mobicham commited on
Commit
9029769
·
verified ·
1 Parent(s): c52e8b3

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -34,7 +34,7 @@ compute_dtype = torch.bfloat16
34
  device = 'cuda'
35
  model_id = "mobiuslabsgmbh/DeepSeek-R1-ReDistill-Qwen-1.5B-v1.1"
36
 
37
- model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=compute_dtype, attn_implementation=attn_implementation, device_map=device)
38
  tokenizer = AutoTokenizer.from_pretrained(model_id)
39
 
40
  chat = tokenizer.apply_chat_template([{"role":"user", "content":"What is 1.5+102.2?"}], tokenize=True, add_generation_prompt=True, return_tensors="pt")
 
34
  device = 'cuda'
35
  model_id = "mobiuslabsgmbh/DeepSeek-R1-ReDistill-Qwen-1.5B-v1.1"
36
 
37
+ model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=compute_dtype, attn_implementation="sdpa", device_map=device)
38
  tokenizer = AutoTokenizer.from_pretrained(model_id)
39
 
40
  chat = tokenizer.apply_chat_template([{"role":"user", "content":"What is 1.5+102.2?"}], tokenize=True, add_generation_prompt=True, return_tensors="pt")