mobiuslabsgmbh
/

DeepSeek-R1-ReDistill-Qwen-1.5B-v1.0

Text Generation

Model card Files Files and versions Community

mobicham commited on 14 days ago

Commit

9029769

·

verified ·

1 Parent(s): c52e8b3

Update README.md

Files changed (1) hide show

README.md +1 -1

README.md CHANGED Viewed

@@ -34,7 +34,7 @@ compute_dtype = torch.bfloat16
 device   = 'cuda'
 model_id = "mobiuslabsgmbh/DeepSeek-R1-ReDistill-Qwen-1.5B-v1.1"
-model     = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=compute_dtype, attn_implementation=attn_implementation, device_map=device)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 chat    = tokenizer.apply_chat_template([{"role":"user", "content":"What is 1.5+102.2?"}], tokenize=True, add_generation_prompt=True, return_tensors="pt")

 device   = 'cuda'
 model_id = "mobiuslabsgmbh/DeepSeek-R1-ReDistill-Qwen-1.5B-v1.1"
+model     = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=compute_dtype, attn_implementation="sdpa", device_map=device)
 tokenizer = AutoTokenizer.from_pretrained(model_id)
 chat    = tokenizer.apply_chat_template([{"role":"user", "content":"What is 1.5+102.2?"}], tokenize=True, add_generation_prompt=True, return_tensors="pt")