nanochat-students
/

nanochat-d20

Model card Files Files and versions

burtenshaw HF Staff commited on 25 days ago

Commit

b9dd845

·

verified ·

1 Parent(s): 24bbf3b

Update README.md

Files changed (1) hide show

README.md +5 -3

README.md CHANGED Viewed

@@ -116,7 +116,7 @@ import torch
 from transformers import AutoModelForCausalLM, AutoTokenizer
-model_id="nanochat-students/chat-d20"
 max_new_tokens=64
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
@@ -137,11 +137,13 @@ inputs = tokenizer.apply_chat_template(
 with torch.no_grad():
     outputs = model.generate(
-        inputs,
         max_new_tokens=max_new_tokens,
     )
-print(tokenizer.decode(outputs[0], skip_special_tokens=True))
 ```

 from transformers import AutoModelForCausalLM, AutoTokenizer
+model_id="nanochat-students/d20-chat-transformers"
 max_new_tokens=64
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 with torch.no_grad():
     outputs = model.generate(
+        **inputs,
         max_new_tokens=max_new_tokens,
     )
+# Decode only the generated tokens (excluding the input prompt)
+generated_tokens = outputs[0, inputs.input_ids.shape[1]:]
+print(tokenizer.decode(generated_tokens, skip_special_tokens=True))
 ```