t83714
/

llama-3.1-8b-instruct-limo

Text Generation

Generated from Trainer

text-generation-inference

Model card Files Files and versions

t83714 commited on Mar 16

Commit

762cf8c

·

1 Parent(s): 896bd0e

update readme.md

Files changed (1) hide show

README.md +3 -3

README.md CHANGED Viewed

@@ -51,16 +51,16 @@ pip install torch transformers
 from transformers import AutoModelForCausalLM, AutoTokenizer
 model_name = "t83714/llama-3.1-8b-instruct-limo"
-model = AutoModelForCausalLM.from_pretrained(model_name)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 prompt = "How much is (2+5)x5/7"
 # Tokenize the input
-inputs = tokenizer(prompt, return_tensors="pt")
 # Generate the output
-output = model.generate(**inputs, max_length=200)
 print(tokenizer.decode(output[0], skip_special_tokens=True))
 ```

 from transformers import AutoModelForCausalLM, AutoTokenizer
 model_name = "t83714/llama-3.1-8b-instruct-limo"
+model = AutoModelForCausalLM.from_pretrained(model_name, torch_dtype="auto", device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 prompt = "How much is (2+5)x5/7"
 # Tokenize the input
+inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
 # Generate the output
+output = model.generate(**inputs, max_length=8000)
 print(tokenizer.decode(output[0], skip_special_tokens=True))
 ```