fireworks-ai
/

firefunction-v1

Text Generation

function-calling

text-generation-inference

Inference Endpoints

Model card Files Files and versions Community

pgarbacki commited on Feb 17

Commit

5a86ab7

•

1 Parent(s): 199b267

Update README.md

Files changed (1) hide show

README.md +2 -2

README.md CHANGED Viewed

@@ -37,7 +37,7 @@ import json
 device = "cuda" # the device to load the model onto
-model = AutoModelForCausalLM.from_pretrained("fireworks-ai/firefunction-v1")
 tokenizer = AutoTokenizer.from_pretrained("fireworks-ai/firefunction-v1")
 function_spec = [
@@ -87,7 +87,7 @@ messages = [
     {'role': 'user', 'content': 'Hi, can you tell me the current stock price of AAPL?'}
 ]
-model_inputs = tokenizer.apply_chat_template(messages, return_tensors="pt")
 generated_ids = model.generate(model_inputs, max_new_tokens=1000, do_sample=True)
 decoded = tokenizer.batch_decode(generated_ids)

 device = "cuda" # the device to load the model onto
+model = AutoModelForCausalLM.from_pretrained("fireworks-ai/firefunction-v1", device_map="auto")
 tokenizer = AutoTokenizer.from_pretrained("fireworks-ai/firefunction-v1")
 function_spec = [
     {'role': 'user', 'content': 'Hi, can you tell me the current stock price of AAPL?'}
 ]
+model_inputs = tokenizer.apply_chat_template(messages, return_tensors="pt").to(model.device)
 generated_ids = model.generate(model_inputs, max_new_tokens=1000, do_sample=True)
 decoded = tokenizer.batch_decode(generated_ids)