Petro commited on
Commit
66bb7d2
·
1 Parent(s): 3fa3baf
Files changed (1) hide show
  1. main.py +4 -3
main.py CHANGED
@@ -2,11 +2,12 @@ from ctransformers import AutoModelForCausalLM
2
  from fastapi import FastAPI
3
  from pydantic import BaseModel
4
 
5
- file_name = "zephyr-7b-beta.Q4_K_S.gguf"
6
  llm = AutoModelForCausalLM.from_pretrained(file_name,
7
  model_type='mistral',
8
- max_new_tokens = 1096,
9
- threads = 3,
 
10
  )
11
 
12
  #Pydantic object
 
2
  from fastapi import FastAPI
3
  from pydantic import BaseModel
4
 
5
+ file_name = "gemma-2b.Q2_K.gguf"
6
  llm = AutoModelForCausalLM.from_pretrained(file_name,
7
  model_type='mistral',
8
+ max_new_tokens=2_096,
9
+ context_length=8_000,
10
+ threads=3,
11
  )
12
 
13
  #Pydantic object