Wolf369 commited on
Commit
d064a1c
1 Parent(s): a2415d5
Files changed (1) hide show
  1. main.py +1 -1
main.py CHANGED
@@ -8,7 +8,7 @@ app = FastAPI()
8
  @app.get("/llm_inference")
9
  def read_root(
10
  prompt: str,
11
- model: str = "meta-llama/Llama-2-7b-hf",
12
  temperature: float = 0.,
13
  max_tokens: int = 1024) -> List:
14
  sampling_params = SamplingParams(temperature=temperature, max_tokens=max_tokens)
 
8
  @app.get("/llm_inference")
9
  def read_root(
10
  prompt: str,
11
+ model: str = "meta-llama/Llama-2-7B-hf",
12
  temperature: float = 0.,
13
  max_tokens: int = 1024) -> List:
14
  sampling_params = SamplingParams(temperature=temperature, max_tokens=max_tokens)