winglian commited on
Commit
d8d503d
1 Parent(s): b15e08e

update manticore's endpoint

Browse files
Files changed (1) hide show
  1. config.yml +3 -2
config.yml CHANGED
@@ -3,9 +3,10 @@ model_url: https://huggingface.co/openaccess-ai-collective/manticore-13b-chat-py
3
  typer:
4
  delay: 0.1
5
  runpod:
6
- endpoint_id: jifr1oczbrmr3n
7
  prefer_async: true
8
  llm:
 
9
  top_k:
10
  top_p:
11
  temperature:
@@ -18,4 +19,4 @@ llm:
18
  - "</s>"
19
  queue:
20
  max_size: 16
21
- concurrency_count: 1 # recommend setting this no larger than your current
 
3
  typer:
4
  delay: 0.1
5
  runpod:
6
+ endpoint_id: u6tv84bpomhfei
7
  prefer_async: true
8
  llm:
9
+ max_tokens: 600
10
  top_k:
11
  top_p:
12
  temperature:
 
19
  - "</s>"
20
  queue:
21
  max_size: 16
22
+ concurrency_count: 1 # recommend setting this no larger than your current