winglian commited on
Commit
d3e686c
β€’
1 Parent(s): b360328

add wizard vicuna 13b, update notes

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -121,6 +121,7 @@ AVAILABLE_MODELS = {
121
  "hermes-13b": ("p0zqb2gkcwp0ww", prompt_instruct),
122
  "manticore-13b-chat": ("u6tv84bpomhfei", prompt_chat),
123
  "airoboros-13b": ("rglzxnk80660ja", prompt_chat),
 
124
  "supercot-13b": ("0be7865dwxpwqk", prompt_instruct, ["Instruction:"]),
125
  "mpt-7b-instruct": ("jpqbvnyluj18b0", prompt_instruct),
126
  }
@@ -265,8 +266,8 @@ with gr.Blocks() as arena:
265
  ### brought to you by OpenAccess AI Collective
266
  - Checkout out [our writeup on how this was built.](https://medium.com/@winglian/inference-any-llm-with-serverless-in-15-minutes-69eeb548a41d)
267
  - This Space runs on CPU only, and uses GGML with GPU support via Runpod Serverless.
268
- - Due to limitations of Runpod Serverless, it cannot stream responses immediately
269
- - Responses WILL take AT LEAST 30 seconds to respond, probably longer
270
  - For now, this is single turn only
271
  - [πŸ’΅ Consider Donating on our Patreon](http://patreon.com/OpenAccessAICollective)
272
  - Join us on [Discord](https://discord.gg/PugNNHAF5r)
 
121
  "hermes-13b": ("p0zqb2gkcwp0ww", prompt_instruct),
122
  "manticore-13b-chat": ("u6tv84bpomhfei", prompt_chat),
123
  "airoboros-13b": ("rglzxnk80660ja", prompt_chat),
124
+ "wizard-vicuna-13b": ("9vvpikt4ttyqos", prompt_chat),
125
  "supercot-13b": ("0be7865dwxpwqk", prompt_instruct, ["Instruction:"]),
126
  "mpt-7b-instruct": ("jpqbvnyluj18b0", prompt_instruct),
127
  }
 
266
  ### brought to you by OpenAccess AI Collective
267
  - Checkout out [our writeup on how this was built.](https://medium.com/@winglian/inference-any-llm-with-serverless-in-15-minutes-69eeb548a41d)
268
  - This Space runs on CPU only, and uses GGML with GPU support via Runpod Serverless.
269
+ - Responses may not stream immediately due to cold starts on Serverless.
270
+ - Some responses WILL take AT LEAST 20 seconds to respond
271
  - For now, this is single turn only
272
  - [πŸ’΅ Consider Donating on our Patreon](http://patreon.com/OpenAccessAICollective)
273
  - Join us on [Discord](https://discord.gg/PugNNHAF5r)