ffreemt commited on
Commit
30289e5
1 Parent(s): fef5540

Update remove references to other models

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -230,9 +230,9 @@ def generate(
230
  )
231
 
232
 
233
- _ = """full url: https://huggingface.co/TheBloke/mpt-30B-chat-GGML/blob/main/mpt-30b-chat.ggmlv0.q4_1.bin"""
234
 
235
- # https://huggingface.co/TheBloke/mpt-30B-chat-GGML
236
  _ = """
237
  mpt-30b-chat.ggmlv0.q4_0.bin q4_0 4 16.85 GB 19.35 GB 4-bit.
238
  mpt-30b-chat.ggmlv0.q4_1.bin q4_1 4 18.73 GB 21.23 GB 4-bit. Higher accuracy than q4_0 but not as high as q5_0. However has quicker inference than q5 models.
 
230
  )
231
 
232
 
233
+ _ = """full url: https://huggingface.co/The Bloke/mpt-30B-chat-GGML/blob/main/mpt-30b-chat.ggmlv0.q4_1.bin"""
234
 
235
+ # https://huggingface.co/The Bloke/mpt-30B-chat-GGML
236
  _ = """
237
  mpt-30b-chat.ggmlv0.q4_0.bin q4_0 4 16.85 GB 19.35 GB 4-bit.
238
  mpt-30b-chat.ggmlv0.q4_1.bin q4_1 4 18.73 GB 21.23 GB 4-bit. Higher accuracy than q4_0 but not as high as q5_0. However has quicker inference than q5 models.