vonewman commited on
Commit
d24362e
1 Parent(s): ff80f4d

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -0
app.py CHANGED
@@ -2,6 +2,13 @@ from transformers import TextIteratorStreamer
2
  from threading import Thread
3
  import gradio as gr
4
 
 
 
 
 
 
 
 
5
 
6
  MAX_INPUT_TOKEN_LENGTH = 4096
7
 
 
2
  from threading import Thread
3
  import gradio as gr
4
 
5
+ from transformers import AutoModelForCausalLM, AutoTokenizer
6
+
7
+ checkpoint_id = "sanchit-gandhi/Mistral-7B-Instruct-v0.1"
8
+
9
+ model = AutoModelForCausalLM.from_pretrained(checkpoint_id, low_cpu_mem_usage=True, load_in_4bit=True)
10
+ tokenizer = AutoTokenizer.from_pretrained(checkpoint_id)
11
+
12
 
13
  MAX_INPUT_TOKEN_LENGTH = 4096
14