udaytag commited on
Commit
cca5852
1 Parent(s): 5d570ff

Upload 2 files

Browse files
Files changed (2) hide show
  1. main.py +52 -0
  2. requirements.txt +12 -0
main.py ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
3
+
4
+ # Define the path where the model and tokenizer are saved
5
+ save_directory = "RAG_model"
6
+
7
+
8
+ # Load the model and tokenizer from the saved directory
9
+ @st.cache(allow_output_mutation=True)
10
+ def load_model():
11
+ model = AutoModelForCausalLM.from_pretrained(save_directory)
12
+ tokenizer = AutoTokenizer.from_pretrained(save_directory)
13
+ return model, tokenizer
14
+
15
+
16
+ model, tokenizer = load_model()
17
+
18
+ # Set up the text generation pipeline
19
+ query_pipeline = pipeline(
20
+ "text-generation",
21
+ model=model,
22
+ tokenizer=tokenizer,
23
+ device=-1, # Use CPU
24
+ device_map="auto",
25
+ )
26
+
27
+ st.title("Text Generation with Llama-2 Model")
28
+ st.write("This is a simple Streamlit app to generate text using the Llama-2 model.")
29
+
30
+ # Text input for the user
31
+ user_input = st.text_area("Enter your prompt:", "")
32
+
33
+ # Generate text when the user clicks the button
34
+ if st.button("Generate"):
35
+ if user_input:
36
+ with st.spinner("Generating..."):
37
+ sequences = query_pipeline(
38
+ user_input,
39
+ do_sample=True,
40
+ top_k=10,
41
+ num_return_sequences=1,
42
+ eos_token_id=tokenizer.eos_token_id,
43
+ max_length=200,
44
+ )
45
+ for seq in sequences:
46
+ st.write("Generated text:")
47
+ st.write(seq['generated_text'])
48
+ else:
49
+ st.write("Please enter a prompt to generate text.")
50
+
51
+ # Add an example usage
52
+ st.write("Example usage: Enter a prompt like 'What is Artificial Intelligence?' and click 'Generate'.")
requirements.txt ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ sentence-transformers
2
+ transformers
3
+ accelerate
4
+ einops==0.6.1
5
+ langchain==0.0.300
6
+ bitsandbytes==0.41.1
7
+ sentence_transformers==2.2.2
8
+ chromadb
9
+ faiss-cpu
10
+ git+https://github.com/huggingface/accelerate.git
11
+ git+https://github.com/huggingface/transformers.git
12
+ bitsandbytes