Artix

Runtime error

App Files Files Community

Vitrous commited on Feb 16, 2024

Commit

67c4e45

verified ·

1 Parent(s): cac49fb

Update app.py

Browse files

Files changed (1) hide show

app.py +74 -8

app.py CHANGED Viewed

@@ -39,8 +39,7 @@ model, tokenizer = load_model_norm()
 #Now we can init the FlaskApi
 app = FastAPI(root_path="/api/v1")
-# Function to generate a response using the model
 def generate_response(prompt: str) -> str:
     # Define the user prompt
     user_prompt = f'USER: {prompt}'
@@ -68,14 +67,49 @@ def generate_response(prompt: str) -> str:
 @app.get("/", tags=["Home"])
 async def api_home():
     return {'detail': 'Welcome to Eren Bot!'}
 # Endpoint to start a new conversation thread
 @app.post('/start_conversation/')
 async def start_conversation(request: Request):
     try:
@@ -86,23 +120,54 @@ async def start_conversation(request: Request):
         if not prompt:
             raise HTTPException(status_code=400, detail="No prompt provided")
-        # Check if conversations dictionary is empty
-       # if not conversations:
-           # raise HTTPException(status_code=404, detail="No chat history available")
         # Generate a response for the initial prompt
         response = generate_response(prompt)
         # Create a new conversation thread and store the prompt and response
-        ##conversations[thread_id] = {'prompt': prompt, 'responses': [response]}
-        #return {'thread_id': thread_id, 'response': response}
         return {'response': response}
     except HTTPException:
         raise  # Re-raise HTTPException to return it directly
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 @app.get('/get_response/{thread_id}')
 async def get_response(thread_id: int):
     if thread_id not in conversations:
@@ -119,6 +184,7 @@ async def get_response(thread_id: int):
 @app.post('/chat/')
 async def chat(request: Request):
     data = await request.json()

 #Now we can init the FlaskApi
 app = FastAPI(root_path="/api/v1")
+#Generates a response from the model
 def generate_response(prompt: str) -> str:
     # Define the user prompt
     user_prompt = f'USER: {prompt}'
+def generate_response(persona_prompt: str, prompt: str) -> dict:
+    try:
+        # Validate inputs
+        if not persona_prompt or not prompt:
+            raise ValueError("Contextual prompt template and prompt cannot be empty.")
+        # Define the user prompt
+        user_prompt = f'USER: {prompt}'
+        # Generate the response
+        pipe = pipeline(
+            "text-generation",
+            model=model,
+            tokenizer=tokenizer,
+            max_new_tokens=512,
+            do_sample=True,
+            temperature=0.7,
+            top_p=0.95,
+            top_k=40,
+            repetition_penalty=1.1
+        )
+        generated_text = pipe(persona_prompt + user_prompt)[0]['generated_text']
+        # Extract only the assistant's response from the generated text
+        assistant_response = generated_text.split(user_prompt)[-1].strip()
+        return {"user": prompt,"assistant": assistant_response}
+    except Exception as e:
+        # Handle any exceptions and return an error message
+        return {"error": str(e)}
+#This is the Root directory of the FastApi application
 @app.get("/", tags=["Home"])
 async def api_home():
     return {'detail': 'Welcome to Eren Bot!'}
 # Endpoint to start a new conversation thread
+# Waits for the User to start a conversation and replies based on persona of the model
 @app.post('/start_conversation/')
 async def start_conversation(request: Request):
     try:
         if not prompt:
             raise HTTPException(status_code=400, detail="No prompt provided")
         # Generate a response for the initial prompt
         response = generate_response(prompt)
+         # Generate a unique thread ID
+        thread_id = len(conversations) + 1
         # Create a new conversation thread and store the prompt and response
+        conversations[thread_id] = {'prompt': prompt, 'responses': [response]}
         return {'response': response}
     except HTTPException:
         raise  # Re-raise HTTPException to return it directly
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
+# Endpoint to start a new chat thread
+# Starts a new chat thread and expects the prompt and the persona_prompt from the user
+@app.post('/start_chat/')
+async def start_chat(request: Request):
+    try:
+        # Read JSON data from request body
+        data = await request.json()
+        prompt = data.get('prompt')
+        persona_prompt = data.get('persona_prompt')
+        if not prompt or not persona_prompt:
+            raise HTTPException(status_code=400, detail="Both prompt and contextual_prompt are required")
+        # Generate a response for the initial prompt
+        response = generate_response(persona_prompt, prompt)
+        # Generate a unique thread ID
+        thread_id = len(conversations) + 1
+        # Create a new conversation thread and store the prompt and response
+        conversations[thread_id] = {'prompt': prompt, 'responses': [response]}
+        # Return the thread ID and response
+        return {'thread_id': thread_id, 'response': response}
+    except HTTPException:
+        raise  # Re-raise HTTPException to return it directly
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+# Gets the response from the model and user given a specific thread id of the conversation
 @app.get('/get_response/{thread_id}')
 async def get_response(thread_id: int):
     if thread_id not in conversations:
 @app.post('/chat/')
 async def chat(request: Request):
     data = await request.json()