Advanced-RAG-Demo

Sleeping

App Files Files Community

AFischer1985 commited on Feb 22, 2024

Commit

da429cd

verified ·

1 Parent(s): 59cb099

Update run.py

Browse files

Files changed (1) hide show

run.py +7 -7

run.py CHANGED Viewed

@@ -342,8 +342,8 @@ def response(message, history):
   # Request Response from LLM:
   system2=None # system2 can be used as fictive first words of the AI, which are not displayed or stored
-  print("RAG: "+rag)
-  print("System: "+system+"\n\nMessage: "+message)
   prompt=extend_prompt(
     message,                  # current message of the user
     history,                  # complete history
@@ -352,7 +352,7 @@ def response(message, history):
     system2,                  # fictive first words of the AI (neither displayed nor stored)
     historylimit=historylimit # number of past messages to consider for response to current message
     )
-  print(prompt)
   ## Request response from model
   #------------------------------
@@ -375,10 +375,10 @@ def response(message, history):
     )
     stream = client.text_generation(prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     response = ""
-    print("User: "+message+"\nAI: ")
     for text in stream:
         part=text.token.text
-        print(part, end="", flush=True)
         response += part
         yield response
     if((myType=="1a")): #add RAG-results to chat-output if appropriate
@@ -406,7 +406,7 @@ def response(message, history):
     response="" #+"("+myType+")\n"
     buffer=""
     #print("URL: "+url)
-    print("User: "+message+"\nAI: ")
     for text in requests.post(url, json=body, stream=True):  #-H 'accept: application/json' -H 'Content-Type: application/json'
       if buffer is None: buffer=""
       buffer=str("".join(buffer))
@@ -423,7 +423,7 @@ def response(message, history):
         if(part.lstrip('\n\r').startswith("data: ")): part=part.lstrip('\n\r').replace("data: ", "")
         try:
           part = str(json.loads(part)["choices"][0]["text"])
-          print(part, end="", flush=True)
           response=response+part
           buffer="" # reset buffer
         except Exception as e:

   # Request Response from LLM:
   system2=None # system2 can be used as fictive first words of the AI, which are not displayed or stored
+  #print("RAG: "+rag)
+  #print("System: "+system+"\n\nMessage: "+message)
   prompt=extend_prompt(
     message,                  # current message of the user
     history,                  # complete history
     system2,                  # fictive first words of the AI (neither displayed nor stored)
     historylimit=historylimit # number of past messages to consider for response to current message
     )
+  print("\n\nPrompt:\n"+prompt)
   ## Request response from model
   #------------------------------
     )
     stream = client.text_generation(prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     response = ""
+    #print("User: "+message+"\nAI: ")
     for text in stream:
         part=text.token.text
+        #print(part, end="", flush=True)
         response += part
         yield response
     if((myType=="1a")): #add RAG-results to chat-output if appropriate
     response="" #+"("+myType+")\n"
     buffer=""
     #print("URL: "+url)
+    #print("User: "+message+"\nAI: ")
     for text in requests.post(url, json=body, stream=True):  #-H 'accept: application/json' -H 'Content-Type: application/json'
       if buffer is None: buffer=""
       buffer=str("".join(buffer))
         if(part.lstrip('\n\r').startswith("data: ")): part=part.lstrip('\n\r').replace("data: ", "")
         try:
           part = str(json.loads(part)["choices"][0]["text"])
+          #print(part, end="", flush=True)
           response=response+part
           buffer="" # reset buffer
         except Exception as e: