File size: 3,455 Bytes
c368c0e
 
 
 
 
f79e201
 
609c8bf
5261070
f79e201
 
49b54f3
f79e201
5261070
f79e201
 
 
574b2df
 
f79e201
609c8bf
 
 
 
 
e3c3f07
 
 
609c8bf
 
 
 
 
 
f79e201
609c8bf
 
 
 
 
c368c0e
609c8bf
 
c368c0e
609c8bf
 
f79e201
 
609c8bf
 
574b2df
 
609c8bf
 
 
 
 
f79e201
 
 
 
 
609c8bf
 
 
 
 
 
 
f79e201
609c8bf
ddcfa7c
 
49b54f3
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
import gradio as gr
import os
import requests
import json

entire_assistant_response = ""

def get_streamed_response(message, history):

    all_message = [{
        "role": "system",
        "content": "From now on, you are an AI Therapist called Dave. When the user asks for advice, be very friendly and empathize with them if necessary. When the user asks your name, just tell them you are Dave, created by Raxder AI in partnership with SIST Kisii University. You were built to be very friendly and compassionate. Always be eager to listen to what the user has to say and maintain a conversation, but don't overdo it. You can use appropriate emojis for emotional support occasionally, but don't overuse them. Keep your responses concise to maintain a conversational flow. Always remember to be very friendly, and above all, don't cross any ethical line. From time to time, assure the user that you do not store any of their data. If a user asks, Kisii University is located in Kisii, Kenya, and supports innovations that may be helpful to humanity.",    }]
    
    for human, assistant in history:
        all_message.append({"role": "user", "content": human })
        all_message.append({"role": "assistant", "content":assistant})
    
    global entire_assistant_response
    entire_assistant_response = ""  # Reset the entire assistant response

    all_message.append({"role": "user", "content": message})

    url = "https://api.together.xyz/v1/chat/completions"
    payload = {
        "model": "NousResearch/Nous-Hermes-2-Yi-34B",
        "temperature": 1.05,
        "top_p": 0.9,
        "top_k": 50,
        "repetition_penalty": 1,
        "n": 1,
        "messages": all_message,
        "stream_tokens": True,
    }

    TOGETHER_API_KEY = os.getenv('TOGETHER_API_KEY')
    headers = {
        "accept": "application/json",
        "content-type": "application/json",
        "Authorization": f"Bearer {TOGETHER_API_KEY}",
    }

    response = requests.post(url, json=payload, headers=headers, stream=True)
    response.raise_for_status()  # Ensure HTTP request was successful

    for line in response.iter_lines():
        if line:
            decoded_line = line.decode('utf-8')

            # Check for the completion signal
            if decoded_line == "data: [DONE]":
                yield entire_assistant_response  # Yield the entire response at the end
                break

            try:
                # Decode and strip any SSE format specific prefix ("data: ")
                if decoded_line.startswith("data: "):
                    decoded_line = decoded_line.replace("data: ", "")
                    chunk_data = json.loads(decoded_line)
                    content = chunk_data['choices'][0]['delta']['content']
                    entire_assistant_response += content  # Aggregate content
                    yield entire_assistant_response

            except json.JSONDecodeError:
                print(f"Invalid JSON received: {decoded_line}")
                continue
            except KeyError as e:
                print(f"KeyError encountered: {e}")
                continue

    print(entire_assistant_response)
    all_message.append({"role": "assistant", "content": entire_assistant_response})


gr.ChatInterface(fn=get_streamed_response, title="Raxder official AI(mvp)", description="Still a minimum viable product under thorough improvement and develepment", retry_btn="Regenerate 🔁").launch()