File size: 9,298 Bytes
397ce12
fa9ac7e
 
 
 
44ee439
fa9ac7e
397ce12
 
 
 
fa9ac7e
 
c5f5dc3
e16fc27
fa9ac7e
c8a1687
1f22b14
c5f5dc3
fa9ac7e
 
 
8b5fed9
5b7d0e6
c8a1687
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
fa9ac7e
c8a1687
fa9ac7e
c8a1687
1f22b14
fa9ac7e
 
 
 
8b5fed9
c8a1687
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
fa9ac7e
5b7d0e6
fa9ac7e
c8a1687
fa9ac7e
c8a1687
d88c550
c5f5dc3
 
 
 
8b5fed9
c8a1687
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c5f5dc3
5b7d0e6
c5f5dc3
c8a1687
c5f5dc3
c8a1687
1f22b14
c8a1687
e16fc27
 
 
8b5fed9
c8a1687
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e16fc27
5b7d0e6
e16fc27
c8a1687
e16fc27
397ce12
 
 
 
 
 
 
 
 
fa9ac7e
 
 
 
 
397ce12
fa9ac7e
 
 
397ce12
 
 
 
 
 
 
 
 
 
 
 
 
 
fa9ac7e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
import logging
import os

from slack_bolt import App

from buster.busterbot import Buster, BusterConfig

logger = logging.getLogger(__name__)
logging.basicConfig(level=logging.INFO)

# Set Slack channel IDs
MILA_CLUSTER_CHANNEL = "C04LR4H9KQA"
ORION_CHANNEL = "C04LYHGUYB0"
PYTORCH_CHANNEL = "C04MEK6N882"
HF_TRANSFORMERS_CHANNEL = "C04NJNCJWHE"

mila_doc_cfg = BusterConfig(
    documents_file="../data/document_embeddings_mila.tar.gz",
    unknown_prompt="This doesn't seem to be related to cluster usage.",
    embedding_model="text-embedding-ada-002",
    top_k=3,
    thresh=0.7,
    max_words=3000,
    response_format="slack",
    completer_cfg={
        "name": "ChatGPT",
        "text_before_prompt": (
            """You are a slack chatbot assistant answering technical questions about the mila cluster. """
            """Make sure to format your answers in Markdown format, including code block and snippets. """
            """Do not include any links to urls or hyperlinks in your answers. """
            """If you do not know the answer to a question, or if it is completely irrelevant to the library usage, simply reply with: """
            """'This doesn't seem to be related to the pytorch library.'\n"""
            """For example:\n"""
            """What is the meaning of life for pytorch?\n"""
            """This doesn't seem to be related to the pytorch library.\n"""
            """Now answer the following question:\n"""
        ),
        "text_before_documents": "Only use these documents as reference:\n",
        "completion_kwargs": {
            "model": "gpt-3.5-turbo",
        },
    },
)
mila_doc_chatbot = Buster(mila_doc_cfg)

orion_cfg = BusterConfig(
    documents_file="../data/document_embeddings_orion.tar.gz",
    unknown_prompt="This doesn't seem to be related to the orion library. I am not sure how to answer.",
    embedding_model="text-embedding-ada-002",
    top_k=3,
    thresh=0.7,
    max_words=3000,
    completer_cfg={
        "name": "ChatGPT",
        "text_before_prompt": (
            """You are a slack chatbot assistant answering technical questions about orion, a hyperparameter optimization library written in python. """
            """Make sure to format your answers in Markdown format, including code block and snippets. """
            """Do not include any links to urls or hyperlinks in your answers. """
            """If you do not know the answer to a question, or if it is completely irrelevant to the library usage, simply reply with: """
            """'This doesn't seem to be related to the pytorch library.'\n"""
            """For example:\n"""
            """What is the meaning of life for pytorch?\n"""
            """This doesn't seem to be related to the pytorch library.\n"""
            """Now answer the following question:\n"""
        ),
        "text_before_documents": "Only use these documents as reference:\n",
        "completion_kwargs": {
            "model": "gpt-3.5-turbo",
        },
    },
    response_format="slack",
)
orion_chatbot = Buster(orion_cfg)

pytorch_cfg = BusterConfig(
    documents_file="../data/document_embeddings_pytorch.tar.gz",
    unknown_prompt="This doesn't seem to be related to the pytorch library. I am not sure how to answer.",
    embedding_model="text-embedding-ada-002",
    top_k=3,
    thresh=0.7,
    max_words=3000,
    completer_cfg={
        "name": "ChatGPT",
        "text_before_prompt": (
            """You are a slack chatbot assistant answering technical questions about pytorch, a library to train neural networks written in python. """
            """Make sure to format your answers in Markdown format, including code block and snippets. """
            """Do not include any links to urls or hyperlinks in your answers. """
            """If you do not know the answer to a question, or if it is completely irrelevant to the library usage, simply reply with: """
            """'This doesn't seem to be related to the pytorch library.'\n"""
            """For example:\n"""
            """What is the meaning of life for pytorch?\n"""
            """This doesn't seem to be related to the pytorch library.\n"""
            """Now answer the following question:\n"""
        ),
        "text_before_documents": "Only use these documents as reference:\n",
        "completion_kwargs": {
            "model": "gpt-3.5-turbo",
        },
    },
    response_format="slack",
)
pytorch_chatbot = Buster(pytorch_cfg)

hf_transformers_cfg = BusterConfig(
    documents_file="../data/document_embeddings_huggingface.tar.gz",
    unknown_prompt="I'm sorry, but I am an AI language model trained to assist with questions related to the huggingface transformers library. I cannot answer that question as it is not relevant to the library or its usage. Is there anything else I can assist you with?",
    embedding_model="text-embedding-ada-002",
    top_k=3,
    thresh=0.7,
    max_words=3000,
    completer_cfg={
        "name": "ChatGPT",
        "text_before_prompt": (
            """You are a slack chatbot assistant answering technical questions about huggingface transformers, a library to train transformers in python. """
            """Make sure to format your answers in Markdown format, including code block and snippets. """
            """Do not include any links to urls or hyperlinks in your answers. """
            """If you do not know the answer to a question, or if it is completely irrelevant to the library usage, let the user know you cannot answer. """
            """For example:\n"""
            """What is the meaning of life for huggingface?\n"""
            """This doesn't seem to be related to the huggingface library.\n"""
            """I'm sorry, but I am an AI language model trained to assist with questions related to the huggingface transformers library. I cannot answer that question as it is not relevant to the library or its usage. Is there anything else I can assist you with?"""
            """"""
            """Now answer the following question:\n"""
        ),
        "text_before_documents": "Only use these documents as reference:\n",
        "completion_kwargs": {
            "model": "gpt-3.5-turbo",
        },
    },
    response_format="slack",
)
hf_transformers_chatbot = Buster(hf_transformers_cfg)

# TODO: eventually move this to a factory of sorts
# Put all the bots in a dict by channel
channel_id_to_bot = {
    MILA_CLUSTER_CHANNEL: mila_doc_chatbot,
    ORION_CHANNEL: orion_chatbot,
    PYTORCH_CHANNEL: pytorch_chatbot,
    HF_TRANSFORMERS_CHANNEL: hf_transformers_chatbot,
}

app = App(token=os.environ.get("SLACK_BOT_TOKEN"), signing_secret=os.environ.get("SLACK_SIGNING_SECRET"))


@app.event("app_mention")
def respond_to_question(event, say):
    logger.info(event)

    # user's text
    text = event["text"]
    channel_id = event["channel"]

    try:
        chatbot = channel_id_to_bot.get(channel_id)
        if chatbot:
            answer = chatbot.process_input(text)
        else:
            answer = "I was not yet implemented to support this channel."
    except ValueError as e:
        # log the error and return a generic response instead.
        import traceback

        logging.error(traceback.format_exc())
        answer = "Oops, something went wrong. Try again later!"

    # responds to the message in the thread
    thread_ts = event["event_ts"]

    say(text=answer, thread_ts=thread_ts)


@app.event("app_home_opened")
def update_home_tab(client, event, logger):
    try:
        # views.publish is the method that your app uses to push a view to the Home tab
        client.views_publish(
            # the user that opened your app's app home
            user_id=event["user"],
            # the view object that appears in the app home
            view={
                "type": "home",
                "callback_id": "home_view",
                # body of the view
                "blocks": [
                    {"type": "section", "text": {"type": "mrkdwn", "text": "*Hello, I'm _BusterBot_* :tada:"}},
                    {"type": "divider"},
                    {
                        "type": "section",
                        "text": {
                            "type": "mrkdwn",
                            "text": (
                                "I am a chatbot 🤖 designed to answer questions related to technical documentation.\n\n"
                                "I use OpenAI's GPT models to target which relevant sections of documentation are relevant and respond with.\n"
                                "I am open-sourced, and my code is available on github: https://github.com/jerpint/buster\n\n"
                                "For more information, contact either Jeremy or Hadrien from the AMLRT team.\n"
                            ),
                        },
                    },
                    # {
                    #     "type": "actions",
                    #     "elements": [{"type": "button", "text": {"type": "plain_text", "text": "Click me!"}}],
                    # },
                ],
            },
        )

    except Exception as e:
        logger.error(f"Error publishing home tab: {e}")


# Start your app
if __name__ == "__main__":
    app.start(port=int(os.environ.get("PORT", 3000)))