Spaces:

RollAI
/

ChatWithTranscriptDev

Running

App Files Files Community

AhmadMustafa commited on Dec 12, 2024

Commit

65a422d

1 Parent(s): 5c4bf91

add: js file for iframe

Browse files

Files changed (4) hide show

20240226t210135-transcript-diarized.txt +0 -0
app.py +41 -6
index.js +30 -0
step_take19AWS.json +0 -0

20240226t210135-transcript-diarized.txt DELETED Viewed

The diff for this file is too large to render. See raw diff

app.py CHANGED Viewed

@@ -1,7 +1,7 @@
 import json
 import os
 from dataclasses import dataclass
-from typing import Dict, List, Optional, Tuple
 import gradio as gr
 import requests
@@ -222,7 +222,7 @@ class TranscriptProcessor:
             response_text = completion.choices[0].message.content.strip()
             try:
                 corrected_mapping = json.loads(response_text)
-            except:
                 response_text = response_text[
                     response_text.find("{") : response_text.rfind("}") + 1
                 ]
@@ -340,7 +340,7 @@ Your job is to find out the timestamp of the best answer given by the interviewe
 The way to know if there are multiple takes to a question is to see in the transcript if the same text is repeated, If not then number of takes is 1.
 Question 1 should always be the introduction if the speaker has introduced themselves to find the best introduction time (Last timestamp is the best timestamp), Rest of questions should be in the order they were asked.
 Return format is:
-Call ID is: {{cid}}, Session ID is: {{rsid}}, Origin is: {{origin}}, Call Type is: {{ct}}
 1. Question: question
 Number of takes: number
 Best Answer timestamp: [Timestamp: start_time - end_time]({link_start}://{{origin}}/collab/{{cid}}/{{rsid}}?st={{start_time_in_sec}}&et={{end_time_in_sec}}"').
@@ -388,6 +388,27 @@ def chat(
     origin,
     ct,
 ) -> str:
     try:
         client = OpenAI()
@@ -398,6 +419,8 @@ def chat(
         prompt = f"""You are a helpful assistant analyzing transcripts and generating timestamps and URL. Call ID is {cid}, Session ID is {rsid}, origin is {origin}, Call Type is {ct}.
 Transcript:\n{transcript_processor.get_transcript()}
 If a user asks timestamps for a specific topic, find the start time and end time of that specific topic and return answer in the format:
 Answer format:
 Topic: Heading [Timestamp: start_time - end_time]({link_start}://{{origin}}/collab/{{cid}}/{{rsid}}?st={{start_time_in_sec}}&et={{end_time_in_sec}}"').
@@ -405,7 +428,6 @@ For Example:
 If the start time is 10:13 and end time is 10:18, the url will be:
 {link_start}://roll.ai/colab/1234aq_12314/51234151?st=613&et=618
 In the URL, make sure that after RSID there is ? and then rest of the fields are added via &.
 """
         messages = [{"role": "system", "content": prompt}]
@@ -421,9 +443,18 @@ In the URL, make sure that after RSID there is ? and then rest of the fields are
         completion = client.chat.completions.create(
             model="gpt-4o-mini",
             messages=messages,
         )
         response = completion.choices[0].message
         return response.content
@@ -462,7 +493,8 @@ def create_chat_interface():
         flex-grow: 1 !important;
     }
     """
-    with gr.Blocks(fill_height=True, fill_width=True, css=css) as demo:
         chatbot = gr.Chatbot(
             elem_id="chatbot_box",
             layout="bubble",
@@ -478,6 +510,8 @@ def create_chat_interface():
         origin_state = gr.State()
         ct_state = gr.State()
         turl_state = gr.State()
         def on_app_load(request: gr.Request):
             cid = request.query_params.get("cid", None)
@@ -532,6 +566,7 @@ def create_chat_interface():
                 chatbot_value = [
                     (None, initial_analysis)
                 ]  # initialized with initial analysis and assistant is None
                 return [
                     chatbot_value,
                     transcript_processor,
@@ -614,7 +649,7 @@ def main():
     try:
         setup_openai_key()
         demo = create_chat_interface()
-        demo.launch(share=True)
     except Exception as e:
         print(f"Error starting application: {str(e)}")
         raise

 import json
 import os
 from dataclasses import dataclass
+from typing import Dict, List
 import gradio as gr
 import requests
             response_text = completion.choices[0].message.content.strip()
             try:
                 corrected_mapping = json.loads(response_text)
+            except Exception:
                 response_text = response_text[
                     response_text.find("{") : response_text.rfind("}") + 1
                 ]
 The way to know if there are multiple takes to a question is to see in the transcript if the same text is repeated, If not then number of takes is 1.
 Question 1 should always be the introduction if the speaker has introduced themselves to find the best introduction time (Last timestamp is the best timestamp), Rest of questions should be in the order they were asked.
 Return format is:
+Call ID is: {{cid}}, Recording Session ID is: {{rsid}}, Origin is: {{origin}}, Call Type is: {{ct}}
 1. Question: question
 Number of takes: number
 Best Answer timestamp: [Timestamp: start_time - end_time]({link_start}://{{origin}}/collab/{{cid}}/{{rsid}}?st={{start_time_in_sec}}&et={{end_time_in_sec}}"').
     origin,
     ct,
 ) -> str:
+    tools = [
+        {
+            "type": "function",
+            "function": {
+                "name": "correct_speaker_name_with_url",
+                "description": "If a User provides a link to Agenda file, call the correct_speaker_name_with_url function to correct the speaker names based on the url, i.e if a user says 'Here is the Luma link for the event' and provides a link to the event, the function will correct the speaker names based on the event.",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "url": {
+                            "type": "string",
+                            "description": "The url to the agenda.",
+                        },
+                    },
+                    "required": ["url"],
+                    "additionalProperties": False,
+                },
+            },
+        }
+    ]
     try:
         client = OpenAI()
         prompt = f"""You are a helpful assistant analyzing transcripts and generating timestamps and URL. Call ID is {cid}, Session ID is {rsid}, origin is {origin}, Call Type is {ct}.
 Transcript:\n{transcript_processor.get_transcript()}
 If a user asks timestamps for a specific topic, find the start time and end time of that specific topic and return answer in the format:
+If the user provides a link to the agenda, use the correct_speaker_name_with_url function to correct the speaker names based on the agenda.
 Answer format:
 Topic: Heading [Timestamp: start_time - end_time]({link_start}://{{origin}}/collab/{{cid}}/{{rsid}}?st={{start_time_in_sec}}&et={{end_time_in_sec}}"').
 If the start time is 10:13 and end time is 10:18, the url will be:
 {link_start}://roll.ai/colab/1234aq_12314/51234151?st=613&et=618
 In the URL, make sure that after RSID there is ? and then rest of the fields are added via &.
 """
         messages = [{"role": "system", "content": prompt}]
         completion = client.chat.completions.create(
             model="gpt-4o-mini",
             messages=messages,
+            tools=tools,
         )
         response = completion.choices[0].message
+        if response.function_call:
+            args = json.loads(response.function_call.arguments)
+            url = args.get("url", None)
+            if url:
+                transcript_processor.correct_speaker_mapping_with_agenda(url)
+                return "Speaker names corrected based on the agenda."
+            else:
+                return "No URL provided for correcting speaker names."
         return response.content
         flex-grow: 1 !important;
     }
     """
+    with gr.Blocks(fill_height=True, fill_width=True, css=css, js="index.js") as demo:
         chatbot = gr.Chatbot(
             elem_id="chatbot_box",
             layout="bubble",
         origin_state = gr.State()
         ct_state = gr.State()
         turl_state = gr.State()
+        iframe_html = "<iframe id='link-frame'></iframe>"
+        gr.HTML(value=iframe_html)  # Add iframe to the UI
         def on_app_load(request: gr.Request):
             cid = request.query_params.get("cid", None)
                 chatbot_value = [
                     (None, initial_analysis)
                 ]  # initialized with initial analysis and assistant is None
                 return [
                     chatbot_value,
                     transcript_processor,
     try:
         setup_openai_key()
         demo = create_chat_interface()
+        demo.launch(debug=True)
     except Exception as e:
         print(f"Error starting application: {str(e)}")
         raise

index.js ADDED Viewed

	@@ -0,0 +1,30 @@

+function createIframeHandler() {
+    let iframe = document.getElementById('link-frame');
+    if (!iframe) {
+        iframe = document.createElement('iframe');
+        iframe.id = 'link-frame';
+        iframe.style.position = 'absolute';
+        iframe.style.width = '1px';
+        iframe.style.height = '1px';
+        iframe.style.right = '-100px';
+        iframe.style.bottom = '-100px';
+        iframe.style.display = 'none'; // Hidden initially
+        document.body.appendChild(iframe);
+    }
+    document.addEventListener('click', function (event) {
+        var link = event.target.closest('a');
+        if (link && link.href) {
+            try {
+                iframe.src = link.href;
+                iframe.style.display = 'block'; // Show iframe on link click
+                event.preventDefault();
+                console.log('Opening link in iframe:', link.href);
+            } catch (error) {
+                console.error('Failed to open link in iframe:', error);
+            }
+        }
+    });
+    return 'Iframe handler initialized';
+}

step_take19AWS.json DELETED Viewed

The diff for this file is too large to render. See raw diff