Spaces:

GFHLabs
/

ChatWithTranscript

Running

App Files Files Community

AhmadMustafa commited on Dec 5, 2024

Commit

c7b90e4

1 Parent(s): deeeb78

rm unessary comment

Browse files

Files changed (1) hide show

app.py +4 -4

app.py CHANGED Viewed

@@ -5,6 +5,7 @@ from typing import Dict, List, Optional, Tuple
 import gradio as gr
 import requests
 from openai import OpenAI
 street_interview = False
@@ -30,7 +31,7 @@ class TranscriptProcessor:
         self.speaker_mapping = {}
         self._load_transcript()
         self._process_transcript()
-        self.map_speaker_ids_to_names()  # Map speaker IDs to names
     def _load_transcript(self) -> None:
         """Load the transcript JSON file."""
@@ -140,7 +141,7 @@ class TranscriptProcessor:
             for segment in self.segments:
                 spk_id = f"spk_{segment.speaker_id}"
                 speaker_name = self.speaker_mapping.get(spk_id, spk_id)
-                segment.speaker_name = speaker_name  # Store the speaker name
             # Recreate the formatted transcript with speaker names
             formatted_segments = []
@@ -160,7 +161,7 @@ class TranscriptProcessor:
     def correct_speaker_mapping_with_agenda(self, url: str) -> None:
         """Fetch agenda from a URL and correct the speaker mapping using OpenAI."""
         try:
-            # Fetch the HTML content from the URL
             response = requests.get(url)
             response.raise_for_status()
             html_content = response.text
@@ -201,7 +202,6 @@ class TranscriptProcessor:
                 "You should only update the name if the name sounds very similar, or there is a good spelling overlap/ The Speaker Introduction matches the description of the Talk from Agends. If the name is totally unrelated, keep the original name."
             )
-            # Use OpenAI API to get corrected mapping
             client = OpenAI()
             completion = client.chat.completions.create(

 import gradio as gr
 import requests
+from bs4 import BeautifulSoup
 from openai import OpenAI
 street_interview = False
         self.speaker_mapping = {}
         self._load_transcript()
         self._process_transcript()
+        self.map_speaker_ids_to_names()
     def _load_transcript(self) -> None:
         """Load the transcript JSON file."""
             for segment in self.segments:
                 spk_id = f"spk_{segment.speaker_id}"
                 speaker_name = self.speaker_mapping.get(spk_id, spk_id)
+                segment.speaker_name = speaker_name
             # Recreate the formatted transcript with speaker names
             formatted_segments = []
     def correct_speaker_mapping_with_agenda(self, url: str) -> None:
         """Fetch agenda from a URL and correct the speaker mapping using OpenAI."""
         try:
             response = requests.get(url)
             response.raise_for_status()
             html_content = response.text
                 "You should only update the name if the name sounds very similar, or there is a good spelling overlap/ The Speaker Introduction matches the description of the Talk from Agends. If the name is totally unrelated, keep the original name."
             )
             client = OpenAI()
             completion = client.chat.completions.create(