Woziii commited on
Commit
f4cc38c
·
verified ·
1 Parent(s): 3209254

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +10 -0
app.py CHANGED
@@ -178,6 +178,10 @@ def transcribe_and_diarize(file_path, task, progress=gr.Progress()):
178
  return "Transcription terminée!", transcription_result['text'], speaker_transcription
179
 
180
  def format_to_markdown(transcription_text, speaker_transcription, audio_duration=None, location=None, speaker_age=None, context=None, num_speakers=None, speaker_names=None):
 
 
 
 
181
  metadata = {
182
  "Date de traitement": datetime.now().strftime('%d/%m/%Y %H:%M'),
183
  "Durée de l'audio": f"{audio_duration}" if audio_duration else "[à remplir]",
@@ -199,15 +203,20 @@ def format_to_markdown(transcription_text, speaker_transcription, audio_duration
199
  elif isinstance(row, (list, tuple)) and len(row) == 2:
200
  custom_names[row[0]] = row[1]
201
 
 
 
202
  metadata_text = "\n".join([f"- **{key}** : '{value}'" for key, value in metadata.items()])
203
 
204
  try:
205
  if isinstance(speaker_transcription, str):
206
  speaker_transcription = parse_simplified_diarization(speaker_transcription)
207
 
 
 
208
  formatted_transcription = []
209
  for speaker, text in speaker_transcription:
210
  custom_name = custom_names.get(speaker, speaker)
 
211
  formatted_transcription.append(f"**{custom_name}**: {text}")
212
  transcription_text = "\n\n".join(formatted_transcription)
213
  except Exception as e:
@@ -223,6 +232,7 @@ def format_to_markdown(transcription_text, speaker_transcription, audio_duration
223
  ## Transcription
224
  {transcription_text}
225
  """
 
226
  return formatted_output
227
 
228
  def _return_yt_html_embed(yt_url):
 
178
  return "Transcription terminée!", transcription_result['text'], speaker_transcription
179
 
180
  def format_to_markdown(transcription_text, speaker_transcription, audio_duration=None, location=None, speaker_age=None, context=None, num_speakers=None, speaker_names=None):
181
+ print("Début de format_to_markdown")
182
+ print("speaker_names reçu :", speaker_names)
183
+ print("num_speakers reçu :", num_speakers)
184
+
185
  metadata = {
186
  "Date de traitement": datetime.now().strftime('%d/%m/%Y %H:%M'),
187
  "Durée de l'audio": f"{audio_duration}" if audio_duration else "[à remplir]",
 
203
  elif isinstance(row, (list, tuple)) and len(row) == 2:
204
  custom_names[row[0]] = row[1]
205
 
206
+ print("custom_names créé :", custom_names)
207
+
208
  metadata_text = "\n".join([f"- **{key}** : '{value}'" for key, value in metadata.items()])
209
 
210
  try:
211
  if isinstance(speaker_transcription, str):
212
  speaker_transcription = parse_simplified_diarization(speaker_transcription)
213
 
214
+ print("speaker_transcription après parsing :", speaker_transcription)
215
+
216
  formatted_transcription = []
217
  for speaker, text in speaker_transcription:
218
  custom_name = custom_names.get(speaker, speaker)
219
+ print(f"Utilisation du nom : {custom_name} pour le speaker : {speaker}")
220
  formatted_transcription.append(f"**{custom_name}**: {text}")
221
  transcription_text = "\n\n".join(formatted_transcription)
222
  except Exception as e:
 
232
  ## Transcription
233
  {transcription_text}
234
  """
235
+ print("Fin de format_to_markdown")
236
  return formatted_output
237
 
238
  def _return_yt_html_embed(yt_url):