Ahmed107 commited on
Commit
c796c98
1 Parent(s): d2828e6

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -1
app.py CHANGED
@@ -87,7 +87,17 @@ def speaker_diarization():
87
  for turn, _, speaker in diarization.itertracks(yield_label=True):
88
  df = df.append({'start': turn.start, 'stop': turn.end, 'speaker': speaker}, ignore_index=True)
89
 
90
- df.to_csv('result.csv', index=False)
 
 
 
 
 
 
 
 
 
 
91
 
92
  def save_audio_chunks(data_path, new_df):
93
  # load the audio file
 
87
  for turn, _, speaker in diarization.itertracks(yield_label=True):
88
  df = df.append({'start': turn.start, 'stop': turn.end, 'speaker': speaker}, ignore_index=True)
89
 
90
+ # if the speaker is the same for 2 rows or more then merge them
91
+ new_df = pd.DataFrame(columns=['start', 'stop', 'speaker'])
92
+ for i in range(len(df)):
93
+ if i == 0:
94
+ new_df = new_df.append({'start': df['start'][i], 'stop': df['stop'][i], 'speaker': df['speaker'][i]}, ignore_index=True)
95
+ else:
96
+ if df['speaker'][i] == df['speaker'][i-1]:
97
+ new_df['stop'][len(new_df)-1] = df['stop'][i]
98
+ else:
99
+ new_df = new_df.append({'start': df['start'][i], 'stop': df['stop'][i], 'speaker': df['speaker'][i]}, ignore_index=True)
100
+ new_df.to_csv('result.csv', index=False)
101
 
102
  def save_audio_chunks(data_path, new_df):
103
  # load the audio file