import gradio as gr speakers = [ "Speaker 1", "Speaker 2", ] def format_speaker(speaker, text): return f"{speaker}: {text}" def mock_diarization(audio): return [ { "speaker": "Speaker 1", "text": "Hello, how are you?", }, { "speaker": "Speaker 2", "text": "I'm fine, thank you!", }, { "speaker": "Speaker 1", "text": "What's your name?", }, { "speaker": "Speaker 2", "text": "My name is John Doe.", }, { "speaker": "Speaker 1", "text": "Nice to meet you!", }, { "speaker": "Speaker 2", "text": "Nice to meet you!", }, ] demo = gr.Interface( fn=mock_diarization, inputs=[gr.Audio(sources=["microphone"])], outputs=[gr.Dialogue(speakers=speakers, tags=None, formatter=format_speaker)], title="Mock Speech Diarization", description="Mock speech diarization", ) if __name__ == "__main__": demo.launch()