import gradio as gr | |
speakers = [ | |
"Speaker 1", | |
"Speaker 2", | |
] | |
def format_speaker(speaker, text): | |
return f"{speaker}: {text}" | |
def mock_diarization(audio): | |
return [ | |
{ | |
"speaker": "Speaker 1", | |
"text": "Hello, how are you?", | |
}, | |
{ | |
"speaker": "Speaker 2", | |
"text": "I'm fine, thank you!", | |
}, | |
{ | |
"speaker": "Speaker 1", | |
"text": "What's your name?", | |
}, | |
{ | |
"speaker": "Speaker 2", | |
"text": "My name is John Doe.", | |
}, | |
{ | |
"speaker": "Speaker 1", | |
"text": "Nice to meet you!", | |
}, | |
{ | |
"speaker": "Speaker 2", | |
"text": "Nice to meet you!", | |
}, | |
] | |
demo = gr.Interface( | |
fn=mock_diarization, | |
inputs=[gr.Audio(sources=["microphone"])], | |
outputs=[gr.Dialogue(speakers=speakers, tags=None, formatter=format_speaker)], | |
title="Mock Speech Diarization", | |
description="Mock speech diarization", | |
) | |
if __name__ == "__main__": | |
demo.launch() | |