bluenevus commited on
Commit
b5dd7e3
·
verified ·
1 Parent(s): ad0756f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -1
app.py CHANGED
@@ -87,7 +87,8 @@ def chunk_audio(audio_segment, chunk_size_ms=60000):
87
 
88
  def transcribe_audio_chunks(chunks):
89
  transcriptions = []
90
- for chunk in chunks:
 
91
  with tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as temp_audio_file:
92
  chunk.export(temp_audio_file.name, format="wav")
93
  with open(temp_audio_file.name, 'rb') as audio_file:
@@ -204,9 +205,13 @@ def process_media(file_path, is_url=False):
204
  audio = AudioSegment.from_wav(wav_path)
205
  chunks = chunk_audio(audio)
206
 
 
 
207
  # Transcribe chunks
208
  transcription = transcribe_audio_chunks(chunks)
209
 
 
 
210
  # Diarization using OpenAI
211
  diarization_prompt = f"""
212
  The following is a transcription of a conversation. Please identify different speakers and label them as Speaker 1, Speaker 2, etc. Format the output as a series of speaker labels followed by their dialogue. Here's the transcription:
 
87
 
88
  def transcribe_audio_chunks(chunks):
89
  transcriptions = []
90
+ for i, chunk in enumerate(chunks):
91
+ logger.info(f"Transcribing chunk {i+1}/{len(chunks)}")
92
  with tempfile.NamedTemporaryFile(suffix='.wav', delete=False) as temp_audio_file:
93
  chunk.export(temp_audio_file.name, format="wav")
94
  with open(temp_audio_file.name, 'rb') as audio_file:
 
205
  audio = AudioSegment.from_wav(wav_path)
206
  chunks = chunk_audio(audio)
207
 
208
+ logger.info(f"Audio chunked into {len(chunks)} segments")
209
+
210
  # Transcribe chunks
211
  transcription = transcribe_audio_chunks(chunks)
212
 
213
+ logger.info(f"Transcription completed. Total length: {len(transcription)} characters")
214
+
215
  # Diarization using OpenAI
216
  diarization_prompt = f"""
217
  The following is a transcription of a conversation. Please identify different speakers and label them as Speaker 1, Speaker 2, etc. Format the output as a series of speaker labels followed by their dialogue. Here's the transcription: