Spaces:

UcsTurkey
/

flare

Paused

App Files Files Community

ciyidogan commited on Jul 8

Commit

15d3e9a

verified ·

1 Parent(s): b47c34d

Update stt/stt_deepgram.py

Browse files

Files changed (1) hide show

stt/stt_deepgram.py +49 -35

stt/stt_deepgram.py CHANGED Viewed

@@ -110,11 +110,12 @@ class DeepgramSTT(STTInterface):
             options = LiveOptions(
                 language="tr",
                 model="nova-2",
-                encoding="opus",
                 sample_rate=16000,
-                interim_results=True,  # ✅ Enable interim results
-                utterance_end_ms=1000,  # 1 second silence
                 punctuate=True,
             )
             log_info(f"🔧 Deepgram options: language=tr, model=nova-2, encoding=opus, interim_results=True")
@@ -167,44 +168,57 @@ class DeepgramSTT(STTInterface):
             return
         # Results handler - handles transcription results
-        def on_transcript(self, result, **kwargs):
             try:
-                log_info(f"📝 Deepgram Transcript event received")
-                # Extract transcription
-                channel = result.get("channel", {})
-                alternatives = channel.get("alternatives", [])
-                if alternatives and len(alternatives) > 0:
-                    transcript = alternatives[0].get("transcript", "")
-                    confidence = alternatives[0].get("confidence", 0.0)
-                    is_final = result.get("is_final", False)
-                    log_info(f"📝 Transcript: '{transcript}' (is_final: {is_final}, confidence: {confidence})")
-                    # Process both interim and final results for debugging
-                    if transcript.strip():  # Only process non-empty transcripts
-                        transcription_result = TranscriptionResult(
-                            text=transcript,
-                            is_final=is_final,
-                            confidence=confidence,
-                            timestamp=datetime.now().timestamp()
-                        )
-                        # Queue result
-                        try:
-                            self.responses_queue.put(transcription_result)
-                            if is_final:
-                                self.final_result_received = True
-                                log_info(f"🎯 FINAL RESULT queued: '{transcript}'")
-                            else:
-                                log_debug(f"📝 Interim result: '{transcript}'")
-                        except queue.Full:
-                            log_warning("⚠️ Response queue full")
             except Exception as e:
-                log_error(f"❌ Error in Transcript handler: {e}")
-                log_error(f"❌ Result data: {result}")
         # Speech started handler
         def on_speech_started(self, speech_started, **kwargs):

             options = LiveOptions(
                 language="tr",
                 model="nova-2",
+                encoding="linear16",  # ✅ Change from opus to linear16
                 sample_rate=16000,
+                interim_results=True,
+                utterance_end_ms=1000,
                 punctuate=True,
+                channels=1,
             )
             log_info(f"🔧 Deepgram options: language=tr, model=nova-2, encoding=opus, interim_results=True")
             return
         # Results handler - handles transcription results
+        def _on_transcript(self, *args, **kwargs):
+            """Handle transcript event - SDK calls this method directly"""
             try:
+                # SDK passes the result as second argument
+                result = args[1] if len(args) > 1 else kwargs.get("result")
+                if not result:
+                    log_warning("⚠️ No result in transcript event")
+                    return
+                # Access properties directly from the result object
+                is_final = result.is_final
+                # Get transcript from channel alternatives
+                if hasattr(result, 'channel') and result.channel:
+                    alternatives = result.channel.alternatives
+                    if alternatives and len(alternatives) > 0:
+                        transcript = alternatives[0].transcript
+                        confidence = alternatives[0].confidence
+                        # Log all transcripts for debugging
+                        log_debug(f"📝 Raw transcript: '{transcript}' (is_final: {is_final}, confidence: {confidence})")
+                        if transcript and transcript.strip():  # Only process non-empty transcripts
+                            transcription_result = TranscriptionResult(
+                                text=transcript,
+                                is_final=is_final,
+                                confidence=confidence,
+                                timestamp=datetime.now().timestamp()
+                            )
+                            # Queue result
+                            try:
+                                self.responses_queue.put(transcription_result)
+                                if is_final:
+                                    self.final_result_received = True
+                                    log_info(f"🎯 FINAL TRANSCRIPT: '{transcript}' (confidence: {confidence:.2f})")
+                                else:
+                                    log_info(f"📝 Interim transcript: '{transcript}'")
+                            except queue.Full:
+                                log_warning("⚠️ Response queue full")
+                        else:
+                            if is_final:
+                                log_warning(f"⚠️ Empty final transcript received")
             except Exception as e:
+                log_error(f"❌ Error processing transcript: {e}")
+                log_error(f"❌ Args: {args}")
+                log_error(f"❌ Kwargs: {kwargs}")
+                import traceback
+                log_error(f"❌ Traceback: {traceback.format_exc()}")
         # Speech started handler
         def on_speech_started(self, speech_started, **kwargs):