Spaces:

husseinelsaadi
/

Codingo

Paused

App Files Files Community

husseinelsaadi commited on Jul 27

Commit

330157f

1 Parent(s): 308d699

audio updated

Browse files

Files changed (2) hide show

backend/routes/interview_api.py +37 -53
backend/templates/interview.html +2 -1

backend/routes/interview_api.py CHANGED Viewed

@@ -77,64 +77,48 @@ def start_interview():
         logging.error(f"Error in start_interview: {e}")
         return jsonify({"error": "Internal server error"}), 500
 @interview_api.route("/transcribe_audio", methods=["POST"])
 @login_required
 def transcribe_audio():
-    """Transcribe uploaded audio with better error handling"""
     try:
-        audio_file = request.files.get("audio")
-        if not audio_file:
-            return jsonify({"error": "No audio file received."}), 400
-        # Check if file has content
-        audio_file.seek(0, 2)  # Seek to end
-        file_size = audio_file.tell()
-        audio_file.seek(0)  # Seek back to start
-        if file_size == 0:
-            logging.error("Received empty audio file")
-            return jsonify({"error": "Empty audio file received."}), 400
-        logging.info(f"Received audio file: {file_size} bytes")
-        # Use /tmp directory which is writable in Hugging Face Spaces
-        temp_dir = "/tmp/interview_temp"
-        os.makedirs(temp_dir, exist_ok=True)
-        # Keep original extension for better compatibility
-        original_filename = audio_file.filename or "recording.webm"
-        file_extension = os.path.splitext(original_filename)[1] or ".webm"
-        filename = f"user_audio_{uuid.uuid4().hex}{file_extension}"
-        path = os.path.join(temp_dir, filename)
-        # Save the file
-        audio_file.save(path)
-        # Verify file was saved
-        if not os.path.exists(path) or os.path.getsize(path) == 0:
-            logging.error(f"Failed to save audio file or file is empty: {path}")
-            return jsonify({"error": "Failed to save audio file."}), 500
-        logging.info(f"Audio file saved: {path} ({os.path.getsize(path)} bytes)")
-        # Transcribe the audio
-        transcript = whisper_stt(path)
-        # Clean up
-        try:
-            os.remove(path)
-        except Exception as e:
-            logging.warning(f"Could not remove temp file {path}: {e}")
-        if not transcript or not transcript.strip():
-            return jsonify({"error": "No speech detected in audio. Please try again."}), 400
-        return jsonify({"transcript": transcript})
     except Exception as e:
-        logging.error(f"Error in transcribe_audio: {e}")
-        return jsonify({"error": "Error processing audio. Please try again."}), 500
 @interview_api.route("/process_answer", methods=["POST"])
 @login_required

         logging.error(f"Error in start_interview: {e}")
         return jsonify({"error": "Internal server error"}), 500
+import subprocess
 @interview_api.route("/transcribe_audio", methods=["POST"])
 @login_required
 def transcribe_audio():
+    """Transcribe uploaded .webm audio using ffmpeg conversion and Faster-Whisper"""
+    audio_file = request.files.get("audio")
+    if not audio_file:
+        return jsonify({"error": "No audio file received."}), 400
+    temp_dir = "/tmp/interview_temp"
+    os.makedirs(temp_dir, exist_ok=True)
+    original_path = os.path.join(temp_dir, f"user_audio_{uuid.uuid4().hex}.webm")
+    wav_path = original_path.replace(".webm", ".wav")
+    audio_file.save(original_path)
+    # Convert to WAV using ffmpeg
     try:
+        subprocess.run(
+            ["ffmpeg", "-y", "-i", original_path, wav_path],
+            stdout=subprocess.DEVNULL,
+            stderr=subprocess.DEVNULL
+        )
     except Exception as e:
+        logging.error(f"FFmpeg conversion failed: {e}")
+        return jsonify({"error": "Failed to convert audio"}), 500
+    # Transcribe
+    transcript = whisper_stt(wav_path)
+    # Cleanup
+    try:
+        os.remove(original_path)
+        os.remove(wav_path)
+    except:
+        pass
+    if not transcript or not transcript.strip():
+        return jsonify({"error": "No speech detected in audio. Please try again."}), 400
+    return jsonify({"transcript": transcript})
 @interview_api.route("/process_answer", methods=["POST"])
 @login_required

backend/templates/interview.html CHANGED Viewed

@@ -757,7 +757,8 @@
                     console.log('Processing', this.audioChunks.length, 'audio chunks');
                     // Create blob from audio chunks
-                    const audioBlob = new Blob(this.audioChunks, { type: 'audio/webm' });
                     console.log('Created audio blob:', audioBlob.size, 'bytes');
                     if (audioBlob.size === 0) {

                     console.log('Processing', this.audioChunks.length, 'audio chunks');
                     // Create blob from audio chunks
+                    const audioBlob = new Blob(this.audioChunks, { type: 'audio/webm;codecs=opus' });
                     console.log('Created audio blob:', audioBlob.size, 'bytes');
                     if (audioBlob.size === 0) {