Spaces:

husseinelsaadi
/

Codingo

Paused

App Files Files Community

Codingo / backend /routes /interview_api.py

husseinelsaadi

updated

88df9ba 9 days ago

raw

history blame contribute delete

20.4 kB

	import os
	import uuid
	import json
	import logging
	from flask import Blueprint, request, jsonify, send_file, url_for, current_app
	from flask_login import login_required, current_user
	from backend.models.database import db, Job, Application
	from backend.services.interview_engine import (
	generate_first_question,
	generate_next_question,
	edge_tts_to_file_sync,
	whisper_stt,
	evaluate_answer
	)


	# Additional imports for report generation
	from backend.models.database import Application
	from backend.services.report_generator import generate_llm_interview_report, create_pdf_report
	from flask import abort

	interview_api = Blueprint("interview_api", __name__)

	@interview_api.route("/start_interview", methods=["POST"])
	@login_required
	def start_interview():
	"""
	Start a new interview. Generates the first question based on the user's
	resume/profile and the selected job. Always returns a JSON payload
	containing the question text and, if available, a URL to an audio
	rendition of the question.
	"""
	try:
	data = request.get_json() or {}
	job_id = data.get("job_id")

	# Validate the job and the user's application
	job = Job.query.get_or_404(job_id)
	application = Application.query.filter_by(
	user_id=current_user.id,
	job_id=job_id
	).first()

	if not application or not application.extracted_features:
	return jsonify({"error": "No application/profile data found."}), 400

	# Parse the candidate's profile
	try:
	profile = json.loads(application.extracted_features)
	except Exception as e:
	logging.error(f"Invalid profile JSON: {e}")
	return jsonify({"error": "Invalid profile JSON"}), 500

	# Generate the first question using the LLM
	question = generate_first_question(profile, job)

	if not question:
	question = "Tell me about yourself and why you're interested in this position."

	# Attempt to generate a TTS audio file for the question
	audio_url = None
	try:
	audio_dir = "/tmp/audio"
	os.makedirs(audio_dir, exist_ok=True)
	filename = f"q_{uuid.uuid4().hex}.wav"
	audio_path = os.path.join(audio_dir, filename)

	audio_result = edge_tts_to_file_sync(question, audio_path)
	if audio_result and os.path.exists(audio_path) and os.path.getsize(audio_path) > 1000:
	audio_url = url_for("interview_api.get_audio", filename=filename)
	logging.info(f"Audio generated successfully: {audio_url}")
	else:
	logging.warning("Audio generation failed or file too small")
	except Exception as e:
	logging.error(f"Error generating TTS audio: {e}")
	audio_url = None

	return jsonify({
	"question": question,
	"audio_url": audio_url
	})

	except Exception as e:
	logging.error(f"Error in start_interview: {e}")
	return jsonify({"error": "Internal server error"}), 500

	import subprocess
	@interview_api.route("/transcribe_audio", methods=["POST"])
	@login_required
	def transcribe_audio():
	"""Transcribe uploaded .webm audio using ffmpeg conversion and Faster-Whisper"""
	audio_file = request.files.get("audio")
	if not audio_file:
	return jsonify({"error": "No audio file received."}), 400

	temp_dir = "/tmp/interview_temp"
	os.makedirs(temp_dir, exist_ok=True)

	original_path = os.path.join(temp_dir, f"user_audio_{uuid.uuid4().hex}.webm")
	wav_path = original_path.replace(".webm", ".wav")

	audio_file.save(original_path)

	# Convert to WAV using ffmpeg
	try:
	subprocess.run(
	["ffmpeg", "-y", "-i", original_path, wav_path],
	stdout=subprocess.DEVNULL,
	stderr=subprocess.DEVNULL
	)
	except Exception as e:
	logging.error(f"FFmpeg conversion failed: {e}")
	return jsonify({"error": "Failed to convert audio"}), 500

	# Transcribe
	transcript = whisper_stt(wav_path)

	# Cleanup
	try:
	os.remove(original_path)
	os.remove(wav_path)
	except:
	pass

	if not transcript or not transcript.strip():
	return jsonify({"error": "No speech detected in audio. Please try again."}), 400

	return jsonify({"transcript": transcript})

	# ----------------------------------------------------------------------------
	# Interview report download
	#
	# Recruiters can download a PDF summarising a candidate's interview performance.
	# This route performs several checks: it verifies that the current user has
	# recruiter or admin privileges, ensures that the requested application exists
	# and belongs to one of the recruiter's jobs, generates a textual report via
	# the ``generate_llm_interview_report`` helper, converts it into a PDF, and
	# finally sends the PDF as a file attachment. The heavy lifting is
	# encapsulated in ``services/report_generator.py`` to keep this route
	# lightweight.
	@interview_api.route('/download_report/<int:application_id>', methods=['GET'])
	@login_required
	def download_report(application_id: int):
	"""Generate and return a PDF report for a candidate's interview.

	The ``application_id`` corresponds to the ID of the Application record
	representing a candidate's job application. Only recruiters (or admins)
	associated with the job are permitted to access this report.
	"""
	# Fetch the application or return 404 if not found
	application = Application.query.get_or_404(application_id)

	# Authorisation: ensure the current user is a recruiter or admin
	if current_user.role not in ('recruiter', 'admin'):
	# 403 Forbidden if the user lacks permissions
	return abort(403)

	# Further check that the recruiter owns the job unless admin
	job = getattr(application, 'job', None)
	if job is None:
	return abort(404)
	if current_user.role != 'admin' and job.recruiter_id != current_user.id:
	return abort(403)

	try:
	# Generate the textual report using the helper function. At this
	# stage, interview answers and evaluations are not stored server‑side,
	# so the report focuses on the candidate's application data and
	# computed skill match. Should answer/score data be persisted in
	# future iterations, ``generate_llm_interview_report`` can be
	# extended accordingly without touching this route.
	report_text = generate_llm_interview_report(application)

	# Convert the text to a PDF. The helper returns a BytesIO buffer
	# ready for sending via Flask's ``send_file``. Matplotlib is used
	# under the hood to avoid heavy dependencies like reportlab.
	pdf_buffer = create_pdf_report(report_text)
	pdf_buffer.seek(0)

	filename = f"{application.name.replace(' ', '_')}_interview_report.pdf"
	return send_file(
	pdf_buffer,
	download_name=filename,
	as_attachment=True,
	mimetype='application/pdf'
	)
	except Exception as exc:
	# Log the error for debugging; return a 500 to the client
	logging.error(f"Error generating report for application {application_id}: {exc}")
	return jsonify({"error": "Failed to generate report"}), 500

	@interview_api.route("/process_answer", methods=["POST"])
	@login_required
	def process_answer():
	"""
	Process a user's answer and return a follow‑up question along with an
	evaluation. Always responds with JSON.
	"""
	try:
	data = request.get_json() or {}
	answer = data.get("answer", "").strip()
	question_idx = data.get("questionIndex", 0)

	# ``job_id`` is required to determine how many total questions are
	# expected for this interview. Without it we fall back to a
	# three‑question interview.
	job_id = data.get("job_id")

	if not answer:
	return jsonify({"error": "No answer provided."}), 400

	# Get the current question for evaluation context
	current_question = data.get("current_question", "Tell me about yourself")

	# Evaluate the answer
	evaluation_result = evaluate_answer(current_question, answer)

	# 🔥 Save Q&A in interview_log for report
	try:
	application = Application.query.filter_by(
	user_id=current_user.id,
	job_id=job_id
	).first()

	if application:
	log_data = []
	if application.interview_log:
	try:
	log_data = json.loads(application.interview_log)
	except Exception:
	log_data = []

	log_data.append({
	"question": current_question,
	"answer": answer,
	"evaluation": evaluation_result
	})

	application.interview_log = json.dumps(log_data, ensure_ascii=False)
	db.session.commit()
	except Exception as log_err:
	logging.error(f"Error saving interview log: {log_err}")

	# Determine the number of questions configured for this job
	total_questions = 4
	if job_id is not None:
	try:
	job = Job.query.get(int(job_id))
	if job and job.num_questions and job.num_questions > 0:
	total_questions = job.num_questions
	except Exception:
	# If lookup fails, keep default
	pass

	# Check completion. ``question_idx`` is zero‑based; the last index
	# corresponds to ``total_questions - 1``. When the current index
	# reaches or exceeds this value, the interview is complete.
	is_complete = question_idx >= (total_questions - 1)

	next_question_text = None
	audio_url = None

	if not is_complete:
	next_idx = question_idx + 1

	# Determine which question to ask next. If next_idx is the last
	# question (i.e. equals total_questions - 1), use the final
	# question. Otherwise, select a follow‑up question from the
	# bank based on ``next_idx - 1`` (because index 0 is for the
	# first follow‑up). If out of range, cycle through the list.
	if next_idx == (total_questions - 1):
	next_question_text = (
	"What are your salary expectations? Are you looking for a full-time or part-time role, "
	"and do you prefer remote or on-site work?"
	)
	else:
	# 🔥 Use Qdrant-powered next question
	try:
	# You need profile + job for Qdrant context
	job = Job.query.get(int(job_id)) if job_id else None
	application = Application.query.filter_by(
	user_id=current_user.id,
	job_id=job_id
	).first()

	profile = {}
	if application and application.extracted_features:
	profile = json.loads(application.extracted_features)

	conversation_history = data.get("conversation_history", [])
	next_question_text = generate_next_question(
	profile,
	job,
	conversation_history,
	answer
	)
	except Exception as e:
	logging.error(f"Error generating next question from Qdrant: {e}")
	next_question_text = "Could you elaborate more on your last point?"


	# Try to generate audio for the next question
	try:
	audio_dir = "/tmp/audio"
	os.makedirs(audio_dir, exist_ok=True)
	filename = f"q_{uuid.uuid4().hex}.wav"
	audio_path = os.path.join(audio_dir, filename)

	audio_result = edge_tts_to_file_sync(next_question_text, audio_path)
	if audio_result and os.path.exists(audio_path) and os.path.getsize(audio_path) > 1000:
	audio_url = url_for("interview_api.get_audio", filename=filename)
	logging.info(f"Next question audio generated: {audio_url}")
	except Exception as e:
	logging.error(f"Error generating next question audio: {e}")
	audio_url = None

	return jsonify({
	"success": True,
	"next_question": next_question_text,
	"audio_url": audio_url,
	"evaluation": evaluation_result,
	"is_complete": is_complete,
	"redirect_url": url_for("interview_api.interview_complete") if is_complete else None
	})

	except Exception as e:
	logging.error(f"Error in process_answer: {e}")
	return jsonify({"error": "Error processing answer. Please try again."}), 500

	@interview_api.route("/audio/<string:filename>", methods=["GET"])
	@login_required
	def get_audio(filename: str):
	"""Serve previously generated TTS audio from the /tmp/audio directory."""
	try:
	# Sanitize filename to prevent directory traversal
	safe_name = os.path.basename(filename)
	if not safe_name.endswith('.wav'):
	return jsonify({"error": "Invalid audio file format."}), 400

	audio_path = os.path.join("/tmp/audio", safe_name)

	if not os.path.exists(audio_path):
	logging.warning(f"Audio file not found: {audio_path}")
	return jsonify({"error": "Audio file not found."}), 404

	if os.path.getsize(audio_path) == 0:
	logging.warning(f"Audio file is empty: {audio_path}")
	return jsonify({"error": "Audio file is empty."}), 404

	return send_file(
	audio_path,
	mimetype="audio/wav",
	as_attachment=False,
	conditional=True # Enable range requests for better audio streaming
	)

	except Exception as e:
	logging.error(f"Error serving audio file {filename}: {e}")
	return jsonify({"error": "Error serving audio file."}), 500

	from flask import render_template

	@interview_api.route("/interview/complete", methods=["GET"])
	@login_required
	def interview_complete():
	"""
	Final interview completion page. After the last question has been
	answered, redirect here to show the candidate a brief summary of
	their overall performance. The summary consists of a percentage
	score and a high‑level label (e.g. "Excellent", "Good"). These
	values are derived from the candidate's application data and
	interview evaluations.

	The calculation mirrors the logic used in the PDF report
	generation: the skills match ratio contributes 40% of the final
	score while the average of the per‑question evaluation ratings
	contributes 60%. If no evaluation data is available, a default
	average of 0.5 is used. The resulting number is expressed as a
	percentage (e.g. "75%") and mapped to a descriptive label.
	"""

	score = None
	feedback_summary = None

	try:
	# Attempt to locate the most recent application with interview data
	# for the current user. Because the completion route does not
	# receive a job ID, we fall back to the latest application that
	# contains an interview_log. If none exists, the summary will
	# remain empty and the template will render placeholders.
	application = (
	Application.query
	.filter_by(user_id=current_user.id)
	.filter(Application.interview_log.isnot(None))
	.order_by(Application.id.desc())
	.first()
	)

	if application:
	# Parse candidate and job skills from stored JSON. If either
	# field is missing or malformed, fall back to empty lists.
	try:
	candidate_features = json.loads(application.extracted_features) if application.extracted_features else {}
	except Exception:
	candidate_features = {}
	candidate_skills = candidate_features.get('skills', []) or []

	job_skills = []
	try:
	job_skills = json.loads(application.job.skills) if application.job and application.job.skills else []
	except Exception:
	job_skills = []

	# Compute the skills match ratio. Normalise skills to lower
	# case and strip whitespace for comparison. Avoid division
	# by zero if the job has no listed skills.
	candidate_set = {s.strip().lower() for s in candidate_skills}
	job_set = {s.strip().lower() for s in job_skills}
	common = candidate_set & job_set
	ratio = (len(common) / len(job_set)) if job_set else 0.0

	# Extract per‑question evaluations from the interview log. The
	# interview_log stores a list of dictionaries with keys
	# "question", "answer" and "evaluation". Each evaluation is
	# expected to include a "score" field containing text such
	# as "Poor", "Medium", "Good" or "Excellent". Convert
	# these descriptors into numeric values in the range [0.2, 1.0]
	# similar to the logic used in report generation.
	qa_scores = []
	try:
	if application.interview_log:
	try:
	log_data = json.loads(application.interview_log)
	except Exception:
	log_data = []
	for entry in log_data:
	score_text = str(entry.get('evaluation', {}).get('score', '')).lower()
	# Map textual scores to numerical values
	if ('excellent' in score_text) or ('5' in score_text) or ('10' in score_text):
	qa_scores.append(1.0)
	elif ('good' in score_text) or ('4' in score_text) or ('8' in score_text) or ('9' in score_text):
	qa_scores.append(0.8)
	elif ('satisfactory' in score_text) or ('medium' in score_text) or ('3' in score_text) or ('6' in score_text) or ('7' in score_text):
	qa_scores.append(0.6)
	elif ('needs improvement' in score_text) or ('poor' in score_text) or ('2' in score_text):
	qa_scores.append(0.4)
	else:
	qa_scores.append(0.2)
	except Exception:
	qa_scores = []

	# Average the QA scores. If no scores were recorded (e.g. if
	# the interview_log is empty or malformed), assume a neutral
	# average of 0.5 to avoid penalising the candidate for missing
	# data.
	qa_average = (sum(qa_scores) / len(qa_scores)) if qa_scores else 0.5

	# Weight skills match (40%) and QA average (60%) to derive
	# the final overall score. Convert to a percentage for
	# display.
	overall = (ratio * 0.4) + (qa_average * 0.6)
	percentage = overall * 100.0

	# Assign a descriptive label based on the overall score.
	if overall >= 0.8:
	label = 'Excellent'
	elif overall >= 0.65:
	label = 'Good'
	elif overall >= 0.45:
	label = 'Satisfactory'
	else:
	label = 'Needs Improvement'

	# Format the score as a whole‑number percentage. For example
	# 0.753 becomes "75%". Note that rounding is applied.
	score = f"{percentage:.0f}%"
	feedback_summary = label

	except Exception as calc_err:
	# If any error occurs during calculation, fall back to None values.
	logging.error(f"Error computing overall interview score: {calc_err}")

	return render_template(
	"closing.html",
	score=score,
	feedback_summary=feedback_summary
	)