Spaces:

husseinelsaadi
/

Codingo

Paused

App Files Files Community

husseinelsaadi commited on Jul 21

Commit

2ae57cb

1 Parent(s): d8acd61

Initial commit for Hugging Face Space

Browse files

Files changed (16) hide show

.huggingface/spaces.yml +4 -0
.venv/bin/huggingface-cli +10 -0
.venv/bin/tiny-agents +10 -0
backend/app.py +47 -14
backend/form/AuthForms.py +7 -6
backend/instance/codingo.db +0 -0
backend/models/database.py +53 -40
backend/models/user.py +2 -1
backend/routes/auth.py +42 -5
backend/routes/interview_api.py +93 -0
backend/services/interview_engine.py +1958 -0
backend/templates/apply.html +44 -69
backend/templates/interview.html +833 -0
backend/utils/luna_phase1.py +0 -0
instance/codingo.db +0 -0
requirements.txt +46 -0

.huggingface/spaces.yml ADDED Viewed

	@@ -0,0 +1,4 @@

+sdk: static
+app_file: app.py
+python_version: "3.10"
+hardware: gpu

.venv/bin/huggingface-cli ADDED Viewed

	@@ -0,0 +1,10 @@

+#!/bin/sh
+'''exec' "/Users/husseinelsaadi/Documents/Data Science USAL/Spring 24-25/FYP - Codingo/Codingo/.venv/bin/python3.12" "$0" "$@"
+' '''
+# -*- coding: utf-8 -*-
+import re
+import sys
+from huggingface_hub.commands.huggingface_cli import main
+if __name__ == '__main__':
+    sys.argv[0] = re.sub(r'(-script\.pyw|\.exe)?$', '', sys.argv[0])
+    sys.exit(main())

.venv/bin/tiny-agents ADDED Viewed

	@@ -0,0 +1,10 @@

+#!/bin/sh
+'''exec' "/Users/husseinelsaadi/Documents/Data Science USAL/Spring 24-25/FYP - Codingo/Codingo/.venv/bin/python3.12" "$0" "$@"
+' '''
+# -*- coding: utf-8 -*-
+import re
+import sys
+from huggingface_hub.inference._mcp.cli import app
+if __name__ == '__main__':
+    sys.argv[0] = re.sub(r'(-script\.pyw|\.exe)?$', '', sys.argv[0])
+    sys.exit(app())

backend/app.py CHANGED Viewed

@@ -6,6 +6,9 @@ import sys
 import json
 from datetime import datetime
 # Adjust sys.path for import flexibility
 current_dir = os.path.dirname(os.path.abspath(__file__))
 parent_dir = os.path.dirname(current_dir)
@@ -20,6 +23,7 @@ app.config['SQLALCHEMY_TRACK_MODIFICATIONS'] = False
 # Import and initialize DB
 from backend.models.database import db, Job, Application, init_db
 init_db(app)
 # Import models/routes AFTER initializing the DB
@@ -42,10 +46,12 @@ login_manager = LoginManager()
 login_manager.login_view = 'auth.login'
 login_manager.init_app(app)
 @login_manager.user_loader
 def load_user(user_id):
     return db.session.get(User, int(user_id))
 # Register auth blueprint
 app.register_blueprint(auth_bp)
@@ -73,41 +79,44 @@ def handle_resume_upload(file):
         return None, str(e), None
 # Routes
 @app.route('/')
 def index():
     return render_template('index.html')
 @app.route('/jobs')
 def jobs():
     all_jobs = Job.query.order_by(Job.date_posted.desc()).all()
     return render_template('jobs.html', jobs=all_jobs)
 @app.route('/job/<int:job_id>')
 def job_detail(job_id):
     job = Job.query.get_or_404(job_id)
     return render_template('job_detail.html', job=job)
 @app.route('/apply/<int:job_id>', methods=['GET', 'POST'])
 @login_required
 def apply(job_id):
     job = Job.query.get_or_404(job_id)
-    form = JobApplicationForm()
-    form.job_id.data = job_id
-    if form.validate_on_submit():
-        resume_file = form.resume.data
-        features, error, filename = handle_resume_upload(resume_file)
-        features_json = json.dumps(features or {})
         application = Application(
             job_id=job_id,
-            name=form.name.data,
-            email=form.email.data,
-            resume_path=filename,
-            cover_letter=form.cover_letter.data,
-            extracted_features=features_json
         )
         db.session.add(application)
@@ -116,10 +125,20 @@ def apply(job_id):
         flash('Your application has been submitted successfully!', 'success')
         return redirect(url_for('jobs'))
-    return render_template('apply.html', form=form, job=job)
 @app.route('/parse_resume', methods=['POST'])
 def parse_resume():
     file = request.files.get('resume')
     features, error, _ = handle_resume_upload(file)
@@ -136,14 +155,28 @@ def parse_resume():
         "email": features.get('email', ''),
         "mobile_number": features.get('mobile_number', ''),
         "skills": features.get('skills', []),
-        "experience": features.get('experience', [])
     }
     return response, 200
 if __name__ == '__main__':
     print("Starting Codingo application...")
     with app.app_context():
         db.create_all()
-    app.run(debug=True, port=5001)

 import json
 from datetime import datetime
+from backend.routes.interview_api import interview_api
+app.register_blueprint(interview_api, url_prefix="/api")
 # Adjust sys.path for import flexibility
 current_dir = os.path.dirname(os.path.abspath(__file__))
 parent_dir = os.path.dirname(current_dir)
 # Import and initialize DB
 from backend.models.database import db, Job, Application, init_db
 init_db(app)
 # Import models/routes AFTER initializing the DB
 login_manager.login_view = 'auth.login'
 login_manager.init_app(app)
 @login_manager.user_loader
 def load_user(user_id):
     return db.session.get(User, int(user_id))
 # Register auth blueprint
 app.register_blueprint(auth_bp)
         return None, str(e), None
 # Routes
 @app.route('/')
 def index():
     return render_template('index.html')
 @app.route('/jobs')
 def jobs():
     all_jobs = Job.query.order_by(Job.date_posted.desc()).all()
     return render_template('jobs.html', jobs=all_jobs)
 @app.route('/job/<int:job_id>')
 def job_detail(job_id):
     job = Job.query.get_or_404(job_id)
     return render_template('job_detail.html', job=job)
 @app.route('/apply/<int:job_id>', methods=['GET', 'POST'])
 @login_required
 def apply(job_id):
     job = Job.query.get_or_404(job_id)
+    if request.method == 'POST':
+        file = request.files.get('resume')
+        features, error, _ = handle_resume_upload(file)
+        if error or not features:
+            flash("Resume parsing failed. Please try again.", "danger")
+            return render_template('apply.html', job=job)
         application = Application(
             job_id=job_id,
+            user_id=current_user.id,
+            name=current_user.username,
+            email=current_user.email,
+            extracted_features=json.dumps(features)
         )
         db.session.add(application)
         flash('Your application has been submitted successfully!', 'success')
         return redirect(url_for('jobs'))
+    return render_template('apply.html', job=job)
+@app.route('/my_applications')
+@login_required
+def my_applications():
+    """View user's applications"""
+    applications = Application.query.filter_by(user_id=current_user.id).order_by(Application.date_applied.desc()).all()
+    return render_template('my_applications.html', applications=applications)
 @app.route('/parse_resume', methods=['POST'])
 def parse_resume():
+    """API endpoint for parsing resume and returning features"""
     file = request.files.get('resume')
     features, error, _ = handle_resume_upload(file)
         "email": features.get('email', ''),
         "mobile_number": features.get('mobile_number', ''),
         "skills": features.get('skills', []),
+        "experience": features.get('experience', []),
+        "education": features.get('education', []),
+        "summary": features.get('summary', '')
     }
     return response, 200
+@app.route("/interview/<int:job_id>")
+@login_required
+def interview_page(job_id):
+    job = Job.query.get_or_404(job_id)
+    application = Application.query.filter_by(user_id=current_user.id, job_id=job_id).first()
+    if not application or not application.extracted_features:
+        flash("Please apply for this job and upload your resume first.", "warning")
+        return redirect(url_for('job_detail', job_id=job_id))
+    cv_data = json.loads(application.extracted_features)
+    return render_template("interview.html", job=job, cv=cv_data)
 if __name__ == '__main__':
     print("Starting Codingo application...")
     with app.app_context():
         db.create_all()
+    app.run(debug=True, port=5001)

backend/form/AuthForms.py CHANGED Viewed

@@ -1,7 +1,8 @@
 from flask_wtf import FlaskForm
-from wtforms import StringField, PasswordField, SubmitField, SelectField
-from wtforms.validators import DataRequired, Email, EqualTo
 class LoginForm(FlaskForm):
     email = StringField('Email', validators=[DataRequired(), Email()])
@@ -9,9 +10,9 @@ class LoginForm(FlaskForm):
     submit = SubmitField('Login')
 class SignupForm(FlaskForm):
-    username = StringField('Username', validators=[DataRequired()])
     email = StringField('Email', validators=[DataRequired(), Email()])
-    password = PasswordField('Password', validators=[DataRequired()])
     confirm_password = PasswordField('Confirm Password', validators=[DataRequired(), EqualTo('password')])
-    role = SelectField('Role', choices=[('unemployed', 'Unemployed'), ('recruiter', 'Recruiter')])
     submit = SubmitField('Sign Up')

 from flask_wtf import FlaskForm
+from flask_wtf.file import FileField, FileAllowed
+from wtforms import StringField, PasswordField, SubmitField, SelectField, TextAreaField, BooleanField, RadioField
+from wtforms.validators import DataRequired, Email, EqualTo, Length, Optional
 class LoginForm(FlaskForm):
     email = StringField('Email', validators=[DataRequired(), Email()])
     submit = SubmitField('Login')
 class SignupForm(FlaskForm):
+    username = StringField('Username', validators=[DataRequired(), Length(min=3, max=20)])
     email = StringField('Email', validators=[DataRequired(), Email()])
+    password = PasswordField('Password', validators=[DataRequired(), Length(min=6)])
     confirm_password = PasswordField('Confirm Password', validators=[DataRequired(), EqualTo('password')])
+    role = SelectField('Role', choices=[('unemployed', 'Job Seeker'), ('recruiter', 'Recruiter')], default='unemployed')
     submit = SubmitField('Sign Up')

backend/instance/codingo.db CHANGED Viewed

Binary files a/backend/instance/codingo.db and b/backend/instance/codingo.db differ

backend/models/database.py CHANGED Viewed

@@ -4,41 +4,52 @@ Database models for the Codingo application.
 from flask_sqlalchemy import SQLAlchemy
 from datetime import datetime
 db = SQLAlchemy()
 class Job(db.Model):
-    """Job model representing a job posting."""
     id = db.Column(db.Integer, primary_key=True)
-    title = db.Column(db.String(100), nullable=False)
-    company = db.Column(db.String(100), nullable=False)
-    location = db.Column(db.String(100), nullable=False)
     description = db.Column(db.Text, nullable=False)
-    requirements = db.Column(db.Text, nullable=False)
     date_posted = db.Column(db.DateTime, default=datetime.utcnow)
-    # Relationships
-    applications = db.relationship('Application', backref='job', lazy=True, cascade="all, delete-orphan")
     def __repr__(self):
-        return f"Job('{self.title}', '{self.company}')"
 class Application(db.Model):
-    """Application model representing a job application."""
     id = db.Column(db.Integer, primary_key=True)
-    job_id = db.Column(db.Integer, db.ForeignKey('job.id'), nullable=False)
     name = db.Column(db.String(100), nullable=False)
     email = db.Column(db.String(100), nullable=False)
-    resume_path = db.Column(db.String(255), nullable=False)
-    cover_letter = db.Column(db.Text, nullable=False)
-    extracted_features = db.Column(db.Text, nullable=True)  # JSON string of extracted features
-    status = db.Column(db.String(50), default='applied')  # applied, reviewed, shortlisted, rejected, hired
     date_applied = db.Column(db.DateTime, default=datetime.utcnow)
     def __repr__(self):
         return f"Application('{self.name}', '{self.email}', Job ID: {self.job_id})"
 # Initialize the database
 def init_db(app):
@@ -46,36 +57,38 @@ def init_db(app):
     db.init_app(app)
     with app.app_context():
         db.create_all()
         # Add sample data if jobs table is empty
         if Job.query.count() == 0:
             sample_jobs = [
-                {
-                    'title': 'Senior Python Developer',
-                    'company': 'TechCorp',
-                    'location': 'Remote',
-                    'description': 'We are looking for an experienced Python developer to join our team. You will be responsible for developing and maintaining our backend services.',
-                    'requirements': 'Strong Python skills, experience with Flask or Django, knowledge of SQL and NoSQL databases, 5+ years of experience.'
-                },
-                {
-                    'title': 'Data Scientist',
-                    'company': 'DataInsights',
-                    'location': 'New York, NY',
-                    'description': 'Join our data science team to develop machine learning models and extract insights from large datasets.',
-                    'requirements': 'Masters or PhD in Computer Science, Statistics or related field. Experience with Python, PyTorch, and scikit-learn.'
-                },
-                {
-                    'title': 'Frontend Developer',
-                    'company': 'WebSolutions',
-                    'location': 'San Francisco, CA',
-                    'description': 'Develop responsive and user-friendly web applications with modern JavaScript frameworks.',
-                    'requirements': 'Proficiency in HTML, CSS, JavaScript, and React.js. Experience with RESTful APIs and version control systems.'
-                }
             ]
-            for job_data in sample_jobs:
-                job = Job(**job_data)
-                db.session.add(job)
-            db.session.commit()

 from flask_sqlalchemy import SQLAlchemy
 from datetime import datetime
+import json
 db = SQLAlchemy()
 class Job(db.Model):
+    __tablename__ = 'jobs'
     id = db.Column(db.Integer, primary_key=True)
+    role = db.Column(db.String(100), nullable=False)
     description = db.Column(db.Text, nullable=False)
+    seniority = db.Column(db.String(50), nullable=False)
+    skills = db.Column(db.Text, nullable=False)  # JSON string
+    company = db.Column(db.String(100), nullable=False)
     date_posted = db.Column(db.DateTime, default=datetime.utcnow)
+    recruiter_id = db.Column(db.Integer, db.ForeignKey('users.id'), nullable=True)
+    recruiter = db.relationship('User', backref='posted_jobs')
     def __repr__(self):
+        return f"<Job {self.role} at {self.company}>"
 class Application(db.Model):
+    __tablename__ = 'applications'
     id = db.Column(db.Integer, primary_key=True)
+    job_id = db.Column(db.Integer, db.ForeignKey('jobs.id'), nullable=False)
+    user_id = db.Column(db.Integer, db.ForeignKey('users.id'), nullable=False)
     name = db.Column(db.String(100), nullable=False)
     email = db.Column(db.String(100), nullable=False)
+    resume_path = db.Column(db.String(255), nullable=True)
+    cover_letter = db.Column(db.Text, nullable=True)
+    extracted_features = db.Column(db.Text, nullable=True)
+    status = db.Column(db.String(50), default='applied')
     date_applied = db.Column(db.DateTime, default=datetime.utcnow)
+    user = db.relationship('User', backref='applications')
     def __repr__(self):
         return f"Application('{self.name}', '{self.email}', Job ID: {self.job_id})"
+    def get_profile_data(self):
+        try:
+            return json.loads(self.extracted_features) if self.extracted_features else {}
+        except:
+            return {}
 # Initialize the database
 def init_db(app):
     db.init_app(app)
     with app.app_context():
+        from backend.models.user import User
         db.create_all()
         # Add sample data if jobs table is empty
         if Job.query.count() == 0:
             sample_jobs = [
+                Job(
+                    role='Senior Python Developer',
+                    description='Experienced developer needed for backend systems.',
+                    seniority='Senior',
+                    skills=json.dumps(['Python', 'Flask', 'SQL', 'AWS']),
+                    company='TechCorp'
+                ),
+                Job(
+                    role='Data Scientist',
+                    description='ML model development and statistical analysis.',
+                    seniority='Mid',
+                    skills=json.dumps(['Python', 'scikit-learn', 'Pandas', 'Spark']),
+                    company='DataInsights'
+                ),
+                Job(
+                    role='Frontend Developer',
+                    description='Modern web frontend development with React.',
+                    seniority='Junior',
+                    skills=json.dumps(['HTML', 'CSS', 'JavaScript', 'React']),
+                    company='WebSolutions'
+                ),
             ]
+        for job in sample_jobs:
+            db.session.add(job)
+        db.session.commit()
+        print("Sample jobs added to database.")

backend/models/user.py CHANGED Viewed

@@ -1,6 +1,7 @@
 from flask_login import UserMixin
 from werkzeug.security import generate_password_hash, check_password_hash
-from backend.models.database import db  # ✅ Use shared db instance only
 class User(UserMixin, db.Model):
     __tablename__ = 'user'

 from flask_login import UserMixin
 from werkzeug.security import generate_password_hash, check_password_hash
+from backend.models.database import db  # Use the shared db object
 class User(UserMixin, db.Model):
     __tablename__ = 'user'

backend/routes/auth.py CHANGED Viewed

@@ -1,11 +1,42 @@
-from flask import Blueprint, render_template, redirect, url_for, flash, request
-from flask_login import login_user, logout_user, login_required
 from backend.form.AuthForms import LoginForm, SignupForm
 from backend.models.user import User
 from backend.models.database import db
 auth_bp = Blueprint('auth', __name__)
 @auth_bp.route('/login', methods=['GET', 'POST'])
 def login():
     form = LoginForm()
@@ -18,6 +49,7 @@ def login():
             flash('Invalid credentials', 'danger')
     return render_template('login.html', form=form)
 @auth_bp.route('/signup', methods=['GET', 'POST'])
 def signup():
     form = SignupForm()
@@ -34,12 +66,17 @@ def signup():
             user.set_password(form.password.data)
             db.session.add(user)
             db.session.commit()
-            flash('Account created successfully!', 'success')
-            return redirect(url_for('auth.login'))
     return render_template('signup.html', form=form)
 @auth_bp.route('/logout')
 @login_required
 def logout():
     logout_user()
-    return redirect(url_for('auth.login'))

+from flask import Blueprint, render_template, redirect, url_for, flash, request, jsonify
+from flask_login import login_user, logout_user, login_required, current_user
+from werkzeug.utils import secure_filename
+import os
+import json
+from datetime import datetime
 from backend.form.AuthForms import LoginForm, SignupForm
 from backend.models.user import User
 from backend.models.database import db
 auth_bp = Blueprint('auth', __name__)
+def handle_resume_upload(file):
+    """
+    Save uploaded file temporarily, extract features, then clean up.
+    Returns (features_dict, error_message, filename)
+    """
+    if not file or file.filename == '':
+        return None, "No file uploaded", None
+    try:
+        # Get current directory for temp folder
+        current_dir = os.path.dirname(os.path.dirname(os.path.abspath(__file__)))
+        filename = secure_filename(file.filename)
+        filepath = os.path.join(current_dir, 'temp', filename)
+        os.makedirs(os.path.dirname(filepath), exist_ok=True)
+        file.save(filepath)
+        features = extract_resume_features(filepath)
+        os.remove(filepath)  # Clean up after parsing
+        return features, None, filename
+    except Exception as e:
+        print(f"Error in handle_resume_upload: {e}")
+        return None, str(e), None
 @auth_bp.route('/login', methods=['GET', 'POST'])
 def login():
     form = LoginForm()
             flash('Invalid credentials', 'danger')
     return render_template('login.html', form=form)
 @auth_bp.route('/signup', methods=['GET', 'POST'])
 def signup():
     form = SignupForm()
             user.set_password(form.password.data)
             db.session.add(user)
             db.session.commit()
+            # Log the user in and redirect to profile completion
+            login_user(user)
+            flash('Account created successfully! Welcome to Codingo.', 'success')
+            return redirect(url_for('index'))
     return render_template('signup.html', form=form)
 @auth_bp.route('/logout')
 @login_required
 def logout():
     logout_user()
+    flash('You have been logged out successfully.', 'info')
+    return redirect(url_for('auth.login'))

backend/routes/interview_api.py ADDED Viewed

	@@ -0,0 +1,93 @@

+import os
+import uuid
+import json
+from flask import Blueprint, request, jsonify, url_for
+from flask_login import login_required, current_user
+from backend.models.database import db, Job, Application
+from backend.services.interview_engine import (
+    generate_first_question,
+    edge_tts_to_file_sync,
+    whisper_stt
+)
+interview_api = Blueprint("interview_api", __name__)
+@interview_api.route("/api/start_interview", methods=["POST"])
+@login_required
+def start_interview():
+    data = request.get_json()
+    job_id = data.get("job_id")
+    job = Job.query.get_or_404(job_id)
+    application = Application.query.filter_by(user_id=current_user.id, job_id=job_id).first()
+    if not application or not application.extracted_features:
+        return jsonify({"error": "No application/profile data found."}), 400
+    try:
+        profile = json.loads(application.extracted_features)
+    except:
+        return jsonify({"error": "Invalid profile JSON"}), 500
+    question = generate_first_question(profile, job)
+    audio_filename = f"q_{uuid.uuid4().hex}.wav"
+    audio_path = os.path.join("static", "audio", audio_filename)
+    os.makedirs(os.path.dirname(audio_path), exist_ok=True)
+    edge_tts_to_file_sync(question, audio_path)
+    return jsonify({
+        "question": question,
+        "audio_url": url_for("static", filename=f"audio/{audio_filename}")
+    })
+@interview_api.route("/api/transcribe_audio", methods=["POST"])
+@login_required
+def transcribe_audio():
+    audio_file = request.files.get("audio")
+    if not audio_file:
+        return jsonify({"error": "No audio file received."}), 400
+    filename = f"user_audio_{uuid.uuid4().hex}.wav"
+    path = os.path.join("temp", filename)
+    os.makedirs("temp", exist_ok=True)
+    audio_file.save(path)
+    transcript = whisper_stt(path)
+    os.remove(path)
+    return jsonify({"transcript": transcript})
+@interview_api.route("/api/process_answer", methods=["POST"])
+@login_required
+def process_answer():
+    data = request.get_json()
+    answer = data.get("answer", "")
+    question_idx = data.get("questionIndex", 0)
+    # For now: just return a fake next question
+    fake_next_question = f"Follow-up question {question_idx + 2}: Why should we hire you?"
+    audio_filename = f"q_{uuid.uuid4().hex}.wav"
+    audio_path = os.path.join("static", "audio", audio_filename)
+    os.makedirs(os.path.dirname(audio_path), exist_ok=True)
+    edge_tts_to_file_sync(fake_next_question, audio_path)
+    return jsonify({
+        "success": True,
+        "nextQuestion": fake_next_question,
+        "audioUrl": url_for("static", filename=f"audio/{audio_filename}"),
+        "evaluation": {
+            "score": "medium",
+            "feedback": "Good answer, but be more specific."
+        },
+        "isComplete": question_idx >= 2,
+        "summary": []  # optional: you can fill this later
+    })

backend/services/interview_engine.py ADDED Viewed

	@@ -0,0 +1,1958 @@

+import requests
+import os
+import json
+from langchain_groq import ChatGroq
+from langchain_community.embeddings import HuggingFaceEmbeddings
+from langchain_community.vectorstores import Qdrant
+from langchain.prompts import PromptTemplate
+from langchain.chains import LLMChain
+from langchain.retrievers import ContextualCompressionRetriever
+from langchain.retrievers.document_compressors import CohereRerank
+from qdrant_client import QdrantClient
+import cohere
+import json
+import re
+import time
+from collections import defaultdict
+from qdrant_client.http import models
+from qdrant_client.models import PointStruct
+from sklearn.feature_extraction.text import TfidfVectorizer
+from sklearn.neighbors import NearestNeighbors
+from transformers import AutoTokenizer
+#from langchain_huggingface import HuggingFaceEndpoint
+from langchain_community.embeddings import HuggingFaceEmbeddings
+import numpy as np
+import os
+from dotenv import load_dotenv
+from enum import Enum
+import time
+from inputimeout import inputimeout, TimeoutOccurred
+# Import Qdrant client and models (adjust based on your environment)
+from qdrant_client import QdrantClient
+from qdrant_client.http.models import VectorParams, Distance, Filter, FieldCondition, MatchValue
+from qdrant_client.http.models import PointStruct, Filter, FieldCondition, MatchValue, SearchRequest
+import traceback
+from transformers import pipeline
+from textwrap import dedent
+import json
+import logging
+from transformers import pipeline,BitsAndBytesConfig
+import os
+cohere_api_key = os.getenv("COHERE_API_KEY")
+chat_groq_api = os.getenv("GROQ_API_KEY")
+hf_api_key = os.getenv("HF_API_KEY")
+qdrant_api = os.getenv("QDRANT_API_KEY")
+qdrant_url = os.getenv("QDRANT_API_URL")
+print("GROQ API Key:", chat_groq_api)
+print("QDRANT API Key:", qdrant_api)
+print("QDRANT API URL:", qdrant_url)
+print("Cohere API Key:", cohere_api_key)
+from qdrant_client import QdrantClient
+qdrant_client = QdrantClient(
+    url="https://313b1ceb-057f-4b7b-89f5-7b19a213fe65.us-east-1-0.aws.cloud.qdrant.io:6333",
+    api_key="eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJhY2Nlc3MiOiJtIn0.w13SPZbljbSvt9Ch_0r034QhMFlmEr4ctXqLo2zhxm4",
+)
+print(qdrant_client.get_collections())
+class CustomChatGroq:
+    def __init__(self, temperature, model_name, api_key):
+        self.temperature = temperature
+        self.model_name = model_name
+        self.api_key = api_key
+        self.api_url = "https://api.groq.com/openai/v1/chat/completions"
+    def predict(self, prompt):
+        """Send a request to the Groq API and return the generated response."""
+        try:
+            headers = {
+                "Authorization": f"Bearer {self.api_key}",
+                "Content-Type": "application/json"
+            }
+            payload = {
+                "model": self.model_name,
+                "messages": [{"role": "system", "content": "You are an AI interviewer."},
+                             {"role": "user", "content": prompt}],
+                "temperature": self.temperature,
+                "max_tokens": 150
+            }
+            response = requests.post(self.api_url, headers=headers, json=payload, timeout=10)
+            response.raise_for_status()  # Raise an error for HTTP codes 4xx/5xx
+            data = response.json()
+            # Extract response text based on Groq API response format
+            if "choices" in data and len(data["choices"]) > 0:
+                return data["choices"][0]["message"]["content"].strip()
+            logging.warning("Unexpected response structure from Groq API")
+            return "Interviewer: Could you tell me more about your relevant experience?"
+        except requests.exceptions.RequestException as e:
+            logging.error(f"ChatGroq API error: {e}")
+            return "Interviewer: Due to a system issue, let's move on to another question."
+groq_llm = ChatGroq(
+    temperature=0.7,
+    model_name="llama-3.3-70b-versatile",
+    api_key=chat_groq_api
+)
+from huggingface_hub import login
+import os
+HF_TOKEN = os.getenv("HF_TOKEN")
+if HF_TOKEN:
+    login(HF_TOKEN)
+else:
+    raise EnvironmentError("Missing HF_TOKEN environment variable.")
+#Load mistral Model
+from transformers import AutoTokenizer, AutoModelForCausalLM, pipeline
+import torch
+print(torch.cuda.is_available())
+MODEL_PATH = "mistralai/Mistral-7B-Instruct-v0.3"
+#MODEL_PATH = "tiiuae/falcon-rw-1b"
+bnb_config = BitsAndBytesConfig(
+    load_in_8bit=True,
+)
+mistral_tokenizer = AutoTokenizer.from_pretrained(MODEL_PATH,token=hf_api_key)
+judge_llm = AutoModelForCausalLM.from_pretrained(
+    MODEL_PATH,
+    quantization_config=bnb_config,torch_dtype=torch.float16,
+    device_map="auto",
+    token=hf_api_key
+)
+judge_llm.config.pad_token_id = judge_llm.config.eos_token_id
+print(judge_llm.hf_device_map)
+judge_pipeline = pipeline(
+    "text-generation",
+    model=judge_llm,
+    tokenizer=mistral_tokenizer,
+    max_new_tokens=128,
+    temperature=0.3,
+    top_p=0.9,
+    do_sample=True,  # Optional but recommended with temperature/top_p
+    repetition_penalty=1.1,
+)
+output = judge_pipeline("Q: What is Python?\nA:", max_new_tokens=128)[0]['generated_text']
+print(output)
+# embedding model
+from sentence_transformers import SentenceTransformer
+class LocalEmbeddings:
+    def __init__(self, model_name="all-MiniLM-L6-v2"):
+        self.model = SentenceTransformer(model_name)
+    def embed_query(self, text):
+        return self.model.encode(text).tolist()
+    def embed_documents(self, documents):
+        return self.model.encode(documents).tolist()
+embeddings = LocalEmbeddings()
+# import cohere
+qdrant_client = QdrantClient(url=qdrant_url, api_key=qdrant_api,check_compatibility=False)
+co = cohere.Client(api_key=cohere_api_key)
+class EvaluationScore(str, Enum):
+    POOR = "Poor"
+    MEDIUM = "Medium"
+    GOOD = "Good"
+    EXCELLENT = "Excellent"
+#  Cohere Reranker
+class CohereReranker:
+    def __init__(self, client):
+        self.client = client
+    def compress_documents(self, documents, query):
+        if not documents:
+            return []
+        doc_texts = [doc.page_content for doc in documents]
+        try:
+            reranked = self.client.rerank(
+                query=query,
+                documents=doc_texts,
+                model="rerank-english-v2.0",
+                top_n=5
+            )
+            return [documents[result.index] for result in reranked.results]
+        except Exception as e:
+            logging.error(f"Error in CohereReranker.compress_documents: {e}")
+            return documents[:5]
+reranker = CohereReranker(co)
+def load_data_from_json(file_path):
+    """Load interview Q&A data from a JSON file."""
+    try:
+        with open(file_path, "r", encoding="utf-8") as f:
+            data = json.load(f)
+        job_role_buckets = defaultdict(list)
+        for idx, item in enumerate(data):
+            try:
+                job_role = item["Job Role"].lower().strip()
+                question = item["Questions"].strip()
+                answer = item["Answers"].strip()
+                job_role_buckets[job_role].append({"question": question, "answer": answer})
+            except KeyError as e:
+                logging.warning(f"Skipping item {idx}: missing key {e}")
+        return job_role_buckets  # <--- You missed this!
+    except Exception as e:
+        logging.error(f"Error loading data: {e}")
+        raise
+def verify_qdrant_collection(collection_name='interview_questions'):
+    """Verify if a Qdrant collection exists with the correct configuration."""
+    try:
+        collection_info = qdrant_client.get_collection(collection_name)
+        vector_size = collection_info.config.params.vectors.size
+        logging.info(f"Collection '{collection_name}' exists with vector size: {vector_size}")
+        return True
+    except Exception as e:
+        logging.warning(f"Collection '{collection_name}' not found: {e}")
+        return False
+def store_data_to_qdrant(data, collection_name='interview_questions', batch_size=100):
+    """Store interview data in the Qdrant vector database."""
+    try:
+        # Check if collection exists, otherwise create it
+        if not verify_qdrant_collection(collection_name):
+            try:
+                qdrant_client.create_collection(
+                    collection_name=collection_name,
+                    vectors_config=VectorParams(size=384, distance=Distance.COSINE)
+                )
+                logging.info(f"Created collection '{collection_name}'")
+            except Exception as e:
+                logging.error(f"Error creating collection: {e}\n{traceback.format_exc()}")
+                return False
+        points = []
+        point_id = 0
+        total_points = sum(len(qa_list) for qa_list in data.values())
+        processed = 0
+        for job_role, qa_list in data.items():
+            for entry in qa_list:
+                try:
+                    emb = embeddings.embed_query(entry["question"])
+                    print(f"Embedding shape: {len(emb)}")
+                    if not emb or len(emb) != 384:
+                        logging.warning(f"Skipping point {point_id} due to invalid embedding length: {len(emb)}")
+                        continue
+                    points.append(PointStruct(
+                        id=point_id,
+                        vector=emb,
+                        payload={
+                            "job_role": job_role,
+                            "question": entry["question"],
+                            "answer": entry["answer"]
+                        }
+                    ))
+                    point_id += 1
+                    processed += 1
+                    # Batch upload
+                    if len(points) >= batch_size:
+                        try:
+                            qdrant_client.upsert(collection_name=collection_name, points=points)
+                            logging.info(f"Stored {processed}/{total_points} points ({processed/total_points*100:.1f}%)")
+                        except Exception as upsert_err:
+                            logging.error(f"Error during upsert: {upsert_err}\n{traceback.format_exc()}")
+                        points = []
+                except Exception as embed_err:
+                    logging.error(f"Embedding error for point {point_id}: {embed_err}\n{traceback.format_exc()}")
+        # Final batch upload
+        if points:
+            try:
+                qdrant_client.upsert(collection_name=collection_name, points=points)
+                logging.info(f"Stored final batch of {len(points)} points")
+            except Exception as final_upsert_err:
+                logging.error(f"Error during final upsert: {final_upsert_err}\n{traceback.format_exc()}")
+        # Final verification
+        try:
+            count = qdrant_client.count(collection_name=collection_name, exact=True).count
+            print("Current count:", count)
+            logging.info(f"✅ Successfully stored {count} points in Qdrant")
+            if count != total_points:
+                logging.warning(f"Expected {total_points} points but stored {count}")
+        except Exception as count_err:
+            logging.error(f"Error verifying stored points: {count_err}\n{traceback.format_exc()}")
+        return True
+    except Exception as e:
+        logging.error(f"Error storing data to Qdrant: {e}\n{traceback.format_exc()}")
+        return False
+#  to ensure cosine similarity use
+info = qdrant_client.get_collection("interview_questions")
+print(info.config.params.vectors.distance)
+def extract_all_roles_from_qdrant(collection_name='interview_questions'):
+    """ Extract all unique job roles from the Qdrant vector store """
+    try:
+        all_roles = set()
+        scroll_offset = None
+        while True:
+            response = qdrant_client.scroll(
+                collection_name=collection_name,
+                limit=200,
+                offset=scroll_offset,
+                with_payload=True
+            )
+            points, next_page_offset = response
+            if not points:
+                break
+            for point in points:
+                role = point.payload.get("job_role", "").strip().lower()
+                if role:
+                    all_roles.add(role)
+            if not next_page_offset:
+                break
+            scroll_offset = next_page_offset
+        if not all_roles:
+            logging.warning("[Qdrant] No roles found in payloads.")
+        else:
+            logging.info(f"[Qdrant] Extracted {len(all_roles)} unique job roles.")
+        return list(all_roles)
+    except Exception as e:
+        logging.error(f"Error extracting roles from Qdrant: {e}")
+        return []
+import numpy as np
+import logging
+from sklearn.metrics.pairwise import cosine_similarity
+def find_similar_roles(user_role, all_roles, top_k=3):
+    """
+    Find the most similar job roles to the given user_role using embeddings.
+    """
+    try:
+        # Clean inputs
+        user_role = user_role.strip().lower()
+        if not user_role or not all_roles or not isinstance(all_roles, list):
+            logging.warning("Invalid input for role similarity")
+            return []
+        # Embed user role
+        try:
+            user_embedding = embeddings.embed_query(user_role)
+            if user_embedding is None:
+                logging.error("User embedding is None")
+                return []
+        except Exception as e:
+            logging.error(f"Error embedding user role: {type(e).__name__}: {e}")
+            return []
+        # Embed all roles
+        try:
+            role_embeddings = []
+            valid_roles = []
+            for role in all_roles:
+                emb = embeddings.embed_query(role.lower())
+                if emb is not None:
+                    role_embeddings.append(emb)
+                    valid_roles.append(role)
+                else:
+                    logging.warning(f"Skipping role with no embedding: {role}")
+        except Exception as e:
+            logging.error(f"Error embedding all roles: {type(e).__name__}: {e}")
+            return []
+        if not role_embeddings:
+            logging.error("All role embeddings failed")
+            return []
+        # Compute similarities
+        similarities = cosine_similarity([user_embedding], role_embeddings)[0]
+        top_indices = np.argsort(similarities)[::-1][:top_k]
+        similar_roles = [valid_roles[i] for i in top_indices]
+        logging.debug(f"Similar roles to '{user_role}': {similar_roles}")
+        return similar_roles
+    except Exception as e:
+        logging.error(f"Error finding similar roles: {type(e).__name__}: {e}", exc_info=True)
+        return []
+# RETREIVE ALL DATA RELATED TO THE JOB ROLE NOT JUST TOP_K
+def get_role_questions(job_role):
+    try:
+        if not job_role:
+            logging.warning("Job role is empty.")
+            return []
+        filter_by_role = Filter(
+            must=[FieldCondition(
+                key="job_role",
+                match=MatchValue(value=job_role.lower())
+            )]
+        )
+        all_results = []
+        offset = None
+        while True:
+            results, next_page_offset = qdrant_client.scroll(
+                collection_name="interview_questions",
+                scroll_filter=filter_by_role,
+                with_payload=True,
+                with_vectors=False,
+                limit=100,  # batch size
+                offset=offset
+            )
+            all_results.extend(results)
+            if not next_page_offset:
+                break
+            offset = next_page_offset
+        parsed_results = [{
+            "question": r.payload.get("question"),
+            "answer": r.payload.get("answer"),
+            "job_role": r.payload.get("job_role")
+        } for r in all_results]
+        return parsed_results
+    except Exception as e:
+        logging.error(f"Error fetching role questions: {type(e).__name__}: {e}", exc_info=True)
+        return []
+def retrieve_interview_data(job_role, all_roles):
+    """
+    Retrieve all interview Q&A for a given job role.
+    Falls back to similar roles if no data found.
+    Args:
+        job_role (str): Input job role (can be misspelled)
+        all_roles (list): Full list of available job roles
+    Returns:
+        list: List of QA dicts with keys: 'question', 'answer', 'job_role'
+    """
+    import logging
+    logging.basicConfig(level=logging.INFO)
+    job_role = job_role.strip().lower()
+    seen_questions = set()
+    final_results = []
+    # Step 1: Try exact match (fetch all questions for role)
+    logging.info(f"Trying to fetch all data for exact role: '{job_role}'")
+    exact_matches = get_role_questions(job_role)
+    for qa in exact_matches:
+        question = qa["question"]
+        if question and question not in seen_questions:
+            seen_questions.add(question)
+            final_results.append(qa)
+    if final_results:
+        logging.info(f"Found {len(final_results)} QA pairs for exact role '{job_role}'")
+        return final_results
+    logging.warning(f"No data found for role '{job_role}'. Trying similar roles...")
+    # Step 2: No matches — find similar roles
+    similar_roles = find_similar_roles(job_role, all_roles, top_k=3)
+    if not similar_roles:
+        logging.warning("No similar roles found.")
+        return []
+    logging.info(f"Found similar roles: {similar_roles}")
+    # Step 3: Retrieve data for each similar role (all questions)
+    for role in similar_roles:
+        logging.info(f"Fetching data for similar role: '{role}'")
+        role_qa = get_role_questions(role)
+        for qa in role_qa:
+            question = qa["question"]
+            if question and question not in seen_questions:
+                seen_questions.add(question)
+                final_results.append(qa)
+    logging.info(f"Retrieved total {len(final_results)} QA pairs from similar roles")
+    return final_results
+import random
+def random_context_chunks(retrieved_data, k=3):
+    chunks = random.sample(retrieved_data, k)
+    return "\n\n".join([f"Q: {item['question']}\nA: {item['answer']}" for item in chunks])
+import json
+import logging
+import re
+from typing import Dict
+def eval_question_quality(
+    question: str,
+    job_role: str,
+    seniority: str
+) -> Dict[str, str]:
+    """
+    Evaluate the quality of a generated interview question using Groq LLM.
+    Returns a structured JSON with score, reasoning, and suggestions.
+    """
+    import time, json
+    prompt = f"""
+You are a senior AI hiring expert evaluating the quality of an interview question for a {seniority} {job_role} role.
+Evaluate the question based on:
+- Relevance to the role and level
+- Clarity and conciseness
+- Depth of technical insight
+---
+Question: {question}
+---
+Respond only with a valid JSON like:
+{{
+  "Score": "Poor" | "Medium" | "Good" | "Excellent",
+  "Reasoning": "short justification",
+  "Improvements": ["tip1", "tip2"]
+}}
+"""
+    try:
+        start = time.time()
+        response = groq_llm.invoke(prompt)
+        print("⏱️ eval_question_quality duration:", round(time.time() - start, 2), "s")
+        # Extract JSON safely
+        start_idx = response.rfind("{")
+        end_idx = response.rfind("}") + 1
+        json_str = response[start_idx:end_idx]
+        result = json.loads(json_str)
+        if result.get("Score") in {"Poor", "Medium", "Good", "Excellent"}:
+            return result
+        else:
+            raise ValueError("Invalid Score value in model output")
+    except Exception as e:
+        print(f"⚠️ eval_question_quality fallback: {e}")
+        return {
+            "Score": "Poor",
+            "Reasoning": "Evaluation failed, using fallback.",
+            "Improvements": [
+                "Ensure the question is relevant and clear.",
+                "Avoid vague or overly generic phrasing.",
+                "Include role-specific context if needed."
+            ]
+        }
+def evaluate_answer(
+    question: str,
+    answer: str,
+    ref_answer: str,
+    job_role: str,
+    seniority: str,
+) -> Dict[str, str]:
+    """
+    Fast and structured answer evaluation using Groq LLM (e.g. Mixtral or LLaMA 3).
+    """
+    import time, json
+    from langchain_core.messages import AIMessage
+    prompt = f"""
+You are a technical interviewer evaluating a candidate for a {seniority} {job_role} role.
+Evaluate the response based on:
+- Technical correctness
+- Clarity
+- Relevance
+- Structure
+---
+Question: {question}
+Candidate Answer: {answer}
+Reference Answer: {ref_answer}
+---
+Respond ONLY with valid JSON in the following format:
+{{
+  "Score": "Poor" | "Medium" | "Good" | "Excellent",
+  "Reasoning": "short justification",
+  "Improvements": ["tip1", "tip2"]
+}}
+"""
+    try:
+        start = time.time()
+        raw = groq_llm.invoke(prompt)
+        print("⏱️ evaluate_answer duration:", round(time.time() - start, 2), "s")
+        if isinstance(raw, AIMessage):
+            output = raw.content
+        else:
+            output = str(raw)
+        print("🔍 Raw Groq Response:\n", output)
+        start_idx = output.rfind("{")
+        end_idx = output.rfind("}") + 1
+        json_str = output[start_idx:end_idx]
+        result = json.loads(json_str)
+        if result.get("Score") in {"Poor", "Medium", "Good", "Excellent"}:
+            return result
+        else:
+            raise ValueError("Invalid score value")
+    except Exception as e:
+        print(f"⚠️ evaluate_answer fallback: {e}")
+        return {
+            "Score": "Poor",
+            "Reasoning": "Failed to evaluate properly. Defaulted to Poor.",
+            "Improvements": [
+                "Be more specific",
+                "Add technical details",
+                "Structure the answer clearly"
+            ]
+        }
+# SAME BUT USING LLAMA 3.3 FROM GROQ
+def generate_reference_answer(question, job_role, seniority):
+    """
+    Generates a high-quality reference answer using Groq-hosted LLaMA model.
+    Args:
+        question (str): Interview question to answer.
+        job_role (str): Target job role (e.g., "Frontend Developer").
+        seniority (str): Experience level (e.g., "Mid-Level").
+    Returns:
+        str: Clean, generated reference answer or error message.
+    """
+    try:
+        # Clean, role-specific prompt
+        prompt = f"""You are a {seniority} {job_role}.
+Q: {question}
+A:"""
+        # Use Groq-hosted model to generate the answer
+        ref_answer = groq_llm.predict(prompt)
+        if not ref_answer.strip():
+            return "Reference answer not generated."
+        return ref_answer.strip()
+    except Exception as e:
+        logging.error(f"Error generating reference answer: {e}", exc_info=True)
+        return "Unable to generate reference answer due to an error"
+def build_interview_prompt(conversation_history, user_response, context, job_role, skills, seniority,
+                           difficulty_adjustment=None, voice_label=None, face_label=None, effective_confidence=None):
+    """Build a prompt for generating the next interview question with adaptive difficulty and fairness logic."""
+    interview_template = """
+    You are an AI interviewer conducting a real-time interview for a {job_role} position.
+    Your objective is to thoroughly evaluate the candidate's suitability for the role using smart, structured, and adaptive questioning.
+    ---
+     Interview Rules and Principles:
+    - The **baseline difficulty** of questions must match the candidate’s seniority level (e.g., junior, mid-level, senior).
+    - Use your judgment to increase difficulty **slightly** if the candidate performs well, or simplify if they struggle — but never drop below the expected baseline for their level.
+    - Avoid asking extremely difficult questions to junior candidates unless they’ve clearly demonstrated advanced knowledge.
+    - Be fair: candidates for the same role should be evaluated within a consistent difficulty range.
+    - Adapt your line of questioning gradually and logically based on the **overall flow**, not just the last answer.
+    - Include real-world problem-solving scenarios to test how the candidate thinks and behaves practically.
+    - You must **lead** the interview and make intelligent decisions about what to ask next.
+    ---
+     Context Use:
+    {context_instruction}
+    Note:
+    If no relevant context was retrieved or the previous answer is unclear, you must still generate a thoughtful interview question using your own knowledge. Do not skip generation. Avoid default or fallback responses — always try to generate a meaningful and fair next question.
+    ---
+     Job Role: {job_role}
+     Seniority Level: {seniority}
+     Skills Focus: {skills}
+     Difficulty Setting: {difficulty} (based on {difficulty_adjustment})
+    ---
+    Recent Conversation History:
+    {history}
+    Candidate's Last Response:
+    "{user_response}"
+    Evaluation of Last Response:
+    {response_evaluation}
+    Voice Tone: {voice_label}
+    ---
+    ---
+    Important:
+    If no relevant context was retrieved or the previous answer is unclear or off-topic,
+    you must still generate a meaningful and fair interview question using your own knowledge and best practices.
+    Do not skip question generation or fall back to default/filler responses.
+    ---
+    Guidelines for Next Question:
+    - If this is the beginning of the interview, start with a question about the candidate’s background or experience.
+    - Base the difficulty primarily on the seniority level, with light adjustment from recent performance.
+    - Focus on core skills, real-world applications, and depth of reasoning.
+    - Ask only one question. Be clear and concise.
+    Generate the next interview question now:
+    """
+    # Calculate difficulty phrase
+    if difficulty_adjustment == "harder":
+        difficulty = f"slightly more challenging than typical for {seniority}"
+    elif difficulty_adjustment == "easier":
+        difficulty = f"slightly easier than typical for {seniority}"
+    else:
+        difficulty = f"appropriate for {seniority}"
+    # Choose context logic
+    if context.strip():
+        context_instruction = (
+            "Use both your own expertise and the provided context from relevant interview datasets. "
+            "You can either build on questions from the dataset or generate your own."
+        )
+        context = context.strip()
+    else:
+        context_instruction = (
+            "No specific context retrieved. Use your own knowledge and best practices to craft a question."
+        )
+        context = ""  # Let it be actually empty!
+    # Format conversation history (last 6 exchanges max)
+    recent_history = conversation_history[-6:] if len(conversation_history) > 6 else conversation_history
+    formatted_history = "\n".join([f"{msg['role'].capitalize()}: {msg['content']}" for msg in recent_history])
+    # Add evaluation summary if available
+    if conversation_history and conversation_history[-1].get("evaluation"):
+        eval_data = conversation_history[-1]["evaluation"][-1]
+        response_evaluation = f"""
+        - Score: {eval_data.get('Score', 'N/A')}
+        - Reasoning: {eval_data.get('Reasoning', 'N/A')}
+        - Improvements: {eval_data.get('Improvements', 'N/A')}
+        """
+    else:
+        response_evaluation = "No evaluation available yet."
+    # Fill the template
+    prompt = interview_template.format(
+        job_role=job_role,
+        seniority=seniority,
+        skills=skills,
+        difficulty=difficulty,
+        difficulty_adjustment=difficulty_adjustment if difficulty_adjustment else "default seniority",
+        context_instruction=context_instruction,
+        context=context,
+        history=formatted_history,
+        user_response=user_response,
+        response_evaluation=response_evaluation.strip(),
+        voice_label=voice_label or "unknown",
+    )
+    return prompt
+def generate_llm_interview_report(
+    interview_state, logged_samples, job_role, seniority
+):
+    from collections import Counter
+    # Helper for converting score to 1–5
+    def score_label(label):
+        mapping = {
+            "confident": 5, "calm": 4, "neutral": 3, "nervous": 2, "anxious": 1, "unknown": 3
+        }
+        return mapping.get(label.lower(), 3)
+    def section_score(vals):
+        return round(sum(vals)/len(vals), 2) if vals else "N/A"
+    # Aggregate info
+    scores, voice_conf, face_conf, comm_scores = [], [], [], []
+    tech_details, comm_details, emotion_details, relevance_details, problem_details = [], [], [], [], []
+    for entry in logged_samples:
+        answer_eval = entry.get("answer_evaluation", {})
+        score = answer_eval.get("Score", "Not Evaluated")
+        reasoning = answer_eval.get("Reasoning", "")
+        if score.lower() in ["excellent", "good", "medium", "poor"]:
+            score_map = {"excellent": 5, "good": 4, "medium": 3, "poor": 2}
+            scores.append(score_map[score.lower()])
+        # Section details
+        tech_details.append(reasoning)
+        comm_details.append(reasoning)
+        # Emotions/confidence
+        voice_conf.append(score_label(entry.get("voice_label", "unknown")))
+        face_conf.append(score_label(entry.get("face_label", "unknown")))
+        # Communication estimate
+        if entry["user_answer"]:
+            length = len(entry["user_answer"].split())
+            comm_score = min(5, max(2, length // 30))
+            comm_scores.append(comm_score)
+    # Compute averages for sections
+    avg_problem = section_score(scores)
+    avg_tech = section_score(scores)
+    avg_comm = section_score(comm_scores)
+    avg_emotion = section_score([(v+f)/2 for v, f in zip(voice_conf, face_conf)])
+    # Compute decision heuristics
+    section_averages = [avg_problem, avg_tech, avg_comm, avg_emotion]
+    numeric_avgs = [v for v in section_averages if isinstance(v, (float, int))]
+    avg_overall = round(sum(numeric_avgs) / len(numeric_avgs), 2) if numeric_avgs else 0
+    # Hiring logic (you can customize thresholds)
+    if avg_overall >= 4.5:
+        verdict = "Strong Hire"
+    elif avg_overall >= 4.0:
+        verdict = "Hire"
+    elif avg_overall >= 3.0:
+        verdict = "Conditional Hire"
+    else:
+        verdict = "No Hire"
+    # Build LLM report prompt
+    transcript = "\n\n".join([
+        f"Q: {e['generated_question']}\nA: {e['user_answer']}\nScore: {e.get('answer_evaluation',{}).get('Score','')}\nReasoning: {e.get('answer_evaluation',{}).get('Reasoning','')}"
+        for e in logged_samples
+    ])
+    prompt = f"""
+You are a senior technical interviewer at a major tech company.
+Write a structured, realistic hiring report for this {seniority} {job_role} interview, using these section scores (scale 1–5, with 5 best):
+Section-wise Evaluation
+1. *Problem Solving & Critical Thinking*: {avg_problem}
+2. *Technical Depth & Knowledge*: {avg_tech}
+3. *Communication & Clarity*: {avg_comm}
+4. *Emotional Composure & Confidence*: {avg_emotion}
+5. *Role Relevance*: 5
+*Transcript*
+{transcript}
+Your report should have the following sections:
+1. *Executive Summary* (realistic, hiring-committee style)
+2. *Section-wise Comments* (for each numbered category above, with short paragraph citing specifics)
+3. *Strengths & Weaknesses* (list at least 2 for each)
+4. *Final Verdict*: {verdict}
+5. *Recommendations* (2–3 for future improvement)
+Use realistic language. If some sections are N/A or lower than others, comment honestly.
+Interview Report:
+"""
+    # LLM call, or just return prompt for review
+    return groq_llm.predict(prompt)
+def get_user_info():
+    """
+    Collects essential information from the candidate before starting the interview.
+    Returns a dictionary with keys: name, job_role, seniority, skills
+    """
+    import logging
+    logging.info("Collecting user information...")
+    print("Welcome to the AI Interview Simulator!")
+    print("Let’s set up your mock interview.\n")
+    # Get user name
+    name = input("What is your name? ").strip()
+    while not name:
+        print("Please enter your name.")
+        name = input("What is your name? ").strip()
+    # Get job role
+    job_role = input(f"Hi {name}, what job role are you preparing for? (e.g. Frontend Developer) ").strip()
+    while not job_role:
+        print("Please specify the job role.")
+        job_role = input("What job role are you preparing for? ").strip()
+    # Get seniority level
+    seniority_options = ["Entry-level", "Junior", "Mid-Level", "Senior", "Lead"]
+    print("\nSelect your experience level:")
+    for i, option in enumerate(seniority_options, 1):
+        print(f"{i}. {option}")
+    seniority_choice = None
+    while seniority_choice not in range(1, len(seniority_options)+1):
+        try:
+            seniority_choice = int(input("Enter the number corresponding to your level: "))
+        except ValueError:
+            print(f"Please enter a number between 1 and {len(seniority_options)}")
+    seniority = seniority_options[seniority_choice - 1]
+    # Get skills
+    skills_input = input(f"\nWhat are your top skills relevant to {job_role}? (Separate with commas): ")
+    skills = [skill.strip() for skill in skills_input.split(",") if skill.strip()]
+    while not skills:
+        print("Please enter at least one skill.")
+        skills_input = input("Your top skills (comma-separated): ")
+        skills = [skill.strip() for skill in skills_input.split(",") if skill.strip()]
+    # Confirm collected info
+    print("\n Interview Setup Complete!")
+    print(f"Name: {name}")
+    print(f"Job Role: {job_role}")
+    print(f"Experience Level: {seniority}")
+    print(f"Skills: {', '.join(skills)}")
+    print("\nStarting your mock interview...\n")
+    return {
+        "name": name,
+        "job_role": job_role,
+        "seniority": seniority,
+        "skills": skills
+    }
+import threading
+def wait_for_user_response(timeout=200):
+    """Wait for user input with timeout. Returns '' if no response."""
+    user_input = []
+    def get_input():
+        answer = input("Your Answer (within timeout): ").strip()
+        user_input.append(answer)
+    thread = threading.Thread(target=get_input)
+    thread.start()
+    thread.join(timeout)
+    return user_input[0] if user_input else ""
+import json
+from datetime import datetime
+from time import time
+import random
+def interview_loop(max_questions, timeout_seconds=300, collection_name="interview_questions", judge_pipeline=None, save_path="interview_log.json"):
+    user_info = get_user_info()
+    job_role = user_info['job_role']
+    seniority = user_info['seniority']
+    skills = user_info['skills']
+    all_roles = extract_all_roles_from_qdrant(collection_name=collection_name)
+    retrieved_data = retrieve_interview_data(job_role, all_roles)
+    context_data = random_context_chunks(retrieved_data, k=4)
+    conversation_history = []
+    interview_state = {
+        "questions": [],
+        "user_answer": [],
+        "job_role": job_role,
+        "seniority": seniority,
+        "start_time": time()
+    }
+    # Store log for evaluation
+    logged_samples = []
+    difficulty_adjustment = None
+    for i in range(max_questions):
+        last_user_response = conversation_history[-1]['content'] if conversation_history else ""
+        # Generate question prompt
+        prompt = build_interview_prompt(
+            conversation_history=conversation_history,
+            user_response=last_user_response,
+            context=context_data,
+            job_role=job_role,
+            skills=skills,
+            seniority=seniority,
+            difficulty_adjustment=difficulty_adjustment
+        )
+        question = groq_llm.predict(prompt)
+        question_eval = eval_question_quality(question, job_role, seniority)
+        conversation_history.append({'role': "Interviewer", "content": question})
+        print(f"Interviewer: Q{i + 1} : {question}")
+        # Wait for user answer
+        start_time = time()
+        user_answer = wait_for_user_response(timeout=timeout_seconds)
+        response_time = time() - start_time
+        skipped = False
+        answer_eval = None
+        ref_answer = None
+        if not user_answer:
+            print("No Response Received, moving to next question.")
+            user_answer = None
+            skipped = True
+            difficulty_adjustment = "medium"
+        else:
+            conversation_history.append({"role": "Candidate", "content": user_answer})
+            ref_answer = generate_reference_answer(question, job_role, seniority)
+            answer_eval = evaluate_answer(
+                question=question,
+                answer=user_answer,
+                ref_answer=ref_answer,
+                job_role=job_role,
+                seniority=seniority,
+                judge_pipeline=judge_pipeline
+            )
+            interview_state["user_answer"].append(user_answer)
+            # Append inline evaluation for history
+            conversation_history[-1].setdefault('evaluation', []).append({
+                "technical_depth": {
+                    "score": answer_eval['Score'],
+                    "Reasoning": answer_eval['Reasoning']
+                }
+            })
+            # Adjust difficulty
+            score = answer_eval['Score'].lower()
+            if score == "excellent":
+                difficulty_adjustment = "harder"
+            elif score in ['poor', 'medium']:
+                difficulty_adjustment = "easier"
+            else:
+                difficulty_adjustment = None
+        # Store for local logging
+        logged_samples.append({
+            "job_role": job_role,
+            "seniority": seniority,
+            "skills": skills,
+            "context": context_data,
+            "prompt": prompt,
+            "generated_question": question,
+            "question_evaluation": question_eval,
+            "user_answer": user_answer,
+            "reference_answer": ref_answer,
+            "answer_evaluation": answer_eval,
+            "skipped": skipped
+        })
+        # Store state
+        interview_state['questions'].append({
+            "question": question,
+            "question_evaluation": question_eval,
+            "user_answer": user_answer,
+            "answer_evaluation": answer_eval,
+            "skipped": skipped
+        })
+    interview_state['end_time'] = time()
+    report = generate_llm_interview_report(interview_state, job_role, seniority)
+    print("Report : _____________________\n")
+    print(report)
+    print('______________________________________________')
+    # Save full interview logs to JSON
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+    filename = f"{save_path.replace('.json', '')}_{timestamp}.json"
+    with open(filename, "w", encoding="utf-8") as f:
+        json.dump(logged_samples, f, indent=2, ensure_ascii=False)
+    print(f" Interview log saved to {filename}")
+    print("____________________________________\n")
+    print(f"interview state : {interview_state}")
+    return interview_state, report
+from sklearn.metrics import precision_score, recall_score, f1_score
+import numpy as np
+# build ground truth for retrieving data for testing
+def build_ground_truth(all_roles):
+    gt = {}
+    for role in all_roles:
+        qa_list = get_role_questions(role)
+        gt[role] = set(q["question"] for q in qa_list if q["question"])
+    return gt
+def evaluate_retrieval(job_role, all_roles, k=10):
+    """
+    Evaluate retrieval quality using Precision@k, Recall@k, and F1@k.
+    Args:
+        job_role (str): The input job role to search for.
+        all_roles (list): List of all available job roles in the system.
+        k (int): Top-k retrieved questions to evaluate.
+    Returns:
+        dict: Evaluation metrics including precision, recall, and f1.
+    """
+    # Step 1: Ground Truth (all exact questions stored for this role)
+    ground_truth_qs = set(
+        q["question"].strip()
+        for q in get_role_questions(job_role)
+        if q.get("question")
+    )
+    if not ground_truth_qs:
+        print(f"[!] No ground truth found for role: {job_role}")
+        return {}
+    # Step 2: Retrieved Questions (may include fallback roles)
+    retrieved_qas = retrieve_interview_data(job_role, all_roles)
+    retrieved_qs = [q["question"].strip() for q in retrieved_qas if q.get("question")]
+    # Step 3: Take top-k retrieved (you can also do full if needed)
+    retrieved_top_k = retrieved_qs[:k]
+    # Step 4: Binary relevance (1 if in ground truth, 0 if not)
+    y_true = [1 if q in ground_truth_qs else 0 for q in retrieved_top_k]
+    y_pred = [1] * len(y_true)  # all retrieved are treated as predicted relevant
+    precision = precision_score(y_true, y_pred, zero_division=0)
+    recall = recall_score(y_true, y_pred, zero_division=0)
+    f1 = f1_score(y_true, y_pred, zero_division=0)
+    print(f" Retrieval Evaluation for role: '{job_role}' (Top-{k})")
+    print(f"Precision@{k}: {precision:.2f}")
+    print(f"Recall@{k}:    {recall:.2f}")
+    print(f"F1@{k}:        {f1:.2f}")
+    print(f"Relevant Retrieved: {sum(y_true)}/{len(y_true)}")
+    print("–" * 40)
+    return {
+        "job_role": job_role,
+        "precision": precision,
+        "recall": recall,
+        "f1": f1,
+        "relevant_retrieved": sum(y_true),
+        "total_retrieved": len(y_true),
+        "ground_truth_count": len(ground_truth_qs),
+    }
+k_values = [5, 10, 20]
+all_roles = extract_all_roles_from_qdrant(collection_name="interview_questions")
+results = []
+for k in k_values:
+    for role in all_roles:
+        metrics = evaluate_retrieval(role, all_roles, k=k)
+        if metrics:  # only if we found ground truth
+            metrics["k"] = k
+            results.append(metrics)
+import pandas as pd
+df = pd.DataFrame(results)
+summary = df.groupby("k")[["precision", "recall", "f1"]].mean().round(3)
+print(summary)
+def extract_job_details(job_description):
+    """Extract job details such as title, skills, experience level, and years of experience from the job description."""
+    title_match = re.search(r"(?i)(?:seeking|hiring) a (.+?) to", job_description)
+    job_title = title_match.group(1) if title_match else "Unknown"
+    skills_match = re.findall(r"(?i)(?:Proficiency in|Experience with|Knowledge of) (.+?)(?:,|\.| and| or)", job_description)
+    skills = list(set([skill.strip() for skill in skills_match])) if skills_match else []
+    experience_match = re.search(r"(\d+)\+? years of experience", job_description)
+    if experience_match:
+        years_experience = int(experience_match.group(1))
+        experience_level = "Senior" if years_experience >= 5 else "Mid" if years_experience >= 3 else "Junior"
+    else:
+        years_experience = None
+        experience_level = "Unknown"
+    return {
+        "job_title": job_title,
+        "skills": skills,
+        "experience_level": experience_level,
+        "years_experience": years_experience
+    }
+import re
+from docx import Document
+import textract
+from PyPDF2 import PdfReader
+JOB_TITLES = [
+    "Accountant", "Data Scientist", "Machine Learning Engineer", "Software Engineer",
+    "Developer", "Analyst", "Researcher", "Intern", "Consultant", "Manager",
+    "Engineer", "Specialist", "Project Manager", "Product Manager", "Administrator",
+    "Director", "Officer", "Assistant", "Coordinator", "Supervisor"
+]
+def clean_filename_name(filename):
+    # Remove file extension
+    base = re.sub(r"\.[^.]+$", "", filename)
+    base = base.strip()
+    # Remove 'cv' or 'CV' words
+    base_clean = re.sub(r"\bcv\b", "", base, flags=re.IGNORECASE).strip()
+    # If after removing CV it's empty, return None
+    if not base_clean:
+        return None
+    # If it contains any digit, return None (unreliable)
+    if re.search(r"\d", base_clean):
+        return None
+    # Replace underscores/dashes with spaces, capitalize
+    base_clean = base_clean.replace("_", " ").replace("-", " ")
+    return base_clean.title()
+def looks_like_job_title(line):
+    for title in JOB_TITLES:
+        pattern = r"\b" + re.escape(title.lower()) + r"\b"
+        if re.search(pattern, line.lower()):
+            return True
+    return False
+def extract_name_from_text(lines):
+    # Try first 3 lines for a name, skipping job titles
+    for i in range(min(1, len(lines))):
+        line = lines[i].strip()
+        if looks_like_job_title(line):
+            return "unknown"
+        if re.search(r"\d", line):  # skip lines with digits
+            continue
+        if len(line.split()) > 4 or len(line) > 40:  # too long or many words
+            continue
+        # If line has only uppercase words, it's probably not a name
+        if line.isupper():
+            continue
+        # Passed checks, return title-cased line as name
+        return line.title()
+    return None
+def extract_text_from_file(file_path):
+    if file_path.endswith('.pdf'):
+        reader = PdfReader(file_path)
+        text = "\n".join(page.extract_text() or '' for page in reader.pages)
+    elif file_path.endswith('.docx'):
+        doc = Document(file_path)
+        text = "\n".join([para.text for para in doc.paragraphs])
+    else:  # For .doc or fallback
+        text = textract.process(file_path).decode('utf-8')
+    return text.strip()
+def extract_candidate_details(file_path):
+    text = extract_text_from_file(file_path)
+    lines = [line.strip() for line in text.splitlines() if line.strip()]
+    # Extract name
+    filename = file_path.split("/")[-1]  # just filename, no path
+    name = clean_filename_name(filename)
+    if not name:
+        name = extract_name_from_text(lines)
+    if not name:
+        name = "Unknown"
+    # Extract skills (basic version)
+    skills = []
+    skills_section = re.search(r"Skills\s*[:\-]?\s*(.+)", text, re.IGNORECASE)
+    if skills_section:
+        raw_skills = skills_section.group(1)
+        skills = [s.strip() for s in re.split(r",|\n|•|-", raw_skills) if s.strip()]
+    return {
+        "name": name,
+        "skills": skills
+    }
+# import gradio as gr
+# import time
+# import tempfile
+# import numpy as np
+# import scipy.io.wavfile as wavfile
+# import os
+# import json
+# from transformers import BarkModel, AutoProcessor
+# import torch, gc
+# import whisper
+# from transformers import Wav2Vec2Processor, Wav2Vec2ForSequenceClassification
+# import librosa
+# import torch
+# print(torch.cuda.is_available())  # ✅ Tells you if GPU is available
+# torch.cuda.empty_cache()
+# gc.collect()
+# # Bark TTS
+# print("🔁 Loading Bark model...")
+# model_bark = BarkModel.from_pretrained("suno/bark").to("cuda" if torch.cuda.is_available() else "cpu")
+# print("✅ Bark model loaded")
+# print("🔁 Loading Bark processor...")
+# processor_bark = AutoProcessor.from_pretrained("suno/bark")
+# print("✅ Bark processor loaded")
+# bark_voice_preset = "v2/en_speaker_5"
+# def bark_tts(text):
+#     print(f"🔁 Synthesizing TTS for: {text}")
+#     # Process the text
+#     inputs = processor_bark(text, return_tensors="pt", voice_preset=bark_voice_preset)
+#     # Move tensors to device
+#     input_ids = inputs["input_ids"].to(model_bark.device)
+#     start = time.time()
+#     # Generate speech with only the required parameters
+#     with torch.no_grad():
+#         speech_values = model_bark.generate(
+#             input_ids=input_ids,
+#             do_sample=True,
+#             fine_temperature=0.4,
+#             coarse_temperature=0.8
+#         )
+#     print(f"✅ Bark finished in {round(time.time() - start, 2)}s")
+#     # Convert to audio
+#     speech = speech_values.cpu().numpy().squeeze()
+#     speech = (speech * 32767).astype(np.int16)
+#     temp_wav = tempfile.NamedTemporaryFile(delete=False, suffix=".wav")
+#     wavfile.write(temp_wav.name, 22050, speech)
+#     return temp_wav.name
+# # Whisper STT
+# print("🔁 Loading Whisper model...")
+# whisper_model = whisper.load_model("base", device="cuda")
+# print("✅ Whisper model loaded")
+# def whisper_stt(audio_path):
+#     if not audio_path or not os.path.exists(audio_path): return ""
+#     result = whisper_model.transcribe(audio_path)
+#     return result["text"]
+# seniority_mapping = {
+#     "Entry-level": 1, "Junior": 2, "Mid-Level": 3, "Senior": 4, "Lead": 5
+# }
+# # --- 2. Gradio App ---
+# with gr.Blocks(theme=gr.themes.Soft()) as demo:
+#     user_data = gr.State({})
+#     interview_state = gr.State({})
+#     missing_fields_state = gr.State([])
+#     # --- UI Layout ---
+#     with gr.Column(visible=True) as user_info_section:
+#         gr.Markdown("## Candidate Information")
+#         cv_file = gr.File(label="Upload CV")
+#         job_desc = gr.Textbox(label="Job Description")
+#         start_btn = gr.Button("Continue", interactive=False)
+#     with gr.Column(visible=False) as missing_section:
+#         gr.Markdown("## Missing Information")
+#         name_in = gr.Textbox(label="Name", visible=False)
+#         role_in = gr.Textbox(label="Job Role", visible=False)
+#         seniority_in = gr.Dropdown(list(seniority_mapping.keys()), label="Seniority", visible=False)
+#         skills_in = gr.Textbox(label="Skills", visible=False)
+#         submit_btn = gr.Button("Submit", interactive=False)
+#     with gr.Column(visible=False) as interview_pre_section:
+#         pre_interview_greeting_md = gr.Markdown()
+#         start_interview_final_btn = gr.Button("Start Interview")
+#     with gr.Column(visible=False) as interview_section:
+#         gr.Markdown("## Interview in Progress")
+#         question_audio = gr.Audio(label="Listen", interactive=False, autoplay=True)
+#         question_text = gr.Markdown()
+#         user_audio_input = gr.Audio(sources=["microphone"], type="filepath", label="1. Record Audio Answer")
+#         stt_transcript = gr.Textbox(label="Transcribed Answer (edit if needed)")
+#         confirm_btn = gr.Button("Confirm Answer")
+#         evaluation_display = gr.Markdown()
+#         interview_summary = gr.Markdown(visible=False)
+#     # --- UI Logic ---
+#     def validate_start_btn(cv_file, job_desc):
+#         return gr.update(interactive=(cv_file is not None and hasattr(cv_file, "name") and bool(job_desc and job_desc.strip())))
+#     cv_file.change(validate_start_btn, [cv_file, job_desc], start_btn)
+#     job_desc.change(validate_start_btn, [cv_file, job_desc], start_btn)
+#     def process_and_route_initial(cv_file, job_desc):
+#         details = extract_candidate_details(cv_file.name)
+#         job_info = extract_job_details(job_desc)
+#         data = {
+#             "name": details.get("name", "unknown"), "job_role": job_info.get("job_title", "unknown"),
+#             "seniority": job_info.get("experience_level", "unknown"), "skills": job_info.get("skills", [])
+#         }
+#         missing = [k for k, v in data.items() if (isinstance(v, str) and v.lower() == "unknown") or not v]
+#         if missing:
+#             return data, missing, gr.update(visible=False), gr.update(visible=True), gr.update(visible=False)
+#         else:
+#             greeting = f"Hello {data['name']}, your profile is ready. Click 'Start Interview' when ready."
+#             return data, missing, gr.update(visible=False), gr.update(visible=False), gr.update(visible=True, value=greeting)
+#     start_btn.click(
+#         process_and_route_initial,
+#         [cv_file, job_desc],
+#         [user_data, missing_fields_state, user_info_section, missing_section, pre_interview_greeting_md]
+#     )
+#     def show_missing(missing):
+#         if missing is None: missing = []
+#         return gr.update(visible="name" in missing), gr.update(visible="job_role" in missing), gr.update(visible="seniority" in missing), gr.update(visible="skills" in missing)
+#     missing_fields_state.change(show_missing, missing_fields_state, [name_in, role_in, seniority_in, skills_in])
+#     def validate_fields(name, role, seniority, skills, missing):
+#         if not missing: return gr.update(interactive=False)
+#         all_filled = all([(not ("name" in missing) or bool(name.strip())), (not ("job_role" in missing) or bool(role.strip())), (not ("seniority" in missing) or bool(seniority)), (not ("skills" in missing) or bool(skills.strip())),])
+#         return gr.update(interactive=all_filled)
+#     for inp in [name_in, role_in, seniority_in, skills_in]:
+#         inp.change(validate_fields, [name_in, role_in, seniority_in, skills_in, missing_fields_state], submit_btn)
+#     def complete_manual(data, name, role, seniority, skills):
+#         if data["name"].lower() == "unknown": data["name"] = name
+#         if data["job_role"].lower() == "unknown": data["job_role"] = role
+#         if data["seniority"].lower() == "unknown": data["seniority"] = seniority
+#         if not data["skills"]: data["skills"] = [s.strip() for s in skills.split(",")]
+#         greeting = f"Hello {data['name']}, your profile is ready. Click 'Start Interview' to begin."
+#         return data, gr.update(visible=False), gr.update(visible=True), gr.update(value=greeting)
+#     submit_btn.click(complete_manual, [user_data, name_in, role_in, seniority_in, skills_in], [user_data, missing_section, interview_pre_section, pre_interview_greeting_md])
+#     def start_interview(data):
+#         # --- Advanced state with full logging ---
+#         state = {
+#             "questions": [], "answers": [], "face_labels": [], "voice_labels": [], "timings": [],
+#             "question_evaluations": [], "answer_evaluations": [], "effective_confidences": [],
+#             "conversation_history": [],
+#             "difficulty_adjustment": None,
+#             "question_idx": 0, "max_questions": 3, "q_start_time": time.time(),
+#             "log": []
+#         }
+#         # --- Optionally: context retrieval here (currently just blank) ---
+#         context = ""
+#         prompt = build_interview_prompt(
+#             conversation_history=[], user_response="", context=context, job_role=data["job_role"],
+#             skills=data["skills"], seniority=data["seniority"], difficulty_adjustment=None,
+#             voice_label="neutral", face_label="neutral"
+#         )
+#         #here the original one
+#         # first_q = groq_llm.predict(prompt)
+#         # # Evaluate Q for quality
+#         # q_eval = eval_question_quality(first_q, data["job_role"], data["seniority"], None)
+#         # state["questions"].append(first_q)
+#         # state["question_evaluations"].append(q_eval)
+#         #here the testing one
+#         first_q = groq_llm.predict(prompt)
+#         q_eval = {
+#             "Score": "N/A",
+#             "Reasoning": "Skipped to reduce processing time",
+#             "Improvements": []
+#         }
+#         state["questions"].append(first_q)
+#         state["question_evaluations"].append(q_eval)
+#         state["conversation_history"].append({'role': 'Interviewer', 'content': first_q})
+#         start = time.perf_counter()
+#         audio_path = bark_tts(first_q)
+#         print("⏱️ Bark TTS took", time.perf_counter() - start, "seconds")
+#         # LOG
+#         state["log"].append({"type": "question", "question": first_q, "question_eval": q_eval, "timestamp": time.time()})
+#         return state, gr.update(visible=False), gr.update(visible=True), audio_path, f"*Question 1:* {first_q}"
+#     start_interview_final_btn.click(start_interview, [user_data], [interview_state, interview_pre_section, interview_section, question_audio, question_text])
+#     def transcribe(audio_path):
+#         return whisper_stt(audio_path)
+#     user_audio_input.change(transcribe, user_audio_input, stt_transcript)
+#     def process_answer(transcript, audio_path, state, data):
+#         if not transcript:
+#             return state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update()
+#         elapsed = round(time.time() - state.get("q_start_time", time.time()), 2)
+#         state["timings"].append(elapsed)
+#         state["answers"].append(transcript)
+#         state["conversation_history"].append({'role': 'Candidate', 'content': transcript})
+#         # --- 1. Emotion analysis (simplified for testing) ---
+#         voice_label = "neutral"
+#         face_label = "neutral"
+#         state["voice_labels"].append(voice_label)
+#         state["face_labels"].append(face_label)
+#         # --- 2. Evaluate previous Q and Answer ---
+#         last_q = state["questions"][-1]
+#         q_eval = state["question_evaluations"][-1]  # Already in state
+#         ref_answer = generate_reference_answer(last_q, data["job_role"], data["seniority"])
+#         answer_eval = evaluate_answer(last_q, transcript, ref_answer, data["job_role"], data["seniority"], None)
+#         state["answer_evaluations"].append(answer_eval)
+#         answer_score = answer_eval.get("Score", "medium") if answer_eval else "medium"
+#         # --- 3. Adaptive difficulty ---
+#         if answer_score == "excellent":
+#             state["difficulty_adjustment"] = "harder"
+#         elif answer_score in ("medium", "poor"):
+#             state["difficulty_adjustment"] = "easier"
+#         else:
+#             state["difficulty_adjustment"] = None
+#         # --- 4. Effective confidence (simplified) ---
+#         eff_conf = {"effective_confidence": 0.6}
+#         state["effective_confidences"].append(eff_conf)
+#         # --- LOG ---
+#         state["log"].append({
+#             "type": "answer",
+#             "question": last_q,
+#             "answer": transcript,
+#             "answer_eval": answer_eval,
+#             "ref_answer": ref_answer,
+#             "face_label": face_label,
+#             "voice_label": voice_label,
+#             "effective_confidence": eff_conf,
+#             "timing": elapsed,
+#             "timestamp": time.time()
+#         })
+#         # --- Next or End ---
+#         qidx = state["question_idx"] + 1
+#         if qidx >= state["max_questions"]:
+#             # Save as JSON (optionally)
+#             timestamp = time.strftime("%Y%m%d_%H%M%S")
+#             log_file = f"interview_log_{timestamp}.json"
+#             with open(log_file, "w", encoding="utf-8") as f:
+#                 json.dump(state["log"], f, indent=2, ensure_ascii=False)
+#             # Report
+#             summary = "# Interview Summary\n"
+#             for i, q in enumerate(state["questions"]):
+#                 summary += (f"\n### Q{i + 1}: {q}\n"
+#                             f"- *Answer*: {state['answers'][i]}\n"
+#                             f"- *Q Eval*: {state['question_evaluations'][i]}\n"
+#                             f"- *A Eval*: {state['answer_evaluations'][i]}\n"
+#                             f"- *Time*: {state['timings'][i]}s\n")
+#             summary += f"\n\n⏺ Full log saved as {log_file}."
+#             return (state, gr.update(visible=True, value=summary), gr.update(value=None), gr.update(value=None), gr.update(value=None), gr.update(value=None), gr.update(visible=True, value=f"Last Detected — Face: {face_label}, Voice: {voice_label}"))
+#         else:
+#             # --- Build next prompt using adaptive difficulty ---
+#             state["question_idx"] = qidx
+#             state["q_start_time"] = time.time()
+#             context = ""  # You can add your context logic here
+#             prompt = build_interview_prompt(
+#                 conversation_history=state["conversation_history"],
+#                 user_response=transcript,
+#                 context=context,
+#                 job_role=data["job_role"],
+#                 skills=data["skills"],
+#                 seniority=data["seniority"],
+#                 difficulty_adjustment=state["difficulty_adjustment"],
+#                 voice_label=voice_label,
+#             )
+#             next_q = groq_llm.predict(prompt)
+#             # Evaluate Q quality
+#             q_eval = eval_question_quality(next_q, data["job_role"], data["seniority"], None)
+#             state["questions"].append(next_q)
+#             state["question_evaluations"].append(q_eval)
+#             state["conversation_history"].append({'role': 'Interviewer', 'content': next_q})
+#             state["log"].append({"type": "question", "question": next_q, "question_eval": q_eval, "timestamp": time.time()})
+#             audio_path = bark_tts(next_q)
+#             # Display evaluations
+#             eval_md = f"*Last Answer Eval:* {answer_eval}\n\n*Effective Confidence:* {eff_conf}"
+#             return (
+#                 state, gr.update(visible=False), audio_path, f"*Question {qidx + 1}:* {next_q}",
+#                 gr.update(value=None), gr.update(value=None),
+#                 gr.update(visible=True, value=eval_md),
+#             )
+#     # Replace your confirm_btn.click with this:
+#     confirm_btn.click(
+#         process_answer,
+#         [stt_transcript, user_audio_input, interview_state, user_data],  # Added None for video_path
+#         [interview_state, interview_summary, question_audio, question_text, user_audio_input, stt_transcript, evaluation_display]
+#     ).then(
+#         lambda: (gr.update(value=None), gr.update(value=None)), None, [user_audio_input, stt_transcript]
+#     )
+# demo.launch(debug=True)
+import gradio as gr
+import time
+import tempfile
+import numpy as np
+import scipy.io.wavfile as wavfile
+import os
+import json
+import edge_tts
+import torch, gc
+from faster_whisper import WhisperModel
+import asyncio
+import threading
+from concurrent.futures import ThreadPoolExecutor
+print(torch.cuda.is_available())
+torch.cuda.empty_cache()
+gc.collect()
+# Global variables for lazy loading
+faster_whisper_model = None
+tts_voice = "en-US-AriaNeural"
+# Thread pool for async operations
+executor = ThreadPoolExecutor(max_workers=2)
+# Add after your imports
+if torch.cuda.is_available():
+    print(f"🔥 CUDA Available: {torch.cuda.get_device_name(0)}")
+    print(f"🔥 CUDA Memory: {torch.cuda.get_device_properties(0).total_memory / 1024**3:.1f} GB")
+    # Set default device
+    torch.cuda.set_device(0)
+else:
+    print("⚠️  CUDA not available, using CPU")
+def load_models_lazy():
+    """Load models only when needed"""
+    global faster_whisper_model
+    device = "cuda" if torch.cuda.is_available() else "cpu"
+    print(f"🔁 Using device: {device}")
+    if faster_whisper_model is None:
+        print("🔁 Loading Faster-Whisper model...")
+        compute_type = "float16" if device == "cuda" else "int8"
+        faster_whisper_model = WhisperModel("base", device=device, compute_type=compute_type)
+        print(f"✅ Faster-Whisper model loaded on {device}")
+async def edge_tts_to_file(text, output_path="tts.wav", voice=tts_voice):
+    communicate = edge_tts.Communicate(text, voice)
+    await communicate.save(output_path)
+    return output_path
+def tts_async(text):
+    loop = asyncio.new_event_loop()
+    asyncio.set_event_loop(loop)
+    return executor.submit(loop.run_until_complete, edge_tts_to_file(text))
+def whisper_stt(audio_path):
+    """STT using Faster-Whisper"""
+    if not audio_path or not os.path.exists(audio_path):
+        return ""
+    load_models_lazy()
+    print("🔁 Transcribing with Faster-Whisper")
+    segments, _ = faster_whisper_model.transcribe(audio_path)
+    transcript = " ".join(segment.text for segment in segments)
+    return transcript.strip()
+seniority_mapping = {
+    "Entry-level": 1, "Junior": 2, "Mid-Level": 3, "Senior": 4, "Lead": 5
+}
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    user_data = gr.State({})
+    interview_state = gr.State({})
+    missing_fields_state = gr.State([])
+    tts_future = gr.State(None)  # Store async TTS future
+    with gr.Column(visible=True) as user_info_section:
+        gr.Markdown("## Candidate Information")
+        cv_file = gr.File(label="Upload CV")
+        job_desc = gr.Textbox(label="Job Description")
+        start_btn = gr.Button("Continue", interactive=False)
+    with gr.Column(visible=False) as missing_section:
+        gr.Markdown("## Missing Information")
+        name_in = gr.Textbox(label="Name", visible=False)
+        role_in = gr.Textbox(label="Job Role", visible=False)
+        seniority_in = gr.Dropdown(list(seniority_mapping.keys()), label="Seniority", visible=False)
+        skills_in = gr.Textbox(label="Skills", visible=False)
+        submit_btn = gr.Button("Submit", interactive=False)
+    with gr.Column(visible=False) as interview_pre_section:
+        pre_interview_greeting_md = gr.Markdown()
+        start_interview_final_btn = gr.Button("Start Interview")
+        loading_status = gr.Markdown("", visible=False)
+    with gr.Column(visible=False) as interview_section:
+        gr.Markdown("## Interview in Progress")
+        question_audio = gr.Audio(label="Listen", interactive=False, autoplay=True)
+        question_text = gr.Markdown()
+        user_audio_input = gr.Audio(sources=["microphone"], type="filepath", label="1. Record Audio Answer")
+        stt_transcript = gr.Textbox(label="Transcribed Answer (edit if needed)")
+        confirm_btn = gr.Button("Confirm Answer")
+        evaluation_display = gr.Markdown()
+        interview_summary = gr.Markdown(visible=False)
+    def validate_start_btn(cv_file, job_desc):
+        return gr.update(interactive=(cv_file is not None and hasattr(cv_file, "name") and bool(job_desc and job_desc.strip())))
+    cv_file.change(validate_start_btn, [cv_file, job_desc], start_btn)
+    job_desc.change(validate_start_btn, [cv_file, job_desc], start_btn)
+    def process_and_route_initial(cv_file, job_desc):
+        details = extract_candidate_details(cv_file.name)
+        job_info = extract_job_details(job_desc)
+        data = {
+            "name": details.get("name", "unknown"),
+            "job_role": job_info.get("job_title", "unknown"),
+            "seniority": job_info.get("experience_level", "unknown"),
+            "skills": job_info.get("skills", [])
+        }
+        missing = [k for k, v in data.items() if (isinstance(v, str) and v.lower() == "unknown") or not v]
+        if missing:
+            return data, missing, gr.update(visible=False), gr.update(visible=True), gr.update(visible=False)
+        else:
+            greeting = f"Hello {data['name']}, your profile is ready. Click 'Start Interview' when ready."
+            return data, missing, gr.update(visible=False), gr.update(visible=False), gr.update(visible=True, value=greeting)
+    start_btn.click(process_and_route_initial, [cv_file, job_desc], [user_data, missing_fields_state, user_info_section, missing_section, pre_interview_greeting_md])
+    def show_missing(missing):
+        if missing is None: missing = []
+        return gr.update(visible="name" in missing), gr.update(visible="job_role" in missing), gr.update(visible="seniority" in missing), gr.update(visible="skills" in missing)
+    missing_fields_state.change(show_missing, missing_fields_state, [name_in, role_in, seniority_in, skills_in])
+    def validate_fields(name, role, seniority, skills, missing):
+        if not missing: return gr.update(interactive=False)
+        all_filled = all([(not ("name" in missing) or bool(name.strip())), (not ("job_role" in missing) or bool(role.strip())), (not ("seniority" in missing) or bool(seniority)), (not ("skills" in missing) or bool(skills.strip()))])
+        return gr.update(interactive=all_filled)
+    for inp in [name_in, role_in, seniority_in, skills_in]:
+        inp.change(validate_fields, [name_in, role_in, seniority_in, skills_in, missing_fields_state], submit_btn)
+    def complete_manual(data, name, role, seniority, skills):
+        if data["name"].lower() == "unknown": data["name"] = name
+        if data["job_role"].lower() == "unknown": data["job_role"] = role
+        if data["seniority"].lower() == "unknown": data["seniority"] = seniority
+        if not data["skills"]: data["skills"] = [s.strip() for s in skills.split(",")]
+        greeting = f"Hello {data['name']}, your profile is ready. Click 'Start Interview' to begin."
+        return data, gr.update(visible=False), gr.update(visible=True), gr.update(value=greeting)
+    submit_btn.click(complete_manual, [user_data, name_in, role_in, seniority_in, skills_in], [user_data, missing_section, interview_pre_section, pre_interview_greeting_md])
+    async def start_interview(data):
+        # Initialize interview state
+        state = {
+            "questions": [],
+            "answers": [],
+            "timings": [],
+            "question_evaluations": [],
+            "answer_evaluations": [],
+            "conversation_history": [],
+            "difficulty_adjustment": None,
+            "question_idx": 0,
+            "max_questions": 3,
+            "q_start_time": time.time(),
+            "log": []
+        }
+        # Build prompt for first question
+        context = ""
+        prompt = build_interview_prompt(
+            conversation_history=[],
+            user_response="",
+            context=context,
+            job_role=data["job_role"],
+            skills=data["skills"],
+            seniority=data["seniority"],
+            difficulty_adjustment=None,
+            voice_label="neutral"
+        )
+        # Generate first question
+        start = time.time()
+        first_q = groq_llm.predict(prompt)
+        print("⏱️ Groq LLM Response Time:", round(time.time() - start, 2), "seconds")
+        q_eval = {
+            "Score": "N/A",
+            "Reasoning": "Skipped to reduce processing time",
+            "Improvements": []
+        }
+        state["questions"].append(first_q)
+        state["question_evaluations"].append(q_eval)
+        state["conversation_history"].append({'role': 'Interviewer', 'content': first_q})
+        # Generate audio with Bark (wait for it)
+        start = time.perf_counter()
+        cleaned_text = first_q.strip().replace("\n", " ")
+        audio_path = await edge_tts_to_file(first_q)
+        print("⏱️ TTS (edge-tts) took", round(time.perf_counter() - start, 2), "seconds")
+        # Log question
+        state["log"].append({
+            "type": "question",
+            "question": first_q,
+            "question_eval": q_eval,
+            "timestamp": time.time()
+        })
+        return (
+            state,
+            gr.update(visible=False),  # Hide interview_pre_section
+            gr.update(visible=True),   # Show interview_section
+            audio_path,                # Set audio
+            f"*Question 1:* {first_q}" # Set question text
+        )
+    # Hook into Gradio
+    start_interview_final_btn.click(
+        fn=start_interview,
+        inputs=[user_data],
+        outputs=[interview_state, interview_pre_section, interview_section, question_audio, question_text],
+        concurrency_limit=1
+    )
+    def transcribe(audio_path):
+        return whisper_stt(audio_path)
+    user_audio_input.change(transcribe, user_audio_input, stt_transcript)
+    async def process_answer(transcript, audio_path, state, data):
+        start = time.time()
+        if not transcript:
+            return state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update()
+        elapsed = round(time.time() - state.get("q_start_time", time.time()), 2)
+        state["timings"].append(elapsed)
+        state["answers"].append(transcript)
+        state["conversation_history"].append({'role': 'Candidate', 'content': transcript})
+        last_q = state["questions"][-1]
+        q_eval = state["question_evaluations"][-1]
+        ref_answer = generate_reference_answer(last_q, data["job_role"], data["seniority"])
+        answer_eval = await asyncio.get_event_loop().run_in_executor(
+            executor,
+            evaluate_answer,
+            last_q, transcript, ref_answer, data["job_role"], data["seniority"]
+        )
+        state["answer_evaluations"].append(answer_eval)
+        answer_score = answer_eval.get("Score", "medium") if answer_eval else "medium"
+        if answer_score == "excellent":
+            state["difficulty_adjustment"] = "harder"
+        elif answer_score in ("medium", "poor"):
+            state["difficulty_adjustment"] = "easier"
+        else:
+            state["difficulty_adjustment"] = None
+        state["log"].append({
+            "type": "answer", "question": last_q, "answer": transcript,
+            "answer_eval": answer_eval, "ref_answer": ref_answer,
+            "timing": elapsed, "timestamp": time.time()
+        })
+        qidx = state["question_idx"] + 1
+        if qidx >= state["max_questions"]:
+            timestamp = time.strftime("%Y%m%d_%H%M%S")
+            log_file = f"interview_log_{timestamp}.json"
+            with open(log_file, "w", encoding="utf-8") as f:
+                json.dump(state["log"], f, indent=2, ensure_ascii=False)
+            summary = "# Interview Summary\n"
+            for i, q in enumerate(state["questions"]):
+                summary += (f"\n### Q{i + 1}: {q}\n"
+                            f"- *Answer*: {state['answers'][i]}\n"
+                            f"- *Q Eval*: {state['question_evaluations'][i]}\n"
+                            f"- *A Eval*: {state['answer_evaluations'][i]}\n"
+                            f"- *Time*: {state['timings'][i]}s\n")
+            summary += f"\n\n⏺ Full log saved as {log_file}."
+            return state, gr.update(visible=True, value=summary), gr.update(value=None), gr.update(value=None), gr.update(value=None), gr.update(value=None), gr.update(visible=False)
+        else:
+            state["question_idx"] = qidx
+            state["q_start_time"] = time.time()
+            context = ""
+            prompt = build_interview_prompt(
+                conversation_history=state["conversation_history"],
+                user_response=transcript, context=context,
+                job_role=data["job_role"], skills=data["skills"],
+                seniority=data["seniority"], difficulty_adjustment=state["difficulty_adjustment"],
+                voice_label="neutral"
+            )
+            start = time.time()
+            next_q = groq_llm.predict(prompt)
+            print("⏱️ Groq LLM Response Time:", round(time.time() - start, 2), "seconds")
+            start = time.time()
+            q_eval_future = executor.submit(
+                eval_question_quality,
+                next_q, data["job_role"], data["seniority"]
+            )
+            q_eval = q_eval_future.result()
+            print("⏱️ Evaluation time:", round(time.time() - start, 2), "seconds")
+            state["questions"].append(next_q)
+            state["question_evaluations"].append(q_eval)
+            state["conversation_history"].append({'role': 'Interviewer', 'content': next_q})
+            state["log"].append({"type": "question", "question": next_q, "question_eval": q_eval, "timestamp": time.time()})
+            audio_path = await edge_tts_to_file(next_q)
+            eval_md = f"*Last Answer Eval:* {answer_eval}"
+            print("✅ process_answer time:", round(time.time() - start, 2), "s")
+            return state, gr.update(visible=False), audio_path, f"*Question {qidx + 1}:* {next_q}", gr.update(value=None), gr.update(value=None), gr.update(visible=True, value=eval_md)
+    confirm_btn.click(
+        fn=process_answer,
+        inputs=[stt_transcript, user_audio_input, interview_state, user_data],
+        outputs=[interview_state, interview_summary, question_audio, question_text, user_audio_input, stt_transcript,
+                 evaluation_display],
+        concurrency_limit=1
+    ).then(
+        lambda: (gr.update(value=None), gr.update(value=None)), None, [user_audio_input, stt_transcript]
+    )
+demo.launch(debug=True)

backend/templates/apply.html CHANGED Viewed

@@ -24,87 +24,62 @@
     <div class="card">
         <div class="card-header">
-            <h2>Complete Your Application</h2>
-            <p>Upload your resume to auto-fill fields or complete the form manually</p>
         </div>
         <div class="card-body">
             <form method="POST" enctype="multipart/form-data">
-                {{ form.hidden_tag() }}
-                {{ form.job_id }}
                 <div class="form-group">
                     <label for="resume">Upload Resume</label>
-                    {{ form.resume(class="form-control", id="resume", required=True) }}
-                </div>
-                <div class="form-group">
-                    {{ form.name.label }}
-                    {{ form.name(class="form-control", id="name", placeholder="Enter your full name") }}
                 </div>
-                <div class="form-group">
-                    {{ form.email.label }}
-                    {{ form.email(class="form-control", id="email", placeholder="Enter your email address") }}
-                </div>
-                <div class="form-group">
-                    <label for="phone">Phone Number</label>
-                    <input type="text" id="phone" class="form-control" placeholder="Enter your phone number">
-                </div>
-                <div class="form-group">
-                    <label for="skills">Skills</label>
-                    <textarea id="skills" class="form-control"
-                              placeholder="Skills extracted from your resume..."></textarea>
-                </div>
-                <div class="form-group">
-                    <label for="experience">Previous Experience</label>
-                    <textarea id="experience" class="form-control"
-                              placeholder="Experience extracted from your resume..."></textarea>
-                </div>
-                <div class="form-group">
-                    {{ form.cover_letter.label }}
-                    {{ form.cover_letter(class="form-control", placeholder="Enter your cover letter here...") }}
-                </div>
-                <div style="display: flex; justify-content: space-between; align-items: center; margin-top: 2rem;">
-                    <a href="{{ url_for('job_detail', job_id=job.id) }}" class="btn btn-outline">Cancel</a>
-                    {{ form.submit(class="btn btn-primary") }}
                 </div>
             </form>
         </div>
     </div>
 </section>
-<script src="https://code.jquery.com/jquery-3.6.0.min.js"></script>
-<script>
-    $(document).ready(function () {
-        $("#resume").on("change", function () {
-            var formData = new FormData();
-            formData.append("resume", $("#resume")[0].files[0]);
-            $.ajax({
-                url: "{{ url_for('parse_resume') }}",
-                type: "POST",
-                data: formData,
-                processData: false,
-                contentType: false,
-                success: function (data) {
-                    $("#name").val(data.name);
-                    $("#email").val(data.email);
-                    $("#phone").val(data.mobile_number);
-                    $("#skills").val(data.skills.join(", "));
-                    $("#experience").val(data.experience.join("\n"));
-                },
-                error: function () {
-                    alert("Error parsing the resume. Please try again.");
-                }
-            });
-        });
-    });
-</script>
-{% endblock %}

     <div class="card">
         <div class="card-header">
+            <h2>Submit Your Application</h2>
+            <p>Please upload your resume (PDF, DOCX). Our system will extract your info automatically.</p>
         </div>
         <div class="card-body">
+            <!-- Application Form -->
             <form method="POST" enctype="multipart/form-data">
                 <div class="form-group">
                     <label for="resume">Upload Resume</label>
+                    <input type="file" name="resume" id="resume" class="form-control" required accept=".pdf,.doc,.docx">
                 </div>
+                <div class="application-actions" style="margin-top: 2rem;">
+                    <button type="submit" class="btn btn-primary">Submit Application</button>
                 </div>
             </form>
+            <div style="margin-top: 1.5rem; text-align: center;">
+                <a href="{{ url_for('job_detail', job_id=job.id) }}" class="btn btn-outline">Back to Job Details</a>
+            </div>
         </div>
     </div>
 </section>
+<style>
+.form-group label {
+    font-weight: 600;
+    color: var(--primary);
+    margin-bottom: 0.5rem;
+    display: block;
+}
+.form-control {
+    width: 100%;
+    padding: 0.75rem;
+    font-size: 1rem;
+    border-radius: 6px;
+    border: 1px solid #ccc;
+}
+.application-actions {
+    text-align: center;
+}
+.btn-primary {
+    background: linear-gradient(135deg, var(--primary), var(--secondary));
+    color: white;
+    padding: 0.75rem 1.5rem;
+    font-weight: 500;
+    border: none;
+    border-radius: 6px;
+    cursor: pointer;
+}
+.btn-primary:hover {
+    opacity: 0.9;
+}
+</style>
+{% endblock %}

backend/templates/interview.html ADDED Viewed

	@@ -0,0 +1,833 @@

+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>AI Interview - Interactive Session</title>
+    <style>
+        * {
+            margin: 0;
+            padding: 0;
+            box-sizing: border-box;
+        }
+        body {
+            font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
+            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
+            min-height: 100vh;
+            display: flex;
+            justify-content: center;
+            align-items: center;
+            padding: 20px;
+        }
+        .interview-container {
+            background: white;
+            border-radius: 20px;
+            box-shadow: 0 20px 60px rgba(0, 0, 0, 0.1);
+            width: 100%;
+            max-width: 800px;
+            min-height: 600px;
+            display: flex;
+            flex-direction: column;
+            overflow: hidden;
+        }
+        .header {
+            background: linear-gradient(45deg, #4CAF50, #45a049);
+            color: white;
+            padding: 20px;
+            text-align: center;
+            position: relative;
+        }
+        .header h1 {
+            font-size: 1.8rem;
+            margin-bottom: 5px;
+        }
+        .header p {
+            opacity: 0.9;
+            font-size: 0.9rem;
+        }
+        .chat-area {
+            flex: 1;
+            padding: 20px;
+            display: flex;
+            flex-direction: column;
+            gap: 20px;
+            max-height: 400px;
+            overflow-y: auto;
+        }
+        .ai-message {
+            display: flex;
+            align-items: flex-start;
+            gap: 15px;
+            animation: slideIn 0.5s ease-out;
+        }
+        .ai-avatar {
+            width: 60px;
+            height: 60px;
+            border-radius: 50%;
+            background: linear-gradient(45deg, #667eea, #764ba2);
+            display: flex;
+            align-items: center;
+            justify-content: center;
+            color: white;
+            font-weight: bold;
+            font-size: 1.2rem;
+            position: relative;
+            flex-shrink: 0;
+        }
+        .ai-avatar.talking {
+            animation: pulse 1.5s infinite;
+        }
+        .ai-avatar.talking::before {
+            content: '';
+            position: absolute;
+            width: 100%;
+            height: 100%;
+            border-radius: 50%;
+            background: rgba(102, 126, 234, 0.3);
+            animation: ripple 1.5s infinite;
+        }
+        .message-bubble {
+            background: #f8f9fa;
+            border-radius: 15px;
+            padding: 15px 20px;
+            max-width: 70%;
+            position: relative;
+        }
+        .message-bubble::before {
+            content: '';
+            position: absolute;
+            left: -10px;
+            top: 15px;
+            width: 0;
+            height: 0;
+            border-top: 10px solid transparent;
+            border-bottom: 10px solid transparent;
+            border-right: 10px solid #f8f9fa;
+        }
+        .user-message {
+            display: flex;
+            justify-content: flex-end;
+            animation: slideIn 0.5s ease-out;
+        }
+        .user-bubble {
+            background: linear-gradient(45deg, #4CAF50, #45a049);
+            color: white;
+            border-radius: 15px;
+            padding: 15px 20px;
+            max-width: 70%;
+            position: relative;
+        }
+        .user-bubble::before {
+            content: '';
+            position: absolute;
+            right: -10px;
+            top: 15px;
+            width: 0;
+            height: 0;
+            border-top: 10px solid transparent;
+            border-bottom: 10px solid transparent;
+            border-left: 10px solid #4CAF50;
+        }
+        .controls-area {
+            background: #f8f9fa;
+            padding: 20px;
+            border-top: 1px solid #e9ecef;
+        }
+        .recording-section {
+            display: flex;
+            flex-direction: column;
+            gap: 15px;
+        }
+        .mic-container {
+            display: flex;
+            justify-content: center;
+            align-items: center;
+            gap: 20px;
+        }
+        .mic-button {
+            width: 80px;
+            height: 80px;
+            border-radius: 50%;
+            border: none;
+            background: linear-gradient(45deg, #ff6b6b, #ee5a52);
+            color: white;
+            font-size: 1.8rem;
+            cursor: pointer;
+            transition: all 0.3s ease;
+            display: flex;
+            align-items: center;
+            justify-content: center;
+            position: relative;
+        }
+        .mic-button:hover {
+            transform: scale(1.05);
+            box-shadow: 0 8px 25px rgba(255, 107, 107, 0.3);
+        }
+        .mic-button.recording {
+            background: linear-gradient(45deg, #ff4757, #ff3742);
+            animation: recordPulse 1s infinite;
+        }
+        .mic-button.recording::before {
+            content: '';
+            position: absolute;
+            width: 100%;
+            height: 100%;
+            border-radius: 50%;
+            background: rgba(255, 71, 87, 0.3);
+            animation: ripple 1s infinite;
+        }
+        .recording-status {
+            font-size: 0.9rem;
+            color: #666;
+            text-align: center;
+        }
+        .transcript-area {
+            background: white;
+            border: 2px solid #e9ecef;
+            border-radius: 10px;
+            padding: 15px;
+            font-size: 0.9rem;
+            color: #333;
+            min-height: 60px;
+            max-height: 120px;
+            overflow-y: auto;
+            transition: border-color 0.3s ease;
+        }
+        .transcript-area:focus {
+            outline: none;
+            border-color: #4CAF50;
+        }
+        .action-buttons {
+            display: flex;
+            gap: 10px;
+            justify-content: center;
+            margin-top: 15px;
+        }
+        .btn {
+            padding: 12px 24px;
+            border: none;
+            border-radius: 8px;
+            cursor: pointer;
+            font-size: 1rem;
+            font-weight: 500;
+            transition: all 0.3s ease;
+            display: flex;
+            align-items: center;
+            gap: 8px;
+        }
+        .btn-primary {
+            background: linear-gradient(45deg, #4CAF50, #45a049);
+            color: white;
+        }
+        .btn-primary:hover {
+            transform: translateY(-2px);
+            box-shadow: 0 5px 15px rgba(76, 175, 80, 0.3);
+        }
+        .btn-secondary {
+            background: #6c757d;
+            color: white;
+        }
+        .btn-secondary:hover {
+            background: #545b62;
+            transform: translateY(-2px);
+        }
+        .btn:disabled {
+            opacity: 0.6;
+            cursor: not-allowed;
+            transform: none;
+        }
+        .question-counter {
+            position: absolute;
+            top: 15px;
+            right: 20px;
+            background: rgba(255, 255, 255, 0.2);
+            padding: 5px 12px;
+            border-radius: 20px;
+            font-size: 0.8rem;
+        }
+        .loading {
+            display: inline-block;
+            width: 20px;
+            height: 20px;
+            border: 3px solid rgba(255, 255, 255, 0.3);
+            border-radius: 50%;
+            border-top-color: white;
+            animation: spin 1s ease-in-out infinite;
+        }
+        .summary-panel {
+            display: none;
+            background: white;
+            border-radius: 15px;
+            padding: 30px;
+            margin: 20px;
+            box-shadow: 0 10px 30px rgba(0, 0, 0, 0.1);
+        }
+        .summary-panel h2 {
+            color: #333;
+            margin-bottom: 20px;
+            text-align: center;
+        }
+        .summary-item {
+            background: #f8f9fa;
+            border-radius: 10px;
+            padding: 15px;
+            margin-bottom: 15px;
+            border-left: 4px solid #4CAF50;
+        }
+        .summary-item h4 {
+            color: #333;
+            margin-bottom: 8px;
+        }
+        .summary-item p {
+            color: #666;
+            margin-bottom: 5px;
+            line-height: 1.4;
+        }
+        .evaluation-score {
+            display: inline-block;
+            background: #4CAF50;
+            color: white;
+            padding: 4px 8px;
+            border-radius: 15px;
+            font-size: 0.8rem;
+            font-weight: bold;
+        }
+        @keyframes slideIn {
+            from {
+                opacity: 0;
+                transform: translateY(20px);
+            }
+            to {
+                opacity: 1;
+                transform: translateY(0);
+            }
+        }
+        @keyframes pulse {
+            0%, 100% { transform: scale(1); }
+            50% { transform: scale(1.1); }
+        }
+        @keyframes ripple {
+            0% {
+                transform: scale(1);
+                opacity: 1;
+            }
+            100% {
+                transform: scale(1.4);
+                opacity: 0;
+            }
+        }
+        @keyframes recordPulse {
+            0%, 100% { transform: scale(1); }
+            50% { transform: scale(1.05); }
+        }
+        @keyframes spin {
+            to { transform: rotate(360deg); }
+        }
+        @media (max-width: 768px) {
+            .interview-container {
+                margin: 10px;
+                min-height: 90vh;
+            }
+            .mic-button {
+                width: 70px;
+                height: 70px;
+                font-size: 1.5rem;
+            }
+            .message-bubble, .user-bubble {
+                max-width: 85%;
+            }
+            .header h1 {
+                font-size: 1.5rem;
+            }
+        }
+        /* Hide default audio controls */
+        audio {
+            display: none;
+        }
+    </style>
+</head>
+<body>
+    <div class="interview-container">
+        <div class="header">
+            <div class="question-counter">
+                Question <span id="currentQuestionNum">1</span> of <span id="totalQuestions">3</span>
+            </div>
+            <h1>🤖 AI Interview Assistant</h1>
+            <p>Answer thoughtfully and take your time</p>
+        </div>
+        <div class="chat-area" id="chatArea">
+            <div class="ai-message">
+                <div class="ai-avatar" id="aiAvatar">AI</div>
+                <div class="message-bubble">
+                    <div id="loadingMessage">
+                        <div class="loading"></div>
+                        <span style="margin-left: 10px;">Generating your first question...</span>
+                    </div>
+                </div>
+            </div>
+        </div>
+        <div class="controls-area">
+            <div class="recording-section">
+                <div class="mic-container">
+                    <button class="mic-button" id="micButton" disabled>
+                        <span id="micIcon">🎤</span>
+                    </button>
+                </div>
+                <div class="recording-status" id="recordingStatus">
+                    Click the microphone to record your answer
+                </div>
+                <div class="transcript-area" id="transcriptArea" contenteditable="true" placeholder="Your transcribed answer will appear here...">
+                </div>
+                <div class="action-buttons">
+                    <button class="btn btn-primary" id="confirmButton" disabled>
+                        <span>Confirm Answer</span>
+                        <span id="confirmLoading" style="display: none;">
+                            <div class="loading" style="width: 16px; height: 16px; border-width: 2px;"></div>
+                        </span>
+                    </button>
+                    <button class="btn btn-secondary" id="retryRecording" style="display: none;">
+                        🔄 Re-record
+                    </button>
+                </div>
+            </div>
+        </div>
+        <!-- Summary Panel (hidden initially) -->
+        <div class="summary-panel" id="summaryPanel">
+            <h2>📋 Interview Summary</h2>
+            <div id="summaryContent"></div>
+            <div style="text-align: center; margin-top: 30px;">
+                <button class="btn btn-primary" onclick="window.close()">
+                    Complete Interview
+                </button>
+            </div>
+        </div>
+    </div>
+    <!-- Hidden audio element for TTS playback -->
+    <audio id="ttsAudio" preload="auto"></audio>
+    <script>
+        const JOB_ID = {{ job.id }};
+        class AIInterviewer {
+            constructor() {
+                this.currentQuestionIndex = 0;
+                this.totalQuestions = 3;
+                this.isRecording = false;
+                this.mediaRecorder = null;
+                this.audioChunks = [];
+                this.interviewData = {
+                    questions: [],
+                    answers: [],
+                    evaluations: []
+                };
+                this.initializeElements();
+                this.initializeInterview();
+            }
+            initializeElements() {
+                this.chatArea = document.getElementById('chatArea');
+                this.micButton = document.getElementById('micButton');
+                this.micIcon = document.getElementById('micIcon');
+                this.recordingStatus = document.getElementById('recordingStatus');
+                this.transcriptArea = document.getElementById('transcriptArea');
+                this.confirmButton = document.getElementById('confirmButton');
+                this.confirmLoading = document.getElementById('confirmLoading');
+                this.retryButton = document.getElementById('retryRecording');
+                this.aiAvatar = document.getElementById('aiAvatar');
+                this.ttsAudio = document.getElementById('ttsAudio');
+                this.summaryPanel = document.getElementById('summaryPanel');
+                this.currentQuestionNum = document.getElementById('currentQuestionNum');
+                this.totalQuestionsSpan = document.getElementById('totalQuestions');
+                this.bindEvents();
+            }
+            bindEvents() {
+                this.micButton.addEventListener('mousedown', () => this.startRecording());
+                this.micButton.addEventListener('mouseup', () => this.stopRecording());
+                this.micButton.addEventListener('mouseleave', () => this.stopRecording());
+                this.micButton.addEventListener('touchstart', (e) => {
+                    e.preventDefault();
+                    this.startRecording();
+                });
+                this.micButton.addEventListener('touchend', (e) => {
+                    e.preventDefault();
+                    this.stopRecording();
+                });
+                this.confirmButton.addEventListener('click', () => this.submitAnswer());
+                this.retryButton.addEventListener('click', () => this.resetRecording());
+                this.transcriptArea.addEventListener('input', () => {
+                    const hasText = this.transcriptArea.textContent.trim().length > 0;
+                    this.confirmButton.disabled = !hasText;
+                });
+                this.ttsAudio.addEventListener('play', () => {
+                    this.aiAvatar.classList.add('talking');
+                });
+                this.ttsAudio.addEventListener('ended', () => {
+                    this.aiAvatar.classList.remove('talking');
+                    this.enableControls();
+                });
+                this.ttsAudio.addEventListener('error', (e) => {
+                    console.error('Audio playback error:', e);
+                    this.aiAvatar.classList.remove('talking');
+                    this.enableControls();
+                });
+            }
+            async initializeInterview() {
+                try {
+                    const response = await fetch('/api/start_interview', {
+                        method: 'POST',
+                        headers: {
+                            'Content-Type': 'application/json'
+                        },
+                        body: JSON.stringify({ job_id: JOB_ID })
+                    });
+                    const data = await response.json();
+                    if (data.success) {
+                        this.displayQuestion(data.question, data.audioUrl);
+                        this.interviewData.questions.push(data.question);
+                    } else {
+                        this.showError('Failed to start interview. Please try again.');
+                    }
+                } catch (error) {
+                    console.error('Error starting interview:', error);
+                    this.showError('Connection error. Please check your internet connection.');
+                }
+            }
+            displayQuestion(question, audioUrl = null) {
+                // Remove loading message
+                const loadingMsg = document.getElementById('loadingMessage');
+                if (loadingMsg) {
+                    loadingMsg.remove();
+                }
+                // Create question message
+                const messageDiv = document.createElement('div');
+                messageDiv.className = 'ai-message';
+                messageDiv.innerHTML = `
+                    <div class="ai-avatar talking">AI</div>
+                    <div class="message-bubble">
+                        <p>${question}</p>
+                    </div>
+                `;
+                this.chatArea.appendChild(messageDiv);
+                this.chatArea.scrollTop = this.chatArea.scrollHeight;
+                // Update question counter
+                this.currentQuestionNum.textContent = this.currentQuestionIndex + 1;
+                // Play audio if available
+                if (audioUrl) {
+                    this.playQuestionAudio(audioUrl);
+                } else {
+                    // Enable controls if no audio
+                    setTimeout(() => this.enableControls(), 1000);
+                }
+            }
+            playQuestionAudio(audioUrl) {
+                this.ttsAudio.src = audioUrl;
+                this.ttsAudio.play().catch(error => {
+                    console.error('Audio play error:', error);
+                    this.enableControls();
+                });
+            }
+            enableControls() {
+                this.micButton.disabled = false;
+                this.recordingStatus.textContent = 'Click and hold to record your answer';
+                // Remove talking animation from avatar
+                const avatars = this.chatArea.querySelectorAll('.ai-avatar');
+                avatars.forEach(avatar => avatar.classList.remove('talking'));
+            }
+            async startRecording() {
+                if (this.isRecording) return;
+                try {
+                    const stream = await navigator.mediaDevices.getUserMedia({ audio: true });
+                    this.mediaRecorder = new MediaRecorder(stream);
+                    this.audioChunks = [];
+                    this.mediaRecorder.ondataavailable = (event) => {
+                        this.audioChunks.push(event.data);
+                    };
+                    this.mediaRecorder.onstop = () => {
+                        this.processRecording();
+                        stream.getTracks().forEach(track => track.stop());
+                    };
+                    this.mediaRecorder.start();
+                    this.isRecording = true;
+                    // Update UI
+                    this.micButton.classList.add('recording');
+                    this.micIcon.textContent = '🔴';
+                    this.recordingStatus.textContent = 'Recording... Release to stop';
+                } catch (error) {
+                    console.error('Error starting recording:', error);
+                    this.recordingStatus.textContent = 'Microphone access denied. Please allow microphone access and try again.';
+                }
+            }
+            stopRecording() {
+                if (!this.isRecording || !this.mediaRecorder) return;
+                this.mediaRecorder.stop();
+                this.isRecording = false;
+                // Update UI
+                this.micButton.classList.remove('recording');
+                this.micIcon.textContent = '🎤';
+                this.recordingStatus.textContent = 'Processing audio...';
+            }
+            async processRecording() {
+                const audioBlob = new Blob(this.audioChunks, { type: 'audio/wav' });
+                const formData = new FormData();
+                formData.append('audio', audioBlob, 'recording.wav');
+                try {
+                    const response = await fetch('/api/transcribe', {
+                        method: 'POST',
+                        body: formData
+                    });
+                    const data = await response.json();
+                    if (data.success && data.transcript) {
+                        this.transcriptArea.textContent = data.transcript;
+                        this.confirmButton.disabled = false;
+                        this.retryButton.style.display = 'inline-flex';
+                        this.recordingStatus.textContent = 'Transcription complete. Review and confirm your answer.';
+                    } else {
+                        this.recordingStatus.textContent = 'Transcription failed. Please try recording again.';
+                    }
+                } catch (error) {
+                    console.error('Error processing recording:', error);
+                    this.recordingStatus.textContent = 'Error processing audio. Please try again.';
+                }
+            }
+            resetRecording() {
+                this.transcriptArea.textContent = '';
+                this.confirmButton.disabled = true;
+                this.retryButton.style.display = 'none';
+                this.recordingStatus.textContent = 'Click and hold to record your answer';
+            }
+            async submitAnswer() {
+                const answer = this.transcriptArea.textContent.trim();
+                if (!answer) return;
+                // Show loading state
+                this.confirmButton.disabled = true;
+                this.confirmLoading.style.display = 'inline-block';
+                this.confirmButton.querySelector('span').style.display = 'none';
+                // Add user message to chat
+                this.addUserMessage(answer);
+                try {
+                    const response = await fetch('/api/process_answer', {
+                        method: 'POST',
+                        headers: {
+                            'Content-Type': 'application/json'
+                        },
+                        body: JSON.stringify({
+                            answer: answer,
+                            questionIndex: this.currentQuestionIndex
+                        })
+                    });
+                    const data = await response.json();
+                    if (data.success) {
+                        this.interviewData.answers.push(answer);
+                        this.interviewData.evaluations.push(data.evaluation);
+                        if (data.isComplete) {
+                            this.showInterviewSummary(data.summary);
+                        } else {
+                            this.currentQuestionIndex++;
+                            this.displayQuestion(data.nextQuestion, data.audioUrl);
+                            this.interviewData.questions.push(data.nextQuestion);
+                            this.resetForNextQuestion();
+                        }
+                    } else {
+                        this.showError('Failed to process answer. Please try again.');
+                    }
+                } catch (error) {
+                    console.error('Error submitting answer:', error);
+                    this.showError('Connection error. Please try again.');
+                } finally {
+                    // Reset button state
+                    this.confirmLoading.style.display = 'none';
+                    this.confirmButton.querySelector('span').style.display = 'inline';
+                }
+            }
+            addUserMessage(message) {
+                const messageDiv = document.createElement('div');
+                messageDiv.className = 'user-message';
+                messageDiv.innerHTML = `
+                    <div class="user-bubble">
+                        <p>${message}</p>
+                    </div>
+                `;
+                this.chatArea.appendChild(messageDiv);
+                this.chatArea.scrollTop = this.chatArea.scrollHeight;
+            }
+            resetForNextQuestion() {
+                this.transcriptArea.textContent = '';
+                this.confirmButton.disabled = true;
+                this.retryButton.style.display = 'none';
+                this.recordingStatus.textContent = 'Wait for the next question...';
+                this.micButton.disabled = true;
+            }
+            showInterviewSummary(summaryData) {
+                const summaryContent = document.getElementById('summaryContent');
+                let summaryHtml = '';
+                this.interviewData.questions.forEach((question, index) => {
+                    const answer = this.interviewData.answers[index] || 'No answer provided';
+                    const evaluation = this.interviewData.evaluations[index] || {};
+                    summaryHtml += `
+                        <div class="summary-item">
+                            <h4>Question ${index + 1}:</h4>
+                            <p><strong>Q:</strong> ${question}</p>
+                            <p><strong>A:</strong> ${answer}</p>
+                            <p><strong>Score:</strong> <span class="evaluation-score">${evaluation.score || 'N/A'}</span></p>
+                            <p><strong>Feedback:</strong> ${evaluation.feedback || 'No feedback provided'}</p>
+                        </div>
+                    `;
+                });
+                summaryContent.innerHTML = summaryHtml;
+                // Hide main interface and show summary
+                document.querySelector('.interview-container').style.display = 'none';
+                this.summaryPanel.style.display = 'block';
+            }
+            showError(message) {
+                this.recordingStatus.textContent = message;
+                this.recordingStatus.style.color = '#ff4757';
+                setTimeout(() => {
+                    this.recordingStatus.style.color = '#666';
+                }, 3000);
+            }
+        }
+        // Initialize the interview when page loads
+        document.addEventListener('DOMContentLoaded', () => {
+            new AIInterviewer();
+        });
+        // Add placeholder attribute support for contenteditable
+        document.addEventListener('DOMContentLoaded', function() {
+            const transcriptArea = document.getElementById('transcriptArea');
+            const placeholder = transcriptArea.getAttribute('placeholder');
+            function checkPlaceholder() {
+                if (transcriptArea.textContent.trim() === '') {
+                    transcriptArea.style.color = '#999';
+                    transcriptArea.textContent = placeholder;
+                } else if (transcriptArea.textContent === placeholder) {
+                    transcriptArea.style.color = '#333';
+                    transcriptArea.textContent = '';
+                }
+            }
+            transcriptArea.addEventListener('focus', function() {
+                if (transcriptArea.textContent === placeholder) {
+                    transcriptArea.textContent = '';
+                    transcriptArea.style.color = '#333';
+                }
+            });
+            transcriptArea.addEventListener('blur', function() {
+                if (transcriptArea.textContent.trim() === '') {
+                    transcriptArea.style.color = '#999';
+                    transcriptArea.textContent = placeholder;
+                }
+            });
+            // Initial check
+            checkPlaceholder();
+        });
+    </script>
+</body>
+</html>

backend/utils/luna_phase1.py ADDED Viewed

File without changes

instance/codingo.db DELETED Viewed

Binary file (24.6 kB)

requirements.txt CHANGED Viewed

@@ -10,3 +10,49 @@ pyresparser
 flask_sqlalchemy
 flask_wtf
 email-validator

 flask_sqlalchemy
 flask_wtf
 email-validator
+# ------
+# Core Scientific Stack
+scipy==1.11.3
+soundfile==0.12.1
+sounddevice==0.4.6
+opencv-python==4.7.0.72
+moviepy==1.0.3
+librosa==0.10.0.post2
+# Hugging Face Transformers + Whisper
+transformers==4.39.3
+torch==2.1.2
+sentencepiece==0.1.99
+sentence-transformers==2.7.0
+git+https://github.com/openai/whisper.git@c0d2f62
+# LangChain stack
+langchain==0.3.26
+langchain_groq==0.3.6
+langchain_community==0.3.27
+#langchain_huggingface==0.2.0
+llama-index==0.8.40
+cohere==5.16.1
+# Vector DB
+qdrant-client==1.14.3
+# PDF & DOCX parsing
+PyPDF2==3.0.1
+python-docx==1.2.0
+# Audio / CLI
+ffmpeg-python==0.2.0
+#pyaudio==0.2.14
+inputimeout==1.0.4
+evaluate==0.4.5
+pip==23.3.1
+accelerate==0.29.3
+huggingface_hub==0.20.3
+textract==1.6.3
+bitsandbytes
+faster-whisper==0.10.0
+edge-tts==6.1.2