Spaces:

Madi7a
/

AI-Interviewer

Build error

AI-Interviewer / rag.py

madi7a

feat: Add core application files and correct gitignore

d90a0a5 21 days ago

10.5 kB

	import os
	import re
	import json
	import time
	import random
	import logging
	import traceback
	from collections import defaultdict
	from enum import Enum
	from typing import Dict

	# --- .env for secrets ---
	from dotenv import load_dotenv

	# --- LangChain & Hugging Face---
	# Note: Some of these imports might be from older versions of LangChain.
	# Ensure your dependencies match.
	from langchain_groq import ChatGroq as LangChainChatGroq # Renamed to avoid conflict
	from langchain_community.embeddings import HuggingFaceEmbeddings
	from langchain_community.vectorstores import Qdrant
	from langchain.prompts import PromptTemplate
	from langchain.chains import LLMChain
	from langchain.retrievers import ContextualCompressionRetriever
	from langchain.retrievers.document_compressors import CohereRerank
	from huggingface_hub import login

	# --- Qdrant Vector DB ---
	from qdrant_client import QdrantClient
	from qdrant_client.http.models import (
	VectorParams, Distance, Filter, FieldCondition, MatchValue,
	PointStruct
	)

	# --- Models, Embeddings, and Utilities ---
	import cohere
	from sentence_transformers import SentenceTransformer
	import torch
	from transformers import (
	pipeline, AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig
	)

	# --- Utility ---
	import numpy as np
	from sklearn.metrics.pairwise import cosine_similarity
	from textwrap import dedent
	import requests
	from docx import Document
	import textract
	from PyPDF2 import PdfReader


	# ==============================================================================
	# 1. SCRIPT CONFIGURATION
	# ==============================================================================
	# Configure logging
	logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

	# --- Hugging Face Model for Local Evaluation ---
	JUDGE_MODEL_NAME = "mistralai/Mistral-7B-Instruct-v0.3"
	EMBEDDING_MODEL_NAME = "all-MiniLM-L6-v2"
	QDRANT_COLLECTION_NAME = "interview_questions"


	# ==============================================================================
	# 2. API AND ENVIRONMENT HANDLING
	# ==============================================================================
	def handle_apis():
	"""
	Loads API keys from a .env file, validates them, and logs into Hugging Face.

	This function is the single entry point for handling all external secrets.
	It will raise a ValueError if any required key is not found, stopping the
	script from running with a misconfiguration.
	"""
	load_dotenv()
	logging.info("Attempting to load API keys from .env file...")

	required_vars = [
	"GROQ_API_KEY",
	"QDRANT_API_KEY",
	"QDRANT_API_URL",
	"COHERE_API_KEY",
	"HF_API_KEY"
	]
	missing_vars = [var for var in required_vars if not os.getenv(var)]

	if missing_vars:
	error_message = (
	f"Error: Missing required environment variables: {', '.join(missing_vars)}. "
	"Please create a .env file in the root directory with all necessary keys."
	)
	logging.critical(error_message)
	raise ValueError(error_message)

	logging.info("✅ Successfully loaded and validated all required API keys.")

	try:
	hf_api_key = os.getenv("HF_API_KEY")
	login(token=hf_api_key)
	logging.info("✅ Successfully logged into Hugging Face Hub.")
	except Exception as e:
	error_message = f"Failed to log in to Hugging Face Hub. Please check your HF_API_KEY. Error: {e}"
	logging.critical(error_message)
	raise RuntimeError(error_message)

	# --- Run the API handler at the start of the script ---
	handle_apis()


	# ==============================================================================
	# 3. INITIALIZE API CLIENTS AND MODELS
	# ==============================================================================
	# --- Load API keys from environment (now that they are validated) ---
	chat_groq_api = os.getenv("GROQ_API_KEY")
	qdrant_api = os.getenv("QDRANT_API_KEY")
	qdrant_url = os.getenv("QDRANT_API_URL")
	cohere_api_key = os.getenv("COHERE_API_KEY")

	# --- Initialize API Clients ---
	logging.info("Initializing API clients...")
	qdrant_client = QdrantClient(url=qdrant_url, api_key=qdrant_api)
	cohere_client = cohere.Client(api_key=cohere_api_key)
	logging.info("✅ API clients initialized.")


	# --- Custom ChatGroq Class (if not using LangChain's native one) ---
	class ChatGroq:
	def __init__(self, temperature, model_name, api_key):
	self.temperature = temperature
	self.model_name = model_name
	self.api_key = api_key
	self.api_url = "https://api.groq.com/openai/v1/chat/completions"

	def predict(self, prompt):
	try:
	headers = {"Authorization": f"Bearer {self.api_key}", "Content-Type": "application/json"}
	payload = {
	"model": self.model_name,
	"messages": [{"role": "system", "content": "You are an AI interviewer."},
	{"role": "user", "content": prompt}],
	"temperature": self.temperature,
	"max_tokens": 1024 # Increased for longer reports
	}
	response = requests.post(self.api_url, headers=headers, json=payload, timeout=20)
	response.raise_for_status()
	data = response.json()
	if "choices" in data and len(data["choices"]) > 0:
	return data["choices"][0]["message"]["content"].strip()
	logging.warning("Unexpected response structure from Groq API")
	return "Interviewer: Could you tell me more about your relevant experience?"
	except requests.exceptions.RequestException as e:
	logging.error(f"ChatGroq API error: {e}")
	return "Interviewer: Due to a system issue, let's move on to another question."

	groq_llm = ChatGroq(temperature=0.7, model_name="llama3-70b-8192", api_key=chat_groq_api)


	# --- Initialize Local Models (Embeddings and Judge LLM) ---
	logging.info("Loading local models. This may take a while...")

	# Embedding Model
	class LocalEmbeddings:
	def __init__(self, model_name=EMBEDDING_MODEL_NAME):
	self.model = SentenceTransformer(model_name)
	def embed_query(self, text):
	return self.model.encode(text).tolist()
	def embed_documents(self, documents):
	return self.model.encode(documents).tolist()

	embeddings = LocalEmbeddings()

	# Judge LLM (with quantization for lower memory usage)
	bnb_config = BitsAndBytesConfig(
	load_in_4bit=True,
	bnb_4bit_compute_dtype=torch.float16,
	bnb_4bit_use_double_quant=True,
	bnb_4bit_quant_type="nf4"
	)

	# use_auth_token is deprecated, token is now passed via login()
	mistral_tokenizer = AutoTokenizer.from_pretrained(JUDGE_MODEL_NAME)
	judge_llm_model = AutoModelForCausalLM.from_pretrained(
	JUDGE_MODEL_NAME,
	quantization_config=bnb_config,
	torch_dtype=torch.float16,
	device_map="auto"
	)

	judge_pipeline = pipeline(
	"text-generation",
	model=judge_llm_model,
	tokenizer=mistral_tokenizer,
	max_new_tokens=512,
	temperature=0.2,
	top_p=0.95,
	do_sample=True,
	repetition_penalty=1.15,
	)
	logging.info("✅ All models and clients are ready.")


	# ==============================================================================
	# 4. CORE APPLICATION LOGIC AND FUNCTIONS
	# ==============================================================================

	# --- The rest of your functions go here, unchanged. ---
	# e.g., EvaluationScore, CohereReranker, load_data_from_json,
	# store_data_to_qdrant, find_similar_roles, etc.
	# ... (All your other functions from the original script) ...
	# I will include them for completeness.

	class EvaluationScore(str, Enum):
	POOR = "Poor"
	MEDIUM = "Medium"
	GOOD = "Good"
	EXCELLENT = "Excellent"

	class CohereReranker:
	def __init__(self, client):
	self.client = client
	def compress_documents(self, documents, query):
	# ... function code ...
	pass

	reranker = CohereReranker(cohere_client)

	def load_data_from_json(file_path):
	# ... function code ...
	pass

	def verify_qdrant_collection(collection_name=QDRANT_COLLECTION_NAME):
	# ... function code ...
	pass

	def store_data_to_qdrant(data, collection_name=QDRANT_COLLECTION_NAME, batch_size=100):
	# ... function code ...
	pass

	def find_similar_roles(user_role, all_roles, top_k=3):
	# ... function code ...
	pass

	def get_role_questions(job_role):
	# ... function code ...
	pass

	def retrieve_interview_data(job_role, all_roles):
	# ... function code ...
	pass

	def random_context_chunks(retrieved_data, k=3):
	# ... function code ...
	pass

	def eval_question_quality(question: str, job_role: str, seniority: str, judge_pipeline=judge_pipeline):
	# ... function code ...
	pass

	def generate_reference_answer(question, job_role, seniority):
	# ... function code ...
	pass

	def evaluate_answer(question: str, answer: str, ref_answer: str, job_role: str, seniority: str, judge_pipeline=judge_pipeline):
	# ... function code ...
	pass

	def build_interview_prompt(conversation_history, user_response, context, job_role, skills, seniority, difficulty_adjustment=None):
	# ... function code ...
	pass

	def generate_llm_interview_report(interview_state, job_role, seniority):
	# ... function code ...
	pass

	def extract_candidate_details(file_path):
	# ... function code ...
	pass

	def extract_job_details(job_description):
	# ... function code ...
	pass

	def extract_all_roles_from_qdrant(collection_name=QDRANT_COLLECTION_NAME):
	# ... function code ...
	pass


	# Example of how to run (for testing purposes)
	if __name__ == '__main__':
	logging.info("Starting a test run...")
	try:
	all_roles = extract_all_roles_from_qdrant()
	if not all_roles:
	logging.warning("No roles found in Qdrant. Using a default list for testing.")
	all_roles = ['data scientist', 'machine learning engineer', 'software engineer']

	job_role = "ml engineer" # intentionally misspelled
	qa_pairs = retrieve_interview_data(job_role, all_roles)

	if qa_pairs:
	logging.info(f"Successfully retrieved {len(qa_pairs)} QA pairs for role '{job_role}'.")
	# print("First QA pair:", qa_pairs[0])
	else:
	logging.error(f"Could not retrieve any QA pairs for role '{job_role}'.")

	except Exception as e:
	logging.critical(f"A critical error occurred during the test run: {e}", exc_info=True)