Spaces:

Tanmay09516
/

langchat-backend

Running

App Files Files Community

langchat-backend / app.py

Tanmay09516

Update app.py

0d02cc4 verified 9 months ago

raw

history blame

4.97 kB

	# app.py
	import os
	import warnings
	from dotenv import load_dotenv
	import gradio as gr
	from qdrant_search import QdrantSearch
	from langchain_groq import ChatGroq
	from nomic_embeddings import EmbeddingsModel

	from fastapi import FastAPI, HTTPException
	from fastapi.middleware.cors import CORSMiddleware
	from pydantic import BaseModel

	# Load environment variables
	load_dotenv()

	# Suppress FutureWarnings
	warnings.filterwarnings("ignore", category=FutureWarning)

	# Disable tokenizers parallelism
	os.environ["TOKENIZERS_PARALLELISM"] = "FALSE"

	# Initialize global variables
	collection_names = ["docs_v1_2", "docs_v2_2", "docs_v3_2"]
	limit = 5

	# Initialize the language model
	llm = ChatGroq(model="mixtral-8x7b-32768")

	# Initialize the embeddings model
	embeddings = EmbeddingsModel()

	# Initialize Qdrant search with necessary credentials
	search = QdrantSearch(
	qdrant_url=os.environ["QDRANT_CLOUD_URL"],
	api_key=os.environ["QDRANT_API_KEY"],
	embeddings=embeddings
	)

	def chat_function(question: str):
	"""
	Handles the chat functionality by processing the user's question,
	retrieving relevant documents, generating an answer, and returning sources.

	Args:
	question (str): The user's question.

	Returns:
	Tuple[str, str]: The generated answer and the sources used.
	"""
	query = question.strip()
	if not query:
	return "❌ Error: Query cannot be empty.", "No sources available."

	# Step 1: Retrieve relevant documents from Qdrant
	retrieved_docs = search.query_multiple_collections(query, collection_names, limit)

	if not retrieved_docs:
	return "⚠️ No relevant documents found for your query.", "No sources available."

	# Step 2: Prepare the context from retrieved documents
	context = "\n\n".join([doc['text'] for doc in retrieved_docs])

	# Step 3: Construct the prompt with context and question
	prompt = (
	"You are LangAssist, a knowledgeable assistant for the LangChain Python Library. "
	"Given the following context from the documentation, provide a helpful answer to the user's question.\n\n"
	"### Context:\n{context}\n\n"
	"### Question:\n{question}\n\n"
	"### Answer:"
	).format(context=context, question=query)

	# Step 4: Generate an answer using the language model
	try:
	answer = llm.invoke(prompt)
	except Exception as e:
	return f"⚠️ Error generating answer: {str(e)}", "No sources available."

	# Prepare sources
	sources = "\n\n".join([
	f"Source: {doc['source']}\nExcerpt: {doc['text']}"
	for doc in retrieved_docs
	])

	return answer.content.strip(), sources

	# Define Pydantic model for request
	class ChatRequest(BaseModel):
	question: str

	# Initialize FastAPI app
	app = FastAPI()

	# Define allowed origins
	origins = [
	"*", # Allow all origins; for production, specify your frontend domains
	# Example:
	# "http://localhost",
	# "http://localhost:3000",
	# "https://your-frontend-domain.com",
	]

	# Add CORS middleware
	app.add_middleware(
	CORSMiddleware,
	allow_origins=origins, # Allows all origins. Replace "*" with specific domains in production.
	allow_credentials=True,
	allow_methods=["*"], # Allows all HTTP methods.
	allow_headers=["*"], # Allows all headers.
	)

	# Define API endpoint
	@app.post("/api/chat")
	async def api_chat(request: ChatRequest):
	try:
	answer, sources = chat_function(request.question)
	return {"answer": answer, "sources": sources}
	except Exception as e:
	raise HTTPException(status_code=500, detail=str(e))

	# Create Gradio Interface
	with gr.Blocks() as demo:
	gr.Markdown("# 🗨️ LangAssist Chat")
	gr.Markdown("Ask questions about the LangChain Python Library and get answers based on the latest documentation.")

	with gr.Row():
	with gr.Column(scale=2):
	question_input = gr.Textbox(
	lines=2,
	placeholder="Type your question here...",
	label="Your Question"
	)
	submit_button = gr.Button("💬 Submit")
	with gr.Column(scale=3):
	answer_output = gr.Markdown("### Answer will appear here...")
	sources_output = gr.Markdown("### Sources will appear here...")

	submit_button.click(
	fn=chat_function,
	inputs=question_input,
	outputs=[answer_output, sources_output]
	)

	gr.Markdown("""
	---
	## 📡 API Endpoint

	You can access the API endpoint at `/api/chat`. For example, send a POST request to `http://localhost:8000/api/chat` with JSON body `{"question": "Your question here"}`.
	""")

	# Mount Gradio app on FastAPI
	app = gr.mount_gradio_app(app, demo, path="/gradio")

	# To run, use: uvicorn app:app --host 0.0.0.0 --port 8000
	if __name__ == "__main__":
	import uvicorn
	uvicorn.run(app, host="0.0.0.0", port=8000)