Spaces:

redfernstech
/

s

Runtime error

redfernstech commited on Dec 13, 2024

Commit

e8a4c92

verified ·

1 Parent(s): 73f703c

Upload 6 files

Files changed (6) hide show

Dockerfile ADDED Viewed

+# Use the official Python image as the base image
+FROM python:3.9-slim
+# Set the working directory
+WORKDIR /app
+# Copy the backend files into the container
+COPY backend/ /app
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    gcc \
+    libsndfile1 \
+    && rm -rf /var/lib/apt/lists/*
+# Install Python dependencies
+RUN pip install --upgrade pip
+RUN pip install -r requirements.txt
+# Expose the FastAPI server port
+EXPOSE 8000
+# Run the FastAPI app with uvicorn
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "8000", "--reload"]

app.py ADDED Viewed

+from fastapi import FastAPI, UploadFile
+from fastapi.responses import FileResponse
+from backend.whisper_utils import transcribe_audio
+from backend.gtts_utils import generate_speech
+from backend.llm_utils import get_llm_response
+import os
+app = FastAPI()
+@app.post("/transcribe/")
+async def transcribe(file: UploadFile):
+    file_path = f"audio/{file.filename}"
+    with open(file_path, "wb") as audio:
+        audio.write(await file.read())
+    text = transcribe_audio(file_path)
+    os.remove(file_path)  # Cleanup audio file
+    return {"transcription": text}
+@app.post("/response/")
+async def get_response(input_text: str):
+    llm_response = get_llm_response(input_text)
+    audio_path = generate_speech(llm_response)
+    return {"response": llm_response, "audio_url": audio_path}
+@app.get("/audio/{file_name}")
+async def serve_audio(file_name: str):
+    file_path = f"audio/{file_name}"
+    return FileResponse(file_path)

gtts_utils.py ADDED Viewed

+from gtts import gTTS
+import os
+import uuid
+def generate_speech(text: str) -> str:
+    file_name = f"{uuid.uuid4()}.mp3"
+    file_path = f"audio/{file_name}"
+    tts = gTTS(text)
+    tts.save(file_path)
+    return file_path

llm_utils.py ADDED Viewed

+from transformers import pipeline
+# Load the Hugging Face LLM
+llm = pipeline("text-generation", model="gpt2", max_length=100)
+def get_llm_response(prompt: str) -> str:
+    response = llm(prompt)
+    return response[0]["generated_text"]

requirements.txt ADDED Viewed

+fastapi
+uvicorn
+openai-whisper
+transformers
+gtts

whisper_utils.py ADDED Viewed

+import whisper
+model = whisper.load_model("base")
+def transcribe_audio(file_path: str) -> str:
+    result = model.transcribe(file_path)
+    return result["text"]