sachin
commited on
Commit
·
b244021
1
Parent(s):
a506b86
update path
Browse files- src/server/main.py +12 -6
src/server/main.py
CHANGED
@@ -19,7 +19,7 @@ import requests
|
|
19 |
from logging_config import logger
|
20 |
from tts_config import SPEED, ResponseFormat, config as tts_config
|
21 |
from gemma_llm import LLMManager
|
22 |
-
from auth import get_api_key, settings as auth_settings
|
23 |
|
24 |
# Supported language codes
|
25 |
SUPPORTED_LANGUAGES = {
|
@@ -144,7 +144,9 @@ async def home():
|
|
144 |
return RedirectResponse(url="/docs")
|
145 |
|
146 |
@app.post("/v1/unload_all_models")
|
147 |
-
async def unload_all_models(
|
|
|
|
|
148 |
try:
|
149 |
logger.info("Starting to unload all models...")
|
150 |
llm_manager.unload()
|
@@ -155,7 +157,9 @@ async def unload_all_models(api_key: str = Depends(get_api_key)):
|
|
155 |
raise HTTPException(status_code=500, detail=f"Failed to unload models: {str(e)}")
|
156 |
|
157 |
@app.post("/v1/load_all_models")
|
158 |
-
async def load_all_models(
|
|
|
|
|
159 |
try:
|
160 |
logger.info("Starting to load all models...")
|
161 |
llm_manager.load()
|
@@ -184,7 +188,9 @@ async def translate(request: TranslationRequest):
|
|
184 |
|
185 |
@app.post("/v1/chat", response_model=ChatResponse)
|
186 |
@limiter.limit(settings.chat_rate_limit)
|
187 |
-
async def chat(request: Request, chat_request: ChatRequest,
|
|
|
|
|
188 |
if not chat_request.prompt:
|
189 |
raise HTTPException(status_code=400, detail="Prompt cannot be empty")
|
190 |
logger.info(f"Received prompt: {chat_request.prompt}, src_lang: {chat_request.src_lang}, tgt_lang: {chat_request.tgt_lang}")
|
@@ -230,7 +236,7 @@ async def visual_query(
|
|
230 |
query: str = Body(...),
|
231 |
src_lang: str = Query("kan_Knda", enum=list(SUPPORTED_LANGUAGES)),
|
232 |
tgt_lang: str = Query("kan_Knda", enum=list(SUPPORTED_LANGUAGES)),
|
233 |
-
api_key: str = Depends(get_api_key)
|
234 |
):
|
235 |
try:
|
236 |
image = Image.open(file.file)
|
@@ -280,7 +286,7 @@ async def chat_v2(
|
|
280 |
image: UploadFile = File(default=None),
|
281 |
src_lang: str = Form("kan_Knda"),
|
282 |
tgt_lang: str = Form("kan_Knda"),
|
283 |
-
api_key: str = Depends(get_api_key)
|
284 |
):
|
285 |
if not prompt:
|
286 |
raise HTTPException(status_code=400, detail="Prompt cannot be empty")
|
|
|
19 |
from logging_config import logger
|
20 |
from tts_config import SPEED, ResponseFormat, config as tts_config
|
21 |
from gemma_llm import LLMManager
|
22 |
+
#from auth import get_api_key, settings as auth_settings
|
23 |
|
24 |
# Supported language codes
|
25 |
SUPPORTED_LANGUAGES = {
|
|
|
144 |
return RedirectResponse(url="/docs")
|
145 |
|
146 |
@app.post("/v1/unload_all_models")
|
147 |
+
async def unload_all_models(
|
148 |
+
#api_key: str = Depends(get_api_key)
|
149 |
+
):
|
150 |
try:
|
151 |
logger.info("Starting to unload all models...")
|
152 |
llm_manager.unload()
|
|
|
157 |
raise HTTPException(status_code=500, detail=f"Failed to unload models: {str(e)}")
|
158 |
|
159 |
@app.post("/v1/load_all_models")
|
160 |
+
async def load_all_models(
|
161 |
+
#api_key: str = Depends(get_api_key)
|
162 |
+
):
|
163 |
try:
|
164 |
logger.info("Starting to load all models...")
|
165 |
llm_manager.load()
|
|
|
188 |
|
189 |
@app.post("/v1/chat", response_model=ChatResponse)
|
190 |
@limiter.limit(settings.chat_rate_limit)
|
191 |
+
async def chat(request: Request, chat_request: ChatRequest,
|
192 |
+
#api_key: str = Depends(get_api_key)
|
193 |
+
):
|
194 |
if not chat_request.prompt:
|
195 |
raise HTTPException(status_code=400, detail="Prompt cannot be empty")
|
196 |
logger.info(f"Received prompt: {chat_request.prompt}, src_lang: {chat_request.src_lang}, tgt_lang: {chat_request.tgt_lang}")
|
|
|
236 |
query: str = Body(...),
|
237 |
src_lang: str = Query("kan_Knda", enum=list(SUPPORTED_LANGUAGES)),
|
238 |
tgt_lang: str = Query("kan_Knda", enum=list(SUPPORTED_LANGUAGES)),
|
239 |
+
#api_key: str = Depends(get_api_key)
|
240 |
):
|
241 |
try:
|
242 |
image = Image.open(file.file)
|
|
|
286 |
image: UploadFile = File(default=None),
|
287 |
src_lang: str = Form("kan_Knda"),
|
288 |
tgt_lang: str = Form("kan_Knda"),
|
289 |
+
#api_key: str = Depends(get_api_key)
|
290 |
):
|
291 |
if not prompt:
|
292 |
raise HTTPException(status_code=400, detail="Prompt cannot be empty")
|