qwen2.5-VL-api

Running

danilohssantana commited on Feb 18

Commit

5dd1cbf

1 Parent(s): f245369

changing endpoint call

Files changed (2) hide show

main.py CHANGED Viewed

@@ -86,28 +86,26 @@ async def upload_and_encode_image(file: UploadFile = File(...)):
         raise HTTPException(status_code=400, detail=f"Invalid file: {e}")
 @app.get("/predict")
-def predict(image_url: str = Query(...), prompt: str = Query(...)):
     """
     Generates a description for an image using the Qwen-2-VL model.
     Args:
-        image_url (str): The URL of the image to describe.
         prompt (str): The text prompt to guide the model's response.
     Returns:
         str: The generated description of the image.
     """
-    image = encode_image(image_url)
     # Create the input message structure
     messages = [
         {
             "role": "user",
             "content": [
-                {"type": "image", "image": f"data:image;base64,{image}"},
-                {"type": "text", "text": prompt},
             ],
         }
     ]

         raise HTTPException(status_code=400, detail=f"Invalid file: {e}")
 @app.get("/predict")
+def predict(data: str = Query(...), prompt: str = Query(...)):
     """
     Generates a description for an image using the Qwen-2-VL model.
     Args:
+        data (any): The encoded image and the prompt to be used.
         prompt (str): The text prompt to guide the model's response.
     Returns:
         str: The generated description of the image.
     """
     # Create the input message structure
     messages = [
         {
             "role": "user",
             "content": [
+                {"type": "image", "image": f"data:image;base64,{data.image_base64}"},
+                {"type": "text", "text": data.prompt},
             ],
         }
     ]

model.py CHANGED Viewed

@@ -1,22 +1,37 @@
 import requests
-# curl -G "https://<uname>-<spacename>.hf.space/predict" \
-#      --data-urlencode "image_url=https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-VL/assets/demo.jpeg" \
-#      --data-urlencode "prompt=Describe this image."
-url = "https://danilohssantana-qwen2-5-vl-api.hf.space/predict"
-# Define the parameters
-params = {
-    "image_url": "https://cdn.britannica.com/35/238335-050-2CB2EB8A/Lionel-Messi-Argentina-Netherlands-World-Cup-Qatar-2022.jpg",
-    "prompt": "describe",
 }
-# Send the GET request
-response = requests.get(url, params=params)
-if response.status_code == 200:
-    print("Response:", response.json())
 else:
-    print("Error:", response.status_code, response.text)

 import requests
+# Define base URL for your Hugging Face Space
+BASE_URL = "https://danilohssantana-qwen2-5-vl-api.hf.space"
+# Image URL to be encoded
+image_url = "https://cdn.britannica.com/35/238335-050-2CB2EB8A/Lionel-Messi-Argentina-Netherlands-World-Cup-Qatar-2022.jpg"
+# Step 1: Download the image
+response = requests.get(image_url)
+if response.status_code != 200:
+    print("Error downloading image:", response.status_code, response.text)
+    exit()
+# Step 2: Send the image to the encode-image endpoint
+files = {"file": ("image.jpg", response.content, "image/jpeg")}
+encode_response = requests.post(f"{BASE_URL}/encode-image/", files=files)
+if encode_response.status_code != 200:
+    print("Error encoding image:", encode_response.status_code, encode_response.text)
+    exit()
+encoded_image = encode_response.json().get("encoded_image")
+# Step 3: Send the encoded image to the predict endpoint
+predict_payload = {
+    "image_base64": encoded_image,
+    "prompt": "describe the image",
 }
+predict_response = requests.get(f"{BASE_URL}/predict", params=predict_payload)
+# Step 4: Print the response
+if predict_response.status_code == 200:
+    print("Response:", predict_response.json())
 else:
+    print("Error:", predict_response.status_code, predict_response.text)