Spaces:

virendravaishnav
/

po-fetch-detail

Sleeping

virendravaishnav commited on Sep 13, 2024

Commit

a02d815

1 Parent(s): 5426c44

Updated with OCR model and Gradio integration

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,17 +7,22 @@ repo_id = "OpenGVLab/InternVL2-1B"
 # Load the tokenizer, processor, and model directly from the Hub
 tokenizer = AutoTokenizer.from_pretrained(repo_id, trust_remote_code=True)
 processor = AutoProcessor.from_pretrained(repo_id, trust_remote_code=True)
-model = AutoModel.from_pretrained(repo_id, trust_remote_code=True)
 # Move model to the appropriate device
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
 def analyze_image(image):
-    img = image.convert("RGB")
-    inputs = processor(images=img, text="describe this image", return_tensors="pt").to(device)
-    outputs = model.generate(**inputs)
-    return tokenizer.decode(outputs[0], skip_special_tokens=True)
 demo = gr.Interface(
     fn=analyze_image,

 # Load the tokenizer, processor, and model directly from the Hub
 tokenizer = AutoTokenizer.from_pretrained(repo_id, trust_remote_code=True)
 processor = AutoProcessor.from_pretrained(repo_id, trust_remote_code=True)
+model = AutoModel.from_pretrained(
+    repo_id, trust_remote_code=True, torch_dtype=torch.float16
+)
 # Move model to the appropriate device
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
 def analyze_image(image):
+    try:
+        img = image.convert("RGB")
+        inputs = processor(images=img, text="describe this image", return_tensors="pt").to(device)
+        outputs = model.generate(**inputs)
+        return tokenizer.decode(outputs[0], skip_special_tokens=True)
+    except Exception as e:
+        return f"An error occurred: {str(e)}"
 demo = gr.Interface(
     fn=analyze_image,