Spaces:

OmidSakaki
/

DocQA_Agent

Sleeping

OmidSakaki commited on Jul 2

Commit

dd4c7df

verified ·

1 Parent(s): abcd869

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -2,33 +2,41 @@ import gradio as gr
 import time
 import numpy as np
 from PIL import Image
-from paddleocr import PaddleOCR
 from transformers import TrOCRProcessor, VisionEncoderDecoderModel
-# Initialize models
-paddle_ocr = PaddleOCR(lang='fa', use_textline_orientation=True)
 trocr_processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-printed")
 trocr_model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-printed")
 def run_paddleocr(image):
     """Run PaddleOCR on image"""
-    # Convert to numpy array if needed
     if isinstance(image, Image.Image):
         image = np.array(image)
-    result = paddle_ocr.ocr(image, cls=True)
-    text = ' '.join([line[1][0] for line in result[0]]) if result else ''
-    return text
 def run_trocr(image):
     """Run TrOCR on image"""
-    # Convert to PIL Image if needed
     if isinstance(image, np.ndarray):
         image = Image.fromarray(image)
-    pixel_values = trocr_processor(image, return_tensors="pt").pixel_values
-    generated_ids = trocr_model.generate(pixel_values)
-    return trocr_processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
 def compare_models(image):
     """Compare PaddleOCR and TrOCR models"""

 import time
 import numpy as np
 from PIL import Image
+try:
+    from paddleocr import PaddleOCR
+    paddle_ocr = PaddleOCR(lang='fa', use_textline_orientation=True)
+except ImportError:
+    raise ImportError("لطفا ابتدا paddlepaddle و paddleocr را نصب کنید: pip install paddlepaddle paddleocr")
 from transformers import TrOCRProcessor, VisionEncoderDecoderModel
+# Initialize TrOCR
 trocr_processor = TrOCRProcessor.from_pretrained("microsoft/trocr-base-printed")
 trocr_model = VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-printed")
 def run_paddleocr(image):
     """Run PaddleOCR on image"""
     if isinstance(image, Image.Image):
         image = np.array(image)
+    try:
+        result = paddle_ocr.ocr(image, cls=True)
+        return ' '.join([line[1][0] for line in result[0]]) if result else ''
+    except Exception as e:
+        return f"خطا در PaddleOCR: {str(e)}"
 def run_trocr(image):
     """Run TrOCR on image"""
     if isinstance(image, np.ndarray):
         image = Image.fromarray(image)
+    try:
+        pixel_values = trocr_processor(image, return_tensors="pt").pixel_values
+        generated_ids = trocr_model.generate(pixel_values)
+        return trocr_processor.batch_decode(generated_ids, skip_special_tokens=True)[0]
+    except Exception as e:
+        return f"خطا در TrOCR: {str(e)}"
 def compare_models(image):
     """Compare PaddleOCR and TrOCR models"""