Spaces:

OmidSakaki
/

DocQA_Agent

Sleeping

App Files Files Community

OmidSakaki commited on Jul 2

Commit

1f0a2e7

verified ·

1 Parent(s): 35b0235

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -26

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ from doctr.models import ocr_predictor
 # Initialize models
 models = {
-    "EasyOCR": easyocr.Reader(['en']),
     "TrOCR": {
         "processor": TrOCRProcessor.from_pretrained("microsoft/trocr-base-printed"),
         "model": VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-printed")
@@ -17,24 +17,24 @@ models = {
 }
 def run_easyocr(image):
-    """Run EasyOCR on image"""
     try:
         result = models["EasyOCR"].readtext(np.array(image), detail=0)
         return ' '.join(result) if result else ''
     except Exception as e:
-        return f"Error: {str(e)}"
 def run_trocr(image):
-    """Run TrOCR on image"""
     try:
         pixel_values = models["TrOCR"]["processor"](image, return_tensors="pt").pixel_values
         generated_ids = models["TrOCR"]["model"].generate(pixel_values)
         return models["TrOCR"]["processor"].batch_decode(generated_ids, skip_special_tokens=True)[0]
     except Exception as e:
-        return f"Error: {str(e)}"
 def run_doctr(image):
-    """Run DocTR on image"""
     try:
         if isinstance(image, Image.Image):
             image = np.array(image)
@@ -42,10 +42,10 @@ def run_doctr(image):
         return ' '.join([word[0] for page in result.pages for block in page.blocks
                         for line in block.lines for word in line.words])
     except Exception as e:
-        return f"Error: {str(e)}"
 def compare_models(image):
-    """Compare all OCR models"""
     if isinstance(image, np.ndarray):
         image = Image.fromarray(image)
     image = image.convert("RGB")
@@ -53,7 +53,7 @@ def compare_models(image):
     results = {}
     times = {}
-    # Run all OCR models
     for name, func in [("EasyOCR", run_easyocr),
                       ("TrOCR", run_trocr),
                       ("DocTR", run_doctr)]:
@@ -61,14 +61,14 @@ def compare_models(image):
         results[name] = func(image)
         times[name] = time.time() - start
-    # Create comparison table
     table_rows = []
     for name in results:
         table_rows.append(f"""
         <tr>
             <td style="padding: 8px; border: 1px solid #ddd; text-align: center; font-weight: bold;">{name}</td>
-            <td style="padding: 8px; border: 1px solid #ddd;">{results[name]}</td>
-            <td style="padding: 8px; border: 1px solid #ddd; text-align: center;">{times[name]:.3f}s</td>
         </tr>
         """)
@@ -76,9 +76,9 @@ def compare_models(image):
     <div style="overflow-x: auto;">
     <table style="width:100%; border-collapse: collapse; margin: 15px 0; font-family: Arial, sans-serif;">
         <tr style="background-color: #4CAF50; color: white;">
-            <th style="padding: 12px; border: 1px solid #ddd; text-align: center;">Model</th>
-            <th style="padding: 12px; border: 1px solid #ddd; text-align: center;">Extracted Text</th>
-            <th style="padding: 12px; border: 1px solid #ddd; text-align: center;">Processing Time</th>
         </tr>
         {''.join(table_rows)}
     </table>
@@ -87,27 +87,27 @@ def compare_models(image):
     return comparison, results['EasyOCR'], results['TrOCR'], results['DocTR']
-# Create Gradio interface
-with gr.Blocks(title="English OCR Comparison", theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
-    # 🚀 English OCR Model Comparison
-    Compare the performance of top OCR models for English text extraction
     """)
     with gr.Row():
         with gr.Column():
-            img_input = gr.Image(label="Upload Image", type="pil")
             gr.Examples(
-                examples=["sample1.jpg", "sample2.png"],
                 inputs=img_input,
-                label="Try these sample images"
             )
-            submit_btn = gr.Button("Compare Models", variant="primary")
         with gr.Column():
-            comparison = gr.HTML(label="Comparison Results")
-            with gr.Accordion("Detailed Results", open=False):
-                gr.Markdown("### Individual Model Outputs")
                 easy_output = gr.Textbox(label="EasyOCR")
                 trocr_output = gr.Textbox(label="TrOCR")
                 doctr_output = gr.Textbox(label="DocTR")

 # Initialize models
 models = {
+    "EasyOCR": easyocr.Reader(['fa']),  # تنظیم زبان فارسی
     "TrOCR": {
         "processor": TrOCRProcessor.from_pretrained("microsoft/trocr-base-printed"),
         "model": VisionEncoderDecoderModel.from_pretrained("microsoft/trocr-base-printed")
 }
 def run_easyocr(image):
+    """تابع پردازش تصویر با EasyOCR برای فارسی"""
     try:
         result = models["EasyOCR"].readtext(np.array(image), detail=0)
         return ' '.join(result) if result else ''
     except Exception as e:
+        return f"خطا: {str(e)}"
 def run_trocr(image):
+    """تابع پردازش تصویر با TrOCR برای فارسی"""
     try:
         pixel_values = models["TrOCR"]["processor"](image, return_tensors="pt").pixel_values
         generated_ids = models["TrOCR"]["model"].generate(pixel_values)
         return models["TrOCR"]["processor"].batch_decode(generated_ids, skip_special_tokens=True)[0]
     except Exception as e:
+        return f"خطا: {str(e)}"
 def run_doctr(image):
+    """تابع پردازش تصویر با DocTR برای فارسی"""
     try:
         if isinstance(image, Image.Image):
             image = np.array(image)
         return ' '.join([word[0] for page in result.pages for block in page.blocks
                         for line in block.lines for word in line.words])
     except Exception as e:
+        return f"خطا: {str(e)}"
 def compare_models(image):
+    """تابع اصلی مقایسه مدل‌ها"""
     if isinstance(image, np.ndarray):
         image = Image.fromarray(image)
     image = image.convert("RGB")
     results = {}
     times = {}
+    # اجرای تمام مدل‌های OCR
     for name, func in [("EasyOCR", run_easyocr),
                       ("TrOCR", run_trocr),
                       ("DocTR", run_doctr)]:
         results[name] = func(image)
         times[name] = time.time() - start
+    # ایجاد جدول مقایسه
     table_rows = []
     for name in results:
         table_rows.append(f"""
         <tr>
             <td style="padding: 8px; border: 1px solid #ddd; text-align: center; font-weight: bold;">{name}</td>
+            <td style="padding: 8px; border: 1px solid #ddd; text-align: right; direction: rtl;">{results[name]}</td>
+            <td style="padding: 8px; border: 1px solid #ddd; text-align: center;">{times[name]:.3f} ثانیه</td>
         </tr>
         """)
     <div style="overflow-x: auto;">
     <table style="width:100%; border-collapse: collapse; margin: 15px 0; font-family: Arial, sans-serif;">
         <tr style="background-color: #4CAF50; color: white;">
+            <th style="padding: 12px; border: 1px solid #ddd; text-align: center;">مدل</th>
+            <th style="padding: 12px; border: 1px solid #ddd; text-align: center;">متن استخراج شده</th>
+            <th style="padding: 12px; border: 1px solid #ddd; text-align: center;">زمان پردازش</th>
         </tr>
         {''.join(table_rows)}
     </table>
     return comparison, results['EasyOCR'], results['TrOCR'], results['DocTR']
+# رابط کاربری Gradio
+with gr.Blocks(title="مقایسه مدل‌های OCR فارسی", theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
+    # 🚀 مقایسه مدل‌های تشخیص متن فارسی
+    مقایسه عملکرد مدل‌های مختلف OCR برای استخراج متن از تصاویر فارسی
     """)
     with gr.Row():
         with gr.Column():
+            img_input = gr.Image(label="تصویر ورودی", type="pil")
             gr.Examples(
+                examples=["sample_fa1.jpg", "sample_fa2.png"],
                 inputs=img_input,
+                label="تصاویر نمونه"
             )
+            submit_btn = gr.Button("مقایسه مدل‌ها", variant="primary")
         with gr.Column():
+            comparison = gr.HTML(label="نتایج مقایسه")
+            with gr.Accordion("نتایج تفکیکی", open=False):
+                gr.Markdown("### خروجی هر مدل")
                 easy_output = gr.Textbox(label="EasyOCR")
                 trocr_output = gr.Textbox(label="TrOCR")
                 doctr_output = gr.Textbox(label="DocTR")