Spaces:

OmidSakaki
/

DocQA_Agent

Sleeping

App Files Files Community

OmidSakaki commited on Jul 2

Commit

f774dbf

verified ·

1 Parent(s): 57fa964

Update app.py

Browse files

Files changed (1) hide show

app.py +22 -17

app.py CHANGED Viewed

@@ -2,9 +2,8 @@ import gradio as gr
 import easyocr
 import numpy as np
 from typing import Tuple
-from transformers import pipeline
-# --- 1. کلاس OCR برای استخراج متن از تصویر ---
 class OCRProcessor:
     def __init__(self):
         self.reader = easyocr.Reader(['fa'])
@@ -16,32 +15,39 @@ class OCRProcessor:
         except Exception as e:
             raise RuntimeError(f"خطا در پردازش OCR: {str(e)}")
-# --- 2. کلاس تصحیح متن با مدل زبانی ---
 class TextCorrector:
     def __init__(self):
-        # استفاده از مدل ParsBERT برای تصحیح متن فارسی
-        self.corrector = pipeline(
-            "text2text-generation",
-            model="persiannlp/parsbert-uncased",  # مدل زبانی فارسی
-            tokenizer="persiannlp/parsbert-uncased"
-        )
     def correct(self, text: str) -> str:
         if not text.strip():
             return text
         try:
-            corrected = self.corrector(
-                text,
                 max_length=512,
                 num_beams=5,
                 early_stopping=True
             )
-            return corrected[0]['generated_text']
         except Exception as e:
             print(f"خطا در تصحیح متن: {e}")
             return text
-# --- 3. پردازش کامل (OCR + تصحیح خودکار) ---
 def full_processing(image: np.ndarray) -> Tuple[str, str]:
     try:
         # استخراج متن از تصویر
@@ -55,10 +61,9 @@ def full_processing(image: np.ndarray) -> Tuple[str, str]:
         error_msg = f"خطا: {str(e)}"
         return error_msg, error_msg
-# --- 4. رابط کاربری Gradio ---
 with gr.Blocks(title="پایپلاین OCR + تصحیح خودکار متن فارسی") as app:
     gr.Markdown("""
-    # استخراج و تصحیح هوشمند متن فارسی از تصویر
     """)
     with gr.Row():
@@ -66,8 +71,8 @@ with gr.Blocks(title="پایپلاین OCR + تصحیح خودکار متن فا
             img_input = gr.Image(label="تصویر ورودی", type="numpy")
             process_btn = gr.Button("پردازش تصویر", variant="primary")
         with gr.Column():
-            raw_output = gr.Textbox(label="متن استخراج شده (خام)", lines=8, interactive=True)
-            corrected_output = gr.Textbox(label="متن تصحیح شده (هوشمند)", lines=10, interactive=True)
     process_btn.click(
         fn=full_processing,

 import easyocr
 import numpy as np
 from typing import Tuple
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 class OCRProcessor:
     def __init__(self):
         self.reader = easyocr.Reader(['fa'])
         except Exception as e:
             raise RuntimeError(f"خطا در پردازش OCR: {str(e)}")
 class TextCorrector:
     def __init__(self):
+        model_name = "persiannlp/mt5-small-parsinlu-arc-comqa-question"
+        try:
+            self.tokenizer = AutoTokenizer.from_pretrained(model_name)
+            self.model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
+        except Exception as e:
+            raise RuntimeError(f"خطا در بارگذاری مدل زبانی: {str(e)}")
     def correct(self, text: str) -> str:
         if not text.strip():
             return text
         try:
+            inputs = self.tokenizer(
+                "اصلاح متن: " + text,
+                return_tensors="pt",
+                max_length=512,
+                truncation=True
+            )
+            outputs = self.model.generate(
+                **inputs,
                 max_length=512,
                 num_beams=5,
                 early_stopping=True
             )
+            return self.tokenizer.decode(outputs[0], skip_special_tokens=True)
         except Exception as e:
             print(f"خطا در تصحیح متن: {e}")
             return text
 def full_processing(image: np.ndarray) -> Tuple[str, str]:
     try:
         # استخراج متن از تصویر
         error_msg = f"خطا: {str(e)}"
         return error_msg, error_msg
 with gr.Blocks(title="پایپلاین OCR + تصحیح خودکار متن فارسی") as app:
     gr.Markdown("""
+    # سیستم استخراج و تصحیح هوشمند متن فارسی
     """)
     with gr.Row():
             img_input = gr.Image(label="تصویر ورودی", type="numpy")
             process_btn = gr.Button("پردازش تصویر", variant="primary")
         with gr.Column():
+            raw_output = gr.Textbox(label="متن استخراج شده (خام)", lines=8)
+            corrected_output = gr.Textbox(label="متن تصحیح شده (هوشمند)", lines=10)
     process_btn.click(
         fn=full_processing,