Spaces:

OmidSakaki
/

DocQA_Agent

Sleeping

App Files Files Community

OmidSakaki commited on Jul 2

Commit

279ab91

verified ·

1 Parent(s): fc0e7b8

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -24

app.py CHANGED Viewed

@@ -6,21 +6,22 @@ import os
 # --- مدل‌ها ---
 try:
-    model_name = "persiannlp/mt5-small-parsinlu-opus-translation"
     ocr_model = PaddleOCR(lang='fa', use_textline_orientation=True)
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     nlp_model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
 except Exception as e:
-    raise gr.Error(f"خطا در بارگذاری مدل‌ها: لطفاً از موجود بودن مدل اطمینان حاصل کنید. خطا: {str(e)}")
 # --- توابع پردازش ---
 def run_ocr(image):
-    image_path = image.name  # مسیر فایل موقت
     result = ocr_model.ocr(image_path, cls=True)
     texts = [line[1][0] for line in result[0]] if result else []
-    os.remove(image_path)  # حذف فایل موقت
     return " ".join(texts)
 def postprocess_text(text):
@@ -28,32 +29,24 @@ def postprocess_text(text):
     outputs = nlp_model.generate(**inputs)
     return tokenizer.decode(outputs[0], skip_special_tokens=True)
-def process_image(image):
-    raw_text = run_ocr(image)
-    processed_text = postprocess_text(raw_text) if raw_text else "متنی یافت نشد!"
-    return raw_text, processed_text
-# --- رابط Gradio ---
-with gr.Blocks(title="OCR فارسی با پردازش NLP") as app:
-    gr.Markdown("## 🔠 OCR فارسی + پردازش متن با مدل زبانی")
-    gr.Markdown("متن را از تصاویر استخراج کنید و با مدل زبانی اصلاح کنید!")
     with gr.Row():
-        image_input = gr.Image(type="filepath", label="تصویر ورودی")
         with gr.Column():
-            raw_text_output = gr.Textbox(label="متن خام (OCR)")
-            processed_text_output = gr.Textbox(label="متن پردازش‌شده (NLP)")
-    submit_btn = gr.Button("پردازش تصویر")
-    submit_btn.click(
-        fn=process_image,
         inputs=image_input,
-        outputs=[raw_text_output, processed_text_output]
     )
-    gr.Markdown("---")
-    gr.Markdown("### راهنما:\n1. تصویری حاوی متن فارسی آپلود کنید.\n2. روی دکمه پردازش کلیک کنید.")
-# اجرای برنامه
 if __name__ == "__main__":
     app.launch()

 # --- مدل‌ها ---
 try:
+    # مدل جدید تست شده و کارآمد
+    model_name = "m3hrdadfi/mt5-small-parsinlu-grammar-correction"
     ocr_model = PaddleOCR(lang='fa', use_textline_orientation=True)
     tokenizer = AutoTokenizer.from_pretrained(model_name)
     nlp_model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
 except Exception as e:
+    raise gr.Error(f"خطا در بارگذاری مدل‌ها: لطفاً این خطا را به توسعه دهنده گزارش دهید. خطا: {str(e)}")
 # --- توابع پردازش ---
 def run_ocr(image):
+    image_path = image.name
     result = ocr_model.ocr(image_path, cls=True)
     texts = [line[1][0] for line in result[0]] if result else []
+    os.remove(image_path)
     return " ".join(texts)
 def postprocess_text(text):
     outputs = nlp_model.generate(**inputs)
     return tokenizer.decode(outputs[0], skip_special_tokens=True)
+# --- رابط کاربری ---
+with gr.Blocks() as app:
+    gr.Markdown("## سیستم OCR فارسی با پردازش پیشرفته متن")
     with gr.Row():
         with gr.Column():
+            image_input = gr.Image(type="filepath", label="تصویر ورودی")
+            process_btn = gr.Button("پردازش تصویر")
+        with gr.Column():
+            raw_output = gr.Textbox(label="متن استخراج شده")
+            processed_output = gr.Textbox(label="متن پردازش شده")
+    process_btn.click(
+        fn=lambda img: (run_ocr(img), postprocess_text(run_ocr(img))),
         inputs=image_input,
+        outputs=[raw_output, processed_output]
     )
 if __name__ == "__main__":
     app.launch()