SuperSl6's picture
Update app.py
a827e42 verified
raw
history blame
1.07 kB
from transformers import pipeline, AutoTokenizer
import gradio as gr
# Load tokenizer with use_fast=False
tokenizer = AutoTokenizer.from_pretrained("SuperSl6/Arabic-Text-Correction", use_fast=False)
model = pipeline(
"text2text-generation",
model="SuperSl6/Arabic-Text-Correction",
tokenizer=tokenizer
)
def correct_text(input_text):
result = model(
input_text,
max_length=50, # Limit output length
no_repeat_ngram_size=2, # Prevent repeating bigrams
repetition_penalty=1.5, # Penalize repetitions
num_return_sequences=1 # Return a single output
)[0]['generated_text']
return result
# Gradio Interface
interface = gr.Interface(
fn=correct_text,
inputs=gr.Textbox(lines=3, placeholder="أدخل النص العربي هنا..."),
outputs=gr.Textbox(),
live=True,
title="تصحيح النص العربي",
description="أداة لتصحيح النصوص العربية باستخدام نموذج SuperSl6/Arabic-Text-Correction."
)
interface.launch()