Spaces:

G4EducFse
/

MonCorrecteurFrancais

Runtime error

TheOnlyHatem commited on Feb 17

Commit

405c6a7

verified ·

1 Parent(s): d6347df

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,28 +1,30 @@
 import gradio as gr
-from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
 import torch
-# Utilisation du modèle sdadas/byt5-text-correction
-model_name = "sdadas/byt5-text-correction"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
-model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model.to(device)
 def correction_grammaticale(texte):
-    # Pour le français, on ajoute le préfixe "<fr>" devant le texte
-    input_text = "<fr> " + texte
-    input_ids = tokenizer.encode(input_text, return_tensors="pt").to(device)
     outputs = model.generate(
-        input_ids,
         max_length=512,
         num_beams=4,
         early_stopping=True
     )
     correction = tokenizer.decode(outputs[0], skip_special_tokens=True)
     return correction
@@ -30,7 +32,7 @@ demo = gr.Interface(
     fn=correction_grammaticale,
     inputs=gr.Textbox(label="Texte à corriger"),
     outputs=gr.Textbox(label="Texte corrigé"),
-    title="Correcteur de Texte Français"
 )
 if __name__ == "__main__":

 import gradio as gr
 import torch
+from transformers import MBartForConditionalGeneration, MBartTokenizer
+# Remplace par ton repo exact si besoin :
+model_name = "alice/mini/mBART_french_correction"
+# Chargement du tokenizer et du modèle
+tokenizer = MBartTokenizer.from_pretrained(model_name)
+model = MBartForConditionalGeneration.from_pretrained(model_name)
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model.to(device)
 def correction_grammaticale(texte):
+    # Tokenisation
+    inputs = tokenizer(texte, return_tensors="pt", max_length=512, truncation=True).to(device)
+    # Génération
     outputs = model.generate(
+        **inputs,
         max_length=512,
         num_beams=4,
         early_stopping=True
     )
+    # Décodage
     correction = tokenizer.decode(outputs[0], skip_special_tokens=True)
     return correction
     fn=correction_grammaticale,
     inputs=gr.Textbox(label="Texte à corriger"),
     outputs=gr.Textbox(label="Texte corrigé"),
+    title="Correcteur MBART Français"
 )
 if __name__ == "__main__":