Spaces:

gryan-galario
/

manga-ocr-demo

Running

gryan-galario commited on Mar 27, 2022

Commit

ff3e8f8

1 Parent(s): 5bdac5f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,41 @@
 import gradio as gr
-from transformers import pipeline
-pipe = pipeline(model="kha-white/manga-ocr-base")
-gr.Interface.from_pipeline(pipe, title="Manga OCR", description="Japanese Character Recognization from Mangas", allow_flagging="never").launch(inbrowser=True)

 import gradio as gr
+from transformers import AutoTokenizer, AutoModel, AutoFeatureExtractor
+from PIL import Image
+import requests
+import torch
+tokenizer = AutoTokenizer.from_pretrained("kha-white/manga-ocr-base")
+model = AutoModel.from_pretrained("kha-white/manga-ocr-base")
+feature_extractor = AutoFeatureExtractor.from_pretrained("kha-white/manga-ocr-base")
+def post_process(text):
+  text = ''.join(text.split())
+  text = text.replace('…', '...')
+  text = re.sub('[・.]{2,}', lambda x: (x.end() - x.start()) * '.', text)
+  text = jaconv.h2z(text, ascii=True, digit=True)
+  return text
+def manga_ocr(img):
+  img = Image.open(img)
+  img = img.convert('L').convert('RGB')
+  pixel_values = self.feature_extractor(img, return_tensors="pt").pixel_values
+  output = model.generate(pixel_values)[0]
+  text = tokenizer.decode(ouput, skip_special_tokens=True)
+  text = post_process(text)
+  return text
+iface = gr.Interface(
+    fn=infer,
+    inputs=[gr.inputs.Image(label="Input", type="pil")],
+    outputs="text",
+    layout="horizontal",
+    theme="huggingface",
+    title="Manga OCR",
+    description="Japanese Character Recognization from Mangas",
+    allow_flagging='never',
+)
+iface.launch(inbrowser=True)