Spaces:

baudm
/

PARSeq-OCR

Running

Upload 3.gif

by nctuan - opened Jul 31, 2022

←

Files changed (4) hide show

3.gif ADDED Viewed

README.md CHANGED Viewed

@@ -4,7 +4,7 @@ emoji: 📚
 colorFrom: red
 colorTo: purple
 sdk: gradio
-sdk_version: 4.36.1
 python_version: 3.9.13
 app_file: app.py
 pinned: false

 colorFrom: red
 colorTo: purple
 sdk: gradio
+sdk_version: 3.1.0
 python_version: 3.9.13
 app_file: app.py
 pinned: false

app.py CHANGED Viewed

@@ -37,16 +37,14 @@ class App:
     def _get_model(self, name):
         if name in self._model_cache:
             return self._model_cache[name]
-        model = torch.hub.load('baudm/parseq', name, pretrained=True, trust_repo=True).eval()
         self._model_cache[name] = model
         return model
-    @torch.inference_mode()
     def __call__(self, model_name, image):
         if image is None:
             return '', []
-        if isinstance(image, dict):  # Extact image from ImageEditor output
-            image = image['composite']
         model = self._get_model(model_name)
         image = self._preprocess(image.convert('RGB')).unsqueeze(0)
         # Greedy decoding
@@ -81,11 +79,11 @@ def main():
         model_name = gr.Radio(app.models, value=app.models[0], label='The STR model to use')
         with gr.Tabs():
             with gr.TabItem('Image Upload'):
-                image_upload = gr.Image(type='pil', sources=['upload'], label='Image')
                 gr.Examples(glob.glob('demo_images/*.*'), inputs=image_upload)
                 read_upload = gr.Button('Read Text')
             with gr.TabItem('Canvas Sketch'):
-                image_canvas = gr.ImageEditor(type='pil', sources=[], label='Sketch', image_mode='RGB', layers=False, canvas_size=(768, 192))
                 read_canvas = gr.Button('Read Text')
         output = gr.Textbox(max_lines=1, label='Model output')

     def _get_model(self, name):
         if name in self._model_cache:
             return self._model_cache[name]
+        model = torch.hub.load('baudm/parseq', name, pretrained=True).eval()
+        model.freeze()
         self._model_cache[name] = model
         return model
     def __call__(self, model_name, image):
         if image is None:
             return '', []
         model = self._get_model(model_name)
         image = self._preprocess(image.convert('RGB')).unsqueeze(0)
         # Greedy decoding
         model_name = gr.Radio(app.models, value=app.models[0], label='The STR model to use')
         with gr.Tabs():
             with gr.TabItem('Image Upload'):
+                image_upload = gr.Image(type='pil', source='upload', label='Image')
                 gr.Examples(glob.glob('demo_images/*.*'), inputs=image_upload)
                 read_upload = gr.Button('Read Text')
             with gr.TabItem('Canvas Sketch'):
+                image_canvas = gr.Image(type='pil', source='canvas', label='Sketch')
                 read_canvas = gr.Button('Read Text')
         output = gr.Textbox(max_lines=1, label='Model output')

requirements.txt CHANGED Viewed

@@ -1,8 +1,8 @@
---extra-index-url https://download.pytorch.org/whl/cpu
-gradio ~=4.36.0
-torch >=2.0.0
-torchvision >=0.15.0
-pytorch-lightning ~=2.2.0
-timm ~=0.9.16
 nltk

+Gradio
+torch
+torchtext
+torchvision
+torchmetrics==0.6.2
+timm==0.4.12
 nltk
+git+https://github.com/baudm/parseq.git