prithivMLmods commited on
Commit
75bd5b2
·
verified ·
1 Parent(s): 2f849e9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -7
app.py CHANGED
@@ -89,10 +89,8 @@ model_i = Qwen2_5_VLForConditionalGeneration.from_pretrained(
89
  MODEL_ID_I, trust_remote_code=True, torch_dtype=torch.float16
90
  ).to(device).eval()
91
 
92
- #-----------------------------------------#
93
-
94
- # Load RolmOCR
95
- MODEL_ID_J = "reducto/RolmOCR"
96
  processor_j = AutoProcessor.from_pretrained(
97
  MODEL_ID_J,
98
  trust_remote_code=True
@@ -102,7 +100,6 @@ model_j = Qwen2_5_VLForConditionalGeneration.from_pretrained(
102
  trust_remote_code=True,
103
  torch_dtype=torch.float16
104
  ).to(device).eval()
105
- #-----------------------------------------#
106
 
107
  # --- Utility Functions ---
108
  def layoutjson2md(layout_data: List[Dict]) -> str:
@@ -154,7 +151,7 @@ def process_document_stream(model_name: str, task_choice: str, image: Image.Imag
154
  elif model_name == "Nanonets-OCR-s": processor, model = processor_c, model_c
155
  elif model_name == "MonkeyOCR-Recognition": processor, model = processor_g, model_g
156
  elif model_name == "olmOCR-7B-0725": processor, model = processor_i, model_i
157
- elif model_name == "RolmOCR": processor, model = processor_j, model_j
158
  else:
159
  yield "Invalid model selected.", "Invalid model selected.", None
160
  return
@@ -224,7 +221,7 @@ def create_gradio_interface():
224
  "olmOCR-7B-0725",
225
  "Nanonets-OCR-s",
226
  "Megalodon-OCR-Sync-0713",
227
- "RolmOCR"
228
  ],
229
  label="Select Model", value="Nanonets-OCR-s"
230
  )
 
89
  MODEL_ID_I, trust_remote_code=True, torch_dtype=torch.float16
90
  ).to(device).eval()
91
 
92
+ # Load typhoon-ocr-3b
93
+ MODEL_ID_J = "scb10x/typhoon-ocr-3b"
 
 
94
  processor_j = AutoProcessor.from_pretrained(
95
  MODEL_ID_J,
96
  trust_remote_code=True
 
100
  trust_remote_code=True,
101
  torch_dtype=torch.float16
102
  ).to(device).eval()
 
103
 
104
  # --- Utility Functions ---
105
  def layoutjson2md(layout_data: List[Dict]) -> str:
 
151
  elif model_name == "Nanonets-OCR-s": processor, model = processor_c, model_c
152
  elif model_name == "MonkeyOCR-Recognition": processor, model = processor_g, model_g
153
  elif model_name == "olmOCR-7B-0725": processor, model = processor_i, model_i
154
+ elif model_name == "typhoon-ocr-3b": processor, model = processor_j, model_j
155
  else:
156
  yield "Invalid model selected.", "Invalid model selected.", None
157
  return
 
221
  "olmOCR-7B-0725",
222
  "Nanonets-OCR-s",
223
  "Megalodon-OCR-Sync-0713",
224
+ "typhoon-ocr-3b"
225
  ],
226
  label="Select Model", value="Nanonets-OCR-s"
227
  )