bokesyo commited on
Commit
9dbc707
·
verified ·
1 Parent(s): 4061826

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -1
app.py CHANGED
@@ -184,9 +184,19 @@ model.to(device)
184
 
185
 
186
  with gr.Blocks() as app:
187
- gr.Markdown("# Memex: OCR-free Visual Document Retrieval @RhapsodyAI")
 
 
 
 
 
 
 
 
 
188
 
189
  gr.Markdown("- We open-sourced our model at [RhapsodyAI/minicpm-visual-embedding-v0](https://huggingface.co/RhapsodyAI/minicpm-visual-embedding-v0)")
 
190
  gr.Markdown("- Currently we support PDF document with less than 50 pages, PDF over 50 pages will reach GPU time limit.")
191
 
192
  with gr.Row():
 
184
 
185
 
186
  with gr.Blocks() as app:
187
+ gr.Markdown("# Memex: OCR-free Visual Document Embedding Model as Your Personal Librarian")
188
+ gr.Markdown("""The model only takes images as document-side inputs and produce vectors representing document pages. Memex is trained with over 200k query-visual document pairs, including textual document, visual document, arxiv figures, plots, charts, industry documents, textbooks, ebooks, and openly-available PDFs, etc. Its performance is on a par with our ablation text embedding model on text-oriented documents, and an advantages on visually-intensive documents.
189
+
190
+ Our model is capable of:
191
+
192
+ - Help you read a long visually-intensive or text-oriented PDF document and find the pages that answer your question.
193
+
194
+ - Help you build a personal library and retireve book pages from a large collection of books.
195
+
196
+ - It works like human: read and comprehend with vision and remember multimodal information in hippocampus.""")
197
 
198
  gr.Markdown("- We open-sourced our model at [RhapsodyAI/minicpm-visual-embedding-v0](https://huggingface.co/RhapsodyAI/minicpm-visual-embedding-v0)")
199
+
200
  gr.Markdown("- Currently we support PDF document with less than 50 pages, PDF over 50 pages will reach GPU time limit.")
201
 
202
  with gr.Row():