Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -184,9 +184,19 @@ model.to(device)
|
|
184 |
|
185 |
|
186 |
with gr.Blocks() as app:
|
187 |
-
gr.Markdown("# Memex: OCR-free Visual Document
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
188 |
|
189 |
gr.Markdown("- We open-sourced our model at [RhapsodyAI/minicpm-visual-embedding-v0](https://huggingface.co/RhapsodyAI/minicpm-visual-embedding-v0)")
|
|
|
190 |
gr.Markdown("- Currently we support PDF document with less than 50 pages, PDF over 50 pages will reach GPU time limit.")
|
191 |
|
192 |
with gr.Row():
|
|
|
184 |
|
185 |
|
186 |
with gr.Blocks() as app:
|
187 |
+
gr.Markdown("# Memex: OCR-free Visual Document Embedding Model as Your Personal Librarian")
|
188 |
+
gr.Markdown("""The model only takes images as document-side inputs and produce vectors representing document pages. Memex is trained with over 200k query-visual document pairs, including textual document, visual document, arxiv figures, plots, charts, industry documents, textbooks, ebooks, and openly-available PDFs, etc. Its performance is on a par with our ablation text embedding model on text-oriented documents, and an advantages on visually-intensive documents.
|
189 |
+
|
190 |
+
Our model is capable of:
|
191 |
+
|
192 |
+
- Help you read a long visually-intensive or text-oriented PDF document and find the pages that answer your question.
|
193 |
+
|
194 |
+
- Help you build a personal library and retireve book pages from a large collection of books.
|
195 |
+
|
196 |
+
- It works like human: read and comprehend with vision and remember multimodal information in hippocampus.""")
|
197 |
|
198 |
gr.Markdown("- We open-sourced our model at [RhapsodyAI/minicpm-visual-embedding-v0](https://huggingface.co/RhapsodyAI/minicpm-visual-embedding-v0)")
|
199 |
+
|
200 |
gr.Markdown("- Currently we support PDF document with less than 50 pages, PDF over 50 pages will reach GPU time limit.")
|
201 |
|
202 |
with gr.Row():
|