Update app1.py
Browse files
app1.py
CHANGED
@@ -2,6 +2,7 @@ import time
|
|
2 |
import os
|
3 |
import gradio as gr
|
4 |
from langchain.document_loaders import PyPDFLoader
|
|
|
5 |
|
6 |
ABS_PATH = os.path.dirname(os.path.abspath(__file__))
|
7 |
DB_DIR = os.path.join(ABS_PATH, "db")
|
@@ -13,8 +14,13 @@ async()=>{
|
|
13 |
"""
|
14 |
|
15 |
def get_documents():
|
16 |
-
return PyPDFLoader("doc1.pdf"
|
17 |
-
|
|
|
|
|
|
|
|
|
|
|
18 |
|
19 |
def extract_pdfs(x, request: gr.Request, progress=gr.Progress()):
|
20 |
progress(0, desc="Test", unit = "Files")
|
|
|
2 |
import os
|
3 |
import gradio as gr
|
4 |
from langchain.document_loaders import PyPDFLoader
|
5 |
+
#from langchain.document_loaders import PyMuPDFLoader
|
6 |
|
7 |
ABS_PATH = os.path.dirname(os.path.abspath(__file__))
|
8 |
DB_DIR = os.path.join(ABS_PATH, "db")
|
|
|
14 |
"""
|
15 |
|
16 |
def get_documents():
|
17 |
+
return PyPDFLoader("doc1.pdf").load()
|
18 |
+
"""
|
19 |
+
loader = PyMuPDFLoader(
|
20 |
+
"example.pdf", extract_images=True,
|
21 |
+
)
|
22 |
+
docs = loader.load()
|
23 |
+
"""
|
24 |
|
25 |
def extract_pdfs(x, request: gr.Request, progress=gr.Progress()):
|
26 |
progress(0, desc="Test", unit = "Files")
|