dammy commited on
Commit
b4c7950
·
1 Parent(s): 5d050f0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +13 -2
app.py CHANGED
@@ -4,8 +4,9 @@ from langchain.text_splitter import CharacterTextSplitter
4
 
5
 
6
  def extract_text(pdf_file):
 
7
  # Load a document
8
- loader = PDFMinerLoader("cereal.pdf")
9
  doc = loader.load()
10
 
11
  text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
@@ -15,9 +16,19 @@ def extract_text(pdf_file):
15
 
16
  return texts[0]
17
 
 
 
 
 
 
 
 
 
 
 
18
  iface = gr.Interface(
19
  fn=extract_text,
20
- inputs=gr.File(type="file", label="Upload PDF"),
21
  outputs="text"
22
  )
23
 
 
4
 
5
 
6
  def extract_text(pdf_file):
7
+
8
  # Load a document
9
+ loader = PDFMinerLoader(pdf_file)
10
  doc = loader.load()
11
 
12
  text_splitter = CharacterTextSplitter(chunk_size=1000, chunk_overlap=0)
 
16
 
17
  return texts[0]
18
 
19
+
20
+ # def upload_file(file):
21
+ # return file.name
22
+
23
+ # with gr.Blocks() as demo:
24
+ # file_output = gr.File()
25
+ # upload_button = gr.UploadButton("Click to Upload a File", file_types="file")
26
+ # upload_button.upload(upload_file, upload_button, file_output)
27
+
28
+
29
  iface = gr.Interface(
30
  fn=extract_text,
31
+ inputs=gr.File(type="filepath", label="Upload PDF"),
32
  outputs="text"
33
  )
34