peterciank commited on
Commit
709eae1
·
verified ·
1 Parent(s): 7010bf6

Update pages/Phase1.py

Browse files
Files changed (1) hide show
  1. pages/Phase1.py +8 -1
pages/Phase1.py CHANGED
@@ -2,6 +2,7 @@ import streamlit as st
2
  from huggingface_hub import InferenceClient
3
  import fitz # PyMuPDF
4
  import os
 
5
 
6
  st.title("ChatGPT-like Chatbot")
7
 
@@ -33,11 +34,17 @@ def reset_conversation():
33
  return None
34
 
35
  def read_pdf(file):
36
- pdf_document = fitz.open(file)
 
 
 
 
37
  text = ""
38
  for page_num in range(len(pdf_document)):
39
  page = pdf_document[page_num]
40
  text += page.get_text()
 
 
41
  return text
42
 
43
  models = [key for key in model_links.keys()]
 
2
  from huggingface_hub import InferenceClient
3
  import fitz # PyMuPDF
4
  import os
5
+ import tempfile
6
 
7
  st.title("ChatGPT-like Chatbot")
8
 
 
34
  return None
35
 
36
  def read_pdf(file):
37
+ with tempfile.NamedTemporaryFile(delete=False, suffix=".pdf") as tmp_file:
38
+ tmp_file.write(file.read())
39
+ tmp_file_path = tmp_file.name
40
+
41
+ pdf_document = fitz.open(tmp_file_path)
42
  text = ""
43
  for page_num in range(len(pdf_document)):
44
  page = pdf_document[page_num]
45
  text += page.get_text()
46
+
47
+ os.remove(tmp_file_path)
48
  return text
49
 
50
  models = [key for key in model_links.keys()]