rajsecrets0 commited on
Commit
9087ae6
·
verified ·
1 Parent(s): 3b1070b

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -11
app.py CHANGED
@@ -3,7 +3,7 @@ import base64
3
  import requests
4
  from PIL import Image
5
  from io import BytesIO
6
- from pdf2image import convert_from_bytes
7
 
8
  # Configuration - Replace with your API key
9
  GEMINI_API_KEY = st.secrets["GEMINI_API_KEY"]
@@ -34,13 +34,13 @@ def encode_file(uploaded_file):
34
  file_bytes = uploaded_file.getvalue()
35
 
36
  if uploaded_file.type == "application/pdf":
37
- # Specify the path to poppler binaries
38
- poppler_path = "/usr/bin" # Adjust this path if necessary
39
- images = convert_from_bytes(file_bytes, first_page=1, last_page=1, poppler_path=poppler_path)
40
- if not images:
41
- raise ValueError("Failed to convert PDF to image")
42
  img_byte_arr = BytesIO()
43
- images[0].save(img_byte_arr, format='JPEG')
44
  return base64.b64encode(img_byte_arr.getvalue()).decode('utf-8')
45
 
46
  return base64.b64encode(file_bytes).decode('utf-8')
@@ -89,10 +89,11 @@ def process_document():
89
 
90
  # Generate preview
91
  if uploaded_file.type == "application/pdf":
92
- # Specify the path to poppler binaries
93
- poppler_path = "/usr/bin" # Adjust this path if necessary
94
- images = convert_from_bytes(uploaded_file.getvalue(), first_page=1, last_page=1, poppler_path=poppler_path)
95
- st.session_state.doc_preview = images[0]
 
96
  else:
97
  st.session_state.doc_preview = Image.open(uploaded_file)
98
 
 
3
  import requests
4
  from PIL import Image
5
  from io import BytesIO
6
+ import fitz # PyMuPDF
7
 
8
  # Configuration - Replace with your API key
9
  GEMINI_API_KEY = st.secrets["GEMINI_API_KEY"]
 
34
  file_bytes = uploaded_file.getvalue()
35
 
36
  if uploaded_file.type == "application/pdf":
37
+ # Convert PDF to image using PyMuPDF
38
+ pdf = fitz.open(stream=BytesIO(file_bytes))
39
+ page = pdf[0] # Get the first page
40
+ pix = page.get_pixmap()
41
+ img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
42
  img_byte_arr = BytesIO()
43
+ img.save(img_byte_arr, format='JPEG')
44
  return base64.b64encode(img_byte_arr.getvalue()).decode('utf-8')
45
 
46
  return base64.b64encode(file_bytes).decode('utf-8')
 
89
 
90
  # Generate preview
91
  if uploaded_file.type == "application/pdf":
92
+ pdf = fitz.open(stream=BytesIO(uploaded_file.getvalue()))
93
+ page = pdf[0] # Get the first page
94
+ pix = page.get_pixmap()
95
+ img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
96
+ st.session_state.doc_preview = img
97
  else:
98
  st.session_state.doc_preview = Image.open(uploaded_file)
99