Spaces:

richardskimco
/

meta-llama

Sleeping

App Files Files

richardkimsm89 commited on Jan 18

Commit

e174db6

verified ·

1 Parent(s): 96281e3

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -5

app.py CHANGED Viewed

@@ -1,7 +1,43 @@
-# Inference
 import gradio as gr
 from huggingface_hub import InferenceClient
 model_text = "meta-llama/Llama-3.2-3B-Instruct"
 model_vision = "meta-llama/Llama-3.2-11B-Vision-Instruct"
@@ -11,12 +47,22 @@ client = InferenceClient()
 def fn_text(
     prompt,
     history,
-    system_prompt,
     max_tokens,
     temperature,
     top_p,
 ):
-    messages = [{"role": "system", "content": [{"type": "text", "text": system_prompt}]}]
     history.append(messages[0])
     messages.append({"role": "user", "content": [{"type": "text", "text": prompt}]})
@@ -40,7 +86,8 @@ app_text = gr.ChatInterface(
     fn = fn_text,
     type = "messages",
     additional_inputs = [
-        gr.Textbox(value="You are a helpful assistant.", label="System Prompt"),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max Tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-P"),

 import gradio as gr
 from huggingface_hub import InferenceClient
+import pytesseract
+from PIL import Image
+from pypdf import PdfReader
+import ocrmypdf
+import os
+# Image to Text
+def fn_image_to_text(input_image):
+    return pytesseract.image_to_string(Image.open(input_image))
+# PDF to Text
+def fn_pdf_to_text(input_pdf):
+    reader = PdfReader(input_pdf)
+    output_pdf = ""
+    for page in reader.pages:
+        output_pdf+=page.extract_text()
+    image_count = 0
+    for page in reader.pages:
+        image_count += len(page.images)
+    if image_count > 0 and len(output_pdf) < 1000:
+        input_pdf_ocr = input_pdf.replace(".pdf", " - OCR.pdf")
+        ocrmypdf.ocr(input_pdf, input_pdf_ocr, force_ocr=True)
+        reader = PdfReader(input_pdf_ocr)
+        output_pdf = ""
+        for page in reader.pages:
+            output_pdf+=page.extract_text()
+        os.remove(input_pdf_ocr)
+    return output_pdf
+# Inference
 model_text = "meta-llama/Llama-3.2-3B-Instruct"
 model_vision = "meta-llama/Llama-3.2-11B-Vision-Instruct"
 def fn_text(
     prompt,
     history,
+    input,
+    #system_prompt,
     max_tokens,
     temperature,
     top_p,
 ):
+    if input:
+        if os.path.splitext(input)[1].lower() in [".png", ".jpg", ".jpeg"]:
+            output = fn_image_to_text(input)
+        if os.path.splitext(input)[1].lower() == ".pdf":
+            output = fn_pdf_to_text(input)
+    else:
+        output = ""
+    messages = [{"role": "system", "content": [{"type": "text", "text": output}]}]
+    #messages = [{"role": "system", "content": [{"type": "text", "text": system_prompt}]}]
     history.append(messages[0])
     messages.append({"role": "user", "content": [{"type": "text", "text": prompt}]})
     fn = fn_text,
     type = "messages",
     additional_inputs = [
+        gr.File(type="filepath", label="Input"),
+        #gr.Textbox(value="You are a helpful assistant.", label="System Prompt"),
         gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max Tokens"),
         gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
         gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-P"),