Spaces:

Rathapoom
/

Llama-3-Typhoon-1.5X-70B-instruct-awq-Modztest

Build error

Rathapoom commited on Aug 1, 2024

Commit

87cdd83

verified ·

1 Parent(s): 09ec353

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,8 +3,7 @@ import torch
 from transformers import AutoTokenizer, AutoModelForCausalLM
 from PyPDF2 import PdfReader
 import gradio as gr
-from datasets import Dataset, load_from_disk, save_to_disk
-import faiss
 # Extract text from PDF
 def extract_text_from_pdf(pdf_path):
@@ -21,15 +20,16 @@ tokenizer = AutoTokenizer.from_pretrained(model_name)
 model = AutoModelForCausalLM.from_pretrained(model_name)
 # Extract text from the provided PDF
-pdf_text = extract_text_from_pdf("TOPF 2564.pdf")  # Updated path
 passages = [{"title": "", "text": line} for line in pdf_text.split('\n') if line.strip()]
 # Create a Dataset
 dataset = Dataset.from_list(passages)
 # Save the dataset and create an index in the current working directory
-dataset_path = "./rag_document_dataset"
-index_path = "./rag_document_index"
 # Ensure the directory exists
 os.makedirs(dataset_path, exist_ok=True)

 from transformers import AutoTokenizer, AutoModelForCausalLM
 from PyPDF2 import PdfReader
 import gradio as gr
+from datasets import Dataset, load_from_disk
 # Extract text from PDF
 def extract_text_from_pdf(pdf_path):
 model = AutoModelForCausalLM.from_pretrained(model_name)
 # Extract text from the provided PDF
+pdf_path = "/home/user/app/TOPF 2564.pdf"  # Ensure this path is correct
+pdf_text = extract_text_from_pdf(pdf_path)
 passages = [{"title": "", "text": line} for line in pdf_text.split('\n') if line.strip()]
 # Create a Dataset
 dataset = Dataset.from_list(passages)
 # Save the dataset and create an index in the current working directory
+dataset_path = "/home/user/app/rag_document_dataset"
+index_path = "/home/user/app/rag_document_index"
 # Ensure the directory exists
 os.makedirs(dataset_path, exist_ok=True)