Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -9,6 +9,7 @@ import os
|
|
9 |
os.environ['OPENAI_API_KEY'] = os.environ['OPEN_API_KEY']
|
10 |
st.title("Contracts Multiple File Search ")
|
11 |
import pandas as pd
|
|
|
12 |
|
13 |
from langchain.retrievers import BM25Retriever, EnsembleRetriever
|
14 |
from langchain.schema import Document
|
@@ -19,7 +20,7 @@ from FlagEmbedding import FlagReranker
|
|
19 |
reranker = FlagReranker('BAAI/bge-reranker-base')
|
20 |
import spacy
|
21 |
# Load the English model from SpaCy
|
22 |
-
nlp = spacy.load("
|
23 |
|
24 |
def util_upload_file_and_return_list_docs(uploaded_files):
|
25 |
#util_del_cwd()
|
@@ -180,7 +181,7 @@ def util_openai_extract_clause(example_prompt, page_content):
|
|
180 |
openai.api_key = os.environ['OPENAI_API_KEY']
|
181 |
content = example_prompt
|
182 |
content = content + "\n Answer precisely; do not add anything extra, and try to locate the answer in the below context \n context: "
|
183 |
-
return_value = openai.ChatCompletion.create(model="gpt-
|
184 |
return(str(return_value['choices'][0]['message']['content']))
|
185 |
|
186 |
|
@@ -188,7 +189,7 @@ def util_openai_hyde(example_prompt):
|
|
188 |
import openai
|
189 |
openai.api_key = os.environ['OPENAI_API_KEY']
|
190 |
content = example_prompt
|
191 |
-
return_value = openai.ChatCompletion.create(model="gpt-
|
192 |
{"role": "system", "content": "You are a legal contract lawyer. generate a summary from below text " + "\n"},
|
193 |
{"role": "user", "content": example_prompt + "\n"},
|
194 |
|
@@ -216,7 +217,7 @@ def util_openai_modify_prompt(example_prompt, page_content):
|
|
216 |
openai.api_key = os.environ['OPENAI_API_KEY']
|
217 |
my_prompt = """Expand the original Query to show exact resuls for extraction\n
|
218 |
Query: """ + example_prompt # + """\nDocument: """ + page_content + """ """
|
219 |
-
return_value = openai.ChatCompletion.create(model="gpt-
|
220 |
return(str(return_value['choices'][0]['message']['content']))
|
221 |
|
222 |
# def create_bm25_page_rank(page_list_retrieve, page_query):
|
@@ -273,6 +274,7 @@ with st.form("my_form"):
|
|
273 |
ensemble_retriever = EnsembleRetriever(retrievers=[bm25_retriever, chroma_retriever],weights=[0.25, 0.75])
|
274 |
passage_nodes = ensemble_retriever.get_relevant_documents(single_example_passage)
|
275 |
print('len(passage_nodes):', len(passage_nodes))
|
|
|
276 |
df = util_get_list_pageno_and_contents(single_example_passage,passage_documents,passage_nodes)
|
277 |
st.write(df)
|
278 |
# print('len(page_list_retrieve):', len(page_list_retrieve))
|
|
|
9 |
os.environ['OPENAI_API_KEY'] = os.environ['OPEN_API_KEY']
|
10 |
st.title("Contracts Multiple File Search ")
|
11 |
import pandas as pd
|
12 |
+
import time
|
13 |
|
14 |
from langchain.retrievers import BM25Retriever, EnsembleRetriever
|
15 |
from langchain.schema import Document
|
|
|
20 |
reranker = FlagReranker('BAAI/bge-reranker-base')
|
21 |
import spacy
|
22 |
# Load the English model from SpaCy
|
23 |
+
nlp = spacy.load("en_core_web_sm")
|
24 |
|
25 |
def util_upload_file_and_return_list_docs(uploaded_files):
|
26 |
#util_del_cwd()
|
|
|
181 |
openai.api_key = os.environ['OPENAI_API_KEY']
|
182 |
content = example_prompt
|
183 |
content = content + "\n Answer precisely; do not add anything extra, and try to locate the answer in the below context \n context: "
|
184 |
+
return_value = openai.ChatCompletion.create(model="gpt-4o-mini",temperature=0.0001,messages=[{"role": "user", "content": content + "\n" + page_content},])
|
185 |
return(str(return_value['choices'][0]['message']['content']))
|
186 |
|
187 |
|
|
|
189 |
import openai
|
190 |
openai.api_key = os.environ['OPENAI_API_KEY']
|
191 |
content = example_prompt
|
192 |
+
return_value = openai.ChatCompletion.create(model="gpt-4o-mini",temperature=0.0001,messages=[
|
193 |
{"role": "system", "content": "You are a legal contract lawyer. generate a summary from below text " + "\n"},
|
194 |
{"role": "user", "content": example_prompt + "\n"},
|
195 |
|
|
|
217 |
openai.api_key = os.environ['OPENAI_API_KEY']
|
218 |
my_prompt = """Expand the original Query to show exact resuls for extraction\n
|
219 |
Query: """ + example_prompt # + """\nDocument: """ + page_content + """ """
|
220 |
+
return_value = openai.ChatCompletion.create(model="gpt-4o-mini",temperature=0.0001,messages=[{"role": "user", "content": my_prompt},])
|
221 |
return(str(return_value['choices'][0]['message']['content']))
|
222 |
|
223 |
# def create_bm25_page_rank(page_list_retrieve, page_query):
|
|
|
274 |
ensemble_retriever = EnsembleRetriever(retrievers=[bm25_retriever, chroma_retriever],weights=[0.25, 0.75])
|
275 |
passage_nodes = ensemble_retriever.get_relevant_documents(single_example_passage)
|
276 |
print('len(passage_nodes):', len(passage_nodes))
|
277 |
+
time.sleep(5)
|
278 |
df = util_get_list_pageno_and_contents(single_example_passage,passage_documents,passage_nodes)
|
279 |
st.write(df)
|
280 |
# print('len(page_list_retrieve):', len(page_list_retrieve))
|