sango07 commited on
Commit
5f6d030
·
verified ·
1 Parent(s): cb05a4f

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +187 -0
app.py ADDED
@@ -0,0 +1,187 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ import pandas as pd
3
+ import os
4
+ import sqlite3
5
+ from langchain_community.utilities.sql_database import SQLDatabase
6
+ from langchain.chains import create_sql_query_chain
7
+ from langchain_openai import AzureChatOpenAI
8
+ from langchain_community.tools.sql_database.tool import QuerySQLDataBaseTool
9
+ from operator import itemgetter
10
+ from langchain_core.output_parsers import StrOutputParser
11
+ from langchain_core.prompts import PromptTemplate
12
+ from langchain_core.runnables import RunnablePassthrough
13
+ from ydata_profiling import ProfileReport
14
+ import streamlit.components.v1 as components
15
+ import tempfile
16
+ from langchain_openai import ChatOpenAI
17
+
18
+ # Enhanced Page Configuration
19
+ st.set_page_config(
20
+ page_title="Chat with Excel/CSV",
21
+ page_icon=":bar_chart:",
22
+ layout="centered",
23
+ initial_sidebar_state="expanded"
24
+ )
25
+
26
+ # Custom CSS for styling
27
+ st.markdown(
28
+ """
29
+ <style>
30
+ /* Main Layout */
31
+ .main {background-color: white;}
32
+
33
+ /* Sidebar Styling */
34
+ .sidebar .sidebar-content {
35
+ background-color: #F1F5F9;
36
+ color: black;
37
+ }
38
+ .sidebar .sidebar-content .stButton>button, .sidebar .sidebar-content h1, .sidebar .sidebar-content h2 {
39
+ color: #1A202C;
40
+ }
41
+
42
+ /* Gradient Text for Main Greeting */
43
+ .greeting-text {
44
+ font-size: 3em;
45
+ color: transparent;
46
+ background-image: linear-gradient(90deg, #3b82f6, #ec4899);
47
+ -webkit-background-clip: text;
48
+ font-weight: 600;
49
+ text-align: center;
50
+ }
51
+
52
+ /* Chat Input Styling */
53
+ .stTextInput > div > input {
54
+ background-color: #F1F5F9;
55
+ color: #1A202C;
56
+ border-radius: 8px;
57
+ padding: 10px;
58
+ margin-top: 10px;
59
+ width: 100%;
60
+ }
61
+
62
+ /* Button Styling */
63
+ .stButton > button {
64
+ background-color: #3b82f6;
65
+ color: white;
66
+ border: none;
67
+ border-radius: 5px;
68
+ padding: 0.5em 1em;
69
+ font-size: 1em;
70
+ font-weight: 600;
71
+ }
72
+ </style>
73
+ """,
74
+ unsafe_allow_html=True
75
+ )
76
+
77
+ # Function to handle Q&A option
78
+ def code_for_option_1(api_key):
79
+ st.write('<div class="greeting-text">Hello, User!</div>', unsafe_allow_html=True)
80
+ st.sidebar.info("Ask any question about the uploaded Excel or CSV data.")
81
+ st.sidebar.image("https://miro.medium.com/v2/resize:fit:786/format:webp/1*qUFgGhSERoWAa08MV6AVCQ.jpeg", use_column_width=True)
82
+
83
+ uploaded_file = st.file_uploader("Upload Excel or CSV file:", type=["xlsx", "csv"])
84
+
85
+ if uploaded_file is not None:
86
+ # Use temporary file for uploaded content
87
+ with tempfile.NamedTemporaryFile(delete=False) as tmp_file:
88
+ tmp_file.write(uploaded_file.read())
89
+ tmp_file_path = tmp_file.name
90
+
91
+ # Load Excel or CSV file
92
+ if uploaded_file.name.endswith(".xlsx"):
93
+ df = pd.read_excel(tmp_file_path)
94
+ elif uploaded_file.name.endswith(".csv"):
95
+ df = pd.read_csv(tmp_file_path)
96
+
97
+ st.write("### Uploaded Data:")
98
+ st.dataframe(df.head(len(df)))
99
+
100
+ question = st.text_input("Ask a question:")
101
+ submit = st.button("Ask")
102
+
103
+ if submit:
104
+ st.subheader("Answer:")
105
+ st.write("Please wait, answer is generating...")
106
+
107
+ # Initialize OpenAI chat model using the provided API key
108
+ llm_1 = ChatOpenAI(model="gpt-3.5-turbo", temperature=0, openai_api_key=api_key)
109
+
110
+ with sqlite3.connect(f"{uploaded_file.name}.db") as conn:
111
+ df.to_sql(f"{uploaded_file.name}s", conn, if_exists="replace")
112
+ db = SQLDatabase.from_uri(f"sqlite:///{uploaded_file.name}.db")
113
+ generate_query = create_sql_query_chain(llm_1, db)
114
+ execute_query = QuerySQLDataBaseTool(db=db)
115
+
116
+ answer_prompt = PromptTemplate.from_template(
117
+ """Given the following user question, SQL query, and SQL result, answer the question.
118
+
119
+ Question: {question}
120
+ SQL Query: {query}
121
+ SQL Result: {result}
122
+ Answer: """
123
+ )
124
+
125
+ rephrase_answer = answer_prompt | llm_1 | StrOutputParser()
126
+ chain = (
127
+ RunnablePassthrough.assign(query=generate_query)
128
+ .assign(result=itemgetter("query") | execute_query)
129
+ | rephrase_answer
130
+ )
131
+
132
+ response = chain.invoke({"question": question})
133
+ st.subheader(response)
134
+
135
+ # Function to handle EDA option
136
+ def code_for_option_2():
137
+ st.sidebar.image("https://miro.medium.com/v2/resize:fit:702/1*Ra02AqsQlC0KV229EvM98g.png", use_column_width=True)
138
+ st.sidebar.info("Explore insights from the uploaded data.")
139
+
140
+ uploaded_file = st.file_uploader("Upload Excel or CSV file:", type=["xlsx", "csv"])
141
+
142
+ if uploaded_file is not None:
143
+ with tempfile.NamedTemporaryFile(delete=False) as tmp_file:
144
+ tmp_file.write(uploaded_file.read())
145
+ tmp_file_path = tmp_file.name
146
+
147
+ # Load Excel or CSV file
148
+ if uploaded_file.name.endswith(".xlsx"):
149
+ df = pd.read_excel(tmp_file_path)
150
+ elif uploaded_file.name.endswith(".csv"):
151
+ df = pd.read_csv(tmp_file_path)
152
+
153
+ st.write("### Uploaded Data:")
154
+ st.dataframe(df.head(len(df)))
155
+
156
+ st.subheader("Exploratory Data Analysis (EDA):")
157
+ st.write("Please wait, reports are generating...")
158
+ response = ProfileReport(df)
159
+
160
+ response.to_file("data_profile_report.html")
161
+ with open("data_profile_report.html", "r", encoding="utf-8") as f:
162
+ data = f.read()
163
+
164
+ components.html(data, width=800, height=600, scrolling=True)
165
+
166
+ # Main UI layout
167
+ def main():
168
+ st.sidebar.image("https://hashstudioz.com/blog/wp-content/uploads/2023/09/ezgif.com-gif-maker-2.webp", use_column_width=True)
169
+ st.title("DocTalk : Chat with Excel/CSV")
170
+ st.sidebar.title("Options")
171
+ selected_option = st.sidebar.radio("Select an option:", ("Chat with Excel/CSV", "EDA"))
172
+
173
+ # Take user API key input
174
+ api_key = st.sidebar.text_input("Enter OpenAI API Key:", type="password")
175
+
176
+ if api_key:
177
+ if selected_option == "Chat with Excel/CSV":
178
+ code_for_option_1(api_key)
179
+ elif selected_option == "EDA":
180
+ code_for_option_2()
181
+ else:
182
+ st.write("Please select an option.")
183
+ else:
184
+ st.sidebar.warning("Please enter your OpenAI API key to proceed.")
185
+
186
+ if __name__ == "__main__":
187
+ main()