Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -175,54 +175,6 @@ if st.session_state.df is None:
|
|
175 |
except Exception as e:
|
176 |
st.error(f"Error loading the file: {e}")
|
177 |
|
178 |
-
# Select
|
179 |
-
elif uploading_way == "select":
|
180 |
-
selected = st.selectbox("Select Dataset", ["Select", "Titanic Dataset","Iris Dataset", "Wine Dataset",
|
181 |
-
"Diabetes Dataset", "Digits Dataset",
|
182 |
-
"Olivetti Faces Dataset", "California Housing Dataset",
|
183 |
-
"Covid-19 Dataset"])
|
184 |
-
|
185 |
-
|
186 |
-
if selected == "Iris Dataset":
|
187 |
-
from sklearn.datasets import load_iris
|
188 |
-
iris = load_iris()
|
189 |
-
df = pd.DataFrame(iris.data, columns=iris.feature_names)
|
190 |
-
df['target'] = iris.target
|
191 |
-
st.session_state.df = df
|
192 |
-
|
193 |
-
elif selected == "Wine Dataset":
|
194 |
-
from sklearn.datasets import load_wine
|
195 |
-
wine = load_wine()
|
196 |
-
df = pd.DataFrame(wine.data, columns=wine.feature_names)
|
197 |
-
df['target'] = wine.target
|
198 |
-
st.session_state.df = df
|
199 |
-
|
200 |
-
|
201 |
-
elif selected == "Digits Dataset":
|
202 |
-
from sklearn.datasets import load_digits
|
203 |
-
digits = load_digits()
|
204 |
-
df = pd.DataFrame(digits.data, columns=digits.feature_names)
|
205 |
-
df['target'] = digits.target
|
206 |
-
st.session_state.df = df
|
207 |
-
|
208 |
-
elif selected == "Olivetti Faces Dataset":
|
209 |
-
from sklearn.datasets import fetch_olivetti_faces
|
210 |
-
olivetti = fetch_olivetti_faces()
|
211 |
-
df = pd.DataFrame(olivetti.data)
|
212 |
-
df['target'] = olivetti.target
|
213 |
-
st.session_state.df = df
|
214 |
-
|
215 |
-
elif selected == "California Housing Dataset":
|
216 |
-
from sklearn.datasets import fetch_california_housing
|
217 |
-
california = fetch_california_housing()
|
218 |
-
df = pd.DataFrame(california.data, columns=california.feature_names)
|
219 |
-
df['target'] = california.target
|
220 |
-
st.session_state.df = df
|
221 |
-
|
222 |
-
elif selected == "Covid-19 Dataset":
|
223 |
-
df = load_data("https://raw.githubusercontent.com/owid/covid-19-data/master/public/data/owid-covid-data.csv")
|
224 |
-
st.session_state.df = df
|
225 |
-
|
226 |
# URL
|
227 |
elif uploading_way == "url":
|
228 |
url = st.text_input("Enter URL")
|
@@ -530,21 +482,17 @@ df.drop(columns={col_to_delete}, inplace=True)
|
|
530 |
new_line()
|
531 |
if st.checkbox("Show Word Cloud", value=False):
|
532 |
text_col = st.selectbox("Select Text Column for Word Cloud", options=df.select_dtypes(include=[np.object]).columns.tolist())
|
533 |
-
text_data = ' '.join(df[text_col].dropna())
|
534 |
-
|
535 |
-
|
536 |
-
|
537 |
-
|
538 |
-
|
539 |
-
|
|
|
|
|
|
|
540 |
|
541 |
-
new_line()
|
542 |
-
if st.checkbox("Show Text Statistics", value=False):
|
543 |
-
text_col = st.selectbox("Select Text Column for Statistics", options=df.select_dtypes(include=[np.object]).columns.tolist())
|
544 |
-
text_stats = df[text_col].dropna().apply(lambda x: {'length': len(x), 'word_count': len(x.split())})
|
545 |
-
text_stats_df = pd.DataFrame(list(text_stats))
|
546 |
-
st.write(text_stats_df.describe())
|
547 |
-
new_line()
|
548 |
|
549 |
|
550 |
new_line()
|
|
|
175 |
except Exception as e:
|
176 |
st.error(f"Error loading the file: {e}")
|
177 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
178 |
# URL
|
179 |
elif uploading_way == "url":
|
180 |
url = st.text_input("Enter URL")
|
|
|
482 |
new_line()
|
483 |
if st.checkbox("Show Word Cloud", value=False):
|
484 |
text_col = st.selectbox("Select Text Column for Word Cloud", options=df.select_dtypes(include=[np.object]).columns.tolist())
|
485 |
+
text_data = ' '.join(df[text_col].dropna()).strip() # Collect and strip the text data
|
486 |
+
|
487 |
+
if text_data: # Check if there is any text data
|
488 |
+
wordcloud = WordCloud(width=800, height=400).generate(text_data)
|
489 |
+
fig, ax = plt.subplots()
|
490 |
+
ax.imshow(wordcloud, interpolation='bilinear')
|
491 |
+
ax.axis('off')
|
492 |
+
st.pyplot(fig)
|
493 |
+
else:
|
494 |
+
st.write("No words available to create a word cloud.")
|
495 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
496 |
|
497 |
|
498 |
new_line()
|