Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -175,54 +175,6 @@ if st.session_state.df is None:
|
|
| 175 |
except Exception as e:
|
| 176 |
st.error(f"Error loading the file: {e}")
|
| 177 |
|
| 178 |
-
# Select
|
| 179 |
-
elif uploading_way == "select":
|
| 180 |
-
selected = st.selectbox("Select Dataset", ["Select", "Titanic Dataset","Iris Dataset", "Wine Dataset",
|
| 181 |
-
"Diabetes Dataset", "Digits Dataset",
|
| 182 |
-
"Olivetti Faces Dataset", "California Housing Dataset",
|
| 183 |
-
"Covid-19 Dataset"])
|
| 184 |
-
|
| 185 |
-
|
| 186 |
-
if selected == "Iris Dataset":
|
| 187 |
-
from sklearn.datasets import load_iris
|
| 188 |
-
iris = load_iris()
|
| 189 |
-
df = pd.DataFrame(iris.data, columns=iris.feature_names)
|
| 190 |
-
df['target'] = iris.target
|
| 191 |
-
st.session_state.df = df
|
| 192 |
-
|
| 193 |
-
elif selected == "Wine Dataset":
|
| 194 |
-
from sklearn.datasets import load_wine
|
| 195 |
-
wine = load_wine()
|
| 196 |
-
df = pd.DataFrame(wine.data, columns=wine.feature_names)
|
| 197 |
-
df['target'] = wine.target
|
| 198 |
-
st.session_state.df = df
|
| 199 |
-
|
| 200 |
-
|
| 201 |
-
elif selected == "Digits Dataset":
|
| 202 |
-
from sklearn.datasets import load_digits
|
| 203 |
-
digits = load_digits()
|
| 204 |
-
df = pd.DataFrame(digits.data, columns=digits.feature_names)
|
| 205 |
-
df['target'] = digits.target
|
| 206 |
-
st.session_state.df = df
|
| 207 |
-
|
| 208 |
-
elif selected == "Olivetti Faces Dataset":
|
| 209 |
-
from sklearn.datasets import fetch_olivetti_faces
|
| 210 |
-
olivetti = fetch_olivetti_faces()
|
| 211 |
-
df = pd.DataFrame(olivetti.data)
|
| 212 |
-
df['target'] = olivetti.target
|
| 213 |
-
st.session_state.df = df
|
| 214 |
-
|
| 215 |
-
elif selected == "California Housing Dataset":
|
| 216 |
-
from sklearn.datasets import fetch_california_housing
|
| 217 |
-
california = fetch_california_housing()
|
| 218 |
-
df = pd.DataFrame(california.data, columns=california.feature_names)
|
| 219 |
-
df['target'] = california.target
|
| 220 |
-
st.session_state.df = df
|
| 221 |
-
|
| 222 |
-
elif selected == "Covid-19 Dataset":
|
| 223 |
-
df = load_data("https://raw.githubusercontent.com/owid/covid-19-data/master/public/data/owid-covid-data.csv")
|
| 224 |
-
st.session_state.df = df
|
| 225 |
-
|
| 226 |
# URL
|
| 227 |
elif uploading_way == "url":
|
| 228 |
url = st.text_input("Enter URL")
|
|
@@ -530,21 +482,17 @@ df.drop(columns={col_to_delete}, inplace=True)
|
|
| 530 |
new_line()
|
| 531 |
if st.checkbox("Show Word Cloud", value=False):
|
| 532 |
text_col = st.selectbox("Select Text Column for Word Cloud", options=df.select_dtypes(include=[np.object]).columns.tolist())
|
| 533 |
-
text_data = ' '.join(df[text_col].dropna())
|
| 534 |
-
|
| 535 |
-
|
| 536 |
-
|
| 537 |
-
|
| 538 |
-
|
| 539 |
-
|
|
|
|
|
|
|
|
|
|
| 540 |
|
| 541 |
-
new_line()
|
| 542 |
-
if st.checkbox("Show Text Statistics", value=False):
|
| 543 |
-
text_col = st.selectbox("Select Text Column for Statistics", options=df.select_dtypes(include=[np.object]).columns.tolist())
|
| 544 |
-
text_stats = df[text_col].dropna().apply(lambda x: {'length': len(x), 'word_count': len(x.split())})
|
| 545 |
-
text_stats_df = pd.DataFrame(list(text_stats))
|
| 546 |
-
st.write(text_stats_df.describe())
|
| 547 |
-
new_line()
|
| 548 |
|
| 549 |
|
| 550 |
new_line()
|
|
|
|
| 175 |
except Exception as e:
|
| 176 |
st.error(f"Error loading the file: {e}")
|
| 177 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 178 |
# URL
|
| 179 |
elif uploading_way == "url":
|
| 180 |
url = st.text_input("Enter URL")
|
|
|
|
| 482 |
new_line()
|
| 483 |
if st.checkbox("Show Word Cloud", value=False):
|
| 484 |
text_col = st.selectbox("Select Text Column for Word Cloud", options=df.select_dtypes(include=[np.object]).columns.tolist())
|
| 485 |
+
text_data = ' '.join(df[text_col].dropna()).strip() # Collect and strip the text data
|
| 486 |
+
|
| 487 |
+
if text_data: # Check if there is any text data
|
| 488 |
+
wordcloud = WordCloud(width=800, height=400).generate(text_data)
|
| 489 |
+
fig, ax = plt.subplots()
|
| 490 |
+
ax.imshow(wordcloud, interpolation='bilinear')
|
| 491 |
+
ax.axis('off')
|
| 492 |
+
st.pyplot(fig)
|
| 493 |
+
else:
|
| 494 |
+
st.write("No words available to create a word cloud.")
|
| 495 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 496 |
|
| 497 |
|
| 498 |
new_line()
|