Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -3,7 +3,8 @@ import streamlit as st
|
|
| 3 |
from difflib import SequenceMatcher
|
| 4 |
from sklearn.feature_extraction.text import TfidfVectorizer
|
| 5 |
from sklearn.metrics.pairwise import cosine_similarity
|
| 6 |
-
from Levenshtein import distance as
|
|
|
|
| 7 |
|
| 8 |
|
| 9 |
ms = st.session_state
|
|
@@ -98,7 +99,13 @@ def find_similar_texts(df1, df2, column_name, threshold=0.3):
|
|
| 98 |
|
| 99 |
return similar_texts, exact_matches
|
| 100 |
|
| 101 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 102 |
|
| 103 |
|
| 104 |
def main():
|
|
@@ -154,6 +161,19 @@ def main():
|
|
| 154 |
st.write(f"____________________")
|
| 155 |
st.write()
|
| 156 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 157 |
|
| 158 |
if __name__ == "__main__":
|
| 159 |
main()
|
|
|
|
| 3 |
from difflib import SequenceMatcher
|
| 4 |
from sklearn.feature_extraction.text import TfidfVectorizer
|
| 5 |
from sklearn.metrics.pairwise import cosine_similarity
|
| 6 |
+
from Levenshtein import distance as
|
| 7 |
+
import matplotlib.pyplot as plt
|
| 8 |
|
| 9 |
|
| 10 |
ms = st.session_state
|
|
|
|
| 99 |
|
| 100 |
return similar_texts, exact_matches
|
| 101 |
|
| 102 |
+
def plot_correlation(df, column):
|
| 103 |
+
plt.figure(figsize=(8, 6))
|
| 104 |
+
plt.scatter(df.index, df[column])
|
| 105 |
+
plt.xlabel("Index")
|
| 106 |
+
plt.ylabel(column)
|
| 107 |
+
plt.title(f"Correlation Plot of {column}")
|
| 108 |
+
st.pyplot()
|
| 109 |
|
| 110 |
|
| 111 |
def main():
|
|
|
|
| 161 |
st.write(f"____________________")
|
| 162 |
st.write()
|
| 163 |
|
| 164 |
+
# Calculate correlation
|
| 165 |
+
if warehouse_df[warehouse_column].dtype != "object" and industry_df[industry_column].dtype != "object":
|
| 166 |
+
correlation = warehouse_df[warehouse_column].corr(industry_df[industry_column])
|
| 167 |
+
st.header("Correlation")
|
| 168 |
+
st.write(f"The correlation between {warehouse_column} in warehouse item stocks and {industry_column} in industry item stocks is: {correlation}")
|
| 169 |
+
|
| 170 |
+
# Show correlation plot for each dataset
|
| 171 |
+
if st.button("Show for each dataset"):
|
| 172 |
+
st.subheader("Correlation Plot for Warehouse Dataset")
|
| 173 |
+
plot_correlation(warehouse_df, warehouse_column)
|
| 174 |
+
|
| 175 |
+
st.subheader("Correlation Plot for Industry Dataset")
|
| 176 |
+
plot_correlation(industry_df, industry_column)
|
| 177 |
|
| 178 |
if __name__ == "__main__":
|
| 179 |
main()
|