Update app.py
Browse files
app.py
CHANGED
|
@@ -8,6 +8,9 @@ import matplotlib.pyplot as plt
|
|
| 8 |
from collections import defaultdict, Counter
|
| 9 |
import base64
|
| 10 |
from sklearn.manifold import MDS
|
|
|
|
|
|
|
|
|
|
| 11 |
import networkx as nx
|
| 12 |
|
| 13 |
# Set page configuration
|
|
@@ -437,7 +440,7 @@ if uploaded_file is not None:
|
|
| 437 |
# Feature Extraction
|
| 438 |
all_words = set(word for folio in folio_word_map for word in folio_word_map[folio])
|
| 439 |
word_freq_matrix = pd.DataFrame(index=folio_word_map.keys(), columns=list(all_words), data=0) # Convert set to list
|
| 440 |
-
|
| 441 |
for folio, word_counter in folio_word_map.items():
|
| 442 |
for word, count in word_counter.items():
|
| 443 |
word_freq_matrix.loc[folio, word] = count
|
|
|
|
| 8 |
from collections import defaultdict, Counter
|
| 9 |
import base64
|
| 10 |
from sklearn.manifold import MDS
|
| 11 |
+
from sklearn.decomposition import PCA
|
| 12 |
+
from sklearn.manifold import TSNE
|
| 13 |
+
from sklearn.cluster import KMeans
|
| 14 |
import networkx as nx
|
| 15 |
|
| 16 |
# Set page configuration
|
|
|
|
| 440 |
# Feature Extraction
|
| 441 |
all_words = set(word for folio in folio_word_map for word in folio_word_map[folio])
|
| 442 |
word_freq_matrix = pd.DataFrame(index=folio_word_map.keys(), columns=list(all_words), data=0) # Convert set to list
|
| 443 |
+
|
| 444 |
for folio, word_counter in folio_word_map.items():
|
| 445 |
for word, count in word_counter.items():
|
| 446 |
word_freq_matrix.loc[folio, word] = count
|