Milad Alshomary
commited on
Commit
·
59c04b5
1
Parent(s):
edc6c74
updates
Browse files- precompute_caches.py +4 -4
- utils/interp_space_utils.py +1 -1
precompute_caches.py
CHANGED
|
@@ -28,9 +28,9 @@ def precompute_all_caches(
|
|
| 28 |
|
| 29 |
if models_to_test is None:
|
| 30 |
models_to_test = [
|
| 31 |
-
'gabrielloiseau/LUAR-MUD-sentence-transformers',
|
| 32 |
-
'gabrielloiseau/LUAR-CRUD-sentence-transformers',
|
| 33 |
-
'miladalsh/light-luar',
|
| 34 |
'AnnaWegmann/Style-Embedding'
|
| 35 |
]
|
| 36 |
|
|
@@ -194,7 +194,7 @@ from utils.visualizations import visualize_clusters_plotly
|
|
| 194 |
|
| 195 |
if __name__ == "__main__":
|
| 196 |
# Test with a small subset first
|
| 197 |
-
instances=[i for i in range(
|
| 198 |
cache_stats = precompute_all_caches(
|
| 199 |
models_to_test=[
|
| 200 |
'gabrielloiseau/LUAR-MUD-sentence-transformers'
|
|
|
|
| 28 |
|
| 29 |
if models_to_test is None:
|
| 30 |
models_to_test = [
|
| 31 |
+
# 'gabrielloiseau/LUAR-MUD-sentence-transformers',
|
| 32 |
+
# 'gabrielloiseau/LUAR-CRUD-sentence-transformers',
|
| 33 |
+
# 'miladalsh/light-luar',
|
| 34 |
'AnnaWegmann/Style-Embedding'
|
| 35 |
]
|
| 36 |
|
|
|
|
| 194 |
|
| 195 |
if __name__ == "__main__":
|
| 196 |
# Test with a small subset first
|
| 197 |
+
instances=[i for i in range(10)] # First 20 instances for testing
|
| 198 |
cache_stats = precompute_all_caches(
|
| 199 |
models_to_test=[
|
| 200 |
'gabrielloiseau/LUAR-MUD-sentence-transformers'
|
utils/interp_space_utils.py
CHANGED
|
@@ -544,7 +544,7 @@ def compute_clusters_style_representation_3(
|
|
| 544 |
background_corpus_df: pd.DataFrame,
|
| 545 |
cluster_ids: List[Any],
|
| 546 |
cluster_label_clm_name: str = 'authorID',
|
| 547 |
-
max_num_feats: int =
|
| 548 |
max_num_documents_per_author=1,
|
| 549 |
max_num_authors=10,
|
| 550 |
max_authors_for_span_extraction=4,
|
|
|
|
| 544 |
background_corpus_df: pd.DataFrame,
|
| 545 |
cluster_ids: List[Any],
|
| 546 |
cluster_label_clm_name: str = 'authorID',
|
| 547 |
+
max_num_feats: int = 25,
|
| 548 |
max_num_documents_per_author=1,
|
| 549 |
max_num_authors=10,
|
| 550 |
max_authors_for_span_extraction=4,
|