Spaces:
Sleeping
Sleeping
Update src/streamlit_app.py
Browse files- src/streamlit_app.py +6 -1
src/streamlit_app.py
CHANGED
|
@@ -221,7 +221,12 @@ def get_clusters_from_r_matrix(r_matrix):
|
|
| 221 |
# Using default parameters for min_cluster_size and min_samples
|
| 222 |
# These might need tuning based on data characteristics and desired cluster granularity
|
| 223 |
# allow_single_cluster=True prevents an error if all points form one cluster
|
| 224 |
-
clusterer = hdbscan.HDBSCAN(
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 225 |
|
| 226 |
# Fit the model directly to the DataFrame values
|
| 227 |
# HDBSCAN fit expects a numpy array or similar structure
|
|
|
|
| 221 |
# Using default parameters for min_cluster_size and min_samples
|
| 222 |
# These might need tuning based on data characteristics and desired cluster granularity
|
| 223 |
# allow_single_cluster=True prevents an error if all points form one cluster
|
| 224 |
+
clusterer = hdbscan.HDBSCAN(
|
| 225 |
+
metric=hamming_distance_with_nan,
|
| 226 |
+
allow_single_cluster=True,
|
| 227 |
+
min_cluster_size=max(int(np.sqrt(len(r_matrix))), 3),
|
| 228 |
+
min_samples=None,
|
| 229 |
+
)
|
| 230 |
|
| 231 |
# Fit the model directly to the DataFrame values
|
| 232 |
# HDBSCAN fit expects a numpy array or similar structure
|