Spaces:
Sleeping
Sleeping
| from data_loader import load_documents | |
| from preprocess import clean_text | |
| from embedder import embed_documents | |
| from fuzzy_cluster import build_gmm_clusters, save_gmm_model | |
| print("Loading dataset...") | |
| docs, labels = load_documents("data/20_newsgroups") | |
| print("Cleaning documents...") | |
| docs = [clean_text(d) for d in docs] | |
| print("Generating embeddings...") | |
| embeddings = embed_documents(docs) | |
| print("Building fuzzy clusters...") | |
| gmm, cluster_probs = build_gmm_clusters(embeddings) | |
| print("Saving clustering model...") | |
| save_gmm_model(gmm) | |
| print("Cluster probabilities shape:", cluster_probs.shape) | |
| print("Fuzzy clustering completed.") |