diff --git "a/data/pr_scope_clusters.json" "b/data/pr_scope_clusters.json" --- "a/data/pr_scope_clusters.json" +++ "b/data/pr_scope_clusters.json" @@ -1 +1,4178 @@ -[] +[ + { + "authors": [ + "DogWala", + "aarushisingh04", + "cyyever", + "excepshenal", + "vasanthrpjan1-boop", + "winglian" + ], + "average_similarity": 0.426, + "cluster_id": "pr-scope-43636-10", + "kind": "pr_scope", + "last_activity_at": "2026-04-09T15:32:29Z", + "outside_window_prs": [ + { + "additions": 11, + "author": "abigailtech", + "changed_files": 1, + "created_at": "2026-01-30T21:53:43Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43636/files", + "html_url": "https://github.com/huggingface/transformers/pull/43636", + "merged": false, + "number": 43636, + "state": "open", + "title": "Add _metrics dict to Trainer for custom metric logging", + "updated_at": "2026-03-13T22:22:03Z" + }, + { + "additions": 13, + "author": "abigailtech", + "changed_files": 1, + "created_at": "2026-01-31T17:51:42Z", + "deletions": 5, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43651/files", + "html_url": "https://github.com/huggingface/transformers/pull/43651", + "merged": false, + "number": 43651, + "state": "open", + "title": "Add _loss_is_scaled_for_ga to allow custom trainers to control gradient accumulation loss scaling", + "updated_at": "2026-03-13T22:28:27Z" + }, + { + "additions": 13, + "author": "abigailtech", + "changed_files": 1, + "created_at": "2026-01-31T21:34:03Z", + "deletions": 12, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43663/files", + "html_url": "https://github.com/huggingface/transformers/pull/43663", + "merged": false, + "number": 43663, + "state": "open", + "title": "Add _get_signature_columns method to allow custom trainers to override column filtering", + "updated_at": "2026-02-03T13:32:17Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.86, + "left_pr_number": 44189, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.776, + "size_similarity": 0.16 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.464, + "left_pr_number": 43663, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.625, + "size_similarity": 1.0 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.418, + "left_pr_number": 43651, + "right_pr_number": 43663, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.55, + "size_similarity": 0.72 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.378, + "left_pr_number": 43651, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.522, + "size_similarity": 0.72 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.414, + "left_pr_number": 43663, + "right_pr_number": 44123, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.508, + "size_similarity": 0.455 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.28, + "left_pr_number": 44257, + "right_pr_number": 44660, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.496, + "size_similarity": 1.0 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.374, + "left_pr_number": 44123, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.48, + "size_similarity": 0.455 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.409, + "left_pr_number": 43663, + "right_pr_number": 44660, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.472, + "size_similarity": 0.24 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.315, + "left_pr_number": 44189, + "right_pr_number": 44660, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.47, + "size_similarity": 0.667 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.35, + "left_pr_number": 43636, + "right_pr_number": 43663, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.461, + "size_similarity": 0.44 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.395, + "left_pr_number": 43663, + "right_pr_number": 44189, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.451, + "size_similarity": 0.16 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.263, + "left_pr_number": 44189, + "right_pr_number": 45055, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.447, + "size_similarity": 0.75 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.37, + "left_pr_number": 44660, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.445, + "size_similarity": 0.24 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.284, + "left_pr_number": 43636, + "right_pr_number": 43651, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.441, + "size_similarity": 0.611 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.27, + "left_pr_number": 44189, + "right_pr_number": 44257, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.439, + "size_similarity": 0.667 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.316, + "left_pr_number": 43636, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.437, + "size_similarity": 0.44 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.336, + "left_pr_number": 43651, + "right_pr_number": 44123, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.435, + "size_similarity": 0.327 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.333, + "left_pr_number": 43651, + "right_pr_number": 44660, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.433, + "size_similarity": 0.333 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.351, + "left_pr_number": 43663, + "right_pr_number": 44257, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.432, + "size_similarity": 0.24 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.278, + "left_pr_number": 43636, + "right_pr_number": 44660, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.427, + "size_similarity": 0.545 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.273, + "left_pr_number": 44660, + "right_pr_number": 45055, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.416, + "size_similarity": 0.5 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.321, + "left_pr_number": 43651, + "right_pr_number": 44189, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.408, + "size_similarity": 0.222 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.342, + "left_pr_number": 43663, + "right_pr_number": 45055, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.408, + "size_similarity": 0.12 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.317, + "left_pr_number": 44257, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.408, + "size_similarity": 0.24 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.286, + "left_pr_number": 43651, + "right_pr_number": 44257, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.4, + "size_similarity": 0.333 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.239, + "left_pr_number": 43636, + "right_pr_number": 44257, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.399, + "size_similarity": 0.545 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.33, + "left_pr_number": 44123, + "right_pr_number": 44660, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.397, + "size_similarity": 0.109 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.269, + "left_pr_number": 43636, + "right_pr_number": 44189, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.393, + "size_similarity": 0.364 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.203, + "left_pr_number": 45055, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.392, + "size_similarity": 0.667 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.235, + "left_pr_number": 44189, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.389, + "size_similarity": 0.5 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.234, + "left_pr_number": 44257, + "right_pr_number": 45055, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.389, + "size_similarity": 0.5 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.309, + "left_pr_number": 45055, + "right_pr_number": 45067, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.385, + "size_similarity": 0.12 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.318, + "left_pr_number": 44123, + "right_pr_number": 44189, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.384, + "size_similarity": 0.073 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.282, + "left_pr_number": 43636, + "right_pr_number": 44123, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.377, + "size_similarity": 0.2 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.305, + "left_pr_number": 43663, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.376, + "size_similarity": 0.08 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.278, + "left_pr_number": 43651, + "right_pr_number": 45055, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.37, + "size_similarity": 0.167 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.243, + "left_pr_number": 44660, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.37, + "size_similarity": 0.333 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.283, + "left_pr_number": 44123, + "right_pr_number": 44257, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.364, + "size_similarity": 0.109 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.276, + "left_pr_number": 45067, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.355, + "size_similarity": 0.08 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.233, + "left_pr_number": 43636, + "right_pr_number": 45055, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.354, + "size_similarity": 0.273 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.276, + "left_pr_number": 44123, + "right_pr_number": 45055, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.351, + "size_similarity": 0.055 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.209, + "left_pr_number": 44257, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.346, + "size_similarity": 0.333 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.248, + "left_pr_number": 43651, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.34, + "size_similarity": 0.111 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.246, + "left_pr_number": 44123, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.328, + "size_similarity": 0.036 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.208, + "left_pr_number": 43636, + "right_pr_number": 45273, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.323, + "size_similarity": 0.182 + } + ], + "pr_count": 10, + "pr_numbers": [ + 43636, + 43651, + 43663, + 44123, + 44189, + 44257, + 44660, + 45055, + 45067, + 45273 + ], + "recent_pr_count": 7, + "recent_pr_numbers": [ + 44123, + 44189, + 44257, + 44660, + 45055, + 45067, + 45273 + ], + "representative_pr_number": 45067, + "representative_title": "feat: trainer resume_from_checkpoint support hub downloads (#43375)", + "representative_url": "https://github.com/huggingface/transformers/pull/45067", + "shared_directories": [], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "summary": "10 open PRs share weighted file overlap around `src/transformers/trainer.py`; representative PR #45067.", + "title": "Scope: feat: trainer resume_from_checkpoint support hub downloads (#43375)" + }, + { + "authors": [ + "UsamaKenway", + "jIab-b", + "rudybear", + "sirzechs66" + ], + "average_similarity": 0.664, + "cluster_id": "pr-scope-44070-4", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T13:54:59Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.932, + "content_similarity": 0.893, + "left_pr_number": 44070, + "right_pr_number": 45296, + "shared_directories": [ + "src/transformers/integrations", + "tests/quantization/ggml", + "src/transformers", + "tests/quantization", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/integrations/ggml.py", + "src/transformers/modeling_gguf_pytorch_utils.py", + "tests/quantization/ggml/test_ggml.py" + ], + "similarity": 0.877, + "size_similarity": 0.702 + }, + { + "breadth_similarity": 0.75, + "concentration_similarity": 0.775, + "content_similarity": 0.613, + "left_pr_number": 44070, + "right_pr_number": 45118, + "shared_directories": [ + "src/transformers/integrations", + "tests/quantization/ggml", + "src/transformers", + "tests/quantization", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/integrations/ggml.py", + "src/transformers/modeling_gguf_pytorch_utils.py", + "tests/quantization/ggml/test_ggml.py" + ], + "similarity": 0.65, + "size_similarity": 0.717 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.959, + "content_similarity": 0.666, + "left_pr_number": 45118, + "right_pr_number": 45283, + "shared_directories": [ + "src/transformers/integrations", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/integrations/ggml.py", + "src/transformers/modeling_gguf_pytorch_utils.py" + ], + "similarity": 0.646, + "size_similarity": 0.549 + }, + { + "breadth_similarity": 0.75, + "concentration_similarity": 0.707, + "content_similarity": 0.552, + "left_pr_number": 45118, + "right_pr_number": 45296, + "shared_directories": [ + "src/transformers/integrations", + "tests/quantization/ggml", + "src/transformers", + "tests/quantization", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/integrations/ggml.py", + "src/transformers/modeling_gguf_pytorch_utils.py", + "tests/quantization/ggml/test_ggml.py" + ], + "similarity": 0.643, + "size_similarity": 0.979 + }, + { + "breadth_similarity": 0.667, + "concentration_similarity": 0.733, + "content_similarity": 0.666, + "left_pr_number": 44070, + "right_pr_number": 45283, + "shared_directories": [ + "src/transformers/integrations", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/integrations/ggml.py", + "src/transformers/modeling_gguf_pytorch_utils.py" + ], + "similarity": 0.628, + "size_similarity": 0.393 + }, + { + "breadth_similarity": 0.667, + "concentration_similarity": 0.665, + "content_similarity": 0.51, + "left_pr_number": 45283, + "right_pr_number": 45296, + "shared_directories": [ + "src/transformers/integrations", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/integrations/ggml.py", + "src/transformers/modeling_gguf_pytorch_utils.py" + ], + "similarity": 0.541, + "size_similarity": 0.56 + } + ], + "pr_count": 4, + "pr_numbers": [ + 44070, + 45118, + 45283, + 45296 + ], + "recent_pr_count": 4, + "recent_pr_numbers": [ + 44070, + 45118, + 45283, + 45296 + ], + "representative_pr_number": 44070, + "representative_title": "Add GGUF loading support for Qwen3-Next (qwen3_next) architecture", + "representative_url": "https://github.com/huggingface/transformers/pull/44070", + "shared_directories": [ + "src/transformers/integrations", + "tests/quantization/ggml", + "tests/quantization", + "tests" + ], + "shared_filenames": [ + "src/transformers/integrations/ggml.py", + "src/transformers/modeling_gguf_pytorch_utils.py", + "tests/quantization/ggml/test_ggml.py" + ], + "summary": "4 open PRs share weighted file overlap around `src/transformers/integrations/ggml.py`, `src/transformers/modeling_gguf_pytorch_utils.py`, `tests/quantization/ggml/test_ggml.py`; representative PR #44070.", + "title": "Scope: Add GGUF loading support for Qwen3-Next (qwen3_next) architecture" + }, + { + "authors": [ + "itazap", + "mohdfaour03", + "tomaarsen", + "yonigozlan" + ], + "average_similarity": 0.548, + "cluster_id": "pr-scope-45078-4", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T13:59:35Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.835, + "content_similarity": 0.872, + "left_pr_number": 45317, + "right_pr_number": 45444, + "shared_directories": [ + "tests/models/auto", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/tokenization_utils_tokenizers.py", + "tests/models/auto/test_tokenization_auto.py" + ], + "similarity": 0.81, + "size_similarity": 0.386 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.605, + "content_similarity": 0.45, + "left_pr_number": 45078, + "right_pr_number": 45444, + "shared_directories": [ + "tests/models/auto", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "tests/models/auto/test_tokenization_auto.py" + ], + "similarity": 0.535, + "size_similarity": 0.6 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.798, + "content_similarity": 0.442, + "left_pr_number": 45078, + "right_pr_number": 45293, + "shared_directories": [ + "src/transformers/models/auto", + "src/transformers/models", + "tests/models/auto", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/auto/tokenization_auto.py", + "tests/models/auto/test_tokenization_auto.py" + ], + "similarity": 0.521, + "size_similarity": 0.476 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.77, + "content_similarity": 0.385, + "left_pr_number": 45078, + "right_pr_number": 45317, + "shared_directories": [ + "tests/models/auto", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "tests/models/auto/test_tokenization_auto.py" + ], + "similarity": 0.505, + "size_similarity": 0.643 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.972, + "content_similarity": 0.333, + "left_pr_number": 45293, + "right_pr_number": 45317, + "shared_directories": [ + "tests/models/auto", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "tests/models/auto/test_tokenization_auto.py" + ], + "similarity": 0.493, + "size_similarity": 0.741 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.807, + "content_similarity": 0.341, + "left_pr_number": 45293, + "right_pr_number": 45444, + "shared_directories": [ + "tests/models/auto", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "tests/models/auto/test_tokenization_auto.py" + ], + "similarity": 0.422, + "size_similarity": 0.286 + } + ], + "pr_count": 4, + "pr_numbers": [ + 45078, + 45293, + 45317, + 45444 + ], + "recent_pr_count": 4, + "recent_pr_numbers": [ + 45078, + 45293, + 45317, + 45444 + ], + "representative_pr_number": 45317, + "representative_title": "Fix AttributeError in _patch_mistral_regex when fix_mistral_regex=True ", + "representative_url": "https://github.com/huggingface/transformers/pull/45317", + "shared_directories": [ + "tests/models/auto", + "tests/models", + "tests", + "src/transformers/models/auto", + "src/transformers/models" + ], + "shared_filenames": [ + "tests/models/auto/test_tokenization_auto.py", + "src/transformers/tokenization_utils_tokenizers.py", + "src/transformers/models/auto/tokenization_auto.py" + ], + "summary": "4 open PRs share weighted file overlap around `tests/models/auto/test_tokenization_auto.py`, `src/transformers/tokenization_utils_tokenizers.py`, `src/transformers/models/auto/tokenization_auto.py`; representative PR #45317.", + "title": "Scope: Fix AttributeError in _patch_mistral_regex when fix_mistral_regex=True " + }, + { + "authors": [ + "Charly21r", + "albertorkive", + "jesperschlegel", + "zucchini-nlp" + ], + "average_similarity": 0.465, + "cluster_id": "pr-scope-45294-4", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T16:13:05Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.989, + "content_similarity": 0.842, + "left_pr_number": 45294, + "right_pr_number": 45438, + "shared_directories": [ + "docs/source/en/model_doc", + "src/transformers/models/auto", + "src/transformers/models/gemma4", + "docs/source/en", + "src/transformers/models", + "tests/models/gemma4", + "docs/source", + "src/transformers", + "tests/models", + "docs" + ], + "shared_filenames": [ + "docs/source/en/model_doc/gemma4.md", + "src/transformers/models/auto/modeling_auto.py", + "src/transformers/models/gemma4/modeling_gemma4.py", + "src/transformers/models/gemma4/modular_gemma4.py", + "tests/models/gemma4/test_modeling_gemma4.py" + ], + "similarity": 0.802, + "size_similarity": 0.42 + }, + { + "breadth_similarity": 0.757, + "concentration_similarity": 0.405, + "content_similarity": 0.394, + "left_pr_number": 45438, + "right_pr_number": 45454, + "shared_directories": [ + "src/transformers/models/gemma4", + "src/transformers/models", + "tests/models/gemma4", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/gemma4/modeling_gemma4.py", + "src/transformers/models/gemma4/modular_gemma4.py", + "tests/models/gemma4/test_modeling_gemma4.py" + ], + "similarity": 0.469, + "size_similarity": 0.647 + }, + { + "breadth_similarity": 0.757, + "concentration_similarity": 0.416, + "content_similarity": 0.338, + "left_pr_number": 45294, + "right_pr_number": 45454, + "shared_directories": [ + "src/transformers/models/gemma4", + "src/transformers/models", + "tests/models/gemma4", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/gemma4/modeling_gemma4.py", + "src/transformers/models/gemma4/modular_gemma4.py", + "tests/models/gemma4/test_modeling_gemma4.py" + ], + "similarity": 0.431, + "size_similarity": 0.649 + }, + { + "breadth_similarity": 0.65, + "concentration_similarity": 0.961, + "content_similarity": 0.307, + "left_pr_number": 45294, + "right_pr_number": 45388, + "shared_directories": [ + "src/transformers/models/gemma4", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gemma4/modeling_gemma4.py", + "src/transformers/models/gemma4/modular_gemma4.py" + ], + "similarity": 0.423, + "size_similarity": 0.633 + }, + { + "breadth_similarity": 0.65, + "concentration_similarity": 0.972, + "content_similarity": 0.347, + "left_pr_number": 45388, + "right_pr_number": 45438, + "shared_directories": [ + "src/transformers/models/gemma4", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gemma4/modeling_gemma4.py", + "src/transformers/models/gemma4/modular_gemma4.py" + ], + "similarity": 0.397, + "size_similarity": 0.266 + }, + { + "breadth_similarity": 0.486, + "concentration_similarity": 0.377, + "content_similarity": 0.201, + "left_pr_number": 45388, + "right_pr_number": 45454, + "shared_directories": [ + "src/transformers/models/gemma4", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gemma4/modeling_gemma4.py", + "src/transformers/models/gemma4/modular_gemma4.py" + ], + "similarity": 0.27, + "size_similarity": 0.411 + } + ], + "pr_count": 4, + "pr_numbers": [ + 45294, + 45388, + 45438, + 45454 + ], + "recent_pr_count": 4, + "recent_pr_numbers": [ + 45294, + 45388, + 45438, + 45454 + ], + "representative_pr_number": 45438, + "representative_title": "Add Gemma4ForSequenceClassification", + "representative_url": "https://github.com/huggingface/transformers/pull/45438", + "shared_directories": [ + "src/transformers/models/gemma4", + "src/transformers/models", + "tests/models/gemma4", + "tests/models", + "tests", + "docs/source/en/model_doc", + "src/transformers/models/auto", + "docs/source/en" + ], + "shared_filenames": [ + "src/transformers/models/gemma4/modeling_gemma4.py", + "src/transformers/models/gemma4/modular_gemma4.py", + "tests/models/gemma4/test_modeling_gemma4.py", + "docs/source/en/model_doc/gemma4.md", + "src/transformers/models/auto/modeling_auto.py" + ], + "summary": "4 open PRs share weighted file overlap around `src/transformers/models/gemma4/modeling_gemma4.py`, `src/transformers/models/gemma4/modular_gemma4.py`, `tests/models/gemma4/test_modeling_gemma4.py`; representative PR #45438.", + "title": "Scope: Add Gemma4ForSequenceClassification" + }, + { + "authors": [ + "IvanFan-Van", + "dacorvo", + "ruben-aghayan" + ], + "average_similarity": 0.406, + "cluster_id": "pr-scope-34667-5", + "kind": "pr_scope", + "last_activity_at": "2026-04-14T20:04:30Z", + "outside_window_prs": [ + { + "additions": 10, + "author": "andrewqianpublic", + "changed_files": 1, + "created_at": "2024-11-09T06:18:31Z", + "deletions": 1, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/34667/files", + "html_url": "https://github.com/huggingface/transformers/pull/34667", + "merged": false, + "number": 34667, + "state": "open", + "title": "Clear unused allocated GPU memory when available GPU memory is low. ", + "updated_at": "2026-03-06T07:28:06Z" + }, + { + "additions": 23, + "author": "bonpiedlaroute", + "changed_files": 1, + "created_at": "2025-07-25T21:27:34Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/39683/files", + "html_url": "https://github.com/huggingface/transformers/pull/39683", + "merged": false, + "number": 39683, + "state": "open", + "title": "Fix issue #39191 respect accelerate config to disable torch.dynamo compilation", + "updated_at": "2026-01-27T12:42:58Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.46, + "left_pr_number": 34667, + "right_pr_number": 39683, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.544, + "size_similarity": 0.478 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.562, + "content_similarity": 0.56, + "left_pr_number": 34667, + "right_pr_number": 45389, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.522, + "size_similarity": 0.344 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.372, + "left_pr_number": 34667, + "right_pr_number": 44872, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.451, + "size_similarity": 0.273 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.27, + "left_pr_number": 44757, + "right_pr_number": 44872, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.439, + "size_similarity": 0.667 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.371, + "left_pr_number": 39683, + "right_pr_number": 44872, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.429, + "size_similarity": 0.13 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.335, + "left_pr_number": 34667, + "right_pr_number": 44757, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.412, + "size_similarity": 0.182 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.334, + "left_pr_number": 39683, + "right_pr_number": 44757, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.397, + "size_similarity": 0.087 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.562, + "content_similarity": 0.284, + "left_pr_number": 39683, + "right_pr_number": 45389, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.385, + "size_similarity": 0.719 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.562, + "content_similarity": 0.23, + "left_pr_number": 44872, + "right_pr_number": 45389, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.253, + "size_similarity": 0.094 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.562, + "content_similarity": 0.207, + "left_pr_number": 44757, + "right_pr_number": 45389, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "similarity": 0.232, + "size_similarity": 0.062 + } + ], + "pr_count": 5, + "pr_numbers": [ + 34667, + 39683, + 44757, + 44872, + 45389 + ], + "recent_pr_count": 3, + "recent_pr_numbers": [ + 44757, + 44872, + 45389 + ], + "representative_pr_number": 34667, + "representative_title": "Clear unused allocated GPU memory when available GPU memory is low. ", + "representative_url": "https://github.com/huggingface/transformers/pull/34667", + "shared_directories": [ + "src/transformers/generation" + ], + "shared_filenames": [ + "src/transformers/generation/utils.py" + ], + "summary": "5 open PRs share weighted file overlap around `src/transformers/generation/utils.py`; representative PR #34667.", + "title": "Scope: Clear unused allocated GPU memory when available GPU memory is low. " + }, + { + "authors": [ + "IlyasMoutawwakil", + "andylizf", + "zucchini-nlp" + ], + "average_similarity": 0.448, + "cluster_id": "pr-scope-41992-4", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T14:22:15Z", + "outside_window_prs": [ + { + "additions": 5038, + "author": "IlyasMoutawwakil", + "changed_files": 82, + "created_at": "2025-11-03T14:20:21Z", + "deletions": 2192, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/41992/files", + "html_url": "https://github.com/huggingface/transformers/pull/41992", + "merged": false, + "number": 41992, + "state": "open", + "title": "[PoC] HF exporters", + "updated_at": "2026-04-13T08:41:05Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.544, + "concentration_similarity": 0.954, + "content_similarity": 0.64, + "left_pr_number": 44157, + "right_pr_number": 45396, + "shared_directories": [ + "src/transformers/models/ernie4_5_vl_moe", + "src/transformers/models/glm4v", + "src/transformers/models/glm4v_moe", + "src/transformers/models/glm_ocr", + "src/transformers/models/paddleocr_vl", + "src/transformers/models/qwen2_5_omni", + "src/transformers/models/qwen2_5_vl", + "src/transformers/models/qwen2_vl", + "src/transformers/models/qwen3_5", + "src/transformers/models/qwen3_5_moe" + ], + "shared_filenames": [ + "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", + "src/transformers/models/ernie4_5_vl_moe/modular_ernie4_5_vl_moe.py", + "src/transformers/models/glm4v/modeling_glm4v.py", + "src/transformers/models/glm4v/modular_glm4v.py", + "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", + "src/transformers/models/glm_ocr/modeling_glm_ocr.py", + "src/transformers/models/glm_ocr/modular_glm_ocr.py", + "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", + "src/transformers/models/paddleocr_vl/modular_paddleocr_vl.py", + "src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py" + ], + "similarity": 0.6, + "size_similarity": 0.334 + }, + { + "breadth_similarity": 0.896, + "concentration_similarity": 0.919, + "content_similarity": 0.588, + "left_pr_number": 44157, + "right_pr_number": 44973, + "shared_directories": [ + "src/transformers/models/ernie4_5_vl_moe", + "src/transformers/models/glm4v", + "src/transformers/models/glm4v_moe", + "src/transformers/models/glm_ocr", + "src/transformers/models/paddleocr_vl", + "src/transformers/models/qwen2_5_omni", + "src/transformers/models/qwen2_5_vl", + "src/transformers/models/qwen2_vl", + "src/transformers/models/qwen3_5", + "src/transformers/models/qwen3_5_moe" + ], + "shared_filenames": [ + "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", + "src/transformers/models/glm4v/modeling_glm4v.py", + "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", + "src/transformers/models/glm_ocr/modeling_glm_ocr.py", + "src/transformers/models/glm_ocr/modular_glm_ocr.py", + "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", + "src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py", + "src/transformers/models/qwen2_5_omni/modular_qwen2_5_omni.py", + "src/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py", + "src/transformers/models/qwen2_vl/modeling_qwen2_vl.py" + ], + "similarity": 0.551, + "size_similarity": 0.029 + }, + { + "breadth_similarity": 0.544, + "concentration_similarity": 0.831, + "content_similarity": 0.473, + "left_pr_number": 41992, + "right_pr_number": 45396, + "shared_directories": [ + "src/transformers/models/ernie4_5_vl_moe", + "src/transformers/models/esm", + "src/transformers/models/glm46v", + "src/transformers/models/glm4v", + "src/transformers/models/glm4v_moe", + "src/transformers/models/glm_image", + "src/transformers/models/glm_ocr", + "src/transformers/models/paddleocr_vl", + "src/transformers/models/qwen2_5_omni", + "src/transformers/models/qwen2_5_vl" + ], + "shared_filenames": [ + "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", + "src/transformers/models/ernie4_5_vl_moe/modular_ernie4_5_vl_moe.py", + "src/transformers/models/esm/configuration_esm.py", + "src/transformers/models/glm46v/modeling_glm46v.py", + "src/transformers/models/glm4v/modeling_glm4v.py", + "src/transformers/models/glm4v/modular_glm4v.py", + "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", + "src/transformers/models/glm_image/modeling_glm_image.py", + "src/transformers/models/glm_image/modular_glm_image.py", + "src/transformers/models/glm_ocr/modeling_glm_ocr.py" + ], + "similarity": 0.521, + "size_similarity": 0.631 + }, + { + "breadth_similarity": 0.489, + "concentration_similarity": 0.965, + "content_similarity": 0.41, + "left_pr_number": 44973, + "right_pr_number": 45396, + "shared_directories": [ + "src/transformers/models/ernie4_5_vl_moe", + "src/transformers/models/glm4v", + "src/transformers/models/glm4v_moe", + "src/transformers/models/glm_image", + "src/transformers/models/glm_ocr", + "src/transformers/models/paddleocr_vl", + "src/transformers/models/qwen2_5_omni", + "src/transformers/models/qwen2_5_vl", + "src/transformers/models/qwen2_vl", + "src/transformers/models/qwen3_5" + ], + "shared_filenames": [ + "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", + "src/transformers/models/glm4v/modeling_glm4v.py", + "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", + "src/transformers/models/glm_image/modeling_glm_image.py", + "src/transformers/models/glm_image/modular_glm_image.py", + "src/transformers/models/glm_ocr/modeling_glm_ocr.py", + "src/transformers/models/glm_ocr/modular_glm_ocr.py", + "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", + "src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py", + "src/transformers/models/qwen2_5_omni/modular_qwen2_5_omni.py" + ], + "similarity": 0.386, + "size_similarity": 0.01 + }, + { + "breadth_similarity": 0.296, + "concentration_similarity": 0.785, + "content_similarity": 0.392, + "left_pr_number": 41992, + "right_pr_number": 44157, + "shared_directories": [ + "src/transformers/models/ernie4_5_vl_moe", + "src/transformers/models/glm4v", + "src/transformers/models/glm4v_moe", + "src/transformers/models/glm_ocr", + "src/transformers/models/paddleocr_vl", + "src/transformers/models/qwen2_5_omni", + "src/transformers/models/qwen2_5_vl", + "src/transformers/models/qwen2_vl", + "src/transformers/models/qwen3_5", + "src/transformers/models/qwen3_5_moe" + ], + "shared_filenames": [ + "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", + "src/transformers/models/ernie4_5_vl_moe/modular_ernie4_5_vl_moe.py", + "src/transformers/models/glm4v/modeling_glm4v.py", + "src/transformers/models/glm4v/modular_glm4v.py", + "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", + "src/transformers/models/glm_ocr/modeling_glm_ocr.py", + "src/transformers/models/glm_ocr/modular_glm_ocr.py", + "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", + "src/transformers/models/paddleocr_vl/modular_paddleocr_vl.py", + "src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py" + ], + "similarity": 0.375, + "size_similarity": 0.211 + }, + { + "breadth_similarity": 0.266, + "concentration_similarity": 0.866, + "content_similarity": 0.262, + "left_pr_number": 41992, + "right_pr_number": 44973, + "shared_directories": [ + "src/transformers/models/ernie4_5_vl_moe", + "src/transformers/models/glm4v", + "src/transformers/models/glm4v_moe", + "src/transformers/models/glm_image", + "src/transformers/models/glm_ocr", + "src/transformers/models/paddleocr_vl", + "src/transformers/models/qwen2_5_omni", + "src/transformers/models/qwen2_5_vl", + "src/transformers/models/qwen2_vl", + "src/transformers/models/qwen3_5" + ], + "shared_filenames": [ + "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", + "src/transformers/models/glm4v/modeling_glm4v.py", + "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", + "src/transformers/models/glm_image/modeling_glm_image.py", + "src/transformers/models/glm_image/modular_glm_image.py", + "src/transformers/models/glm_ocr/modeling_glm_ocr.py", + "src/transformers/models/glm_ocr/modular_glm_ocr.py", + "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", + "src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py", + "src/transformers/models/qwen2_5_omni/modular_qwen2_5_omni.py" + ], + "similarity": 0.254, + "size_similarity": 0.006 + } + ], + "pr_count": 4, + "pr_numbers": [ + 41992, + 44157, + 44973, + 45396 + ], + "recent_pr_count": 3, + "recent_pr_numbers": [ + 44157, + 44973, + 45396 + ], + "representative_pr_number": 44157, + "representative_title": "Use correct mask for packed inputs in Qwen-VL ", + "representative_url": "https://github.com/huggingface/transformers/pull/44157", + "shared_directories": [ + "src/transformers/models/glm_ocr", + "src/transformers/models/glm4v", + "src/transformers/models/paddleocr_vl", + "src/transformers/models/qwen3_5_moe", + "src/transformers/models/video_llama_3", + "src/transformers/models/glm4v_moe", + "src/transformers/models/qwen2_vl", + "src/transformers/models/qwen2_5_omni" + ], + "shared_filenames": [ + "src/transformers/models/glm_ocr/modular_glm_ocr.py", + "src/transformers/models/glm4v/modeling_glm4v.py", + "src/transformers/models/glm_ocr/modeling_glm_ocr.py", + "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", + "src/transformers/models/qwen3_5_moe/modeling_qwen3_5_moe.py", + "src/transformers/models/qwen3_vl/modeling_qwen3_vl.py", + "src/transformers/models/video_llama_3/modeling_video_llama_3.py", + "src/transformers/models/video_llama_3/modular_video_llama_3.py" + ], + "summary": "4 open PRs share weighted file overlap around `src/transformers/models/glm_ocr/modular_glm_ocr.py`, `src/transformers/models/glm4v/modeling_glm4v.py`, `src/transformers/models/glm_ocr/modeling_glm_ocr.py`; representative PR #44157.", + "title": "Scope: Use correct mask for packed inputs in Qwen-VL " + }, + { + "authors": [ + "Jay-IIT", + "Zephyr-Blessed", + "chandan11248" + ], + "average_similarity": 0.941, + "cluster_id": "pr-scope-44066-3", + "kind": "pr_scope", + "last_activity_at": "2026-03-19T18:12:59Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.957, + "content_similarity": 0.967, + "left_pr_number": 44066, + "right_pr_number": 44722, + "shared_directories": [ + "src/transformers/models/codegen", + "src/transformers/models/gptj", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/codegen/modeling_codegen.py", + "src/transformers/models/gptj/modeling_gptj.py" + ], + "similarity": 0.969, + "size_similarity": 0.959 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.986, + "content_similarity": 0.988, + "left_pr_number": 44085, + "right_pr_number": 44722, + "shared_directories": [ + "src/transformers/models/gptj", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gptj/modeling_gptj.py" + ], + "similarity": 0.938, + "size_similarity": 0.98 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.944, + "content_similarity": 0.963, + "left_pr_number": 44066, + "right_pr_number": 44085, + "shared_directories": [ + "src/transformers/models/gptj", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gptj/modeling_gptj.py" + ], + "similarity": 0.918, + "size_similarity": 0.979 + } + ], + "pr_count": 3, + "pr_numbers": [ + 44066, + 44085, + 44722 + ], + "recent_pr_count": 3, + "recent_pr_numbers": [ + 44066, + 44085, + 44722 + ], + "representative_pr_number": 44722, + "representative_title": "Refactor gptj output tracing to use standardized decorators", + "representative_url": "https://github.com/huggingface/transformers/pull/44722", + "shared_directories": [ + "src/transformers/models/gptj", + "src/transformers/models", + "src/transformers/models/codegen" + ], + "shared_filenames": [ + "src/transformers/models/gptj/modeling_gptj.py", + "src/transformers/models/codegen/modeling_codegen.py" + ], + "summary": "3 open PRs share weighted file overlap around `src/transformers/models/gptj/modeling_gptj.py`, `src/transformers/models/codegen/modeling_codegen.py`; representative PR #44722.", + "title": "Scope: Refactor gptj output tracing to use standardized decorators" + }, + { + "authors": [ + "JokeYoonic", + "akashadsare", + "lakprigan" + ], + "average_similarity": 0.571, + "cluster_id": "pr-scope-44015-3", + "kind": "pr_scope", + "last_activity_at": "2026-03-18T17:16:49Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.754, + "left_pr_number": 44059, + "right_pr_number": 44676, + "shared_directories": [ + "src/transformers/models/gpt2", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gpt2/modeling_gpt2.py" + ], + "similarity": 0.687, + "size_similarity": 0.062 + }, + { + "breadth_similarity": 0.333, + "concentration_similarity": 0.488, + "content_similarity": 0.673, + "left_pr_number": 44015, + "right_pr_number": 44059, + "shared_directories": [ + "src/transformers/models/gpt2", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gpt2/modeling_gpt2.py" + ], + "similarity": 0.61, + "size_similarity": 0.543 + }, + { + "breadth_similarity": 0.333, + "concentration_similarity": 0.488, + "content_similarity": 0.506, + "left_pr_number": 44015, + "right_pr_number": 44676, + "shared_directories": [ + "src/transformers/models/gpt2", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/gpt2/modeling_gpt2.py" + ], + "similarity": 0.417, + "size_similarity": 0.034 + } + ], + "pr_count": 3, + "pr_numbers": [ + 44015, + 44059, + 44676 + ], + "recent_pr_count": 3, + "recent_pr_numbers": [ + 44015, + 44059, + 44676 + ], + "representative_pr_number": 44059, + "representative_title": "[GPT2] Refactor output tracing to use capture_outputs/can_return_tuple decorators", + "representative_url": "https://github.com/huggingface/transformers/pull/44059", + "shared_directories": [ + "src/transformers/models/gpt2", + "src/transformers/models" + ], + "shared_filenames": [ + "src/transformers/models/gpt2/modeling_gpt2.py" + ], + "summary": "3 open PRs share weighted file overlap around `src/transformers/models/gpt2/modeling_gpt2.py`; representative PR #44059.", + "title": "Scope: [GPT2] Refactor output tracing to use capture_outputs/can_return_tuple decorators" + }, + { + "authors": [ + "3outeille", + "Cyrilvallez", + "yonigozlan" + ], + "average_similarity": 0.445, + "cluster_id": "pr-scope-44974-3", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T16:32:23Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.633, + "concentration_similarity": 0.959, + "content_similarity": 0.594, + "left_pr_number": 44974, + "right_pr_number": 45448, + "shared_directories": [ + "src/transformers", + "tests/utils", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/core_model_loading.py", + "tests/utils/test_core_model_loading.py" + ], + "similarity": 0.595, + "size_similarity": 0.455 + }, + { + "breadth_similarity": 0.667, + "concentration_similarity": 0.657, + "content_similarity": 0.314, + "left_pr_number": 44974, + "right_pr_number": 45421, + "shared_directories": [ + "src/transformers", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/core_model_loading.py" + ], + "similarity": 0.43, + "size_similarity": 0.735 + }, + { + "breadth_similarity": 0.417, + "concentration_similarity": 0.616, + "content_similarity": 0.206, + "left_pr_number": 45421, + "right_pr_number": 45448, + "shared_directories": [ + "src/transformers", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/core_model_loading.py" + ], + "similarity": 0.309, + "size_similarity": 0.619 + } + ], + "pr_count": 3, + "pr_numbers": [ + 44974, + 45421, + 45448 + ], + "recent_pr_count": 3, + "recent_pr_numbers": [ + 44974, + 45421, + 45448 + ], + "representative_pr_number": 44974, + "representative_title": "Refactor core_model_loading to support FSDP shard-on-read loading", + "representative_url": "https://github.com/huggingface/transformers/pull/44974", + "shared_directories": [ + "tests", + "tests/utils" + ], + "shared_filenames": [ + "src/transformers/core_model_loading.py", + "tests/utils/test_core_model_loading.py" + ], + "summary": "3 open PRs share weighted file overlap around `src/transformers/core_model_loading.py`, `tests/utils/test_core_model_loading.py`; representative PR #44974.", + "title": "Scope: Refactor core_model_loading to support FSDP shard-on-read loading" + }, + { + "authors": [ + "AkshajKashyap", + "roycho96", + "saslifat-gif" + ], + "average_similarity": 0.396, + "cluster_id": "pr-scope-44889-3", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T06:11:00Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.927, + "content_similarity": 0.424, + "left_pr_number": 44889, + "right_pr_number": 45402, + "shared_directories": [ + "tests/trainer/distributed", + "src/transformers", + "tests/trainer", + "src", + "tests" + ], + "shared_filenames": [ + "tests/trainer/distributed/test_trainer_distributed_deepspeed.py" + ], + "similarity": 0.506, + "size_similarity": 0.421 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.812, + "content_similarity": 0.169, + "left_pr_number": 44889, + "right_pr_number": 44981, + "shared_directories": [ + "src/transformers", + "tests/trainer", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/trainer.py" + ], + "similarity": 0.408, + "size_similarity": 0.991 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.885, + "content_similarity": 0.097, + "left_pr_number": 44981, + "right_pr_number": 45402, + "shared_directories": [ + "src/transformers", + "tests/trainer", + "src", + "tests" + ], + "shared_filenames": [], + "similarity": 0.275, + "size_similarity": 0.417 + } + ], + "pr_count": 3, + "pr_numbers": [ + 44889, + 44981, + 45402 + ], + "recent_pr_count": 3, + "recent_pr_numbers": [ + 44889, + 44981, + 45402 + ], + "representative_pr_number": 44889, + "representative_title": "[DeepSpeed] Fix evaluate()/predict() before train()", + "representative_url": "https://github.com/huggingface/transformers/pull/44889", + "shared_directories": [ + "tests/trainer", + "tests", + "tests/trainer/distributed" + ], + "shared_filenames": [ + "tests/trainer/distributed/test_trainer_distributed_deepspeed.py", + "src/transformers/trainer.py" + ], + "summary": "3 open PRs share weighted file overlap around `tests/trainer/distributed/test_trainer_distributed_deepspeed.py`, `src/transformers/trainer.py`; representative PR #44889.", + "title": "Scope: [DeepSpeed] Fix evaluate()/predict() before train()" + }, + { + "authors": [ + "SunMarc", + "rain-1" + ], + "average_similarity": 0.499, + "cluster_id": "pr-scope-43656-5", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T15:16:40Z", + "outside_window_prs": [ + { + "additions": 9, + "author": "jonathan-fulton", + "changed_files": 1, + "created_at": "2026-01-31T18:54:19Z", + "deletions": 9, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43656/files", + "html_url": "https://github.com/huggingface/transformers/pull/43656", + "merged": false, + "number": 43656, + "state": "open", + "title": "Fix TypeAdapter NameError in transformers CLI", + "updated_at": "2026-03-01T12:00:57Z" + }, + { + "additions": 79, + "author": "pragnyanramtha", + "changed_files": 1, + "created_at": "2026-02-08T11:28:31Z", + "deletions": 70, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43836/files", + "html_url": "https://github.com/huggingface/transformers/pull/43836", + "merged": false, + "number": 43836, + "state": "open", + "title": "fix: wrapped TypeAdpater in string literals (for now)", + "updated_at": "2026-02-17T04:46:27Z" + }, + { + "additions": 3, + "author": "Mr-Neutr0n", + "changed_files": 1, + "created_at": "2026-02-08T13:01:19Z", + "deletions": 1, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43842/files", + "html_url": "https://github.com/huggingface/transformers/pull/43842", + "merged": false, + "number": 43842, + "state": "open", + "title": "fix(cli): Fix TypeAdapter NameError when pydantic is not installed", + "updated_at": "2026-02-08T16:08:04Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.734, + "left_pr_number": 43656, + "right_pr_number": 43836, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.682, + "size_similarity": 0.121 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.65, + "left_pr_number": 43836, + "right_pr_number": 43842, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.609, + "size_similarity": 0.027 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.802, + "content_similarity": 0.645, + "left_pr_number": 43836, + "right_pr_number": 44682, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.602, + "size_similarity": 0.398 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.579, + "left_pr_number": 43656, + "right_pr_number": 43842, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.589, + "size_similarity": 0.222 + }, + { + "breadth_similarity": 0.667, + "concentration_similarity": 0.752, + "content_similarity": 0.405, + "left_pr_number": 44558, + "right_pr_number": 44682, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.535, + "size_similarity": 0.984 + }, + { + "breadth_similarity": 0.333, + "concentration_similarity": 0.554, + "content_similarity": 0.491, + "left_pr_number": 43836, + "right_pr_number": 44558, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.465, + "size_similarity": 0.405 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.802, + "content_similarity": 0.488, + "left_pr_number": 43656, + "right_pr_number": 44682, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.439, + "size_similarity": 0.048 + }, + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.802, + "content_similarity": 0.449, + "left_pr_number": 43842, + "right_pr_number": 44682, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.406, + "size_similarity": 0.011 + }, + { + "breadth_similarity": 0.333, + "concentration_similarity": 0.554, + "content_similarity": 0.409, + "left_pr_number": 43656, + "right_pr_number": 44558, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.355, + "size_similarity": 0.049 + }, + { + "breadth_similarity": 0.333, + "concentration_similarity": 0.554, + "content_similarity": 0.345, + "left_pr_number": 43842, + "right_pr_number": 44558, + "shared_directories": [ + "src/transformers/cli", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "similarity": 0.304, + "size_similarity": 0.011 + } + ], + "pr_count": 5, + "pr_numbers": [ + 43656, + 43836, + 43842, + 44558, + 44682 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44558, + 44682 + ], + "representative_pr_number": 43836, + "representative_title": "fix: wrapped TypeAdpater in string literals (for now)", + "representative_url": "https://github.com/huggingface/transformers/pull/43836", + "shared_directories": [ + "src/transformers/cli" + ], + "shared_filenames": [ + "src/transformers/cli/serve.py" + ], + "summary": "5 open PRs share weighted file overlap around `src/transformers/cli/serve.py`; representative PR #43836.", + "title": "Scope: fix: wrapped TypeAdpater in string literals (for now)" + }, + { + "authors": [ + "Sid-V5", + "pdwi2020" + ], + "average_similarity": 0.525, + "cluster_id": "pr-scope-43997-3", + "kind": "pr_scope", + "last_activity_at": "2026-02-19T15:49:49Z", + "outside_window_prs": [ + { + "additions": 12, + "author": "karthiksuki", + "changed_files": 1, + "created_at": "2026-02-14T19:57:54Z", + "deletions": 45, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43997/files", + "html_url": "https://github.com/huggingface/transformers/pull/43997", + "merged": false, + "number": 43997, + "state": "open", + "title": "Migrate RegNet to standardized output tracing", + "updated_at": "2026-02-14T20:10:22Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.333, + "concentration_similarity": 0.548, + "content_similarity": 0.695, + "left_pr_number": 44007, + "right_pr_number": 44019, + "shared_directories": [ + "src/transformers/models/resnet", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/resnet/modeling_resnet.py" + ], + "similarity": 0.688, + "size_similarity": 0.94 + }, + { + "breadth_similarity": 0.333, + "concentration_similarity": 0.548, + "content_similarity": 0.653, + "left_pr_number": 43997, + "right_pr_number": 44007, + "shared_directories": [ + "src/transformers/models/regnet", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/regnet/modeling_regnet.py" + ], + "similarity": 0.619, + "size_similarity": 0.679 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.013, + "left_pr_number": 43997, + "right_pr_number": 44019, + "shared_directories": [ + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [], + "similarity": 0.267, + "size_similarity": 0.722 + } + ], + "pr_count": 3, + "pr_numbers": [ + 43997, + 44007, + 44019 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44007, + 44019 + ], + "representative_pr_number": 44007, + "representative_title": "[ResNet] Refactor output tracing to decorator-based interface", + "representative_url": "https://github.com/huggingface/transformers/pull/44007", + "shared_directories": [ + "src/transformers/models", + "src/transformers/models/regnet", + "src/transformers/models/resnet" + ], + "shared_filenames": [ + "src/transformers/models/regnet/modeling_regnet.py", + "src/transformers/models/resnet/modeling_resnet.py" + ], + "summary": "3 open PRs share weighted file overlap around `src/transformers/models/regnet/modeling_regnet.py`, `src/transformers/models/resnet/modeling_resnet.py`; representative PR #44007.", + "title": "Scope: [ResNet] Refactor output tracing to decorator-based interface" + }, + { + "authors": [ + "himani27301", + "hongping-zh" + ], + "average_similarity": 0.373, + "cluster_id": "pr-scope-33686-3", + "kind": "pr_scope", + "last_activity_at": "2026-03-25T11:53:49Z", + "outside_window_prs": [ + { + "additions": 15, + "author": "maxwbuckley", + "changed_files": 1, + "created_at": "2024-09-24T20:28:02Z", + "deletions": 7, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/33686/files", + "html_url": "https://github.com/huggingface/transformers/pull/33686", + "merged": false, + "number": 33686, + "state": "open", + "title": "Updating Chameleon Image handling documentation", + "updated_at": "2026-04-07T05:09:42Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.139, + "left_pr_number": 33686, + "right_pr_number": 44550, + "shared_directories": [ + "docs/source/en/model_doc", + "docs/source/en", + "docs/source", + "docs" + ], + "shared_filenames": [], + "similarity": 0.397, + "size_similarity": 1.0 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.106, + "left_pr_number": 44407, + "right_pr_number": 44550, + "shared_directories": [ + "docs/source/en", + "docs/source", + "docs" + ], + "shared_filenames": [], + "similarity": 0.367, + "size_similarity": 0.957 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.089, + "left_pr_number": 33686, + "right_pr_number": 44407, + "shared_directories": [ + "docs/source/en", + "docs/source", + "docs" + ], + "shared_filenames": [], + "similarity": 0.356, + "size_similarity": 0.957 + } + ], + "pr_count": 3, + "pr_numbers": [ + 33686, + 44407, + 44550 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44407, + 44550 + ], + "representative_pr_number": 44550, + "representative_title": "Improve clarity and grammar in Auto Classes documentation", + "representative_url": "https://github.com/huggingface/transformers/pull/44550", + "shared_directories": [ + "docs/source/en", + "docs/source", + "docs", + "docs/source/en/model_doc" + ], + "shared_filenames": [], + "summary": "3 open PRs cluster in `docs/source/en`, `docs/source`, `docs` with similar change breadth; representative PR #44550.", + "title": "Scope: Improve clarity and grammar in Auto Classes documentation" + }, + { + "authors": [ + "mtthw13", + "yashbora9" + ], + "average_similarity": 0.989, + "cluster_id": "pr-scope-44018-2", + "kind": "pr_scope", + "last_activity_at": "2026-02-18T08:30:32Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.999, + "content_similarity": 0.998, + "left_pr_number": 44018, + "right_pr_number": 44068, + "shared_directories": [ + "src/transformers/models/gpt_neo", + "src/transformers/models", + "tests/models/gpt_neo", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/gpt_neo/modeling_gpt_neo.py", + "tests/models/gpt_neo/test_modeling_gpt_neo.py" + ], + "similarity": 0.989, + "size_similarity": 0.932 + } + ], + "pr_count": 2, + "pr_numbers": [ + 44018, + 44068 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44018, + 44068 + ], + "representative_pr_number": 44018, + "representative_title": "Refactor GPT-Neo output tracing to use capture_outputs/can_return_tuple", + "representative_url": "https://github.com/huggingface/transformers/pull/44018", + "shared_directories": [ + "src/transformers/models/gpt_neo", + "tests/models/gpt_neo", + "src/transformers/models", + "tests/models", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/gpt_neo/modeling_gpt_neo.py", + "tests/models/gpt_neo/test_modeling_gpt_neo.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/models/gpt_neo/modeling_gpt_neo.py`, `tests/models/gpt_neo/test_modeling_gpt_neo.py`; representative PR #44018.", + "title": "Scope: Refactor GPT-Neo output tracing to use capture_outputs/can_return_tuple" + }, + { + "authors": [ + "Qubitium", + "remi-or" + ], + "average_similarity": 0.648, + "cluster_id": "pr-scope-45274-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T01:41:00Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.607, + "concentration_similarity": 0.781, + "content_similarity": 0.63, + "left_pr_number": 45274, + "right_pr_number": 45323, + "shared_directories": [ + "src/transformers/generation/continuous_batching", + "src/transformers/generation", + "src/transformers", + "tests/generation", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/generation/continuous_batching/continuous_api.py", + "src/transformers/generation/continuous_batching/input_outputs.py", + "src/transformers/generation/continuous_batching/utils.py", + "tests/generation/test_continuous_batching.py" + ], + "similarity": 0.648, + "size_similarity": 0.713 + } + ], + "pr_count": 2, + "pr_numbers": [ + 45274, + 45323 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 45274, + 45323 + ], + "representative_pr_number": 45274, + "representative_title": "Fix CB Accuracy Regression under FA2", + "representative_url": "https://github.com/huggingface/transformers/pull/45274", + "shared_directories": [ + "src/transformers/generation/continuous_batching", + "src/transformers/generation", + "tests/generation", + "tests" + ], + "shared_filenames": [ + "src/transformers/generation/continuous_batching/continuous_api.py", + "src/transformers/generation/continuous_batching/input_outputs.py", + "src/transformers/generation/continuous_batching/utils.py", + "tests/generation/test_continuous_batching.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/generation/continuous_batching/continuous_api.py`, `src/transformers/generation/continuous_batching/input_outputs.py`, `src/transformers/generation/continuous_batching/utils.py`; representative PR #45274.", + "title": "Scope: Fix CB Accuracy Regression under FA2" + }, + { + "authors": [ + "aman-coder03", + "dtiourine" + ], + "average_similarity": 0.55, + "cluster_id": "pr-scope-44101-2", + "kind": "pr_scope", + "last_activity_at": "2026-02-19T08:08:33Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.507, + "content_similarity": 0.61, + "left_pr_number": 44101, + "right_pr_number": 44116, + "shared_directories": [ + "src/transformers/models/flaubert", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/models/flaubert/modeling_flaubert.py" + ], + "similarity": 0.55, + "size_similarity": 0.319 + } + ], + "pr_count": 2, + "pr_numbers": [ + 44101, + 44116 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44101, + 44116 + ], + "representative_pr_number": 44101, + "representative_title": "[XLM] Refactor output tracing to align with capture_outputs standardized architecture", + "representative_url": "https://github.com/huggingface/transformers/pull/44101", + "shared_directories": [ + "src/transformers/models/flaubert", + "src/transformers/models" + ], + "shared_filenames": [ + "src/transformers/models/flaubert/modeling_flaubert.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/models/flaubert/modeling_flaubert.py`; representative PR #44101.", + "title": "Scope: [XLM] Refactor output tracing to align with capture_outputs standardized architecture" + }, + { + "authors": [ + "ArthurZucker", + "FaizanImran-blip" + ], + "average_similarity": 0.505, + "cluster_id": "pr-scope-45056-2", + "kind": "pr_scope", + "last_activity_at": "2026-03-31T10:44:40Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.875, + "concentration_similarity": 0.724, + "content_similarity": 0.401, + "left_pr_number": 45056, + "right_pr_number": 45128, + "shared_directories": [ + "src/transformers/utils", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/utils/auto_docstring.py" + ], + "similarity": 0.505, + "size_similarity": 0.669 + } + ], + "pr_count": 2, + "pr_numbers": [ + 45056, + 45128 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 45056, + 45128 + ], + "representative_pr_number": 45056, + "representative_title": "[`auto_docstring`] needs to be only run on __doc__ ", + "representative_url": "https://github.com/huggingface/transformers/pull/45056", + "shared_directories": [ + "src/transformers/utils" + ], + "shared_filenames": [ + "src/transformers/utils/auto_docstring.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/utils/auto_docstring.py`; representative PR #45056.", + "title": "Scope: [`auto_docstring`] needs to be only run on __doc__ " + }, + { + "authors": [ + "qgallouedec", + "umbilnm" + ], + "average_similarity": 0.501, + "cluster_id": "pr-scope-44543-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-14T16:08:31Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.75, + "concentration_similarity": 0.802, + "content_similarity": 0.48, + "left_pr_number": 44543, + "right_pr_number": 45422, + "shared_directories": [ + "src/transformers", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/processing_utils.py", + "tests/test_processing_common.py" + ], + "similarity": 0.501, + "size_similarity": 0.331 + } + ], + "pr_count": 2, + "pr_numbers": [ + 44543, + 45422 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44543, + 45422 + ], + "representative_pr_number": 44543, + "representative_title": "Fix assistant_masks for multimodal inputs in apply_chat_template", + "representative_url": "https://github.com/huggingface/transformers/pull/44543", + "shared_directories": [ + "tests" + ], + "shared_filenames": [ + "tests/test_processing_common.py", + "src/transformers/processing_utils.py" + ], + "summary": "2 open PRs share weighted file overlap around `tests/test_processing_common.py`, `src/transformers/processing_utils.py`; representative PR #44543.", + "title": "Scope: Fix assistant_masks for multimodal inputs in apply_chat_template" + }, + { + "authors": [ + "eladsegal" + ], + "average_similarity": 0.495, + "cluster_id": "pr-scope-45332-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T04:50:09Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.479, + "concentration_similarity": 0.945, + "content_similarity": 0.526, + "left_pr_number": 45332, + "right_pr_number": 45333, + "shared_directories": [ + "src/transformers/heterogeneity", + "src/transformers", + "tests/heterogeneity", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/configuration_utils.py", + "src/transformers/heterogeneity/__init__.py", + "src/transformers/heterogeneity/configuration_utils.py", + "tests/heterogeneity/__init__.py", + "tests/heterogeneity/test_configuration_utils.py" + ], + "similarity": 0.495, + "size_similarity": 0.215 + } + ], + "pr_count": 2, + "pr_numbers": [ + 45332, + 45333 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 45332, + 45333 + ], + "representative_pr_number": 45332, + "representative_title": "Add heterogeneous model support (per-layer config and modeling)", + "representative_url": "https://github.com/huggingface/transformers/pull/45332", + "shared_directories": [ + "src/transformers/heterogeneity", + "tests/heterogeneity", + "tests" + ], + "shared_filenames": [ + "src/transformers/heterogeneity/__init__.py", + "src/transformers/heterogeneity/configuration_utils.py", + "tests/heterogeneity/__init__.py", + "tests/heterogeneity/test_configuration_utils.py", + "src/transformers/configuration_utils.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/heterogeneity/__init__.py`, `src/transformers/heterogeneity/configuration_utils.py`, `tests/heterogeneity/__init__.py`; representative PR #45332.", + "title": "Scope: Add heterogeneous model support (per-layer config and modeling)" + }, + { + "authors": [ + "MaybeSam05", + "NielsRogge" + ], + "average_similarity": 0.411, + "cluster_id": "pr-scope-44385-2", + "kind": "pr_scope", + "last_activity_at": "2026-03-12T10:33:43Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.667, + "concentration_similarity": 1.0, + "content_similarity": 0.341, + "left_pr_number": 44385, + "right_pr_number": 44615, + "shared_directories": [ + "src/transformers/utils", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/utils/import_utils.py" + ], + "similarity": 0.411, + "size_similarity": 0.371 + } + ], + "pr_count": 2, + "pr_numbers": [ + 44385, + 44615 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44385, + 44615 + ], + "representative_pr_number": 44385, + "representative_title": "Fix make check-repo", + "representative_url": "https://github.com/huggingface/transformers/pull/44385", + "shared_directories": [ + "src/transformers/utils" + ], + "shared_filenames": [ + "src/transformers/utils/import_utils.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/utils/import_utils.py`; representative PR #44385.", + "title": "Scope: Fix make check-repo" + }, + { + "authors": [ + "AmineDiro", + "sywangyi" + ], + "average_similarity": 0.409, + "cluster_id": "pr-scope-45279-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T14:57:41Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.667, + "concentration_similarity": 0.911, + "content_similarity": 0.319, + "left_pr_number": 45279, + "right_pr_number": 45436, + "shared_directories": [ + "src/transformers/integrations", + "src/transformers/models", + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/integrations/tensor_parallel.py" + ], + "similarity": 0.409, + "size_similarity": 0.49 + } + ], + "pr_count": 2, + "pr_numbers": [ + 45279, + 45436 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 45279, + 45436 + ], + "representative_pr_number": 45279, + "representative_title": "add expert parallelism for gemma-4-26B-A4B-it", + "representative_url": "https://github.com/huggingface/transformers/pull/45279", + "shared_directories": [ + "src/transformers/integrations", + "src/transformers/models" + ], + "shared_filenames": [ + "src/transformers/integrations/tensor_parallel.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/integrations/tensor_parallel.py`; representative PR #45279.", + "title": "Scope: add expert parallelism for gemma-4-26B-A4B-it" + }, + { + "authors": [ + "itazap", + "knQzx" + ], + "average_similarity": 0.402, + "cluster_id": "pr-scope-44606-2", + "kind": "pr_scope", + "last_activity_at": "2026-03-28T16:37:49Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.312, + "left_pr_number": 44606, + "right_pr_number": 45086, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/tokenization_utils_tokenizers.py" + ], + "similarity": 0.402, + "size_similarity": 0.222 + } + ], + "pr_count": 2, + "pr_numbers": [ + 44606, + 45086 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 44606, + 45086 + ], + "representative_pr_number": 44606, + "representative_title": "optionally override tokenizer class with serialized tokenizer ", + "representative_url": "https://github.com/huggingface/transformers/pull/44606", + "shared_directories": [], + "shared_filenames": [ + "src/transformers/tokenization_utils_tokenizers.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/tokenization_utils_tokenizers.py`; representative PR #44606.", + "title": "Scope: optionally override tokenizer class with serialized tokenizer " + }, + { + "authors": [ + "SunMarc", + "qgallouedec" + ], + "average_similarity": 0.391, + "cluster_id": "pr-scope-45443-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T20:42:24Z", + "outside_window_prs": [], + "pairwise": [ + { + "breadth_similarity": 0.533, + "concentration_similarity": 0.637, + "content_similarity": 0.41, + "left_pr_number": 45443, + "right_pr_number": 45463, + "shared_directories": [ + "src/transformers/cli/serving", + "src/transformers/cli", + "src/transformers", + "tests/cli", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/cli/serving/utils.py", + "tests/cli/test_serve.py" + ], + "similarity": 0.391, + "size_similarity": 0.122 + } + ], + "pr_count": 2, + "pr_numbers": [ + 45443, + 45463 + ], + "recent_pr_count": 2, + "recent_pr_numbers": [ + 45443, + 45463 + ], + "representative_pr_number": 45443, + "representative_title": "Raise 400 on model mismatch when `transformers serve` is pinned", + "representative_url": "https://github.com/huggingface/transformers/pull/45443", + "shared_directories": [ + "src/transformers/cli/serving", + "src/transformers/cli", + "tests/cli", + "tests" + ], + "shared_filenames": [ + "src/transformers/cli/serving/utils.py", + "tests/cli/test_serve.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/cli/serving/utils.py`, `tests/cli/test_serve.py`; representative PR #45443.", + "title": "Scope: Raise 400 on model mismatch when `transformers serve` is pinned" + }, + { + "authors": [ + "dagecko" + ], + "average_similarity": 0.529, + "cluster_id": "pr-scope-42975-3", + "kind": "pr_scope", + "last_activity_at": "2026-03-27T22:20:56Z", + "outside_window_prs": [ + { + "additions": 228, + "author": "salmanmkc", + "changed_files": 33, + "created_at": "2025-12-20T23:37:58Z", + "deletions": 228, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/42975/files", + "html_url": "https://github.com/huggingface/transformers/pull/42975", + "merged": false, + "number": 42975, + "state": "open", + "title": "Upgrade GitHub Actions for Node 24 compatibility", + "updated_at": "2026-01-25T00:07:56Z" + }, + { + "additions": 23, + "author": "salmanmkc", + "changed_files": 7, + "created_at": "2025-12-20T23:38:07Z", + "deletions": 23, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/42976/files", + "html_url": "https://github.com/huggingface/transformers/pull/42976", + "merged": false, + "number": 42976, + "state": "open", + "title": "Upgrade GitHub Actions to latest versions", + "updated_at": "2026-01-25T00:07:18Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.833, + "concentration_similarity": 1.0, + "content_similarity": 0.626, + "left_pr_number": 42975, + "right_pr_number": 45077, + "shared_directories": [ + ".github/workflows", + ".github" + ], + "shared_filenames": [ + ".github/workflows/benchmark.yml", + ".github/workflows/build-ci-docker-images.yml", + ".github/workflows/build-docker-images.yml", + ".github/workflows/build-nightly-ci-docker-images.yml", + ".github/workflows/build-past-ci-docker-images.yml", + ".github/workflows/check_tiny_models.yml", + ".github/workflows/model_jobs.yml", + ".github/workflows/release-conda.yml", + ".github/workflows/release.yml", + ".github/workflows/trufflehog.yml" + ], + "similarity": 0.681, + "size_similarity": 0.731 + }, + { + "breadth_similarity": 0.659, + "concentration_similarity": 1.0, + "content_similarity": 0.522, + "left_pr_number": 42976, + "right_pr_number": 45077, + "shared_directories": [ + ".github/workflows", + ".github" + ], + "shared_filenames": [ + ".github/workflows/build-ci-docker-images.yml", + ".github/workflows/build-docker-images.yml", + ".github/workflows/build-nightly-ci-docker-images.yml", + ".github/workflows/build-past-ci-docker-images.yml", + ".github/workflows/release-conda.yml" + ], + "similarity": 0.492, + "size_similarity": 0.074 + }, + { + "breadth_similarity": 0.606, + "concentration_similarity": 1.0, + "content_similarity": 0.412, + "left_pr_number": 42975, + "right_pr_number": 42976, + "shared_directories": [ + ".github/workflows", + ".github" + ], + "shared_filenames": [ + ".github/workflows/build-ci-docker-images.yml", + ".github/workflows/build-docker-images.yml", + ".github/workflows/build-nightly-ci-docker-images.yml", + ".github/workflows/build-past-ci-docker-images.yml", + ".github/workflows/check_failed_tests.yml", + ".github/workflows/new_model_pr_merged_notification.yml", + ".github/workflows/release-conda.yml" + ], + "similarity": 0.414, + "size_similarity": 0.101 + } + ], + "pr_count": 3, + "pr_numbers": [ + 42975, + 42976, + 45077 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45077 + ], + "representative_pr_number": 45077, + "representative_title": "fix: pin 50 unpinned actions to commit SHA, extract 1 secret to env var", + "representative_url": "https://github.com/huggingface/transformers/pull/45077", + "shared_directories": [ + ".github/workflows", + ".github" + ], + "shared_filenames": [ + ".github/workflows/build-ci-docker-images.yml", + ".github/workflows/build-docker-images.yml", + ".github/workflows/build-nightly-ci-docker-images.yml", + ".github/workflows/build-past-ci-docker-images.yml", + ".github/workflows/release-conda.yml", + ".github/workflows/benchmark.yml", + ".github/workflows/check_failed_tests.yml", + ".github/workflows/check_tiny_models.yml" + ], + "summary": "3 open PRs share weighted file overlap around `.github/workflows/build-ci-docker-images.yml`, `.github/workflows/build-docker-images.yml`, `.github/workflows/build-nightly-ci-docker-images.yml`; representative PR #45077.", + "title": "Scope: fix: pin 50 unpinned actions to commit SHA, extract 1 secret to env var" + }, + { + "authors": [ + "mvanhorn" + ], + "average_similarity": 0.467, + "cluster_id": "pr-scope-41097-3", + "kind": "pr_scope", + "last_activity_at": "2026-03-09T16:08:29Z", + "outside_window_prs": [ + { + "additions": 11, + "author": "cyyever", + "changed_files": 1, + "created_at": "2025-09-23T10:51:04Z", + "deletions": 14, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/41097/files", + "html_url": "https://github.com/huggingface/transformers/pull/41097", + "merged": false, + "number": 41097, + "state": "open", + "title": "Delay and probably avoid unnecessary graph breaks in _upad_input of modeling_flash_attention_utils.py", + "updated_at": "2026-02-11T12:31:59Z" + }, + { + "additions": 15, + "author": "MekkCyber", + "changed_files": 1, + "created_at": "2026-01-28T10:41:55Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43549/files", + "html_url": "https://github.com/huggingface/transformers/pull/43549", + "merged": false, + "number": 43549, + "state": "open", + "title": "[kernels] exception handling for fa kernels", + "updated_at": "2026-01-28T14:52:46Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.446, + "left_pr_number": 41097, + "right_pr_number": 43549, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/modeling_flash_attention_utils.py" + ], + "similarity": 0.552, + "size_similarity": 0.6 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.358, + "left_pr_number": 43549, + "right_pr_number": 44547, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/modeling_flash_attention_utils.py" + ], + "similarity": 0.441, + "size_similarity": 0.267 + }, + { + "breadth_similarity": 1.0, + "concentration_similarity": 1.0, + "content_similarity": 0.334, + "left_pr_number": 41097, + "right_pr_number": 44547, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/modeling_flash_attention_utils.py" + ], + "similarity": 0.408, + "size_similarity": 0.16 + } + ], + "pr_count": 3, + "pr_numbers": [ + 41097, + 43549, + 44547 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 44547 + ], + "representative_pr_number": 43549, + "representative_title": "[kernels] exception handling for fa kernels", + "representative_url": "https://github.com/huggingface/transformers/pull/43549", + "shared_directories": [], + "shared_filenames": [ + "src/transformers/modeling_flash_attention_utils.py" + ], + "summary": "3 open PRs share weighted file overlap around `src/transformers/modeling_flash_attention_utils.py`; representative PR #43549.", + "title": "Scope: [kernels] exception handling for fa kernels" + }, + { + "authors": [ + "zucchini-nlp" + ], + "average_similarity": 0.925, + "cluster_id": "pr-scope-40962-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-02T12:55:56Z", + "outside_window_prs": [ + { + "additions": 5927, + "author": "AkshatSh", + "changed_files": 21, + "created_at": "2025-09-18T07:05:39Z", + "deletions": 2, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/40962/files", + "html_url": "https://github.com/huggingface/transformers/pull/40962", + "merged": false, + "number": 40962, + "state": "open", + "title": "perceptron: Isaac-0.1 implementation", + "updated_at": "2026-04-14T14:58:41Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.832, + "content_similarity": 0.943, + "left_pr_number": 40962, + "right_pr_number": 45186, + "shared_directories": [ + "docs/source/en/model_doc", + "src/transformers/models/auto", + "src/transformers/models/isaac", + "docs/source/en", + "src/transformers/models", + "tests/models/isaac", + "docs/source", + "src/transformers", + "tests/models", + "tests/utils" + ], + "shared_filenames": [ + "docs/source/en/_toctree.yml", + "docs/source/en/model_doc/isaac.md", + "src/transformers/conversion_mapping.py", + "src/transformers/modeling_utils.py", + "src/transformers/models/__init__.py", + "src/transformers/models/auto/configuration_auto.py", + "src/transformers/models/auto/image_processing_auto.py", + "src/transformers/models/auto/modeling_auto.py", + "src/transformers/models/auto/processing_auto.py", + "src/transformers/models/isaac/__init__.py" + ], + "similarity": 0.925, + "size_similarity": 0.818 + } + ], + "pr_count": 2, + "pr_numbers": [ + 40962, + 45186 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45186 + ], + "representative_pr_number": 40962, + "representative_title": "perceptron: Isaac-0.1 implementation", + "representative_url": "https://github.com/huggingface/transformers/pull/40962", + "shared_directories": [ + "src/transformers/models/isaac", + "docs/source/en/model_doc", + "src/transformers/models/auto", + "tests/models/isaac", + "docs/source/en", + "src/transformers/models", + "tests/utils", + "docs/source" + ], + "shared_filenames": [ + "docs/source/en/model_doc/isaac.md", + "src/transformers/models/isaac/__init__.py", + "src/transformers/models/isaac/configuration_isaac.py", + "src/transformers/models/isaac/image_processing_isaac.py", + "src/transformers/models/isaac/modeling_isaac.py", + "src/transformers/models/isaac/modular_isaac.py", + "src/transformers/models/isaac/processing_isaac.py", + "tests/models/isaac/__init__.py" + ], + "summary": "2 open PRs share weighted file overlap around `docs/source/en/model_doc/isaac.md`, `src/transformers/models/isaac/__init__.py`, `src/transformers/models/isaac/configuration_isaac.py`; representative PR #40962.", + "title": "Scope: perceptron: Isaac-0.1 implementation" + }, + { + "authors": [ + "NielsRogge" + ], + "average_similarity": 0.761, + "cluster_id": "pr-scope-36895-2", + "kind": "pr_scope", + "last_activity_at": "2026-03-05T16:00:53Z", + "outside_window_prs": [ + { + "additions": 5464, + "author": "sbucaille", + "changed_files": 22, + "created_at": "2025-03-21T22:28:16Z", + "deletions": 46, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/36895/files", + "html_url": "https://github.com/huggingface/transformers/pull/36895", + "merged": false, + "number": 36895, + "state": "open", + "title": "Add RF-DETR", + "updated_at": "2026-04-13T23:57:11Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.886, + "concentration_similarity": 0.93, + "content_similarity": 0.721, + "left_pr_number": 36895, + "right_pr_number": 44375, + "shared_directories": [ + "docs/source/en/model_doc", + "src/transformers/models/auto", + "src/transformers/models/rf_detr", + "docs/source/en", + "src/transformers/loss", + "src/transformers/models", + "tests/models/rf_detr", + "docs/source", + "src/transformers", + "tests/models" + ], + "shared_filenames": [ + "docs/source/en/_toctree.yml", + "docs/source/en/model_doc/rf_detr.md", + "src/transformers/loss/loss_lw_detr.py", + "src/transformers/loss/loss_utils.py", + "src/transformers/models/__init__.py", + "src/transformers/models/auto/configuration_auto.py", + "src/transformers/models/auto/image_processing_auto.py", + "src/transformers/models/auto/modeling_auto.py", + "src/transformers/models/rf_detr/__init__.py", + "src/transformers/models/rf_detr/configuration_rf_detr.py" + ], + "similarity": 0.761, + "size_similarity": 0.806 + } + ], + "pr_count": 2, + "pr_numbers": [ + 36895, + 44375 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 44375 + ], + "representative_pr_number": 36895, + "representative_title": "Add RF-DETR", + "representative_url": "https://github.com/huggingface/transformers/pull/36895", + "shared_directories": [ + "src/transformers/models/rf_detr", + "docs/source/en/model_doc", + "src/transformers/models/auto", + "tests/models/rf_detr", + "src/transformers/loss", + "docs/source/en", + "src/transformers/models", + "docs/source" + ], + "shared_filenames": [ + "docs/source/en/model_doc/rf_detr.md", + "src/transformers/loss/loss_lw_detr.py", + "src/transformers/models/rf_detr/__init__.py", + "src/transformers/models/rf_detr/configuration_rf_detr.py", + "src/transformers/models/rf_detr/modeling_rf_detr.py", + "src/transformers/models/rf_detr/modular_rf_detr.py", + "tests/models/rf_detr/__init__.py", + "tests/models/rf_detr/test_modeling_rf_detr.py" + ], + "summary": "2 open PRs share weighted file overlap around `docs/source/en/model_doc/rf_detr.md`, `src/transformers/loss/loss_lw_detr.py`, `src/transformers/models/rf_detr/__init__.py`; representative PR #36895.", + "title": "Scope: Add RF-DETR" + }, + { + "authors": [ + "casinca" + ], + "average_similarity": 0.68, + "cluster_id": "pr-scope-43020-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T18:35:49Z", + "outside_window_prs": [ + { + "additions": 1172, + "author": "Aznix07", + "changed_files": 9, + "created_at": "2025-12-23T13:02:30Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43020/files", + "html_url": "https://github.com/huggingface/transformers/pull/43020", + "merged": false, + "number": 43020, + "state": "open", + "title": "Add mimo v2 flash", + "updated_at": "2026-03-03T09:16:22Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.661, + "concentration_similarity": 0.9, + "content_similarity": 0.696, + "left_pr_number": 43020, + "right_pr_number": 45144, + "shared_directories": [ + "src/transformers/models/auto", + "src/transformers/models/mimo_v2_flash", + "src/transformers/models", + "tests/models/mimo_v2_flash", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/__init__.py", + "src/transformers/models/auto/configuration_auto.py", + "src/transformers/models/auto/modeling_auto.py", + "src/transformers/models/mimo_v2_flash/__init__.py", + "src/transformers/models/mimo_v2_flash/configuration_mimo_v2_flash.py", + "src/transformers/models/mimo_v2_flash/modular_mimo_v2_flash.py", + "tests/models/mimo_v2_flash/__init__.py", + "tests/models/mimo_v2_flash/test_modeling_mimo_v2_flash.py" + ], + "similarity": 0.68, + "size_similarity": 0.545 + } + ], + "pr_count": 2, + "pr_numbers": [ + 43020, + 45144 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45144 + ], + "representative_pr_number": 43020, + "representative_title": "Add mimo v2 flash", + "representative_url": "https://github.com/huggingface/transformers/pull/43020", + "shared_directories": [ + "src/transformers/models/mimo_v2_flash", + "src/transformers/models/auto", + "tests/models/mimo_v2_flash", + "src/transformers/models", + "tests/models", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/mimo_v2_flash/__init__.py", + "src/transformers/models/mimo_v2_flash/configuration_mimo_v2_flash.py", + "src/transformers/models/mimo_v2_flash/modular_mimo_v2_flash.py", + "tests/models/mimo_v2_flash/__init__.py", + "tests/models/mimo_v2_flash/test_modeling_mimo_v2_flash.py", + "src/transformers/models/__init__.py", + "src/transformers/models/auto/configuration_auto.py", + "src/transformers/models/auto/modeling_auto.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/models/mimo_v2_flash/__init__.py`, `src/transformers/models/mimo_v2_flash/configuration_mimo_v2_flash.py`, `src/transformers/models/mimo_v2_flash/modular_mimo_v2_flash.py`; representative PR #43020.", + "title": "Scope: Add mimo v2 flash" + }, + { + "authors": [ + "GitGlimpse895" + ], + "average_similarity": 0.543, + "cluster_id": "pr-scope-43085-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-14T03:23:23Z", + "outside_window_prs": [ + { + "additions": 519, + "author": "AmitMY", + "changed_files": 5, + "created_at": "2026-01-03T09:42:33Z", + "deletions": 2, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43085/files", + "html_url": "https://github.com/huggingface/transformers/pull/43085", + "merged": false, + "number": 43085, + "state": "open", + "title": "Add async_stopping_criteria flag to reduce GPU-CPU syncs during generation", + "updated_at": "2026-02-09T17:16:29Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.7, + "concentration_similarity": 0.608, + "content_similarity": 0.621, + "left_pr_number": 43085, + "right_pr_number": 45384, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "tests/generation", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/generation/stopping_criteria.py", + "tests/generation/test_stopping_criteria.py" + ], + "similarity": 0.543, + "size_similarity": 0.048 + } + ], + "pr_count": 2, + "pr_numbers": [ + 43085, + 45384 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45384 + ], + "representative_pr_number": 43085, + "representative_title": "Add async_stopping_criteria flag to reduce GPU-CPU syncs during generation", + "representative_url": "https://github.com/huggingface/transformers/pull/43085", + "shared_directories": [ + "src/transformers/generation", + "tests/generation", + "tests" + ], + "shared_filenames": [ + "src/transformers/generation/stopping_criteria.py", + "tests/generation/test_stopping_criteria.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/generation/stopping_criteria.py`, `tests/generation/test_stopping_criteria.py`; representative PR #43085.", + "title": "Scope: Add async_stopping_criteria flag to reduce GPU-CPU syncs during generation" + }, + { + "authors": [ + "songyuc" + ], + "average_similarity": 0.469, + "cluster_id": "pr-scope-43665-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-12T15:05:10Z", + "outside_window_prs": [ + { + "additions": 9, + "author": "ydshieh2", + "changed_files": 2, + "created_at": "2026-01-31T21:50:43Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43665/files", + "html_url": "https://github.com/huggingface/transformers/pull/43665", + "merged": false, + "number": 43665, + "state": "open", + "title": "fix", + "updated_at": "2026-03-24T14:42:35Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.822, + "content_similarity": 0.34, + "left_pr_number": 43665, + "right_pr_number": 45385, + "shared_directories": [ + "tests/models/clip", + "tests/models", + "tests" + ], + "shared_filenames": [ + "tests/models/clip/test_modeling_clip.py" + ], + "similarity": 0.469, + "size_similarity": 0.6 + } + ], + "pr_count": 2, + "pr_numbers": [ + 43665, + 45385 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45385 + ], + "representative_pr_number": 43665, + "representative_title": "fix", + "representative_url": "https://github.com/huggingface/transformers/pull/43665", + "shared_directories": [ + "tests/models/clip", + "tests/models", + "tests" + ], + "shared_filenames": [ + "tests/models/clip/test_modeling_clip.py" + ], + "summary": "2 open PRs share weighted file overlap around `tests/models/clip/test_modeling_clip.py`; representative PR #43665.", + "title": "Scope: fix" + }, + { + "authors": [ + "harshaljanjani" + ], + "average_similarity": 0.46, + "cluster_id": "pr-scope-41356-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T17:06:41Z", + "outside_window_prs": [ + { + "additions": 512, + "author": "Vinayaktoor", + "changed_files": 10, + "created_at": "2025-10-05T21:35:01Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/41356/files", + "html_url": "https://github.com/huggingface/transformers/pull/41356", + "merged": false, + "number": 41356, + "state": "open", + "title": "Add DEIMv2 model, image processor, and basic tests", + "updated_at": "2026-02-09T17:25:26Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.5, + "concentration_similarity": 0.96, + "content_similarity": 0.499, + "left_pr_number": 41356, + "right_pr_number": 44339, + "shared_directories": [ + "docs/source/en/model_doc", + "src/transformers/models/deimv2", + "docs/source/en", + "src/transformers/models", + "tests/models/deimv2", + "docs/source", + "src/transformers", + "tests/models", + "docs", + "src" + ], + "shared_filenames": [ + "docs/source/en/model_doc/deimv2.md", + "src/transformers/models/deimv2/__init__.py", + "src/transformers/models/deimv2/configuration_deimv2.py", + "src/transformers/models/deimv2/modeling_deimv2.py", + "tests/models/deimv2/__init__.py", + "tests/models/deimv2/test_modeling_deimv2.py" + ], + "similarity": 0.46, + "size_similarity": 0.082 + } + ], + "pr_count": 2, + "pr_numbers": [ + 41356, + 44339 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 44339 + ], + "representative_pr_number": 41356, + "representative_title": "Add DEIMv2 model, image processor, and basic tests", + "representative_url": "https://github.com/huggingface/transformers/pull/41356", + "shared_directories": [ + "src/transformers/models/deimv2", + "docs/source/en/model_doc", + "tests/models/deimv2", + "docs/source/en", + "src/transformers/models", + "docs/source", + "tests/models", + "docs" + ], + "shared_filenames": [ + "docs/source/en/model_doc/deimv2.md", + "src/transformers/models/deimv2/__init__.py", + "src/transformers/models/deimv2/configuration_deimv2.py", + "src/transformers/models/deimv2/modeling_deimv2.py", + "tests/models/deimv2/__init__.py", + "tests/models/deimv2/test_modeling_deimv2.py" + ], + "summary": "2 open PRs share weighted file overlap around `docs/source/en/model_doc/deimv2.md`, `src/transformers/models/deimv2/__init__.py`, `src/transformers/models/deimv2/configuration_deimv2.py`; representative PR #41356.", + "title": "Scope: Add DEIMv2 model, image processor, and basic tests" + }, + { + "authors": [ + "ezylopx5" + ], + "average_similarity": 0.432, + "cluster_id": "pr-scope-42112-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T13:36:39Z", + "outside_window_prs": [ + { + "additions": 721, + "author": "AndresAlgaba", + "changed_files": 8, + "created_at": "2025-11-09T10:17:17Z", + "deletions": 6, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/42112/files", + "html_url": "https://github.com/huggingface/transformers/pull/42112", + "merged": false, + "number": 42112, + "state": "open", + "title": "Add max_thinking_tokens for reasoning models (issue #42111)", + "updated_at": "2026-02-02T10:51:15Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.458, + "concentration_similarity": 0.969, + "content_similarity": 0.478, + "left_pr_number": 42112, + "right_pr_number": 45413, + "shared_directories": [ + "src/transformers/generation", + "src/transformers", + "tests/generation", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/generation/logits_process.py", + "tests/generation/test_logits_process.py" + ], + "similarity": 0.432, + "size_similarity": 0.019 + } + ], + "pr_count": 2, + "pr_numbers": [ + 42112, + 45413 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45413 + ], + "representative_pr_number": 42112, + "representative_title": "Add max_thinking_tokens for reasoning models (issue #42111)", + "representative_url": "https://github.com/huggingface/transformers/pull/42112", + "shared_directories": [ + "src/transformers/generation", + "tests/generation", + "tests" + ], + "shared_filenames": [ + "src/transformers/generation/logits_process.py", + "tests/generation/test_logits_process.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/generation/logits_process.py`, `tests/generation/test_logits_process.py`; representative PR #42112.", + "title": "Scope: Add max_thinking_tokens for reasoning models (issue #42111)" + }, + { + "authors": [ + "pdufour" + ], + "average_similarity": 0.416, + "cluster_id": "pr-scope-40755-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-10T23:37:52Z", + "outside_window_prs": [ + { + "additions": 1911, + "author": "kashif", + "changed_files": 5, + "created_at": "2025-09-08T13:05:54Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/40755/files", + "html_url": "https://github.com/huggingface/transformers/pull/40755", + "merged": false, + "number": 40755, + "state": "open", + "title": "[TimesFM] Add support for forecasting with covariates", + "updated_at": "2026-03-06T08:29:28Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 1.0, + "concentration_similarity": 0.901, + "content_similarity": 0.342, + "left_pr_number": 40755, + "right_pr_number": 45233, + "shared_directories": [ + "src/transformers/models/timesfm", + "src/transformers/models", + "src/transformers", + "tests/models", + "src", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/timesfm/modeling_timesfm.py", + "src/transformers/models/timesfm/modular_timesfm.py" + ], + "similarity": 0.416, + "size_similarity": 0.211 + } + ], + "pr_count": 2, + "pr_numbers": [ + 40755, + 45233 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45233 + ], + "representative_pr_number": 40755, + "representative_title": "[TimesFM] Add support for forecasting with covariates", + "representative_url": "https://github.com/huggingface/transformers/pull/40755", + "shared_directories": [ + "src/transformers/models/timesfm", + "src/transformers/models", + "tests/models", + "tests" + ], + "shared_filenames": [ + "src/transformers/models/timesfm/modeling_timesfm.py", + "src/transformers/models/timesfm/modular_timesfm.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/models/timesfm/modeling_timesfm.py`, `src/transformers/models/timesfm/modular_timesfm.py`; representative PR #40755.", + "title": "Scope: [TimesFM] Add support for forecasting with covariates" + }, + { + "authors": [ + "UsamaKenway" + ], + "average_similarity": 0.388, + "cluster_id": "pr-scope-43757-2", + "kind": "pr_scope", + "last_activity_at": "2026-04-15T11:58:05Z", + "outside_window_prs": [ + { + "additions": 15, + "author": "TheSanjBot", + "changed_files": 2, + "created_at": "2026-02-05T07:56:19Z", + "deletions": 0, + "draft": false, + "files_url": "https://github.com/huggingface/transformers/pull/43757/files", + "html_url": "https://github.com/huggingface/transformers/pull/43757", + "merged": false, + "number": 43757, + "state": "open", + "title": "Avoid hard failure for gpt-oss GGUF architecture by falling back to g\u2026", + "updated_at": "2026-02-05T17:42:11Z" + } + ], + "pairwise": [ + { + "breadth_similarity": 0.75, + "concentration_similarity": 0.533, + "content_similarity": 0.315, + "left_pr_number": 43757, + "right_pr_number": 45386, + "shared_directories": [ + "src/transformers", + "src" + ], + "shared_filenames": [ + "src/transformers/modeling_gguf_pytorch_utils.py" + ], + "similarity": 0.388, + "size_similarity": 0.441 + } + ], + "pr_count": 2, + "pr_numbers": [ + 43757, + 45386 + ], + "recent_pr_count": 1, + "recent_pr_numbers": [ + 45386 + ], + "representative_pr_number": 43757, + "representative_title": "Avoid hard failure for gpt-oss GGUF architecture by falling back to g\u2026", + "representative_url": "https://github.com/huggingface/transformers/pull/43757", + "shared_directories": [], + "shared_filenames": [ + "src/transformers/modeling_gguf_pytorch_utils.py" + ], + "summary": "2 open PRs share weighted file overlap around `src/transformers/modeling_gguf_pytorch_utils.py`; representative PR #43757.", + "title": "Scope: Avoid hard failure for gpt-oss GGUF architecture by falling back to g\u2026" + } +]