[ { "authors": [ "DogWala", "abigailtech", "cyyever", "excepshenal", "winglian" ], "average_similarity": 0.454, "cluster_id": "pr-scope-43636-7", "kind": "pr_scope", "last_activity_at": "2026-03-13T22:28:27Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.483, "left_pr_number": 43663, "right_pr_number": 44123, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.592, "size_similarity": 0.694 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.423, "left_pr_number": 43651, "right_pr_number": 43663, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.554, "size_similarity": 0.72 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.292, "left_pr_number": 44257, "right_pr_number": 44660, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.504, "size_similarity": 1.0 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.394, "left_pr_number": 43651, "right_pr_number": 44123, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.501, "size_similarity": 0.5 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.415, "left_pr_number": 43663, "right_pr_number": 44660, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.476, "size_similarity": 0.24 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.365, "left_pr_number": 43636, "right_pr_number": 43663, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.471, "size_similarity": 0.44 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.308, "left_pr_number": 44189, "right_pr_number": 44660, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.466, "size_similarity": 0.667 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.297, "left_pr_number": 43636, "right_pr_number": 43651, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.45, "size_similarity": 0.611 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.386, "left_pr_number": 44123, "right_pr_number": 44660, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.445, "size_similarity": 0.167 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.386, "left_pr_number": 43663, "right_pr_number": 44189, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.444, "size_similarity": 0.16 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.365, "left_pr_number": 43663, "right_pr_number": 44257, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.442, "size_similarity": 0.24 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.272, "left_pr_number": 44189, "right_pr_number": 44257, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.44, "size_similarity": 0.667 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.338, "left_pr_number": 43651, "right_pr_number": 44660, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.437, "size_similarity": 0.333 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.291, "left_pr_number": 43636, "right_pr_number": 44660, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.436, "size_similarity": 0.545 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.339, "left_pr_number": 43636, "right_pr_number": 44123, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.433, "size_similarity": 0.306 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.359, "left_pr_number": 44123, "right_pr_number": 44189, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.418, "size_similarity": 0.111 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.34, "left_pr_number": 44123, "right_pr_number": 44257, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.413, "size_similarity": 0.167 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.257, "left_pr_number": 43636, "right_pr_number": 44257, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.411, "size_similarity": 0.545 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.298, "left_pr_number": 43651, "right_pr_number": 44257, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.408, "size_similarity": 0.333 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.315, "left_pr_number": 43651, "right_pr_number": 44189, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.404, "size_similarity": 0.222 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.271, "left_pr_number": 43636, "right_pr_number": 44189, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.394, "size_similarity": 0.364 } ], "pr_count": 7, "pr_numbers": [ 43636, 43651, 43663, 44123, 44189, 44257, 44660 ], "recent_pr_count": 7, "recent_pr_numbers": [ 43636, 43651, 43663, 44123, 44189, 44257, 44660 ], "representative_pr_number": 43663, "representative_title": "Add _get_signature_columns method to allow custom trainers to override column filtering", "representative_url": "https://github.com/huggingface/transformers/pull/43663", "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "summary": "7 open PRs share weighted file overlap around `src/transformers/trainer.py`; representative PR #43663.", "title": "Scope: Add _get_signature_columns method to allow custom trainers to override column filtering" }, { "authors": [ "Mr-Neutr0n", "SunMarc", "jonathan-fulton", "pragnyanramtha", "rain-1", "tarekziade" ], "average_similarity": 0.485, "cluster_id": "pr-scope-43656-6", "kind": "pr_scope", "last_activity_at": "2026-03-23T07:30:41Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.746, "left_pr_number": 43656, "right_pr_number": 43836, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.69, "size_similarity": 0.121 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.649, "left_pr_number": 43836, "right_pr_number": 43842, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.608, "size_similarity": 0.027 }, { "breadth_similarity": 0.5, "concentration_similarity": 0.802, "content_similarity": 0.638, "left_pr_number": 43836, "right_pr_number": 44682, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.596, "size_similarity": 0.398 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.574, "left_pr_number": 43656, "right_pr_number": 43842, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.585, "size_similarity": 0.222 }, { "breadth_similarity": 0.35, "concentration_similarity": 0.994, "content_similarity": 0.525, "left_pr_number": 44566, "right_pr_number": 44682, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.568, "size_similarity": 0.773 }, { "breadth_similarity": 0.667, "concentration_similarity": 0.752, "content_similarity": 0.384, "left_pr_number": 44558, "right_pr_number": 44682, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.52, "size_similarity": 0.984 }, { "breadth_similarity": 0.175, "concentration_similarity": 0.796, "content_similarity": 0.524, "left_pr_number": 43836, "right_pr_number": 44566, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.502, "size_similarity": 0.516 }, { "breadth_similarity": 0.525, "concentration_similarity": 0.759, "content_similarity": 0.412, "left_pr_number": 44558, "right_pr_number": 44566, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.497, "size_similarity": 0.785 }, { "breadth_similarity": 0.5, "concentration_similarity": 0.802, "content_similarity": 0.483, "left_pr_number": 43656, "right_pr_number": 44682, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.436, "size_similarity": 0.048 }, { "breadth_similarity": 0.333, "concentration_similarity": 0.554, "content_similarity": 0.44, "left_pr_number": 43836, "right_pr_number": 44558, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.43, "size_similarity": 0.405 }, { "breadth_similarity": 0.175, "concentration_similarity": 0.796, "content_similarity": 0.503, "left_pr_number": 43842, "right_pr_number": 44566, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.412, "size_similarity": 0.014 }, { "breadth_similarity": 0.175, "concentration_similarity": 0.796, "content_similarity": 0.491, "left_pr_number": 43656, "right_pr_number": 44566, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.411, "size_similarity": 0.062 }, { "breadth_similarity": 0.5, "concentration_similarity": 0.802, "content_similarity": 0.454, "left_pr_number": 43842, "right_pr_number": 44682, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.409, "size_similarity": 0.011 }, { "breadth_similarity": 0.333, "concentration_similarity": 0.554, "content_similarity": 0.342, "left_pr_number": 43656, "right_pr_number": 44558, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.307, "size_similarity": 0.049 }, { "breadth_similarity": 0.333, "concentration_similarity": 0.554, "content_similarity": 0.338, "left_pr_number": 43842, "right_pr_number": 44558, "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "similarity": 0.299, "size_similarity": 0.011 } ], "pr_count": 6, "pr_numbers": [ 43656, 43836, 43842, 44558, 44566, 44682 ], "recent_pr_count": 6, "recent_pr_numbers": [ 43656, 43836, 43842, 44558, 44566, 44682 ], "representative_pr_number": 43836, "representative_title": "fix: wrapped TypeAdpater in string literals (for now)", "representative_url": "https://github.com/huggingface/transformers/pull/43836", "shared_directories": [ "src/transformers/cli", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/cli/serve.py" ], "summary": "6 open PRs share weighted file overlap around `src/transformers/cli/serve.py`; representative PR #43836.", "title": "Scope: fix: wrapped TypeAdpater in string literals (for now)" }, { "authors": [ "Jay-IIT", "Zephyr-Blessed", "chandan11248" ], "average_similarity": 0.942, "cluster_id": "pr-scope-44066-3", "kind": "pr_scope", "last_activity_at": "2026-03-19T18:12:59Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 0.957, "content_similarity": 0.968, "left_pr_number": 44066, "right_pr_number": 44722, "shared_directories": [ "src/transformers/models/codegen", "src/transformers/models/gptj", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/codegen/modeling_codegen.py", "src/transformers/models/gptj/modeling_gptj.py" ], "similarity": 0.969, "size_similarity": 0.959 }, { "breadth_similarity": 0.5, "concentration_similarity": 0.986, "content_similarity": 0.988, "left_pr_number": 44085, "right_pr_number": 44722, "shared_directories": [ "src/transformers/models/gptj", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/gptj/modeling_gptj.py" ], "similarity": 0.938, "size_similarity": 0.98 }, { "breadth_similarity": 0.5, "concentration_similarity": 0.944, "content_similarity": 0.963, "left_pr_number": 44066, "right_pr_number": 44085, "shared_directories": [ "src/transformers/models/gptj", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/gptj/modeling_gptj.py" ], "similarity": 0.918, "size_similarity": 0.979 } ], "pr_count": 3, "pr_numbers": [ 44066, 44085, 44722 ], "recent_pr_count": 3, "recent_pr_numbers": [ 44066, 44085, 44722 ], "representative_pr_number": 44722, "representative_title": "Refactor gptj output tracing to use standardized decorators", "representative_url": "https://github.com/huggingface/transformers/pull/44722", "shared_directories": [ "src/transformers/models/gptj", "src/transformers/models", "src/transformers", "src", "src/transformers/models/codegen" ], "shared_filenames": [ "src/transformers/models/gptj/modeling_gptj.py", "src/transformers/models/codegen/modeling_codegen.py" ], "summary": "3 open PRs share weighted file overlap around `src/transformers/models/gptj/modeling_gptj.py`, `src/transformers/models/codegen/modeling_codegen.py`; representative PR #44722.", "title": "Scope: Refactor gptj output tracing to use standardized decorators" }, { "authors": [ "JokeYoonic", "akashadsare", "lakprigan" ], "average_similarity": 0.574, "cluster_id": "pr-scope-44015-3", "kind": "pr_scope", "last_activity_at": "2026-03-18T17:16:49Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.76, "left_pr_number": 44059, "right_pr_number": 44676, "shared_directories": [ "src/transformers/models/gpt2", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/gpt2/modeling_gpt2.py" ], "similarity": 0.691, "size_similarity": 0.062 }, { "breadth_similarity": 0.333, "concentration_similarity": 0.488, "content_similarity": 0.674, "left_pr_number": 44015, "right_pr_number": 44059, "shared_directories": [ "src/transformers/models/gpt2", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/gpt2/modeling_gpt2.py" ], "similarity": 0.611, "size_similarity": 0.543 }, { "breadth_similarity": 0.333, "concentration_similarity": 0.488, "content_similarity": 0.511, "left_pr_number": 44015, "right_pr_number": 44676, "shared_directories": [ "src/transformers/models/gpt2", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/gpt2/modeling_gpt2.py" ], "similarity": 0.421, "size_similarity": 0.034 } ], "pr_count": 3, "pr_numbers": [ 44015, 44059, 44676 ], "recent_pr_count": 3, "recent_pr_numbers": [ 44015, 44059, 44676 ], "representative_pr_number": 44059, "representative_title": "[GPT2] Refactor output tracing to use capture_outputs/can_return_tuple decorators", "representative_url": "https://github.com/huggingface/transformers/pull/44059", "shared_directories": [ "src/transformers/models/gpt2", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/gpt2/modeling_gpt2.py" ], "summary": "3 open PRs share weighted file overlap around `src/transformers/models/gpt2/modeling_gpt2.py`; representative PR #44059.", "title": "Scope: [GPT2] Refactor output tracing to use capture_outputs/can_return_tuple decorators" }, { "authors": [ "Sid-V5", "karthiksuki", "pdwi2020" ], "average_similarity": 0.53, "cluster_id": "pr-scope-43997-3", "kind": "pr_scope", "last_activity_at": "2026-02-19T15:49:49Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.333, "concentration_similarity": 0.548, "content_similarity": 0.71, "left_pr_number": 44007, "right_pr_number": 44019, "shared_directories": [ "src/transformers/models/resnet", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/resnet/modeling_resnet.py" ], "similarity": 0.699, "size_similarity": 0.94 }, { "breadth_similarity": 0.333, "concentration_similarity": 0.548, "content_similarity": 0.647, "left_pr_number": 43997, "right_pr_number": 44007, "shared_directories": [ "src/transformers/models/regnet", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/regnet/modeling_regnet.py" ], "similarity": 0.616, "size_similarity": 0.679 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.025, "left_pr_number": 43997, "right_pr_number": 44019, "shared_directories": [ "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [], "similarity": 0.276, "size_similarity": 0.722 } ], "pr_count": 3, "pr_numbers": [ 43997, 44007, 44019 ], "recent_pr_count": 3, "recent_pr_numbers": [ 43997, 44007, 44019 ], "representative_pr_number": 44007, "representative_title": "[ResNet] Refactor output tracing to decorator-based interface", "representative_url": "https://github.com/huggingface/transformers/pull/44007", "shared_directories": [ "src/transformers/models", "src/transformers", "src", "src/transformers/models/regnet", "src/transformers/models/resnet" ], "shared_filenames": [ "src/transformers/models/regnet/modeling_regnet.py", "src/transformers/models/resnet/modeling_resnet.py" ], "summary": "3 open PRs share weighted file overlap around `src/transformers/models/regnet/modeling_regnet.py`, `src/transformers/models/resnet/modeling_resnet.py`; representative PR #44007.", "title": "Scope: [ResNet] Refactor output tracing to decorator-based interface" }, { "authors": [ "hf-security-analysis[bot]", "ydshieh" ], "average_similarity": 0.494, "cluster_id": "pr-scope-43532-3", "kind": "pr_scope", "last_activity_at": "2026-03-11T15:49:09Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.208, "concentration_similarity": 0.605, "content_similarity": 0.548, "left_pr_number": 43532, "right_pr_number": 44599, "shared_directories": [ ".github/workflows", ".github" ], "shared_filenames": [ ".github/workflows/self-comment-ci.yml" ], "similarity": 0.543, "size_similarity": 0.726 }, { "breadth_similarity": 0.875, "concentration_similarity": 0.893, "content_similarity": 0.445, "left_pr_number": 43532, "right_pr_number": 43649, "shared_directories": [ "tests/models/vit", ".github/workflows", "tests/models", ".github", "tests", "utils" ], "shared_filenames": [ ".github/workflows/self-comment-ci.yml", ".github/workflows/self-scheduled.yml", "tests/models/vit/test_modeling_vit.py", "utils/notification_service.py" ], "similarity": 0.503, "size_similarity": 0.395 }, { "breadth_similarity": 0.188, "concentration_similarity": 0.498, "content_similarity": 0.442, "left_pr_number": 43649, "right_pr_number": 44599, "shared_directories": [ ".github/workflows", ".github" ], "shared_filenames": [ ".github/workflows/self-comment-ci.yml" ], "similarity": 0.435, "size_similarity": 0.545 } ], "pr_count": 3, "pr_numbers": [ 43532, 43649, 44599 ], "recent_pr_count": 3, "recent_pr_numbers": [ 43532, 43649, 44599 ], "representative_pr_number": 43532, "representative_title": "[don't merge] Show diff", "representative_url": "https://github.com/huggingface/transformers/pull/43532", "shared_directories": [ ".github/workflows", ".github", "tests/models/vit", "tests/models", "utils", "tests" ], "shared_filenames": [ ".github/workflows/self-comment-ci.yml", "utils/notification_service.py", ".github/workflows/self-scheduled.yml", "tests/models/vit/test_modeling_vit.py" ], "summary": "3 open PRs share weighted file overlap around `.github/workflows/self-comment-ci.yml`, `utils/notification_service.py`, `.github/workflows/self-scheduled.yml`; representative PR #43532.", "title": "Scope: [don't merge] Show diff" }, { "authors": [ "stevhliu" ], "average_similarity": 0.368, "cluster_id": "pr-scope-44290-3", "kind": "pr_scope", "last_activity_at": "2026-03-23T09:09:32Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.75, "concentration_similarity": 0.998, "content_similarity": 0.229, "left_pr_number": 44342, "right_pr_number": 44799, "shared_directories": [ "docs/source/en", "docs/source", "docs" ], "shared_filenames": [ "docs/source/en/_toctree.yml", "docs/source/en/perf_train_gpu_one.md" ], "similarity": 0.388, "size_similarity": 0.683 }, { "breadth_similarity": 0.833, "concentration_similarity": 1.0, "content_similarity": 0.147, "left_pr_number": 44290, "right_pr_number": 44342, "shared_directories": [ "docs/source/en", "docs/source", "docs" ], "shared_filenames": [ "docs/source/en/_toctree.yml", "docs/source/en/perf_train_gpu_one.md" ], "similarity": 0.372, "size_similarity": 0.904 }, { "breadth_similarity": 0.583, "concentration_similarity": 0.998, "content_similarity": 0.175, "left_pr_number": 44290, "right_pr_number": 44799, "shared_directories": [ "docs/source/en", "docs/source", "docs" ], "shared_filenames": [ "docs/source/en/_toctree.yml", "docs/source/en/perf_train_gpu_one.md" ], "similarity": 0.344, "size_similarity": 0.756 } ], "pr_count": 3, "pr_numbers": [ 44290, 44342, 44799 ], "recent_pr_count": 3, "recent_pr_numbers": [ 44290, 44342, 44799 ], "representative_pr_number": 44342, "representative_title": "[docs] training performance", "representative_url": "https://github.com/huggingface/transformers/pull/44342", "shared_directories": [ "docs/source/en", "docs/source", "docs" ], "shared_filenames": [ "docs/source/en/perf_train_gpu_one.md", "docs/source/en/_toctree.yml" ], "summary": "3 open PRs share weighted file overlap around `docs/source/en/perf_train_gpu_one.md`, `docs/source/en/_toctree.yml`; representative PR #44342.", "title": "Scope: [docs] training performance" }, { "authors": [ "IvanFan-Van", "dacorvo" ], "average_similarity": 0.46, "cluster_id": "pr-scope-34667-4", "kind": "pr_scope", "last_activity_at": "2026-03-20T05:45:46Z", "outside_window_prs": [ { "additions": 10, "author": "andrewqianpublic", "changed_files": 1, "created_at": "2024-11-09T06:18:31Z", "deletions": 1, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/34667/files", "html_url": "https://github.com/huggingface/transformers/pull/34667", "merged": false, "number": 34667, "state": "open", "title": "Clear unused allocated GPU memory when available GPU memory is low. ", "updated_at": "2026-03-06T07:28:06Z" }, { "additions": 23, "author": "bonpiedlaroute", "changed_files": 1, "created_at": "2025-07-25T21:27:34Z", "deletions": 0, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/39683/files", "html_url": "https://github.com/huggingface/transformers/pull/39683", "merged": false, "number": 39683, "state": "open", "title": "Fix issue #39191 respect accelerate config to disable torch.dynamo compilation", "updated_at": "2026-01-27T12:42:58Z" } ], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.458, "left_pr_number": 34667, "right_pr_number": 39683, "shared_directories": [ "src/transformers/generation", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/generation/utils.py" ], "similarity": 0.542, "size_similarity": 0.478 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.308, "left_pr_number": 44757, "right_pr_number": 44872, "shared_directories": [ "src/transformers/generation", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/generation/utils.py" ], "similarity": 0.465, "size_similarity": 0.667 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.387, "left_pr_number": 34667, "right_pr_number": 44872, "shared_directories": [ "src/transformers/generation", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/generation/utils.py" ], "similarity": 0.462, "size_similarity": 0.273 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.382, "left_pr_number": 39683, "right_pr_number": 44872, "shared_directories": [ "src/transformers/generation", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/generation/utils.py" ], "similarity": 0.437, "size_similarity": 0.13 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.368, "left_pr_number": 34667, "right_pr_number": 44757, "shared_directories": [ "src/transformers/generation", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/generation/utils.py" ], "similarity": 0.435, "size_similarity": 0.182 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.364, "left_pr_number": 39683, "right_pr_number": 44757, "shared_directories": [ "src/transformers/generation", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/generation/utils.py" ], "similarity": 0.418, "size_similarity": 0.087 } ], "pr_count": 4, "pr_numbers": [ 34667, 39683, 44757, 44872 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44757, 44872 ], "representative_pr_number": 34667, "representative_title": "Clear unused allocated GPU memory when available GPU memory is low. ", "representative_url": "https://github.com/huggingface/transformers/pull/34667", "shared_directories": [ "src/transformers/generation", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/generation/utils.py" ], "summary": "4 open PRs share weighted file overlap around `src/transformers/generation/utils.py`; representative PR #34667.", "title": "Scope: Clear unused allocated GPU memory when available GPU memory is low. " }, { "authors": [ "itazap", "vaibhav-research" ], "average_similarity": 0.545, "cluster_id": "pr-scope-43422-3", "kind": "pr_scope", "last_activity_at": "2026-03-17T16:03:19Z", "outside_window_prs": [ { "additions": 34, "author": "harshaljanjani", "changed_files": 2, "created_at": "2026-01-22T18:34:36Z", "deletions": 1, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/43422/files", "html_url": "https://github.com/huggingface/transformers/pull/43422", "merged": false, "number": 43422, "state": "open", "title": "feat(tokenizer): Update post-processor when special tokens are modified in TokenizersBackend", "updated_at": "2026-02-23T10:07:58Z" } ], "pairwise": [ { "breadth_similarity": 0.5, "concentration_similarity": 0.971, "content_similarity": 0.676, "left_pr_number": 43422, "right_pr_number": 44606, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/tokenization_utils_tokenizers.py" ], "similarity": 0.688, "size_similarity": 0.771 }, { "breadth_similarity": 0.75, "concentration_similarity": 1.0, "content_similarity": 0.507, "left_pr_number": 43603, "right_pr_number": 44606, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/tokenization_utils_tokenizers.py" ], "similarity": 0.502, "size_similarity": 0.148 }, { "breadth_similarity": 0.75, "concentration_similarity": 0.971, "content_similarity": 0.436, "left_pr_number": 43422, "right_pr_number": 43603, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/tokenization_utils_tokenizers.py" ], "similarity": 0.446, "size_similarity": 0.114 } ], "pr_count": 3, "pr_numbers": [ 43422, 43603, 44606 ], "recent_pr_count": 2, "recent_pr_numbers": [ 43603, 44606 ], "representative_pr_number": 44606, "representative_title": "optionally override tokenizer class with serialized tokenizer ", "representative_url": "https://github.com/huggingface/transformers/pull/44606", "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/tokenization_utils_tokenizers.py" ], "summary": "3 open PRs share weighted file overlap around `src/transformers/tokenization_utils_tokenizers.py`; representative PR #44606.", "title": "Scope: optionally override tokenizer class with serialized tokenizer " }, { "authors": [ "MekkCyber", "mvanhorn" ], "average_similarity": 0.471, "cluster_id": "pr-scope-41097-3", "kind": "pr_scope", "last_activity_at": "2026-03-09T16:08:29Z", "outside_window_prs": [ { "additions": 11, "author": "cyyever", "changed_files": 1, "created_at": "2025-09-23T10:51:04Z", "deletions": 14, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/41097/files", "html_url": "https://github.com/huggingface/transformers/pull/41097", "merged": false, "number": 41097, "state": "open", "title": "Delay and probably avoid unnecessary graph breaks in _upad_input of modeling_flash_attention_utils.py", "updated_at": "2026-02-11T12:31:59Z" } ], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.452, "left_pr_number": 41097, "right_pr_number": 43549, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/modeling_flash_attention_utils.py" ], "similarity": 0.556, "size_similarity": 0.6 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.363, "left_pr_number": 43549, "right_pr_number": 44547, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/modeling_flash_attention_utils.py" ], "similarity": 0.444, "size_similarity": 0.267 }, { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.339, "left_pr_number": 41097, "right_pr_number": 44547, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/modeling_flash_attention_utils.py" ], "similarity": 0.412, "size_similarity": 0.16 } ], "pr_count": 3, "pr_numbers": [ 41097, 43549, 44547 ], "recent_pr_count": 2, "recent_pr_numbers": [ 43549, 44547 ], "representative_pr_number": 43549, "representative_title": "[kernels] exception handling for fa kernels", "representative_url": "https://github.com/huggingface/transformers/pull/43549", "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/modeling_flash_attention_utils.py" ], "summary": "3 open PRs share weighted file overlap around `src/transformers/modeling_flash_attention_utils.py`; representative PR #43549.", "title": "Scope: [kernels] exception handling for fa kernels" }, { "authors": [ "mtthw13", "yashbora9" ], "average_similarity": 0.989, "cluster_id": "pr-scope-44018-2", "kind": "pr_scope", "last_activity_at": "2026-02-18T08:30:32Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 0.999, "content_similarity": 0.998, "left_pr_number": 44018, "right_pr_number": 44068, "shared_directories": [ "src/transformers/models/gpt_neo", "src/transformers/models", "tests/models/gpt_neo", "src/transformers", "tests/models", "src", "tests" ], "shared_filenames": [ "src/transformers/models/gpt_neo/modeling_gpt_neo.py", "tests/models/gpt_neo/test_modeling_gpt_neo.py" ], "similarity": 0.989, "size_similarity": 0.932 } ], "pr_count": 2, "pr_numbers": [ 44018, 44068 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44018, 44068 ], "representative_pr_number": 44018, "representative_title": "Refactor GPT-Neo output tracing to use capture_outputs/can_return_tuple", "representative_url": "https://github.com/huggingface/transformers/pull/44018", "shared_directories": [ "src/transformers/models/gpt_neo", "tests/models/gpt_neo", "src/transformers/models", "tests/models", "src/transformers", "tests", "src" ], "shared_filenames": [ "src/transformers/models/gpt_neo/modeling_gpt_neo.py", "tests/models/gpt_neo/test_modeling_gpt_neo.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/models/gpt_neo/modeling_gpt_neo.py`, `tests/models/gpt_neo/test_modeling_gpt_neo.py`; representative PR #44018.", "title": "Scope: Refactor GPT-Neo output tracing to use capture_outputs/can_return_tuple" }, { "authors": [ "lashahub" ], "average_similarity": 0.831, "cluster_id": "pr-scope-43538-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T17:19:57Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.862, "concentration_similarity": 0.865, "content_similarity": 0.842, "left_pr_number": 43538, "right_pr_number": 44830, "shared_directories": [ "docs/source/en/model_doc", "src/transformers/models/audioflamingo3", "src/transformers/models/auto", "src/transformers/models/glmasr", "src/transformers/models/musicflamingo", "docs/source/en", "src/transformers/models", "tests/fixtures/audioflamingo3", "tests/fixtures/musicflamingo", "tests/models/audioflamingo3" ], "shared_filenames": [ "docs/source/en/_toctree.yml", "docs/source/en/model_doc/audioflamingo3.md", "docs/source/en/model_doc/musicflamingo.md", "docs/source/en/model_doc/vibevoice_acoustic_tokenizer.md", "src/transformers/models/__init__.py", "src/transformers/models/audioflamingo3/configuration_audioflamingo3.py", "src/transformers/models/audioflamingo3/modeling_audioflamingo3.py", "src/transformers/models/audioflamingo3/modular_audioflamingo3.py", "src/transformers/models/audioflamingo3/processing_audioflamingo3.py", "src/transformers/models/auto/configuration_auto.py" ], "similarity": 0.831, "size_similarity": 0.748 } ], "pr_count": 2, "pr_numbers": [ 43538, 44830 ], "recent_pr_count": 2, "recent_pr_numbers": [ 43538, 44830 ], "representative_pr_number": 43538, "representative_title": "Add Music Flamingo", "representative_url": "https://github.com/huggingface/transformers/pull/43538", "shared_directories": [ "src/transformers/models/musicflamingo", "src/transformers/models/glmasr", "src/transformers/models/audioflamingo3", "docs/source/en/model_doc", "src/transformers/models/auto", "tests/fixtures/audioflamingo3", "tests/fixtures/musicflamingo", "tests/models/audioflamingo3" ], "shared_filenames": [ "docs/source/en/model_doc/audioflamingo3.md", "docs/source/en/model_doc/musicflamingo.md", "src/transformers/models/audioflamingo3/configuration_audioflamingo3.py", "src/transformers/models/glmasr/processing_glmasr.py", "src/transformers/models/musicflamingo/__init__.py", "src/transformers/models/musicflamingo/configuration_musicflamingo.py", "src/transformers/models/musicflamingo/convert_musicflamingo_to_hf.py", "src/transformers/models/musicflamingo/modeling_musicflamingo.py" ], "summary": "2 open PRs share weighted file overlap around `docs/source/en/model_doc/audioflamingo3.md`, `docs/source/en/model_doc/musicflamingo.md`, `src/transformers/models/audioflamingo3/configuration_audioflamingo3.py`; representative PR #43538.", "title": "Scope: Add Music Flamingo" }, { "authors": [ "ITcarrot", "Mr-Neutr0n" ], "average_similarity": 0.819, "cluster_id": "pr-scope-43543-2", "kind": "pr_scope", "last_activity_at": "2026-02-05T18:14:28Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.913, "left_pr_number": 43543, "right_pr_number": 43775, "shared_directories": [ "src/transformers/models/dbrx", "src/transformers/models/ernie4_5_moe", "src/transformers/models/ernie4_5_vl_moe", "src/transformers/models/flex_olmo", "src/transformers/models/glm4v_moe", "src/transformers/models/gpt_oss", "src/transformers/models/granitemoe", "src/transformers/models/granitemoehybrid", "src/transformers/models/granitemoeshared", "src/transformers/models/jamba" ], "shared_filenames": [ "src/transformers/models/dbrx/modeling_dbrx.py", "src/transformers/models/ernie4_5_moe/modeling_ernie4_5_moe.py", "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", "src/transformers/models/flex_olmo/modeling_flex_olmo.py", "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", "src/transformers/models/gpt_oss/modeling_gpt_oss.py", "src/transformers/models/granitemoe/modeling_granitemoe.py", "src/transformers/models/granitemoehybrid/modeling_granitemoehybrid.py", "src/transformers/models/granitemoeshared/modeling_granitemoeshared.py", "src/transformers/models/jamba/modeling_jamba.py" ], "similarity": 0.819, "size_similarity": 0.2 } ], "pr_count": 2, "pr_numbers": [ 43543, 43775 ], "recent_pr_count": 2, "recent_pr_numbers": [ 43543, 43775 ], "representative_pr_number": 43543, "representative_title": "Fix fp16 underflow in MoE load balancing loss by enforcing fp32 softmax", "representative_url": "https://github.com/huggingface/transformers/pull/43543", "shared_directories": [ "src/transformers/models/dbrx", "src/transformers/models/ernie4_5_moe", "src/transformers/models/jetmoe", "src/transformers/models/minimax_m2", "src/transformers/models/phimoe", "src/transformers/models/flex_olmo", "src/transformers/models/mixtral", "src/transformers/models/qwen3_moe" ], "shared_filenames": [ "src/transformers/models/dbrx/modeling_dbrx.py", "src/transformers/models/ernie4_5_moe/modeling_ernie4_5_moe.py", "src/transformers/models/jetmoe/modeling_jetmoe.py", "src/transformers/models/minimax_m2/modeling_minimax_m2.py", "src/transformers/models/mixtral/modeling_mixtral.py", "src/transformers/models/phimoe/modeling_phimoe.py", "src/transformers/models/flex_olmo/modeling_flex_olmo.py", "src/transformers/models/gpt_oss/modeling_gpt_oss.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/models/dbrx/modeling_dbrx.py`, `src/transformers/models/ernie4_5_moe/modeling_ernie4_5_moe.py`, `src/transformers/models/jetmoe/modeling_jetmoe.py`; representative PR #43543.", "title": "Scope: Fix fp16 underflow in MoE load balancing loss by enforcing fp32 softmax" }, { "authors": [ "surya10602", "thecaptain789" ], "average_similarity": 0.661, "cluster_id": "pr-scope-43779-2", "kind": "pr_scope", "last_activity_at": "2026-02-09T09:44:45Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.677, "left_pr_number": 43779, "right_pr_number": 43816, "shared_directories": [ "src/transformers/integrations", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/integrations/integration_utils.py" ], "similarity": 0.661, "size_similarity": 0.25 } ], "pr_count": 2, "pr_numbers": [ 43779, 43816 ], "recent_pr_count": 2, "recent_pr_numbers": [ 43779, 43816 ], "representative_pr_number": 43779, "representative_title": "SwanLab: Add support for id and resume arguments in SwanLabCallback", "representative_url": "https://github.com/huggingface/transformers/pull/43779", "shared_directories": [ "src/transformers/integrations", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/integrations/integration_utils.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/integrations/integration_utils.py`; representative PR #43779.", "title": "Scope: SwanLab: Add support for id and resume arguments in SwanLabCallback" }, { "authors": [ "Cyrilvallez", "xenova" ], "average_similarity": 0.592, "cluster_id": "pr-scope-44763-2", "kind": "pr_scope", "last_activity_at": "2026-03-23T15:14:13Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.833, "concentration_similarity": 1.0, "content_similarity": 0.459, "left_pr_number": 44763, "right_pr_number": 44888, "shared_directories": [ "src/transformers/models/nemotron_h", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/nemotron_h/modeling_nemotron_h.py", "src/transformers/models/nemotron_h/modular_nemotron_h.py" ], "similarity": 0.592, "size_similarity": 0.917 } ], "pr_count": 2, "pr_numbers": [ 44763, 44888 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44763, 44888 ], "representative_pr_number": 44763, "representative_title": "[nemotron_h] Add support for MLP mixers", "representative_url": "https://github.com/huggingface/transformers/pull/44763", "shared_directories": [ "src/transformers/models/nemotron_h", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/nemotron_h/modular_nemotron_h.py", "src/transformers/models/nemotron_h/modeling_nemotron_h.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/models/nemotron_h/modular_nemotron_h.py`, `src/transformers/models/nemotron_h/modeling_nemotron_h.py`; representative PR #44763.", "title": "Scope: [nemotron_h] Add support for MLP mixers" }, { "authors": [ "andylizf", "zucchini-nlp" ], "average_similarity": 0.555, "cluster_id": "pr-scope-44157-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T14:12:50Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.896, "concentration_similarity": 0.919, "content_similarity": 0.594, "left_pr_number": 44157, "right_pr_number": 44973, "shared_directories": [ "src/transformers/models/ernie4_5_vl_moe", "src/transformers/models/glm4v", "src/transformers/models/glm4v_moe", "src/transformers/models/glm_ocr", "src/transformers/models/paddleocr_vl", "src/transformers/models/qwen2_5_omni", "src/transformers/models/qwen2_5_vl", "src/transformers/models/qwen2_vl", "src/transformers/models/qwen3_5", "src/transformers/models/qwen3_5_moe" ], "shared_filenames": [ "src/transformers/models/ernie4_5_vl_moe/modeling_ernie4_5_vl_moe.py", "src/transformers/models/glm4v/modeling_glm4v.py", "src/transformers/models/glm4v_moe/modeling_glm4v_moe.py", "src/transformers/models/glm_ocr/modeling_glm_ocr.py", "src/transformers/models/glm_ocr/modular_glm_ocr.py", "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", "src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py", "src/transformers/models/qwen2_5_omni/modular_qwen2_5_omni.py", "src/transformers/models/qwen2_5_vl/modeling_qwen2_5_vl.py", "src/transformers/models/qwen2_vl/modeling_qwen2_vl.py" ], "similarity": 0.555, "size_similarity": 0.029 } ], "pr_count": 2, "pr_numbers": [ 44157, 44973 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44157, 44973 ], "representative_pr_number": 44157, "representative_title": "Use correct mask for packed inputs in Qwen-VL ", "representative_url": "https://github.com/huggingface/transformers/pull/44157", "shared_directories": [ "src/transformers/models/glm_ocr", "src/transformers/models/video_llama_3", "src/transformers/models/glm4v", "src/transformers/models/glm4v_moe", "src/transformers/models/qwen2_5_omni", "src/transformers/models/qwen2_vl", "src/transformers/models/qwen3_5_moe", "src/transformers/models/paddleocr_vl" ], "shared_filenames": [ "src/transformers/models/glm_ocr/modular_glm_ocr.py", "src/transformers/models/video_llama_3/modular_video_llama_3.py", "src/transformers/models/glm4v/modeling_glm4v.py", "src/transformers/models/glm_ocr/modeling_glm_ocr.py", "src/transformers/models/qwen3_vl/modeling_qwen3_vl.py", "src/transformers/models/video_llama_3/modeling_video_llama_3.py", "src/transformers/models/paddleocr_vl/modeling_paddleocr_vl.py", "src/transformers/models/qwen2_5_omni/modeling_qwen2_5_omni.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/models/glm_ocr/modular_glm_ocr.py`, `src/transformers/models/video_llama_3/modular_video_llama_3.py`, `src/transformers/models/glm4v/modeling_glm4v.py`; representative PR #44157.", "title": "Scope: Use correct mask for packed inputs in Qwen-VL " }, { "authors": [ "aman-coder03", "dtiourine" ], "average_similarity": 0.553, "cluster_id": "pr-scope-44101-2", "kind": "pr_scope", "last_activity_at": "2026-02-19T08:08:33Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.5, "concentration_similarity": 0.507, "content_similarity": 0.614, "left_pr_number": 44101, "right_pr_number": 44116, "shared_directories": [ "src/transformers/models/flaubert", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/flaubert/modeling_flaubert.py" ], "similarity": 0.553, "size_similarity": 0.319 } ], "pr_count": 2, "pr_numbers": [ 44101, 44116 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44101, 44116 ], "representative_pr_number": 44101, "representative_title": "[XLM] Refactor output tracing to align with capture_outputs standardized architecture", "representative_url": "https://github.com/huggingface/transformers/pull/44101", "shared_directories": [ "src/transformers/models/flaubert", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/flaubert/modeling_flaubert.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/models/flaubert/modeling_flaubert.py`; representative PR #44101.", "title": "Scope: [XLM] Refactor output tracing to align with capture_outputs standardized architecture" }, { "authors": [ "Sai-Suraj-27", "nulone" ], "average_similarity": 0.543, "cluster_id": "pr-scope-43833-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T19:31:09Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 1.0, "content_similarity": 0.409, "left_pr_number": 43833, "right_pr_number": 45001, "shared_directories": [ "src/transformers/integrations", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/integrations/moe.py" ], "similarity": 0.543, "size_similarity": 0.714 } ], "pr_count": 2, "pr_numbers": [ 43833, 45001 ], "recent_pr_count": 2, "recent_pr_numbers": [ 43833, 45001 ], "representative_pr_number": 43833, "representative_title": "fix: ensure dtype consistency in grouped_mm under autocast", "representative_url": "https://github.com/huggingface/transformers/pull/43833", "shared_directories": [ "src/transformers/integrations", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/integrations/moe.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/integrations/moe.py`; representative PR #43833.", "title": "Scope: fix: ensure dtype consistency in grouped_mm under autocast" }, { "authors": [ "kulkarni-rohan", "zucchini-nlp" ], "average_similarity": 0.466, "cluster_id": "pr-scope-44713-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T18:53:51Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.196, "concentration_similarity": 0.377, "content_similarity": 0.54, "left_pr_number": 44713, "right_pr_number": 45000, "shared_directories": [ "src/transformers/models/colqwen2", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/colqwen2/modeling_colqwen2.py", "src/transformers/models/colqwen2/modular_colqwen2.py" ], "similarity": 0.466, "size_similarity": 0.331 } ], "pr_count": 2, "pr_numbers": [ 44713, 45000 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44713, 45000 ], "representative_pr_number": 44713, "representative_title": "[ColQwen2] Refactor output tracing (issue #43979)", "representative_url": "https://github.com/huggingface/transformers/pull/44713", "shared_directories": [ "src/transformers/models/colqwen2", "src/transformers/models", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/models/colqwen2/modeling_colqwen2.py", "src/transformers/models/colqwen2/modular_colqwen2.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/models/colqwen2/modeling_colqwen2.py`, `src/transformers/models/colqwen2/modular_colqwen2.py`; representative PR #44713.", "title": "Scope: [ColQwen2] Refactor output tracing (issue #43979)" }, { "authors": [ "MaybeSam05", "NielsRogge" ], "average_similarity": 0.433, "cluster_id": "pr-scope-44385-2", "kind": "pr_scope", "last_activity_at": "2026-03-12T10:33:43Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.667, "concentration_similarity": 1.0, "content_similarity": 0.372, "left_pr_number": 44385, "right_pr_number": 44615, "shared_directories": [ "src/transformers/utils", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/utils/import_utils.py" ], "similarity": 0.433, "size_similarity": 0.371 } ], "pr_count": 2, "pr_numbers": [ 44385, 44615 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44385, 44615 ], "representative_pr_number": 44385, "representative_title": "Fix make check-repo", "representative_url": "https://github.com/huggingface/transformers/pull/44385", "shared_directories": [ "src/transformers/utils", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/utils/import_utils.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/utils/import_utils.py`; representative PR #44385.", "title": "Scope: Fix make check-repo" }, { "authors": [ "AkshajKashyap", "roycho96" ], "average_similarity": 0.412, "cluster_id": "pr-scope-44889-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T02:39:15Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 0.812, "content_similarity": 0.176, "left_pr_number": 44889, "right_pr_number": 44981, "shared_directories": [ "src/transformers", "tests/trainer", "src", "tests" ], "shared_filenames": [ "src/transformers/trainer.py" ], "similarity": 0.412, "size_similarity": 0.991 } ], "pr_count": 2, "pr_numbers": [ 44889, 44981 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44889, 44981 ], "representative_pr_number": 44889, "representative_title": "[DeepSpeed] Fix evaluate()/predict() before train()", "representative_url": "https://github.com/huggingface/transformers/pull/44889", "shared_directories": [ "tests/trainer", "src/transformers", "tests", "src" ], "shared_filenames": [ "src/transformers/trainer.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/trainer.py`; representative PR #44889.", "title": "Scope: [DeepSpeed] Fix evaluate()/predict() before train()" }, { "authors": [ "tarekziade", "zucchini-nlp" ], "average_similarity": 0.412, "cluster_id": "pr-scope-43587-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T16:52:04Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.8, "concentration_similarity": 0.849, "content_similarity": 0.245, "left_pr_number": 43587, "right_pr_number": 44992, "shared_directories": [ "utils" ], "shared_filenames": [ "utils/check_docstrings.py" ], "similarity": 0.412, "size_similarity": 0.787 } ], "pr_count": 2, "pr_numbers": [ 43587, 44992 ], "recent_pr_count": 2, "recent_pr_numbers": [ 43587, 44992 ], "representative_pr_number": 43587, "representative_title": "[WIP] Check docstring runs on modular files", "representative_url": "https://github.com/huggingface/transformers/pull/43587", "shared_directories": [ "utils" ], "shared_filenames": [ "utils/check_docstrings.py" ], "summary": "2 open PRs share weighted file overlap around `utils/check_docstrings.py`; representative PR #43587.", "title": "Scope: [WIP] Check docstring runs on modular files" }, { "authors": [ "Charly21r", "khushali9" ], "average_similarity": 0.409, "cluster_id": "pr-scope-44146-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T15:02:57Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.75, "concentration_similarity": 0.898, "content_similarity": 0.284, "left_pr_number": 44146, "right_pr_number": 44949, "shared_directories": [ "src/transformers", "tests/trainer", "src", "tests" ], "shared_filenames": [ "tests/trainer/test_trainer_callback.py" ], "similarity": 0.409, "size_similarity": 0.605 } ], "pr_count": 2, "pr_numbers": [ 44146, 44949 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44146, 44949 ], "representative_pr_number": 44146, "representative_title": "Ensure final evaluation runs with step-based evaluation strategy", "representative_url": "https://github.com/huggingface/transformers/pull/44146", "shared_directories": [ "tests/trainer", "src/transformers", "tests", "src" ], "shared_filenames": [ "tests/trainer/test_trainer_callback.py" ], "summary": "2 open PRs share weighted file overlap around `tests/trainer/test_trainer_callback.py`; representative PR #44146.", "title": "Scope: Ensure final evaluation runs with step-based evaluation strategy" }, { "authors": [ "kashif", "qgallouedec" ], "average_similarity": 0.406, "cluster_id": "pr-scope-44425-2", "kind": "pr_scope", "last_activity_at": "2026-03-20T16:28:43Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 0.196, "concentration_similarity": 0.618, "content_similarity": 0.507, "left_pr_number": 44425, "right_pr_number": 44891, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer_callback.py" ], "similarity": 0.406, "size_similarity": 0.004 } ], "pr_count": 2, "pr_numbers": [ 44425, 44891 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44425, 44891 ], "representative_pr_number": 44425, "representative_title": "Fix conditional check for float formatting", "representative_url": "https://github.com/huggingface/transformers/pull/44425", "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/trainer_callback.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/trainer_callback.py`; representative PR #44425.", "title": "Scope: Fix conditional check for float formatting" }, { "authors": [ "ArthurZucker", "ydshieh" ], "average_similarity": 0.382, "cluster_id": "pr-scope-44128-2", "kind": "pr_scope", "last_activity_at": "2026-03-25T13:54:10Z", "outside_window_prs": [], "pairwise": [ { "breadth_similarity": 1.0, "concentration_similarity": 0.955, "content_similarity": 0.142, "left_pr_number": 44128, "right_pr_number": 44965, "shared_directories": [ ".github/workflows", ".github" ], "shared_filenames": [], "similarity": 0.382, "size_similarity": 0.899 } ], "pr_count": 2, "pr_numbers": [ 44128, 44965 ], "recent_pr_count": 2, "recent_pr_numbers": [ 44128, 44965 ], "representative_pr_number": 44128, "representative_title": "update release workflow", "representative_url": "https://github.com/huggingface/transformers/pull/44128", "shared_directories": [ ".github/workflows", ".github" ], "shared_filenames": [], "summary": "2 open PRs cluster in `.github/workflows`, `.github` with similar change breadth; representative PR #44128.", "title": "Scope: update release workflow" }, { "authors": [ "XingyuHu109" ], "average_similarity": 0.865, "cluster_id": "pr-scope-41251-2", "kind": "pr_scope", "last_activity_at": "2026-03-12T16:02:46Z", "outside_window_prs": [ { "additions": 1704, "author": "ArthurZucker", "changed_files": 14, "created_at": "2025-10-01T12:41:21Z", "deletions": 1, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/41251/files", "html_url": "https://github.com/huggingface/transformers/pull/41251", "merged": false, "number": 41251, "state": "open", "title": "Add deepseek 3.2 exp", "updated_at": "2026-03-25T17:02:59Z" } ], "pairwise": [ { "breadth_similarity": 0.743, "concentration_similarity": 0.977, "content_similarity": 0.906, "left_pr_number": 41251, "right_pr_number": 44481, "shared_directories": [ "docs/source/en/model_doc", "src/transformers/models/auto", "src/transformers/models/deepseek_v32", "docs/source/en", "src/transformers/integrations", "src/transformers/models", "tests/models/deepseek_v32", "docs/source", "src/transformers", "tests/models" ], "shared_filenames": [ "docs/source/en/_toctree.yml", "docs/source/en/model_doc/deepseek_v32.md", "src/transformers/conversion_mapping.py", "src/transformers/models/__init__.py", "src/transformers/models/auto/configuration_auto.py", "src/transformers/models/auto/modeling_auto.py", "src/transformers/models/deepseek_v32/__init__.py", "src/transformers/models/deepseek_v32/configuration_deepseek_v32.py", "src/transformers/models/deepseek_v32/modeling_deepseek_v32.py", "src/transformers/models/deepseek_v32/modular_deepseek_v32.py" ], "similarity": 0.865, "size_similarity": 0.716 } ], "pr_count": 2, "pr_numbers": [ 41251, 44481 ], "recent_pr_count": 1, "recent_pr_numbers": [ 44481 ], "representative_pr_number": 41251, "representative_title": "Add deepseek 3.2 exp", "representative_url": "https://github.com/huggingface/transformers/pull/41251", "shared_directories": [ "src/transformers/models/deepseek_v32", "docs/source/en/model_doc", "src/transformers/models/auto", "tests/models/deepseek_v32", "src/transformers/integrations", "docs/source/en", "src/transformers/models", "docs/source" ], "shared_filenames": [ "docs/source/en/model_doc/deepseek_v32.md", "src/transformers/models/deepseek_v32/__init__.py", "src/transformers/models/deepseek_v32/configuration_deepseek_v32.py", "src/transformers/models/deepseek_v32/modeling_deepseek_v32.py", "src/transformers/models/deepseek_v32/modular_deepseek_v32.py", "tests/models/deepseek_v32/__init__.py", "tests/models/deepseek_v32/test_modeling_deepseek_v32.py", "src/transformers/conversion_mapping.py" ], "summary": "2 open PRs share weighted file overlap around `docs/source/en/model_doc/deepseek_v32.md`, `src/transformers/models/deepseek_v32/__init__.py`, `src/transformers/models/deepseek_v32/configuration_deepseek_v32.py`; representative PR #41251.", "title": "Scope: Add deepseek 3.2 exp" }, { "authors": [ "NielsRogge" ], "average_similarity": 0.726, "cluster_id": "pr-scope-36895-2", "kind": "pr_scope", "last_activity_at": "2026-03-05T16:00:53Z", "outside_window_prs": [ { "additions": 5599, "author": "sbucaille", "changed_files": 20, "created_at": "2025-03-21T22:28:16Z", "deletions": 17, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/36895/files", "html_url": "https://github.com/huggingface/transformers/pull/36895", "merged": false, "number": 36895, "state": "open", "title": "Add RF-DETR", "updated_at": "2026-03-24T13:39:48Z" } ], "pairwise": [ { "breadth_similarity": 0.926, "concentration_similarity": 0.931, "content_similarity": 0.662, "left_pr_number": 36895, "right_pr_number": 44375, "shared_directories": [ "docs/source/en/model_doc", "src/transformers/models/auto", "src/transformers/models/rf_detr", "docs/source/en", "src/transformers/loss", "src/transformers/models", "tests/models/rf_detr", "docs/source", "src/transformers", "tests/models" ], "shared_filenames": [ "docs/source/en/_toctree.yml", "docs/source/en/model_doc/rf_detr.md", "src/transformers/loss/loss_lw_detr.py", "src/transformers/loss/loss_utils.py", "src/transformers/models/__init__.py", "src/transformers/models/auto/configuration_auto.py", "src/transformers/models/auto/image_processing_auto.py", "src/transformers/models/auto/modeling_auto.py", "src/transformers/models/rf_detr/__init__.py", "src/transformers/models/rf_detr/configuration_rf_detr.py" ], "similarity": 0.726, "size_similarity": 0.822 } ], "pr_count": 2, "pr_numbers": [ 36895, 44375 ], "recent_pr_count": 1, "recent_pr_numbers": [ 44375 ], "representative_pr_number": 36895, "representative_title": "Add RF-DETR", "representative_url": "https://github.com/huggingface/transformers/pull/36895", "shared_directories": [ "src/transformers/models/rf_detr", "docs/source/en/model_doc", "src/transformers/models/auto", "tests/models/rf_detr", "src/transformers/loss", "docs/source/en", "src/transformers/models", "docs/source" ], "shared_filenames": [ "docs/source/en/model_doc/rf_detr.md", "src/transformers/loss/loss_lw_detr.py", "src/transformers/models/rf_detr/__init__.py", "src/transformers/models/rf_detr/configuration_rf_detr.py", "src/transformers/models/rf_detr/modeling_rf_detr.py", "src/transformers/models/rf_detr/modular_rf_detr.py", "tests/models/rf_detr/__init__.py", "tests/models/rf_detr/test_modeling_rf_detr.py" ], "summary": "2 open PRs share weighted file overlap around `docs/source/en/model_doc/rf_detr.md`, `src/transformers/loss/loss_lw_detr.py`, `src/transformers/models/rf_detr/__init__.py`; representative PR #36895.", "title": "Scope: Add RF-DETR" }, { "authors": [ "antznette1" ], "average_similarity": 0.693, "cluster_id": "pr-scope-41441-2", "kind": "pr_scope", "last_activity_at": "2026-01-26T15:29:00Z", "outside_window_prs": [ { "additions": 6, "author": "cyyever", "changed_files": 1, "created_at": "2025-10-08T10:41:51Z", "deletions": 3, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/41441/files", "html_url": "https://github.com/huggingface/transformers/pull/41441", "merged": false, "number": 41441, "state": "open", "title": "Enhance the handling of Union types in HfArgumentParser", "updated_at": "2026-02-11T12:33:03Z" } ], "pairwise": [ { "breadth_similarity": 0.5, "concentration_similarity": 0.75, "content_similarity": 0.768, "left_pr_number": 41441, "right_pr_number": 43469, "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/hf_argparser.py" ], "similarity": 0.693, "size_similarity": 0.45 } ], "pr_count": 2, "pr_numbers": [ 41441, 43469 ], "recent_pr_count": 1, "recent_pr_numbers": [ 43469 ], "representative_pr_number": 41441, "representative_title": "Enhance the handling of Union types in HfArgumentParser", "representative_url": "https://github.com/huggingface/transformers/pull/41441", "shared_directories": [ "src/transformers", "src" ], "shared_filenames": [ "src/transformers/hf_argparser.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/hf_argparser.py`; representative PR #41441.", "title": "Scope: Enhance the handling of Union types in HfArgumentParser" }, { "authors": [ "IlyasMoutawwakil" ], "average_similarity": 0.607, "cluster_id": "pr-scope-43349-2", "kind": "pr_scope", "last_activity_at": "2026-03-24T13:39:07Z", "outside_window_prs": [ { "additions": 1, "author": "readleyj", "changed_files": 1, "created_at": "2026-01-19T09:54:48Z", "deletions": 6, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/43349/files", "html_url": "https://github.com/huggingface/transformers/pull/43349", "merged": false, "number": 43349, "state": "open", "title": "Remove unnecessary device synchronizations from finegrained FP8 matmul", "updated_at": "2026-01-27T12:40:12Z" } ], "pairwise": [ { "breadth_similarity": 0.292, "concentration_similarity": 0.98, "content_similarity": 0.752, "left_pr_number": 43349, "right_pr_number": 44832, "shared_directories": [ "src/transformers/integrations", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/integrations/finegrained_fp8.py" ], "similarity": 0.607, "size_similarity": 0.02 } ], "pr_count": 2, "pr_numbers": [ 43349, 44832 ], "recent_pr_count": 1, "recent_pr_numbers": [ 44832 ], "representative_pr_number": 43349, "representative_title": "Remove unnecessary device synchronizations from finegrained FP8 matmul", "representative_url": "https://github.com/huggingface/transformers/pull/43349", "shared_directories": [ "src/transformers/integrations", "src/transformers", "src" ], "shared_filenames": [ "src/transformers/integrations/finegrained_fp8.py" ], "summary": "2 open PRs share weighted file overlap around `src/transformers/integrations/finegrained_fp8.py`; representative PR #43349.", "title": "Scope: Remove unnecessary device synchronizations from finegrained FP8 matmul" }, { "authors": [ "harshaljanjani" ], "average_similarity": 0.464, "cluster_id": "pr-scope-41356-2", "kind": "pr_scope", "last_activity_at": "2026-03-24T13:42:36Z", "outside_window_prs": [ { "additions": 512, "author": "Vinayaktoor", "changed_files": 10, "created_at": "2025-10-05T21:35:01Z", "deletions": 0, "draft": false, "files_url": "https://github.com/huggingface/transformers/pull/41356/files", "html_url": "https://github.com/huggingface/transformers/pull/41356", "merged": false, "number": 41356, "state": "open", "title": "Add DEIMv2 model, image processor, and basic tests", "updated_at": "2026-02-09T17:25:26Z" } ], "pairwise": [ { "breadth_similarity": 0.5, "concentration_similarity": 0.951, "content_similarity": 0.506, "left_pr_number": 41356, "right_pr_number": 44339, "shared_directories": [ "docs/source/en/model_doc", "src/transformers/models/deimv2", "docs/source/en", "src/transformers/models", "tests/models/deimv2", "docs/source", "src/transformers", "tests/models", "docs", "src" ], "shared_filenames": [ "docs/source/en/model_doc/deimv2.md", "src/transformers/models/deimv2/__init__.py", "src/transformers/models/deimv2/configuration_deimv2.py", "src/transformers/models/deimv2/modeling_deimv2.py", "tests/models/deimv2/__init__.py", "tests/models/deimv2/test_modeling_deimv2.py" ], "similarity": 0.464, "size_similarity": 0.084 } ], "pr_count": 2, "pr_numbers": [ 41356, 44339 ], "recent_pr_count": 1, "recent_pr_numbers": [ 44339 ], "representative_pr_number": 41356, "representative_title": "Add DEIMv2 model, image processor, and basic tests", "representative_url": "https://github.com/huggingface/transformers/pull/41356", "shared_directories": [ "src/transformers/models/deimv2", "docs/source/en/model_doc", "tests/models/deimv2", "docs/source/en", "src/transformers/models", "docs/source", "tests/models", "src/transformers" ], "shared_filenames": [ "docs/source/en/model_doc/deimv2.md", "src/transformers/models/deimv2/__init__.py", "src/transformers/models/deimv2/configuration_deimv2.py", "src/transformers/models/deimv2/modeling_deimv2.py", "tests/models/deimv2/__init__.py", "tests/models/deimv2/test_modeling_deimv2.py" ], "summary": "2 open PRs share weighted file overlap around `docs/source/en/model_doc/deimv2.md`, `src/transformers/models/deimv2/__init__.py`, `src/transformers/models/deimv2/configuration_deimv2.py`; representative PR #41356.", "title": "Scope: Add DEIMv2 model, image processor, and basic tests" } ]