stranske · stranske · Jan 10, 2026 · Jan 10, 2026 · Copilot · Jan 10, 2026
@@ -106,7 +106,10 @@ jobs:
               sys.exit(0)
 
           # Build vector store
-          label_records = [LabelRecord(name=l['name'], description=l['description']) for l in labels]
+          label_records = [
+              LabelRecord(name=l['name'], description=l['description'])
+              for l in labels
+          ]
           store = build_label_vector_store(label_records)
 
           if store is None:
@@ -128,6 +131,16 @@ jobs:
           auto_apply = [m for m in matches if m.score >= auto_threshold]
           suggestions = [m for m in matches if suggest_threshold <= m.score < auto_threshold]
 
+          # IMPORTANT: Only auto-apply the BEST matching label, not all above threshold
+          # This prevents over-labeling issues with multiple labels like bug+enhancement
+          if auto_apply:
+              best_match = auto_apply[0]  # matches are already sorted by score descending
+              auto_apply = [best_match]
+              # Move other high-confidence matches to suggestions
+              for m in matches[1:]:
+                  if m.score >= auto_threshold and m not in suggestions:
+                      suggestions.insert(0, m)
-          auto_apply = [m for m in matches if m.score >= auto_threshold]
-          suggestions = [m for m in matches if suggest_threshold <= m.score < auto_threshold]
-
-          # IMPORTANT: Only auto-apply the BEST matching label, not all above threshold
-          # This prevents over-labeling issues with multiple labels like bug+enhancement
-          if auto_apply:
-              best_match = auto_apply[0]  # matches are already sorted by score descending
-              auto_apply = [best_match]
-              # Move other high-confidence matches to suggestions
-              for m in matches[1:]:
-                  if m.score >= auto_threshold and m not in suggestions:
-                      suggestions.insert(0, m)
+          auto_apply_full = [m for m in matches if m.score >= auto_threshold]
+          auto_apply = list(auto_apply_full)
+          suggestions = [m for m in matches if suggest_threshold <= m.score < auto_threshold]
+
+          # IMPORTANT: Only auto-apply the BEST matching label, not all above threshold
+          # This prevents over-labeling issues with multiple labels like bug+enhancement
+          if auto_apply:
+              best_match = auto_apply[0]  # matches are already sorted by score descending
+              # Keep only the best match for auto-apply
+              auto_apply = [best_match]
+              # Move other high-confidence matches (remaining auto_apply) to suggestions
+              other_high = auto_apply_full[1:] if 'auto_apply_full' in locals() else []
+              for m in reversed(other_high):
+                  suggestions.insert(0, m)
-          auto_apply = [m for m in matches if m.score >= auto_threshold]
-          suggestions = [m for m in matches if suggest_threshold <= m.score < auto_threshold]
-
-          # IMPORTANT: Only auto-apply the BEST matching label, not all above threshold
-          # This prevents over-labeling issues with multiple labels like bug+enhancement
-          if auto_apply:
-              best_match = auto_apply[0]  # matches are already sorted by score descending
-              auto_apply = [best_match]
-              # Move other high-confidence matches to suggestions
-              for m in matches[1:]:
-                  if m.score >= auto_threshold and m not in suggestions:
-                      suggestions.insert(0, m)
+          auto_apply_full = [m for m in matches if m.score >= auto_threshold]
+          auto_apply = list(auto_apply_full)
+          suggestions = [m for m in matches if suggest_threshold <= m.score < auto_threshold]
+
+          # IMPORTANT: Only auto-apply the BEST matching label, not all above threshold
+          # This prevents over-labeling issues with multiple labels like bug+enhancement
+          if auto_apply:
+              best_match = auto_apply[0]  # matches are already sorted by score descending
+              # Keep only the best match for auto-apply
+              auto_apply = [best_match]
+              # Move other high-confidence matches (remaining auto_apply) to suggestions
+              other_high = auto_apply_full[1:] if 'auto_apply_full' in locals() else []
+              for m in reversed(other_high):
+                  suggestions.insert(0, m)
+
           print(f"Auto-apply labels ({auto_threshold}+ confidence):")
           for m in auto_apply:
               print(f"  - {m.label.name}: {m.score:.2%}")
@@ -139,13 +152,20 @@ jobs:
           # Output results
           with open(os.environ['GITHUB_OUTPUT'], 'a') as f:
               f.write('has_suggestions=true\n')
-              f.write(f'auto_apply_labels={json.dumps([m.label.name for m in auto_apply])}\n')
-              f.write(f'suggested_labels={json.dumps([{"name": m.label.name, "score": f"{m.score:.0%}"} for m in suggestions])}\n')
+              auto_json = json.dumps([m.label.name for m in auto_apply])
+              f.write(f'auto_apply_labels={auto_json}\n')
+              sugg_data = [
+                  {"name": m.label.name, "score": f"{m.score:.0%}"}
+                  for m in suggestions
+              ]
+              f.write(f'suggested_labels={json.dumps(sugg_data)}\n')
 
           PYTHON_SCRIPT
 
       - name: Apply high-confidence labels
-        if: steps.match.outputs.has_suggestions == 'true' && steps.match.outputs.auto_apply_labels != '[]'
+        if: |
+          steps.match.outputs.has_suggestions == 'true' &&
+          steps.match.outputs.auto_apply_labels != '[]'
         uses: actions/github-script@v8
         with:
           script: |
@@ -182,7 +202,9 @@ jobs:
             core.info(`Applied labels: ${newLabels.join(', ')}`);
 
       - name: Post suggestion comment
-        if: steps.match.outputs.has_suggestions == 'true' && steps.match.outputs.suggested_labels != '[]'
+        if: |
+          steps.match.outputs.has_suggestions == 'true' &&
+          steps.match.outputs.suggested_labels != '[]'
         uses: actions/github-script@v8
         with:
           script: |
@@ -199,15 +221,19 @@ jobs:
               .map(l => `- \`${l.name}\` (${l.score} confidence)`)
               .join('\n');
 
-            let body = `### 🏷️ Label Suggestions\n\nBased on the issue content, these labels might be relevant:\n\n${suggestions}\n\n`;
+            let body = `### 🏷️ Label Suggestions\n\n`;
+            body += `Based on the issue content, these labels might be relevant:\n\n`;
+            body += `${suggestions}\n\n`;
 
             if (autoApplied.length > 0) {
-              body += `**Auto-applied:** ${autoApplied.map(l => `\`${l}\``).join(', ')}\n\n`;
+              const applied = autoApplied.map(l => `\`${l}\``).join(', ');
+              body += `**Auto-applied:** ${applied}\n\n`;
             }
 
             body += `<details>\n<summary>How to use these suggestions</summary>\n\n`;
             body += `- Click the label name in the sidebar to add it\n`;
-            body += `- Or use the GitHub CLI: \`gh issue edit ${context.issue.number} --add-label "label-name"\`\n`;
+            const editCmd = `gh issue edit ${context.issue.number} --add-label "label-name"`;
+            body += `- Or use the GitHub CLI: \`${editCmd}\`\n`;
             body += `</details>\n\n`;
             body += `---\n*Auto-generated by label matcher*`;
 

@@ -14,8 +14,9 @@ permissions:
 
 env:
   # Similarity threshold for flagging duplicates (0.0-1.0)
-  # 0.85 = very similar, reduces false positives
-  SIMILARITY_THRESHOLD: "0.85"
+  # 0.92 = very high similarity required, reduces false positives from
+  # issues in the same domain/feature area that share vocabulary
+  SIMILARITY_THRESHOLD: "0.92"
 
 jobs:
   dedup:
@@ -122,9 +123,31 @@ jobs:
           new_body = os.environ.get('NEW_ISSUE_BODY', '')
           query = f'{new_title}\n\n{new_body}'
 
-          threshold = float(os.environ.get('SIMILARITY_THRESHOLD', '0.85'))
+          threshold = float(os.environ.get('SIMILARITY_THRESHOLD', '0.92'))
           matches = find_similar_issues(store, query, threshold=threshold, k=3)
 
+          # Additional filter: require title similarity for true duplicates
+          # This reduces false positives from issues in the same domain/feature area
+          # that share vocabulary but are different tasks
+          filtered_matches = []
+          new_title_lower = new_title.lower().strip()
+          for m in matches:
+              match_title_lower = m.issue.title.lower().strip()
+              # Check for significant title overlap
+              title_words_new = set(new_title_lower.split())
+              title_words_match = set(match_title_lower.split())
+              shared_words = title_words_new.intersection(title_words_match)
+              # Require at least 40% of words to overlap for a duplicate flag
+              max_words = max(len(title_words_new), len(title_words_match), 1)
+              overlap_ratio = len(shared_words) / max_words
-              # Require at least 40% of words to overlap for a duplicate flag
-              max_words = max(len(title_words_new), len(title_words_match), 1)
-              overlap_ratio = len(shared_words) / max_words
+              # Require at least 40% of words in the shorter title to overlap for a duplicate flag
+              min_words = max(min(len(title_words_new), len(title_words_match)), 1)
+              overlap_ratio = len(shared_words) / min_words
-              # Require at least 40% of words to overlap for a duplicate flag
-              max_words = max(len(title_words_new), len(title_words_match), 1)
-              overlap_ratio = len(shared_words) / max_words
+              # Require at least 40% of words in the shorter title to overlap for a duplicate flag
+              min_words = max(min(len(title_words_new), len(title_words_match)), 1)
+              overlap_ratio = len(shared_words) / min_words
+              if m.score >= 0.95 or overlap_ratio >= 0.4:
+                  filtered_matches.append(m)
+                  print(f'  Match #{m.issue.number}: {m.score:.0%}, overlap={overlap_ratio:.0%}')
+              else:
+                  print(f'  Skip #{m.issue.number}: {m.score:.0%}, overlap={overlap_ratio:.0%}')
+
+          matches = filtered_matches
+
           if not matches:
               print('No duplicates found above threshold')
               with open(os.environ['GITHUB_OUTPUT'], 'a') as f: