beads/cmd/bd/duplicates_test.go

package main

import (
	"context"
	"testing"

	"github.com/steveyegge/beads/internal/types"
)

func TestFindDuplicateGroups(t *testing.T) {
	tests := []struct {
		name           string
		issues         []*types.Issue
		expectedGroups int
	}{
		{
			name: "no duplicates",
			issues: []*types.Issue{
				{ID: "bd-1", Title: "Task 1", Status: types.StatusOpen},
				{ID: "bd-2", Title: "Task 2", Status: types.StatusOpen},
			},
			expectedGroups: 0,
		},
		{
			name: "simple duplicate",
			issues: []*types.Issue{
				{ID: "bd-1", Title: "Task 1", Status: types.StatusOpen},
				{ID: "bd-2", Title: "Task 1", Status: types.StatusOpen},
			},
			expectedGroups: 1,
		},
		{
			name: "duplicate with different status ignored",
			issues: []*types.Issue{
				{ID: "bd-1", Title: "Task 1", Status: types.StatusOpen},
				{ID: "bd-2", Title: "Task 1", Status: types.StatusClosed},
			},
			expectedGroups: 0,
		},
		{
			name: "multiple duplicates",
			issues: []*types.Issue{
				{ID: "bd-1", Title: "Task 1", Status: types.StatusOpen},
				{ID: "bd-2", Title: "Task 1", Status: types.StatusOpen},
				{ID: "bd-3", Title: "Task 2", Status: types.StatusOpen},
				{ID: "bd-4", Title: "Task 2", Status: types.StatusOpen},
			},
			expectedGroups: 2,
		},
		{
			name: "different descriptions are duplicates if title matches",
			issues: []*types.Issue{
				{ID: "bd-1", Title: "Task 1", Description: "Desc 1", Status: types.StatusOpen},
				{ID: "bd-2", Title: "Task 1", Description: "Desc 2", Status: types.StatusOpen},
			},
			expectedGroups: 0, // Different descriptions = not duplicates
		},
		{
			name: "exact content match",
			issues: []*types.Issue{
				{ID: "bd-1", Title: "Task 1", Description: "Desc 1", Design: "Design 1", AcceptanceCriteria: "AC 1", Status: types.StatusOpen},
				{ID: "bd-2", Title: "Task 1", Description: "Desc 1", Design: "Design 1", AcceptanceCriteria: "AC 1", Status: types.StatusOpen},
			},
			expectedGroups: 1,
		},
		{
			name: "three-way duplicate",
			issues: []*types.Issue{
				{ID: "bd-1", Title: "Task 1", Status: types.StatusOpen},
				{ID: "bd-2", Title: "Task 1", Status: types.StatusOpen},
				{ID: "bd-3", Title: "Task 1", Status: types.StatusOpen},
			},
			expectedGroups: 1,
		},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			groups := findDuplicateGroups(tt.issues)
			if len(groups) != tt.expectedGroups {
				t.Errorf("findDuplicateGroups() returned %d groups, want %d", len(groups), tt.expectedGroups)
			}
		})
	}
}

func TestChooseMergeTarget(t *testing.T) {
	tests := []struct {
		name             string
		group            []*types.Issue
		refCounts        map[string]int
		structuralScores map[string]*issueScore
		wantID           string
	}{
		{
			name: "choose by reference count when no structural data",
			group: []*types.Issue{
				{ID: "bd-2", Title: "Task"},
				{ID: "bd-1", Title: "Task"},
			},
			refCounts: map[string]int{
				"bd-1": 5,
				"bd-2": 0,
			},
			structuralScores: map[string]*issueScore{},
			wantID:           "bd-1",
		},
		{
			name: "choose by lexicographic order if same references",
			group: []*types.Issue{
				{ID: "bd-2", Title: "Task"},
				{ID: "bd-1", Title: "Task"},
			},
			refCounts: map[string]int{
				"bd-1": 0,
				"bd-2": 0,
			},
			structuralScores: map[string]*issueScore{},
			wantID:           "bd-1",
		},
		{
			name: "prefer higher references even with larger ID",
			group: []*types.Issue{
				{ID: "bd-1", Title: "Task"},
				{ID: "bd-100", Title: "Task"},
			},
			refCounts: map[string]int{
				"bd-1":   1,
				"bd-100": 10,
			},
			structuralScores: map[string]*issueScore{},
			wantID:           "bd-100",
		},
		{
			name: "prefer dependents over text references (GH#1022)",
			group: []*types.Issue{
				{ID: "HONEY-s2g1", Title: "P1 / Foundations"}, // Has 17 children
				{ID: "HONEY-d0mw", Title: "P1 / Foundations"}, // Empty shell
			},
			refCounts: map[string]int{
				"HONEY-s2g1": 0,
				"HONEY-d0mw": 0,
			},
			structuralScores: map[string]*issueScore{
				"HONEY-s2g1": {dependentCount: 17, dependsOnCount: 2, textRefs: 0},
				"HONEY-d0mw": {dependentCount: 0, dependsOnCount: 0, textRefs: 0},
			},
			wantID: "HONEY-s2g1", // Should keep the one with children
		},
		{
			name: "dependents beat text references",
			group: []*types.Issue{
				{ID: "bd-1", Title: "Task"}, // Has text refs but no deps
				{ID: "bd-2", Title: "Task"}, // Has deps but no text refs
			},
			refCounts: map[string]int{
				"bd-1": 100, // Lots of text references
				"bd-2": 0,
			},
			structuralScores: map[string]*issueScore{
				"bd-1": {dependentCount: 0, dependsOnCount: 0, textRefs: 100},
				"bd-2": {dependentCount: 5, dependsOnCount: 0, textRefs: 0}, // 5 children/dependents
			},
			wantID: "bd-2", // Dependents take priority
		},
		{
			name: "dependsOnCount included in weight calculation (GH#1022)",
			group: []*types.Issue{
				{ID: "bd-1", Title: "Task"}, // Has dependencies (depends on others)
				{ID: "bd-2", Title: "Task"}, // Empty shell
			},
			refCounts: map[string]int{
				"bd-1": 0,
				"bd-2": 0,
			},
			structuralScores: map[string]*issueScore{
				"bd-1": {dependentCount: 0, dependsOnCount: 3, textRefs: 0}, // Depends on 3 other issues
				"bd-2": {dependentCount: 0, dependsOnCount: 0, textRefs: 0}, // Empty shell
			},
			wantID: "bd-1", // Issue with dependencies should be kept over empty shell
		},
		{
			name: "weight combines dependents and dependencies (GH#1022)",
			group: []*types.Issue{
				{ID: "bd-1", Title: "Task"}, // Has only dependents (children)
				{ID: "bd-2", Title: "Task"}, // Has both dependents and dependencies
			},
			refCounts: map[string]int{
				"bd-1": 0,
				"bd-2": 0,
			},
			structuralScores: map[string]*issueScore{
				"bd-1": {dependentCount: 5, dependsOnCount: 0, textRefs: 0}, // Weight = 5
				"bd-2": {dependentCount: 3, dependsOnCount: 4, textRefs: 0}, // Weight = 7
			},
			wantID: "bd-2", // Higher combined weight wins
		},
	}

	for _, tt := range tests {
		t.Run(tt.name, func(t *testing.T) {
			target := chooseMergeTarget(tt.group, tt.refCounts, tt.structuralScores)
			if target.ID != tt.wantID {
				t.Errorf("chooseMergeTarget() = %v, want %v", target.ID, tt.wantID)
			}
		})
	}
}

func TestCountReferences(t *testing.T) {
	issues := []*types.Issue{
		{
			ID:          "bd-1",
			Description: "See bd-2 for details",
			Notes:       "Related to bd-3",
		},
		{
			ID:          "bd-2",
			Description: "Mentioned bd-1 twice: bd-1",
		},
		{
			ID:    "bd-3",
			Notes: "Nothing to see here",
		},
	}

	counts := countReferences(issues)

	expectedCounts := map[string]int{
		"bd-1": 2, // Referenced twice in bd-2
		"bd-2": 1, // Referenced once in bd-1
		"bd-3": 1, // Referenced once in bd-1
	}

	for id, expectedCount := range expectedCounts {
		if counts[id] != expectedCount {
			t.Errorf("countReferences()[%s] = %d, want %d", id, counts[id], expectedCount)
		}
	}
}

func TestDuplicateGroupsWithDifferentStatuses(t *testing.T) {
	issues := []*types.Issue{
		{ID: "bd-1", Title: "Task 1", Status: types.StatusOpen},
		{ID: "bd-2", Title: "Task 1", Status: types.StatusClosed},
		{ID: "bd-3", Title: "Task 1", Status: types.StatusOpen},
	}

	groups := findDuplicateGroups(issues)

	// Should have 1 group with bd-1 and bd-3 (both open)
	if len(groups) != 1 {
		t.Fatalf("Expected 1 group, got %d", len(groups))
	}

	if len(groups[0]) != 2 {
		t.Fatalf("Expected 2 issues in group, got %d", len(groups[0]))
	}

	// Verify bd-2 (closed) is not in the group
	for _, issue := range groups[0] {
		if issue.ID == "bd-2" {
			t.Errorf("bd-2 (closed) should not be in group with open issues")
		}
	}
}

func TestDuplicatesIntegration(t *testing.T) {
	tmpDir := t.TempDir()
	testStore := newTestStore(t, tmpDir+"/.beads/beads.db")
	ctx := context.Background()

	// Create duplicate issues (let DB assign IDs)
	issues := []*types.Issue{
		{
			Title:       "Fix authentication bug",
			Description: "Users can't login",
			Status:      types.StatusOpen,
			Priority:    1,
			IssueType:   types.TypeBug,
		},
		{
			Title:       "Fix authentication bug",
			Description: "Users can't login",
			Status:      types.StatusOpen,
			Priority:    1,
			IssueType:   types.TypeBug,
		},
		{
			Title:       "Different task",
			Description: "Different description",
			Status:      types.StatusOpen,
			Priority:    2,
			IssueType:   types.TypeTask,
		},
	}

	for _, issue := range issues {
		if err := testStore.CreateIssue(ctx, issue, "test"); err != nil {
			t.Fatalf("CreateIssue failed: %v", err)
		}
	}

	// Fetch all issues
	allIssues, err := testStore.SearchIssues(ctx, "", types.IssueFilter{})
	if err != nil {
		t.Fatalf("SearchIssues failed: %v", err)
	}

	// Find duplicates
	groups := findDuplicateGroups(allIssues)

	if len(groups) != 1 {
		t.Fatalf("Expected 1 duplicate group, got %d", len(groups))
	}

	if len(groups[0]) != 2 {
		t.Fatalf("Expected 2 issues in group, got %d", len(groups[0]))
	}

	// Verify the duplicate group contains the two issues with "Fix authentication bug"
	dupCount := 0
	for _, issue := range groups[0] {
		if issue.Title == "Fix authentication bug" {
			dupCount++
		}
	}

	if dupCount != 2 {
		t.Errorf("Expected duplicate group to contain 2 'Fix authentication bug' issues, got %d", dupCount)
	}
}

func TestPerformMerge(t *testing.T) {
	tmpDir := t.TempDir()
	testStore := newTestStore(t, tmpDir+"/.beads/beads.db")
	ctx := context.Background()

	// Set up global state needed by performMerge
	oldStore := store
	oldRootCtx := rootCtx
	oldActor := actor
	store = testStore
	rootCtx = ctx
	actor = "test-user"
	defer func() {
		store = oldStore
		rootCtx = oldRootCtx
		actor = oldActor
	}()

	// Create duplicate issues
	target := &types.Issue{
		Title:       "Main issue",
		Description: "This is the target",
		Status:      types.StatusOpen,
		Priority:    1,
		IssueType:   types.TypeTask,
	}
	source1 := &types.Issue{
		Title:       "Main issue",
		Description: "This is the target",
		Status:      types.StatusOpen,
		Priority:    1,
		IssueType:   types.TypeTask,
	}
	source2 := &types.Issue{
		Title:       "Main issue",
		Description: "This is the target",
		Status:      types.StatusOpen,
		Priority:    1,
		IssueType:   types.TypeTask,
	}

	for _, issue := range []*types.Issue{target, source1, source2} {
		if err := testStore.CreateIssue(ctx, issue, "test"); err != nil {
			t.Fatalf("CreateIssue failed: %v", err)
		}
	}

	// Perform the merge
	result := performMerge(target.ID, []string{source1.ID, source2.ID})

	// Verify result structure
	closedIDs := result["closed"].([]string)
	linkedIDs := result["linked"].([]string)
	errors := result["errors"].([]string)

	if len(closedIDs) != 2 {
		t.Errorf("Expected 2 closed issues, got %d", len(closedIDs))
	}
	if len(linkedIDs) != 2 {
		t.Errorf("Expected 2 linked issues, got %d", len(linkedIDs))
	}
	if len(errors) != 0 {
		t.Errorf("Expected 0 errors, got %d: %v", len(errors), errors)
	}

	// Verify source issues are closed
	for _, sourceID := range []string{source1.ID, source2.ID} {
		issue, err := testStore.GetIssue(ctx, sourceID)
		if err != nil {
			t.Fatalf("GetIssue(%s) failed: %v", sourceID, err)
		}
		if issue.Status != types.StatusClosed {
			t.Errorf("Issue %s should be closed, got status %s", sourceID, issue.Status)
		}
	}

	// Verify target is still open
	targetIssue, err := testStore.GetIssue(ctx, target.ID)
	if err != nil {
		t.Fatalf("GetIssue(%s) failed: %v", target.ID, err)
	}
	if targetIssue.Status != types.StatusOpen {
		t.Errorf("Target issue should still be open, got status %s", targetIssue.Status)
	}

	// Verify dependencies were created (GetDependencies returns issues this depends on)
	for _, sourceID := range []string{source1.ID, source2.ID} {
		deps, err := testStore.GetDependencies(ctx, sourceID)
		if err != nil {
			t.Fatalf("GetDependencies(%s) failed: %v", sourceID, err)
		}
		found := false
		for _, dep := range deps {
			if dep.ID == target.ID {
				found = true
				break
			}
		}
		if !found {
			t.Errorf("Expected dependency from %s to %s", sourceID, target.ID)
		}
	}
}