Add storage cache eviction policy to daemon (bd-145)

Implemented TTL-based and LRU cache eviction for daemon storage connections: - Add StorageCacheEntry with lastAccess timestamp tracking - Cleanup goroutine runs every 5 minutes to evict stale entries - TTL-based eviction: remove entries idle >30min (configurable) - LRU eviction: enforce max cache size (default: 50 repos) - Configurable via BEADS_DAEMON_MAX_CACHE_SIZE and BEADS_DAEMON_CACHE_TTL - Proper cleanup on server shutdown - Update lastAccess on cache hits - Comprehensive tests for eviction logic Fixes memory leaks and file descriptor exhaustion for multi-repo users. Amp-Thread-ID: https://ampcode.com/threads/T-1148d8b3-b8a8-45fc-af9c-b5be14c4834d Co-authored-by: Amp <amp@ampcode.com>
2025-10-18 13:17:07 -07:00
parent 491cb82489
commit 259e994522
3 changed files with 460 additions and 32 deletions
--- a/.beads/issues.jsonl
+++ b/.beads/issues.jsonl
@@ -49,7 +49,7 @@
 {"id":"bd-142","title":"Add 'bd stale' command to show orphaned claims and dead executors","description":"Need visibility into orphaned claims - issues stuck in_progress with execution_state but executor is dead/stopped. Add command to show: 1) All issues with execution_state where executor status=stopped or last_heartbeat \u003e threshold, 2) Executor instance details (when died, how long claimed), 3) Option to auto-release them. Makes manual recovery easier until auto-cleanup (bd-140) is implemented.","design":"Query: SELECT i.*, ei.status, ei.last_heartbeat FROM issues i JOIN issue_execution_state ies ON i.id = ies.issue_id JOIN executor_instances ei ON ies.executor_instance_id = ei.instance_id WHERE ei.status='stopped' OR ei.last_heartbeat \u003c NOW() - threshold. Add --release flag to auto-release all found issues.","acceptance_criteria":"bd stale shows orphaned claims, bd stale --release cleans them up","status":"closed","priority":1,"issue_type":"feature","created_at":"2025-10-18T00:25:16.530937-07:00","updated_at":"2025-10-18T09:57:28.141701-07:00","closed_at":"2025-10-18T02:09:12.529064-07:00"}
 {"id":"bd-143","title":"Bias ready work towards recent issues before oldest-first","description":"Currently 'bd ready' shows oldest issues first (by created_at). This can bury recently discovered work that might be more relevant. Propose a hybrid approach: show issues from the past 1-2 days first (sorted by priority), then fall back to oldest-first for older issues. This keeps fresh discoveries visible while still surfacing old forgotten work.","status":"closed","priority":2,"issue_type":"feature","created_at":"2025-10-18T09:31:15.036495-07:00","updated_at":"2025-10-18T09:57:28.105887-07:00","closed_at":"2025-10-18T09:35:55.084891-07:00"}
 {"id":"bd-144","title":"Fix nil pointer dereference in renumber command","description":"The 'bd renumber' command crashes with a nil pointer dereference at renumber.go:52 because store is nil. The command doesn't properly handle daemon/direct mode initialization like other commands do. Error occurs on both --dry-run and --force modes.","status":"closed","priority":1,"issue_type":"bug","created_at":"2025-10-18T09:54:31.59912-07:00","updated_at":"2025-10-18T09:57:28.106373-07:00","closed_at":"2025-10-18T09:56:49.88701-07:00"}
-{"id":"bd-145","title":"Add storage cache eviction policy to daemon","description":"Daemon caches DB connections forever in storageCache map (server.go:29). For users with 50+ repos, this causes memory leaks and file descriptor exhaustion.\n\nNeed LRU cache with:\n- Max size limit (default: 50 repos)\n- TTL-based eviction (default: 30min idle)\n- Periodic cleanup goroutine\n\nLocation: internal/rpc/server.go:29-40","design":"Add StorageCacheEntry struct with lastAccess timestamp.\n\nImplement evictStaleStorage() method that runs every 5 minutes to close connections idle \u003e30min.\n\nAdd max cache size enforcement (LRU eviction when full).\n\nMake limits configurable via env vars:\n- BEADS_DAEMON_MAX_CACHE_SIZE (default: 50)\n- BEADS_DAEMON_CACHE_TTL (default: 30m)","acceptance_criteria":"- Cache evicts entries after 30min idle\n- Cache respects max size limit\n- Cleanup goroutine runs periodically\n- Evicted storage connections are properly closed\n- No resource leaks under sustained load\n- Unit tests for eviction logic","status":"open","priority":0,"issue_type":"feature","created_at":"2025-10-18T13:05:46.174245-07:00","updated_at":"2025-10-18T13:05:46.174245-07:00","dependencies":[{"issue_id":"bd-145","depends_on_id":"bd-155","type":"parent-child","created_at":"2025-10-18T13:07:49.077954-07:00","created_by":"daemon"}]}
+{"id":"bd-145","title":"Add storage cache eviction policy to daemon","description":"Daemon caches DB connections forever in storageCache map (server.go:29). For users with 50+ repos, this causes memory leaks and file descriptor exhaustion.\n\nNeed LRU cache with:\n- Max size limit (default: 50 repos)\n- TTL-based eviction (default: 30min idle)\n- Periodic cleanup goroutine\n\nLocation: internal/rpc/server.go:29-40","design":"Add StorageCacheEntry struct with lastAccess timestamp.\n\nImplement evictStaleStorage() method that runs every 5 minutes to close connections idle \u003e30min.\n\nAdd max cache size enforcement (LRU eviction when full).\n\nMake limits configurable via env vars:\n- BEADS_DAEMON_MAX_CACHE_SIZE (default: 50)\n- BEADS_DAEMON_CACHE_TTL (default: 30m)","acceptance_criteria":"- Cache evicts entries after 30min idle\n- Cache respects max size limit\n- Cleanup goroutine runs periodically\n- Evicted storage connections are properly closed\n- No resource leaks under sustained load\n- Unit tests for eviction logic","status":"in_progress","priority":0,"issue_type":"feature","created_at":"2025-10-18T13:05:46.174245-07:00","updated_at":"2025-10-18T13:13:08.805418-07:00","dependencies":[{"issue_id":"bd-145","depends_on_id":"bd-155","type":"parent-child","created_at":"2025-10-18T13:07:49.077954-07:00","created_by":"daemon"}]}
 {"id":"bd-146","title":"Add daemon health check endpoint and probes","description":"Auto-start only checks socket existence, not daemon responsiveness. Daemon can be running but unresponsive (deadlock, hung DB). Users work in degraded direct mode without knowing why.\n\nNeed health check RPC operation that:\n- Tests DB connectivity (1s timeout)\n- Returns uptime, status, metrics\n- Used by auto-start before connecting\n- Enables monitoring/alerting\n\nLocation: internal/rpc/server.go, cmd/bd/main.go:100-108","design":"Add OpHealth RPC operation to protocol.\n\nhandleHealth() implementation:\n- Quick DB ping with 1s timeout\n- Return status, uptime, version\n- Include basic metrics (connections, cache size)\n\nUpdate TryConnect() to call Health() after socket connection:\n- If health check fails, close connection and return nil\n- Enables transparent failover to direct mode\n\nAdd 'bd daemon --health' CLI command for monitoring.","acceptance_criteria":"- Health check RPC endpoint works\n- Returns structured health status\n- Client uses health check before operations\n- bd daemon --health command exists\n- Unhealthy daemon triggers auto-restart or fallback\n- Health check completes in \u003c2 seconds","status":"open","priority":0,"issue_type":"feature","created_at":"2025-10-18T13:05:58.647592-07:00","updated_at":"2025-10-18T13:05:58.647592-07:00","dependencies":[{"issue_id":"bd-146","depends_on_id":"bd-155","type":"parent-child","created_at":"2025-10-18T13:07:49.093618-07:00","created_by":"daemon"}]}
 {"id":"bd-147","title":"Add stale socket and crash recovery for daemon","description":"When daemon crashes (panic, OOM, signal), socket file remains and blocks new daemon start. Users must manually remove .beads/bd.sock.\n\nProblems:\n- Socket file remains after crash\n- PID file remains (isDaemonRunning false positive)\n- No automatic recovery\n- Users get 'daemon already running' error\n\nLocation: cmd/bd/daemon.go, cmd/bd/main.go:221-311","design":"Improve stale detection in tryAutoStartDaemon():\n\n1. If socket exists, try to connect\n2. If connection fails → stale socket, remove it\n3. Also remove PID file and lock files\n4. Retry daemon start\n\nAdd self-healing to daemon startup:\n- On startup, check for stale PID files\n- If PID in file doesn't exist, remove and continue\n- Use exclusive file lock to prevent races\n\nOptional: Add crash recovery watchdog that restarts daemon on exit.","acceptance_criteria":"- Stale sockets are automatically detected and removed\n- Auto-start recovers from daemon crashes\n- No manual intervention needed for crash recovery\n- PID file management is robust\n- Lock files prevent multiple daemon instances\n- Tests for crash recovery scenarios","status":"open","priority":0,"issue_type":"bug","created_at":"2025-10-18T13:06:10.116917-07:00","updated_at":"2025-10-18T13:06:10.116917-07:00","dependencies":[{"issue_id":"bd-147","depends_on_id":"bd-155","type":"parent-child","created_at":"2025-10-18T13:07:49.108099-07:00","created_by":"daemon"}]}
 {"id":"bd-148","title":"Add lifecycle management for beads-mcp processes","description":"MCP server processes accumulate without cleanup. Each tool invocation spawns a new Python process that lingers after Claude disconnects.\n\nObserved: 6+ beads-mcp processes running simultaneously.\n\nProblems:\n- No parent-child relationship tracking\n- No cleanup on MCP client disconnect\n- Processes leak over days of use\n- Could accumulate hundreds of processes\n\nLocation: integrations/beads-mcp/src/beads_mcp/server.py","design":"Add proper cleanup handlers to MCP server:\n\n1. Register atexit handler to close daemon connections\n2. Handle SIGTERM/SIGINT for graceful shutdown\n3. Close daemon client in cleanup()\n4. Remove any temp files\n\nOptional improvements:\n- Track active connections to daemon\n- Implement connection pooling\n- Add process timeout/TTL\n- Log lifecycle events for debugging\n\nExample:\nimport atexit\nimport signal\n\ndef cleanup():\n    # Close daemon connections\n    # Remove temp files\n    pass\n\natexit.register(cleanup)\nsignal.signal(signal.SIGTERM, lambda s, f: cleanup())","acceptance_criteria":"- MCP processes clean up on exit\n- Daemon connections are properly closed\n- No process leaks after repeated use\n- Signal handlers work correctly\n- Cleanup runs on normal and abnormal exit\n- Test with multiple concurrent MCP invocations","status":"open","priority":0,"issue_type":"bug","created_at":"2025-10-18T13:06:22.030027-07:00","updated_at":"2025-10-18T13:06:22.030027-07:00","dependencies":[{"issue_id":"bd-148","depends_on_id":"bd-155","type":"parent-child","created_at":"2025-10-18T13:07:49.121494-07:00","created_by":"daemon"}]}
--- a/internal/rpc/server.go
+++ b/internal/rpc/server.go
@@ -18,24 +18,54 @@ import (
 	"github.com/steveyegge/beads/internal/types"
 )
 // StorageCacheEntry holds a cached storage with metadata for eviction
 type StorageCacheEntry struct {
 	store      storage.Storage
 	lastAccess time.Time
 }
 // Server represents the RPC server that runs in the daemon
 type Server struct {
-	socketPath string
+	socketPath   string
-	storage    storage.Storage // Default storage (for backward compat)
+	storage      storage.Storage // Default storage (for backward compat)
-	listener   net.Listener
+	listener     net.Listener
-	mu         sync.RWMutex
+	mu           sync.RWMutex
-	shutdown   bool
+	shutdown     bool
-	// Per-request storage routing
+	shutdownChan chan struct{}
-	storageCache map[string]storage.Storage // path -> storage
+	// Per-request storage routing with eviction support
-	cacheMu      sync.RWMutex
+	storageCache   map[string]*StorageCacheEntry // path -> entry
 	cacheMu        sync.RWMutex
 	maxCacheSize   int
 	cacheTTL       time.Duration
 	cleanupTicker  *time.Ticker
 }
 // NewServer creates a new RPC server
 func NewServer(socketPath string, store storage.Storage) *Server {
 	// Parse config from env vars
 	maxCacheSize := 50 // default
 	if env := os.Getenv("BEADS_DAEMON_MAX_CACHE_SIZE"); env != "" {
 		// Parse as integer
 		var size int
 		if _, err := fmt.Sscanf(env, "%d", &size); err == nil && size > 0 {
 			maxCacheSize = size
 		}
 	}
 	cacheTTL := 30 * time.Minute // default
 	if env := os.Getenv("BEADS_DAEMON_CACHE_TTL"); env != "" {
 		if ttl, err := time.ParseDuration(env); err == nil {
 			cacheTTL = ttl
 		}
 	}
 	return &Server{
 		socketPath:   socketPath,
 		storage:      store,
-		storageCache: make(map[string]storage.Storage),
+		storageCache: make(map[string]*StorageCacheEntry),
 		maxCacheSize: maxCacheSize,
 		cacheTTL:     cacheTTL,
 		shutdownChan: make(chan struct{}),
 	}
 }
@@ -62,6 +92,7 @@ func (s *Server) Start(ctx context.Context) error {
 	}
 	go s.handleSignals()
 	go s.runCleanupLoop()
 	for {
 		conn, err := s.listener.Accept()
@@ -85,6 +116,23 @@ func (s *Server) Stop() error {
 	s.shutdown = true
 	s.mu.Unlock()
 	// Signal cleanup goroutine to stop
 	close(s.shutdownChan)
 	if s.cleanupTicker != nil {
 		s.cleanupTicker.Stop()
 	}
 	// Close all cached storage connections
 	s.cacheMu.Lock()
 	for _, entry := range s.storageCache {
 		if err := entry.store.Close(); err != nil {
 			fmt.Fprintf(os.Stderr, "Warning: failed to close storage: %v\n", err)
 		}
 	}
 	s.storageCache = make(map[string]*StorageCacheEntry)
 	s.cacheMu.Unlock()
 	if s.listener != nil {
 		if err := s.listener.Close(); err != nil {
 			return fmt.Errorf("failed to close listener: %w", err)
@@ -122,6 +170,76 @@ func (s *Server) handleSignals() {
 	s.Stop()
 }
 // runCleanupLoop periodically evicts stale storage connections
 func (s *Server) runCleanupLoop() {
 	s.cleanupTicker = time.NewTicker(5 * time.Minute)
 	defer s.cleanupTicker.Stop()
 	for {
 		select {
 		case <-s.cleanupTicker.C:
 			s.evictStaleStorage()
 		case <-s.shutdownChan:
 			return
 		}
 	}
 }
 // evictStaleStorage removes idle connections and enforces cache size limits
 func (s *Server) evictStaleStorage() {
 	now := time.Now()
 	toClose := []storage.Storage{}
 	s.cacheMu.Lock()
 	defer s.cacheMu.Unlock()
 	// First pass: evict TTL-expired entries
 	for path, entry := range s.storageCache {
 		if now.Sub(entry.lastAccess) > s.cacheTTL {
 			toClose = append(toClose, entry.store)
 			delete(s.storageCache, path)
 		}
 	}
 	// Second pass: enforce max cache size with LRU eviction
 	if len(s.storageCache) > s.maxCacheSize {
 		// Build sorted list of entries by lastAccess
 		type cacheItem struct {
 			path       string
 			entry      *StorageCacheEntry
 		}
 		items := make([]cacheItem, 0, len(s.storageCache))
 		for path, entry := range s.storageCache {
 			items = append(items, cacheItem{path, entry})
 		}
 		// Sort by lastAccess (oldest first)
 		for i := 0; i < len(items)-1; i++ {
 			for j := i + 1; j < len(items); j++ {
 				if items[i].entry.lastAccess.After(items[j].entry.lastAccess) {
 					items[i], items[j] = items[j], items[i]
 				}
 			}
 		}
 		// Evict oldest entries until we're under the limit
 		numToEvict := len(s.storageCache) - s.maxCacheSize
 		for i := 0; i < numToEvict && i < len(items); i++ {
 			toClose = append(toClose, items[i].entry.store)
 			delete(s.storageCache, items[i].path)
 		}
 	}
 	// Close connections outside of lock to avoid blocking
 	go func() {
 		for _, store := range toClose {
 			if err := store.Close(); err != nil {
 				fmt.Fprintf(os.Stderr, "Warning: failed to close evicted storage: %v\n", err)
 			}
 		}
 	}()
 }
 func (s *Server) handleConnection(conn net.Conn) {
 	defer conn.Close()
@@ -712,11 +830,13 @@ func (s *Server) getStorageForRequest(req *Request) (storage.Storage, error) {
 	}
 	// Check cache first
-	s.cacheMu.RLock()
+	s.cacheMu.Lock()
-	cached, ok := s.storageCache[req.Cwd]
+	defer s.cacheMu.Unlock()
-	s.cacheMu.RUnlock()
+	
-	if ok {
+	if entry, ok := s.storageCache[req.Cwd]; ok {
-		return cached, nil
+		// Update last access time
 		entry.lastAccess = time.Now()
 		return entry.store, nil
 	}
 	// Find database for this cwd
@@ -731,10 +851,11 @@ func (s *Server) getStorageForRequest(req *Request) (storage.Storage, error) {
 		return nil, fmt.Errorf("failed to open database at %s: %w", dbPath, err)
 	}
-	// Cache it
+	// Cache it with current timestamp
-	s.cacheMu.Lock()
+	s.storageCache[req.Cwd] = &StorageCacheEntry{
-	s.storageCache[req.Cwd] = store
+		store:      store,
-	s.cacheMu.Unlock()
+		lastAccess: time.Now(),
 	}
 	return store, nil
 }
@@ -784,9 +905,9 @@ func (s *Server) handleReposList(_ *Request) Response {
 	defer s.cacheMu.RUnlock()
 	repos := make([]RepoInfo, 0, len(s.storageCache))
-	for path, store := range s.storageCache {
+	for path, entry := range s.storageCache {
 		ctx, cancel := context.WithTimeout(context.Background(), 2*time.Second)
-		stats, err := store.GetStatistics(ctx)
+		stats, err := entry.store.GetStatistics(ctx)
 		cancel()
 		if err != nil {
 			continue
@@ -795,7 +916,7 @@ func (s *Server) handleReposList(_ *Request) Response {
 		// Extract prefix from a sample issue
 		filter := types.IssueFilter{Limit: 1}
 		ctx2, cancel2 := context.WithTimeout(context.Background(), 1*time.Second)
-		issues, err := store.SearchIssues(ctx2, "", filter)
+		issues, err := entry.store.SearchIssues(ctx2, "", filter)
 		cancel2()
 		prefix := ""
 		if err == nil && len(issues) > 0 && len(issues[0].ID) > 0 {
@@ -813,7 +934,7 @@ func (s *Server) handleReposList(_ *Request) Response {
 			Path:       path,
 			Prefix:     prefix,
 			IssueCount: stats.TotalIssues,
-			LastAccess: "active",
+			LastAccess: entry.lastAccess.Format(time.RFC3339),
 		})
 	}
@@ -839,7 +960,7 @@ func (s *Server) handleReposReady(req *Request) Response {
 	if args.GroupByRepo {
 		result := make([]RepoReadyWork, 0, len(s.storageCache))
-		for path, store := range s.storageCache {
+		for path, entry := range s.storageCache {
 			filter := types.WorkFilter{
 				Status: types.StatusOpen,
 				Limit:  args.Limit,
@@ -852,7 +973,7 @@ func (s *Server) handleReposReady(req *Request) Response {
 			}
 			ctx, cancel := context.WithTimeout(context.Background(), 2*time.Second)
-			issues, err := store.GetReadyWork(ctx, filter)
+			issues, err := entry.store.GetReadyWork(ctx, filter)
 			cancel()
 			if err != nil || len(issues) == 0 {
 				continue
@@ -873,7 +994,7 @@ func (s *Server) handleReposReady(req *Request) Response {
 	// Flat list of all ready issues across all repos
 	allIssues := make([]ReposReadyIssue, 0)
-	for path, store := range s.storageCache {
+	for path, entry := range s.storageCache {
 		filter := types.WorkFilter{
 			Status: types.StatusOpen,
 			Limit:  args.Limit,
@@ -886,7 +1007,7 @@ func (s *Server) handleReposReady(req *Request) Response {
 		}
 		ctx, cancel := context.WithTimeout(context.Background(), 2*time.Second)
-		issues, err := store.GetReadyWork(ctx, filter)
+		issues, err := entry.store.GetReadyWork(ctx, filter)
 		cancel()
 		if err != nil {
 			continue
@@ -916,9 +1037,9 @@ func (s *Server) handleReposStats(_ *Request) Response {
 	perRepo := make(map[string]types.Statistics)
 	errors := make(map[string]string)
-	for path, store := range s.storageCache {
+	for path, entry := range s.storageCache {
 		ctx, cancel := context.WithTimeout(context.Background(), 2*time.Second)
-		stats, err := store.GetStatistics(ctx)
+		stats, err := entry.store.GetStatistics(ctx)
 		cancel()
 		if err != nil {
 			errors[path] = err.Error()
@@ -957,10 +1078,10 @@ func (s *Server) handleReposClearCache(_ *Request) Response {
 	// to avoid holding lock during potentially slow Close() operations
 	s.cacheMu.Lock()
 	stores := make([]storage.Storage, 0, len(s.storageCache))
-	for _, store := range s.storageCache {
+	for _, entry := range s.storageCache {
-		stores = append(stores, store)
+		stores = append(stores, entry.store)
 	}
-	s.storageCache = make(map[string]storage.Storage)
+	s.storageCache = make(map[string]*StorageCacheEntry)
 	s.cacheMu.Unlock()
 	// Close all storage connections without holding lock
--- a/internal/rpc/server_eviction_test.go
+++ b/internal/rpc/server_eviction_test.go
@@ -0,0 +1,307 @@
 package rpc
 import (
 	"os"
 	"path/filepath"
 	"testing"
 	"time"
 	"github.com/steveyegge/beads/internal/storage/sqlite"
 )
 func TestStorageCacheEviction_TTL(t *testing.T) {
 	tmpDir := t.TempDir()
 	// Create main DB
 	mainDB := filepath.Join(tmpDir, "main.db")
 	mainStore, err := sqlite.New(mainDB)
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer mainStore.Close()
 	// Create server with short TTL for testing
 	socketPath := filepath.Join(tmpDir, "test.sock")
 	server := NewServer(socketPath, mainStore)
 	server.cacheTTL = 100 * time.Millisecond // Short TTL for testing
 	defer server.Stop()
 	// Create two test databases
 	db1 := filepath.Join(tmpDir, "repo1", ".beads", "issues.db")
 	os.MkdirAll(filepath.Dir(db1), 0755)
 	store1, err := sqlite.New(db1)
 	if err != nil {
 		t.Fatal(err)
 	}
 	store1.Close()
 	db2 := filepath.Join(tmpDir, "repo2", ".beads", "issues.db")
 	os.MkdirAll(filepath.Dir(db2), 0755)
 	store2, err := sqlite.New(db2)
 	if err != nil {
 		t.Fatal(err)
 	}
 	store2.Close()
 	// Access both repos to populate cache
 	req1 := &Request{Cwd: filepath.Join(tmpDir, "repo1")}
 	_, err = server.getStorageForRequest(req1)
 	if err != nil {
 		t.Fatal(err)
 	}
 	req2 := &Request{Cwd: filepath.Join(tmpDir, "repo2")}
 	_, err = server.getStorageForRequest(req2)
 	if err != nil {
 		t.Fatal(err)
 	}
 	// Verify both are cached
 	server.cacheMu.RLock()
 	cacheSize := len(server.storageCache)
 	server.cacheMu.RUnlock()
 	if cacheSize != 2 {
 		t.Fatalf("expected 2 cached entries, got %d", cacheSize)
 	}
 	// Wait for TTL to expire
 	time.Sleep(150 * time.Millisecond)
 	// Run eviction
 	server.evictStaleStorage()
 	// Verify both entries were evicted
 	server.cacheMu.RLock()
 	cacheSize = len(server.storageCache)
 	server.cacheMu.RUnlock()
 	if cacheSize != 0 {
 		t.Fatalf("expected 0 cached entries after TTL eviction, got %d", cacheSize)
 	}
 }
 func TestStorageCacheEviction_LRU(t *testing.T) {
 	tmpDir := t.TempDir()
 	// Create main DB
 	mainDB := filepath.Join(tmpDir, "main.db")
 	mainStore, err := sqlite.New(mainDB)
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer mainStore.Close()
 	// Create server with small cache size
 	socketPath := filepath.Join(tmpDir, "test.sock")
 	server := NewServer(socketPath, mainStore)
 	server.maxCacheSize = 2 // Only keep 2 entries
 	server.cacheTTL = 1 * time.Hour // Long TTL so we test LRU
 	defer server.Stop()
 	// Create three test databases
 	for i := 1; i <= 3; i++ {
 		dbPath := filepath.Join(tmpDir, "repo"+string(rune('0'+i)), ".beads", "issues.db")
 		os.MkdirAll(filepath.Dir(dbPath), 0755)
 		store, err := sqlite.New(dbPath)
 		if err != nil {
 			t.Fatal(err)
 		}
 		store.Close()
 	}
 	// Access repos 1 and 2
 	req1 := &Request{Cwd: filepath.Join(tmpDir, "repo1")}
 	_, err = server.getStorageForRequest(req1)
 	if err != nil {
 		t.Fatal(err)
 	}
 	time.Sleep(10 * time.Millisecond) // Ensure different timestamps
 	req2 := &Request{Cwd: filepath.Join(tmpDir, "repo2")}
 	_, err = server.getStorageForRequest(req2)
 	if err != nil {
 		t.Fatal(err)
 	}
 	// Verify 2 entries cached
 	server.cacheMu.RLock()
 	cacheSize := len(server.storageCache)
 	server.cacheMu.RUnlock()
 	if cacheSize != 2 {
 		t.Fatalf("expected 2 cached entries, got %d", cacheSize)
 	}
 	// Access repo 3, which should trigger LRU eviction of repo1 (oldest)
 	req3 := &Request{Cwd: filepath.Join(tmpDir, "repo3")}
 	_, err = server.getStorageForRequest(req3)
 	if err != nil {
 		t.Fatal(err)
 	}
 	// Run eviction to enforce max cache size
 	server.evictStaleStorage()
 	// Should still have 2 entries
 	server.cacheMu.RLock()
 	cacheSize = len(server.storageCache)
 	_, hasRepo1 := server.storageCache[filepath.Join(tmpDir, "repo1")]
 	_, hasRepo2 := server.storageCache[filepath.Join(tmpDir, "repo2")]
 	_, hasRepo3 := server.storageCache[filepath.Join(tmpDir, "repo3")]
 	server.cacheMu.RUnlock()
 	if cacheSize != 2 {
 		t.Fatalf("expected 2 cached entries after LRU eviction, got %d", cacheSize)
 	}
 	// Repo1 should be evicted (oldest), repo2 and repo3 should remain
 	if hasRepo1 {
 		t.Error("repo1 should have been evicted (oldest)")
 	}
 	if !hasRepo2 {
 		t.Error("repo2 should still be cached")
 	}
 	if !hasRepo3 {
 		t.Error("repo3 should be cached")
 	}
 }
 func TestStorageCacheEviction_LastAccessUpdate(t *testing.T) {
 	tmpDir := t.TempDir()
 	// Create main DB
 	mainDB := filepath.Join(tmpDir, "main.db")
 	mainStore, err := sqlite.New(mainDB)
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer mainStore.Close()
 	// Create server
 	socketPath := filepath.Join(tmpDir, "test.sock")
 	server := NewServer(socketPath, mainStore)
 	defer server.Stop()
 	// Create test database
 	dbPath := filepath.Join(tmpDir, "repo1", ".beads", "issues.db")
 	os.MkdirAll(filepath.Dir(dbPath), 0755)
 	store, err := sqlite.New(dbPath)
 	if err != nil {
 		t.Fatal(err)
 	}
 	store.Close()
 	// First access
 	req := &Request{Cwd: filepath.Join(tmpDir, "repo1")}
 	_, err = server.getStorageForRequest(req)
 	if err != nil {
 		t.Fatal(err)
 	}
 	// Get initial lastAccess time
 	server.cacheMu.RLock()
 	entry := server.storageCache[filepath.Join(tmpDir, "repo1")]
 	initialTime := entry.lastAccess
 	server.cacheMu.RUnlock()
 	// Wait a bit
 	time.Sleep(50 * time.Millisecond)
 	// Access again
 	_, err = server.getStorageForRequest(req)
 	if err != nil {
 		t.Fatal(err)
 	}
 	// Verify lastAccess was updated
 	server.cacheMu.RLock()
 	entry = server.storageCache[filepath.Join(tmpDir, "repo1")]
 	updatedTime := entry.lastAccess
 	server.cacheMu.RUnlock()
 	if !updatedTime.After(initialTime) {
 		t.Errorf("lastAccess should be updated on cache hit, initial: %v, updated: %v", initialTime, updatedTime)
 	}
 }
 func TestStorageCacheEviction_EnvVars(t *testing.T) {
 	tmpDir := t.TempDir()
 	// Create main DB
 	mainDB := filepath.Join(tmpDir, "main.db")
 	mainStore, err := sqlite.New(mainDB)
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer mainStore.Close()
 	// Set env vars
 	os.Setenv("BEADS_DAEMON_MAX_CACHE_SIZE", "100")
 	os.Setenv("BEADS_DAEMON_CACHE_TTL", "1h30m")
 	defer os.Unsetenv("BEADS_DAEMON_MAX_CACHE_SIZE")
 	defer os.Unsetenv("BEADS_DAEMON_CACHE_TTL")
 	// Create server
 	socketPath := filepath.Join(tmpDir, "test.sock")
 	server := NewServer(socketPath, mainStore)
 	defer server.Stop()
 	// Verify config was parsed
 	if server.maxCacheSize != 100 {
 		t.Errorf("expected maxCacheSize=100, got %d", server.maxCacheSize)
 	}
 	expectedTTL := 90 * time.Minute
 	if server.cacheTTL != expectedTTL {
 		t.Errorf("expected cacheTTL=%v, got %v", expectedTTL, server.cacheTTL)
 	}
 }
 func TestStorageCacheEviction_CleanupOnStop(t *testing.T) {
 	tmpDir := t.TempDir()
 	// Create main DB
 	mainDB := filepath.Join(tmpDir, "main.db")
 	mainStore, err := sqlite.New(mainDB)
 	if err != nil {
 		t.Fatal(err)
 	}
 	defer mainStore.Close()
 	// Create server
 	socketPath := filepath.Join(tmpDir, "test.sock")
 	server := NewServer(socketPath, mainStore)
 	// Create test database and populate cache
 	dbPath := filepath.Join(tmpDir, "repo1", ".beads", "issues.db")
 	os.MkdirAll(filepath.Dir(dbPath), 0755)
 	store, err := sqlite.New(dbPath)
 	if err != nil {
 		t.Fatal(err)
 	}
 	store.Close()
 	req := &Request{Cwd: filepath.Join(tmpDir, "repo1")}
 	_, err = server.getStorageForRequest(req)
 	if err != nil {
 		t.Fatal(err)
 	}
 	// Verify cached
 	server.cacheMu.RLock()
 	cacheSize := len(server.storageCache)
 	server.cacheMu.RUnlock()
 	if cacheSize != 1 {
 		t.Fatalf("expected 1 cached entry, got %d", cacheSize)
 	}
 	// Stop server
 	if err := server.Stop(); err != nil {
 		t.Fatal(err)
 	}
 	// Verify cache was cleared
 	server.cacheMu.RLock()
 	cacheSize = len(server.storageCache)
 	server.cacheMu.RUnlock()
 	if cacheSize != 0 {
 		t.Errorf("expected cache to be cleared on stop, got %d entries", cacheSize)
 	}
 }