Refactors all agent startup paths (witness, refinery, crew, polecat) to use a consistent Manager interface with Start(), Stop(), IsRunning(), and SessionName() methods. Includes: - Witness manager with GUPP propulsion nudge for startup - Refinery manager for engineer sessions - Crew manager for worker agents - Session/polecat manager updates - claude_settings_check doctor check for settings validation - Settings management consolidated from rig/manager.go - Settings location moved outside source repos to prevent conflicts 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>
475 lines
15 KiB
Go
475 lines
15 KiB
Go
// Package session provides polecat session lifecycle management.
|
|
package session
|
|
|
|
import (
|
|
"errors"
|
|
"fmt"
|
|
"os"
|
|
"os/exec"
|
|
"path/filepath"
|
|
"strings"
|
|
"time"
|
|
|
|
"github.com/steveyegge/gastown/internal/claude"
|
|
"github.com/steveyegge/gastown/internal/config"
|
|
"github.com/steveyegge/gastown/internal/constants"
|
|
"github.com/steveyegge/gastown/internal/rig"
|
|
"github.com/steveyegge/gastown/internal/tmux"
|
|
)
|
|
|
|
// debugSession logs non-fatal errors during session startup when GT_DEBUG_SESSION=1.
|
|
// These errors are intentionally suppressed because they don't prevent session operation,
|
|
// but logging them helps diagnose issues when needed.
|
|
func debugSession(context string, err error) {
|
|
if os.Getenv("GT_DEBUG_SESSION") != "" && err != nil {
|
|
fmt.Fprintf(os.Stderr, "[session-debug] %s: %v\n", context, err)
|
|
}
|
|
}
|
|
|
|
// Common errors
|
|
var (
|
|
ErrSessionRunning = errors.New("session already running")
|
|
ErrSessionNotFound = errors.New("session not found")
|
|
ErrPolecatNotFound = errors.New("polecat not found")
|
|
)
|
|
|
|
// Manager handles polecat session lifecycle.
|
|
type Manager struct {
|
|
tmux *tmux.Tmux
|
|
rig *rig.Rig
|
|
}
|
|
|
|
// NewManager creates a new session manager for a rig.
|
|
func NewManager(t *tmux.Tmux, r *rig.Rig) *Manager {
|
|
return &Manager{
|
|
tmux: t,
|
|
rig: r,
|
|
}
|
|
}
|
|
|
|
// StartOptions configures session startup.
|
|
type StartOptions struct {
|
|
// WorkDir overrides the default working directory (polecat clone dir).
|
|
WorkDir string
|
|
|
|
// Issue is an optional issue ID to work on.
|
|
Issue string
|
|
|
|
// Command overrides the default "claude" command.
|
|
Command string
|
|
|
|
// Account specifies the account handle to use (overrides default).
|
|
Account string
|
|
|
|
// ClaudeConfigDir is resolved CLAUDE_CONFIG_DIR for the account.
|
|
// If set, this is injected as an environment variable.
|
|
ClaudeConfigDir string
|
|
}
|
|
|
|
// Info contains information about a running session.
|
|
type Info struct {
|
|
// Polecat is the polecat name.
|
|
Polecat string `json:"polecat"`
|
|
|
|
// SessionID is the tmux session identifier.
|
|
SessionID string `json:"session_id"`
|
|
|
|
// Running indicates if the session is currently active.
|
|
Running bool `json:"running"`
|
|
|
|
// RigName is the rig this session belongs to.
|
|
RigName string `json:"rig_name"`
|
|
|
|
// Attached indicates if someone is attached to the session.
|
|
Attached bool `json:"attached,omitempty"`
|
|
|
|
// Created is when the session was created.
|
|
Created time.Time `json:"created,omitempty"`
|
|
|
|
// Windows is the number of tmux windows.
|
|
Windows int `json:"windows,omitempty"`
|
|
|
|
// LastActivity is when the session last had activity.
|
|
LastActivity time.Time `json:"last_activity,omitempty"`
|
|
}
|
|
|
|
// SessionName generates the tmux session name for a polecat.
|
|
func (m *Manager) SessionName(polecat string) string {
|
|
return fmt.Sprintf("gt-%s-%s", m.rig.Name, polecat)
|
|
}
|
|
|
|
// polecatDir returns the working directory for a polecat.
|
|
func (m *Manager) polecatDir(polecat string) string {
|
|
return filepath.Join(m.rig.Path, "polecats", polecat)
|
|
}
|
|
|
|
// hasPolecat checks if the polecat exists in this rig.
|
|
func (m *Manager) hasPolecat(polecat string) bool {
|
|
// Check filesystem directly to handle newly-created polecats
|
|
polecatPath := m.polecatDir(polecat)
|
|
info, err := os.Stat(polecatPath)
|
|
if err != nil {
|
|
return false
|
|
}
|
|
return info.IsDir()
|
|
}
|
|
|
|
// Start creates and starts a new session for a polecat.
|
|
func (m *Manager) Start(polecat string, opts StartOptions) error {
|
|
if !m.hasPolecat(polecat) {
|
|
return fmt.Errorf("%w: %s", ErrPolecatNotFound, polecat)
|
|
}
|
|
|
|
sessionID := m.SessionName(polecat)
|
|
|
|
// Check if session already exists
|
|
running, err := m.tmux.HasSession(sessionID)
|
|
if err != nil {
|
|
return fmt.Errorf("checking session: %w", err)
|
|
}
|
|
if running {
|
|
return fmt.Errorf("%w: %s", ErrSessionRunning, sessionID)
|
|
}
|
|
|
|
// Determine working directory
|
|
workDir := opts.WorkDir
|
|
if workDir == "" {
|
|
workDir = m.polecatDir(polecat)
|
|
}
|
|
|
|
// Ensure Claude settings exist in polecats/ (not polecats/<name>/) so we don't
|
|
// write into the source repo. Claude walks up the tree to find settings.
|
|
// All polecats share the same settings file.
|
|
polecatsDir := filepath.Join(m.rig.Path, "polecats")
|
|
if err := claude.EnsureSettingsForRole(polecatsDir, "polecat"); err != nil {
|
|
return fmt.Errorf("ensuring Claude settings: %w", err)
|
|
}
|
|
|
|
// Create session
|
|
if err := m.tmux.NewSession(sessionID, workDir); err != nil {
|
|
return fmt.Errorf("creating session: %w", err)
|
|
}
|
|
|
|
// Set environment (non-fatal: session works without these)
|
|
debugSession("SetEnvironment GT_RIG", m.tmux.SetEnvironment(sessionID, "GT_RIG", m.rig.Name))
|
|
debugSession("SetEnvironment GT_POLECAT", m.tmux.SetEnvironment(sessionID, "GT_POLECAT", polecat))
|
|
|
|
// Set CLAUDE_CONFIG_DIR for account selection (non-fatal)
|
|
if opts.ClaudeConfigDir != "" {
|
|
debugSession("SetEnvironment CLAUDE_CONFIG_DIR", m.tmux.SetEnvironment(sessionID, "CLAUDE_CONFIG_DIR", opts.ClaudeConfigDir))
|
|
}
|
|
|
|
// CRITICAL: Set beads environment for worktree polecats (non-fatal: session works without)
|
|
// Polecats need access to TOWN-level beads (parent of rig) for hooks and convoys.
|
|
// Town beads use hq- prefix and store hooks, mail, and cross-rig coordination.
|
|
// BEADS_NO_DAEMON=1 prevents daemon from committing to wrong branch.
|
|
// Using town-level beads ensures gt prime and bd commands can find hooked work.
|
|
townRoot := filepath.Dir(m.rig.Path) // Town root is parent of rig directory
|
|
beadsDir := filepath.Join(townRoot, ".beads")
|
|
debugSession("SetEnvironment BEADS_DIR", m.tmux.SetEnvironment(sessionID, "BEADS_DIR", beadsDir))
|
|
debugSession("SetEnvironment BEADS_NO_DAEMON", m.tmux.SetEnvironment(sessionID, "BEADS_NO_DAEMON", "1"))
|
|
debugSession("SetEnvironment BEADS_AGENT_NAME", m.tmux.SetEnvironment(sessionID, "BEADS_AGENT_NAME", fmt.Sprintf("%s/%s", m.rig.Name, polecat)))
|
|
|
|
// Hook the issue to the polecat if provided via --issue flag
|
|
if opts.Issue != "" {
|
|
agentID := fmt.Sprintf("%s/polecats/%s", m.rig.Name, polecat)
|
|
if err := m.hookIssue(opts.Issue, agentID, workDir); err != nil {
|
|
// Non-fatal - warn but continue (session can still start)
|
|
fmt.Printf("Warning: could not hook issue %s: %v\n", opts.Issue, err)
|
|
}
|
|
}
|
|
|
|
// Apply theme (non-fatal: theming failure doesn't affect operation)
|
|
theme := tmux.AssignTheme(m.rig.Name)
|
|
debugSession("ConfigureGasTownSession", m.tmux.ConfigureGasTownSession(sessionID, theme, m.rig.Name, polecat, "polecat"))
|
|
|
|
// Set pane-died hook for crash detection (non-fatal)
|
|
agentID := fmt.Sprintf("%s/%s", m.rig.Name, polecat)
|
|
debugSession("SetPaneDiedHook", m.tmux.SetPaneDiedHook(sessionID, agentID))
|
|
|
|
// Send initial command with env vars exported inline
|
|
// NOTE: tmux SetEnvironment only affects NEW panes, not the current shell.
|
|
// We must export GT_ROLE, GT_RIG, GT_POLECAT inline for Claude to detect identity.
|
|
command := opts.Command
|
|
if command == "" {
|
|
// Polecats run with full permissions - Gas Town is for grownups
|
|
// Export env vars inline so Claude's role detection works
|
|
command = config.BuildPolecatStartupCommand(m.rig.Name, polecat, m.rig.Path, "")
|
|
}
|
|
if err := m.tmux.SendKeys(sessionID, command); err != nil {
|
|
return fmt.Errorf("sending command: %w", err)
|
|
}
|
|
|
|
// Wait for Claude to start (non-fatal: session continues even if this times out)
|
|
debugSession("WaitForCommand", m.tmux.WaitForCommand(sessionID, constants.SupportedShells, constants.ClaudeStartTimeout))
|
|
|
|
// Accept bypass permissions warning dialog if it appears.
|
|
// When Claude starts with --dangerously-skip-permissions, it shows a warning that
|
|
// requires pressing Down to select "Yes, I accept" and Enter to confirm.
|
|
// This is needed for automated polecat startup.
|
|
debugSession("AcceptBypassPermissionsWarning", m.tmux.AcceptBypassPermissionsWarning(sessionID))
|
|
|
|
// Wait for Claude to be fully ready at the prompt (not just started)
|
|
// PRAGMATIC APPROACH: Use fixed delay rather than detection.
|
|
// WaitForClaudeReady has false positives (detects > in various contexts).
|
|
// Claude startup takes ~5-8 seconds on typical machines.
|
|
// Reduced from 10s to 8s since AcceptBypassPermissionsWarning already adds ~1.2s.
|
|
time.Sleep(8 * time.Second)
|
|
|
|
// Inject startup nudge for predecessor discovery via /resume
|
|
// This becomes the session title in Claude Code's session picker
|
|
address := fmt.Sprintf("%s/polecats/%s", m.rig.Name, polecat)
|
|
debugSession("StartupNudge", StartupNudge(m.tmux, sessionID, StartupNudgeConfig{
|
|
Recipient: address,
|
|
Sender: "witness",
|
|
Topic: "assigned",
|
|
MolID: opts.Issue,
|
|
}))
|
|
|
|
// GUPP: Gas Town Universal Propulsion Principle
|
|
// Send the propulsion nudge to trigger autonomous work execution.
|
|
// The beacon alone is just metadata - this nudge is the actual instruction
|
|
// that triggers Claude to check the hook and begin work.
|
|
// Wait for beacon to be fully processed (needs to be separate prompt)
|
|
time.Sleep(2 * time.Second)
|
|
debugSession("NudgeSession PropulsionNudge", m.tmux.NudgeSession(sessionID, PropulsionNudge()))
|
|
|
|
return nil
|
|
}
|
|
|
|
// Stop terminates a polecat session.
|
|
// If force is true, skips graceful shutdown and kills immediately.
|
|
func (m *Manager) Stop(polecat string, force bool) error {
|
|
sessionID := m.SessionName(polecat)
|
|
|
|
// Check if session exists
|
|
running, err := m.tmux.HasSession(sessionID)
|
|
if err != nil {
|
|
return fmt.Errorf("checking session: %w", err)
|
|
}
|
|
if !running {
|
|
return ErrSessionNotFound
|
|
}
|
|
|
|
// Sync beads before shutdown to preserve any changes
|
|
// Run in the polecat's worktree directory
|
|
if !force {
|
|
polecatDir := m.polecatDir(polecat)
|
|
if err := m.syncBeads(polecatDir); err != nil {
|
|
// Non-fatal - log and continue with shutdown
|
|
fmt.Printf("Warning: beads sync failed: %v\n", err)
|
|
}
|
|
}
|
|
|
|
// Try graceful shutdown first (unless forced, best-effort interrupt)
|
|
if !force {
|
|
_ = m.tmux.SendKeysRaw(sessionID, "C-c")
|
|
time.Sleep(100 * time.Millisecond)
|
|
}
|
|
|
|
// Kill the session
|
|
if err := m.tmux.KillSession(sessionID); err != nil {
|
|
return fmt.Errorf("killing session: %w", err)
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|
|
// syncBeads runs bd sync in the given directory.
|
|
func (m *Manager) syncBeads(workDir string) error {
|
|
cmd := exec.Command("bd", "sync")
|
|
cmd.Dir = workDir
|
|
return cmd.Run()
|
|
}
|
|
|
|
// IsRunning checks if a polecat session is active.
|
|
func (m *Manager) IsRunning(polecat string) (bool, error) {
|
|
sessionID := m.SessionName(polecat)
|
|
return m.tmux.HasSession(sessionID)
|
|
}
|
|
|
|
// Status returns detailed status for a polecat session.
|
|
func (m *Manager) Status(polecat string) (*Info, error) {
|
|
sessionID := m.SessionName(polecat)
|
|
|
|
running, err := m.tmux.HasSession(sessionID)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("checking session: %w", err)
|
|
}
|
|
|
|
info := &Info{
|
|
Polecat: polecat,
|
|
SessionID: sessionID,
|
|
Running: running,
|
|
RigName: m.rig.Name,
|
|
}
|
|
|
|
if !running {
|
|
return info, nil
|
|
}
|
|
|
|
// Get detailed session info
|
|
tmuxInfo, err := m.tmux.GetSessionInfo(sessionID)
|
|
if err != nil {
|
|
// Non-fatal - return basic info
|
|
return info, nil
|
|
}
|
|
|
|
info.Attached = tmuxInfo.Attached
|
|
info.Windows = tmuxInfo.Windows
|
|
|
|
// Parse created time from tmux format (e.g., "Thu Dec 19 10:30:00 2025")
|
|
if tmuxInfo.Created != "" {
|
|
// Try common tmux date formats
|
|
formats := []string{
|
|
"Mon Jan 2 15:04:05 2006",
|
|
"Mon Jan _2 15:04:05 2006",
|
|
time.ANSIC,
|
|
time.UnixDate,
|
|
}
|
|
for _, format := range formats {
|
|
if t, err := time.Parse(format, tmuxInfo.Created); err == nil {
|
|
info.Created = t
|
|
break
|
|
}
|
|
}
|
|
}
|
|
|
|
// Parse activity time (unix timestamp from tmux)
|
|
if tmuxInfo.Activity != "" {
|
|
var activityUnix int64
|
|
if _, err := fmt.Sscanf(tmuxInfo.Activity, "%d", &activityUnix); err == nil && activityUnix > 0 {
|
|
info.LastActivity = time.Unix(activityUnix, 0)
|
|
}
|
|
}
|
|
|
|
return info, nil
|
|
}
|
|
|
|
// List returns information about all sessions for this rig.
|
|
func (m *Manager) List() ([]Info, error) {
|
|
sessions, err := m.tmux.ListSessions()
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
prefix := fmt.Sprintf("gt-%s-", m.rig.Name)
|
|
var infos []Info
|
|
|
|
for _, sessionID := range sessions {
|
|
if !strings.HasPrefix(sessionID, prefix) {
|
|
continue
|
|
}
|
|
|
|
polecat := strings.TrimPrefix(sessionID, prefix)
|
|
infos = append(infos, Info{
|
|
Polecat: polecat,
|
|
SessionID: sessionID,
|
|
Running: true,
|
|
RigName: m.rig.Name,
|
|
})
|
|
}
|
|
|
|
return infos, nil
|
|
}
|
|
|
|
// Attach attaches to a polecat session.
|
|
func (m *Manager) Attach(polecat string) error {
|
|
sessionID := m.SessionName(polecat)
|
|
|
|
running, err := m.tmux.HasSession(sessionID)
|
|
if err != nil {
|
|
return fmt.Errorf("checking session: %w", err)
|
|
}
|
|
if !running {
|
|
return ErrSessionNotFound
|
|
}
|
|
|
|
return m.tmux.AttachSession(sessionID)
|
|
}
|
|
|
|
// Capture returns the recent output from a polecat session.
|
|
func (m *Manager) Capture(polecat string, lines int) (string, error) {
|
|
sessionID := m.SessionName(polecat)
|
|
|
|
running, err := m.tmux.HasSession(sessionID)
|
|
if err != nil {
|
|
return "", fmt.Errorf("checking session: %w", err)
|
|
}
|
|
if !running {
|
|
return "", ErrSessionNotFound
|
|
}
|
|
|
|
return m.tmux.CapturePane(sessionID, lines)
|
|
}
|
|
|
|
// CaptureSession returns the recent output from a session by raw session ID.
|
|
// Use this for crew workers or other non-polecat sessions where the session
|
|
// name doesn't follow the standard gt-{rig}-{polecat} pattern.
|
|
func (m *Manager) CaptureSession(sessionID string, lines int) (string, error) {
|
|
running, err := m.tmux.HasSession(sessionID)
|
|
if err != nil {
|
|
return "", fmt.Errorf("checking session: %w", err)
|
|
}
|
|
if !running {
|
|
return "", ErrSessionNotFound
|
|
}
|
|
|
|
return m.tmux.CapturePane(sessionID, lines)
|
|
}
|
|
|
|
// Inject sends a message to a polecat session.
|
|
// Uses a longer debounce delay for large messages to ensure paste completes.
|
|
func (m *Manager) Inject(polecat, message string) error {
|
|
sessionID := m.SessionName(polecat)
|
|
|
|
running, err := m.tmux.HasSession(sessionID)
|
|
if err != nil {
|
|
return fmt.Errorf("checking session: %w", err)
|
|
}
|
|
if !running {
|
|
return ErrSessionNotFound
|
|
}
|
|
|
|
// Use longer debounce for large messages (spawn context can be 1KB+)
|
|
// Claude needs time to process paste before Enter is sent
|
|
// Scale delay based on message size: 200ms base + 100ms per KB
|
|
debounceMs := 200 + (len(message)/1024)*100
|
|
if debounceMs > 1500 {
|
|
debounceMs = 1500 // Cap at 1.5s for large pastes
|
|
}
|
|
|
|
return m.tmux.SendKeysDebounced(sessionID, message, debounceMs)
|
|
}
|
|
|
|
// StopAll terminates all sessions for this rig.
|
|
func (m *Manager) StopAll(force bool) error {
|
|
infos, err := m.List()
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
var lastErr error
|
|
for _, info := range infos {
|
|
if err := m.Stop(info.Polecat, force); err != nil {
|
|
lastErr = err
|
|
}
|
|
}
|
|
|
|
return lastErr
|
|
}
|
|
|
|
// hookIssue pins an issue to a polecat's hook using bd update.
|
|
// This makes the work visible via 'gt hook' when the session starts.
|
|
func (m *Manager) hookIssue(issueID, agentID, workDir string) error {
|
|
// Use bd update to set status=hooked and assign to the polecat
|
|
cmd := exec.Command("bd", "update", issueID, "--status=hooked", "--assignee="+agentID) //nolint:gosec // G204: bd is a trusted internal tool
|
|
cmd.Dir = workDir
|
|
cmd.Stderr = os.Stderr
|
|
if err := cmd.Run(); err != nil {
|
|
return fmt.Errorf("bd update failed: %w", err)
|
|
}
|
|
fmt.Printf("✓ Hooked issue %s to %s\n", issueID, agentID)
|
|
return nil
|
|
}
|