heretek-openclaw-core/litellm_config.yaml

# ==============================================================================
# Heretek OpenClaw — LiteLLM Configuration v2.1
# ==============================================================================
# Configuration: AMD GPU + MiniMax Primary + z.ai Failover
# Passthrough Endpoints: Per-agent virtual models
#
# Each agent has a virtual model endpoint (agent/steward, agent/alpha, etc.)
# Users can reassign models via LiteLLM WebUI without changing openclaw.json
#
# DEFAULT MODEL: MiniMax MiniMax-M2.7 (via LiteLLM Gateway)
# FAILOVER: z.ai GLM-5.1 (Coding API)
#
# This file is mounted to the LiteLLM container at /app/config.yaml
# Version: 2.1.0
# Last Updated: 2026-03-31
#
# PROVIDER TEMPLATES: Additional provider configurations are available in:
#   - config/providers/openai.yaml
#   - config/providers/anthropic.yaml
#   - config/providers/google.yaml
#   - config/providers/ollama.yaml
#   - config/providers/azure-openai.yaml
#   - config/providers/xai.yaml
#   - config/providers/combined-example.yaml
# ==============================================================================

model_list:
  # ==========================================================================
  # PRIMARY: MiniMax MiniMax-M2.7 (All Agents Default)
  # ==========================================================================
  - model_name: minimax/MiniMax-M2.7
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "MiniMax MiniMax-M2.7 - Primary model for all agents"
      max_tokens: 128000
      input_cost_per_token: 0.0000001
      output_cost_per_token: 0.0000004

  - model_name: minimax/MiniMax-M2.5
    litellm_params:
      model: minimax/MiniMax-M2.5
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "MiniMax MiniMax-M2.5 - Legacy fallback"
      max_tokens: 128000

  # ==========================================================================
  # FAILOVER: z.ai GLM-5.1 (Coding API)
  # ==========================================================================
  - model_name: zai/glm-5-1
    litellm_params:
      model: openai/glm-5-1
      api_key: os.environ/ZAI_API_KEY
      api_base: os.environ/ZAI_API_BASE
    model_info:
      description: "z.ai GLM-5.1 - Coding API failover"
      max_tokens: 128000

  - model_name: zai/glm-5
    litellm_params:
      model: openai/glm-5
      api_key: os.environ/ZAI_API_KEY
      api_base: os.environ/ZAI_API_BASE
    model_info:
      description: "z.ai GLM-5 - Legacy failover"
      max_tokens: 128000

  - model_name: zai/glm-4
    litellm_params:
      model: openai/glm-4
      api_key: os.environ/ZAI_API_KEY
      api_base: os.environ/ZAI_API_BASE
    model_info:
      description: "z.ai GLM-4 - Alternative failover"
      max_tokens: 128000

  # ==========================================================================
  # AGENT PASSTHROUGH ENDPOINTS (Virtual Models)
  # ==========================================================================
  # Each agent has a virtual model that defaults to MiniMax MiniMax-M2.5
  # Users can reassign these via LiteLLM WebUI without changing openclaw.json
  # ==========================================================================

  # Steward (Orchestrator) - Manages collective workflow
  - model_name: agent/steward
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Steward Agent - Orchestrator role"
      agent_role: orchestrator
      agent_id: steward

  # Alpha (Triad) - Primary deliberator
  - model_name: agent/alpha
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Alpha Agent - Triad role"
      agent_role: triad
      agent_id: alpha

  # Beta (Triad) - Secondary deliberator
  - model_name: agent/beta
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Beta Agent - Triad role"
      agent_role: triad
      agent_id: beta

  # Charlie (Triad) - Final deliberator
  - model_name: agent/charlie
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Charlie Agent - Triad role"
      agent_role: triad
      agent_id: charlie

  # Examiner (Interrogator) - Challenges decisions
  - model_name: agent/examiner
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Examiner Agent - Interrogator role"
      agent_role: interrogator
      agent_id: examiner

  # Explorer (Scout) - Scans for opportunities
  - model_name: agent/explorer
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Explorer Agent - Scout role"
      agent_role: scout
      agent_id: explorer

  # Sentinel (Guardian) - Security and monitoring
  - model_name: agent/sentinel
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Sentinel Agent - Guardian role"
      agent_role: guardian
      agent_id: sentinel

  # Coder (Artisan) - Code generation and review
  - model_name: agent/coder
    litellm_params:
      model: zai/glm-5-1
      api_key: os.environ/ZAI_API_KEY
      api_base: os.environ/ZAI_API_BASE
    model_info:
      description: "Coder Agent - Artisan role (GLM-4 via z.ai passthrough)"
      agent_role: artisan
      agent_id: coder

  # Dreamer (Visionary) - Creative speculation, future planning
  - model_name: agent/dreamer
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Dreamer Agent - Visionary role"
      agent_role: visionary
      agent_id: dreamer

  # Empath (Diplomat) - Emotional intelligence, user rapport
  - model_name: agent/empath
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Empath Agent - Diplomat role"
      agent_role: diplomat
      agent_id: empath

  # Historian (Archivist) - Memory keeper, context preservation
  - model_name: agent/historian
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Historian Agent - Archivist role"
      agent_role: archivist
      agent_id: historian

  # Arbiter (Adjudicator) - Decision maker, conflict resolver
  - model_name: agent/arbiter
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Arbiter Agent - Adjudicator role"
      agent_role: adjudicator
      agent_id: arbiter

  # Catalyst (Accelerator) - Process optimization, workflow acceleration
  - model_name: agent/catalyst
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Catalyst Agent - Accelerator role"
      agent_role: accelerator
      agent_id: catalyst

  # Chronos (Timekeeper) - Time management, scheduling
  - model_name: agent/chronos
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Chronos Agent - Timekeeper role"
      agent_role: timekeeper
      agent_id: chronos

  # Coordinator (Integrator) - Cross-agent coordination
  - model_name: agent/coordinator
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Coordinator Agent - Integrator role"
      agent_role: integrator
      agent_id: coordinator

  # Echo (Communicator) - External communications, broadcasts
  - model_name: agent/echo
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Echo Agent - Communicator role"
      agent_role: communicator
      agent_id: echo

  # Habit Forge (Optimizer) - Habit formation, pattern tracking
  - model_name: agent/habit-forge
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Habit Forge Agent - Optimizer role"
      agent_role: optimizer
      agent_id: habit-forge

  # Metis (Strategist) - Strategic planning, tactical analysis
  - model_name: agent/metis
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Metis Agent - Strategist role"
      agent_role: strategist
      agent_id: metis

  # Nexus (Connector) - System integration, API management
  - model_name: agent/nexus
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Nexus Agent - Connector role"
      agent_role: connector
      agent_id: nexus

  # Perceiver (Sensor) - Data interpretation, pattern extraction
  - model_name: agent/perceiver
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Perceiver Agent - Sensor role"
      agent_role: sensor
      agent_id: perceiver

  # Prism (Analyzer) - Multi-perspective analysis
  - model_name: agent/prism
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Prism Agent - Analyzer role"
      agent_role: analyzer
      agent_id: prism

  # Sentinel Prime (Commander) - Lead security agent, threat coordination
  - model_name: agent/sentinel-prime
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE
    model_info:
      description: "Sentinel Prime Agent - Commander role"
      agent_role: commander
      agent_id: sentinel-prime

  # ==========================================================================
  # OLLAMA EMBEDDING (Local - AMD GPU)
  # ==========================================================================
  - model_name: ollama/nomic-embed-text
    litellm_params:
      model: ollama/nomic-embed-text-v2-moe
      api_base: http://ollama:11434
    model_info:
      description: "Nomic Embed Text v2 MoE - 768 dimensions"
      mode: embedding
      embedding_dim: 768

  # ==========================================================================
  # MODEL ALIASES (Convenience)
  # ==========================================================================
  - model_name: default
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE

  - model_name: fast
    litellm_params:
      model: minimax/MiniMax-M2.7
      api_key: os.environ/MINIMAX_API_KEY
      api_base: os.environ/MINIMAX_API_BASE

  - model_name: failover
    litellm_params:
      model: zai/glm-5-1
      api_key: os.environ/ZAI_API_KEY
      api_base: os.environ/ZAI_API_BASE

# ==============================================================================
# LiteLLM Settings
# ==============================================================================
litellm_settings:
  # Default model for requests without model specification
  default_model: minimax/MiniMax-M2.7

  # Drop unsupported parameters
  drop_params: true

  # Logging verbosity
  set_verbose: false

  # Request timeout (seconds)
  request_timeout: 300

  # Retry configuration
  num_retries: 3
  retry_after: 2

  # Caching
  cache: true
  cache_params:
    ttl: 3600
    redis_url: os.environ/REDIS_URL

  # Callbacks for logging
  callbacks: []
  success_callback: ["prometheus", "langfuse", "log_cost"]
  failure_callback: []

# ==============================================================================
# General Settings
# ==============================================================================
general_settings:
  # Database connection
  database_url: os.environ/DATABASE_URL

  # Redis connection
  redis_url: os.environ/REDIS_URL

  # Master key for API authentication
  master_key: os.environ/LITELLM_MASTER_KEY

  # Salt for encryption
  salt_key: os.environ/LITELLM_SALT_KEY

  # Environment identifier
  environment: heretek-openclaw

  # Logging level
  log_level: INFO

  # UI settings
  ui: true
  ui_access_mode: admin

  # Proxy settings
  proxy_batch_write_at: 60

# ==============================================================================
# A2A (Agent-to-Agent) Protocol Settings
# ==============================================================================
a2a_settings:
  # Enable A2A protocol
  enabled: true

  # Agent timeout (seconds)
  agent_timeout: 300

  # Session persistence backend
  session_persistence: redis

  # Session TTL (seconds)
  session_ttl: 86400

  # -------------------------------------------------------------------------
  # Standard A2A Endpoints
  # -------------------------------------------------------------------------
  agent_endpoint_format: "/v1/agents/{agent_name}"
  send_message_endpoint: "/v1/agents/{agent_name}/send"
  receive_message_endpoint: "/v1/agents/{agent_name}/receive"
  health_check_endpoint: "/health"
  health_check_timeout: 10

  # -------------------------------------------------------------------------
  # Task Handoff (NEW)
  # -------------------------------------------------------------------------
  task_handoff:
    enabled: true
    context_preservation: full
    timeout_seconds: 60
  task_handoff_endpoint: "/v1/agents/{agent_name}/tasks"
  task_status_endpoint: "/v1/agents/{agent_name}/tasks/{task_id}/status"

  # -------------------------------------------------------------------------
  # Streaming Support (NEW)
  # -------------------------------------------------------------------------
  streaming:
    enabled: true
    chunk_size: 1024
  streaming_endpoint: "/v1/agents/{agent_name}/stream"

  # -------------------------------------------------------------------------
  # Agent Discovery (NEW)
  # -------------------------------------------------------------------------
  agent_discovery:
    enabled: true
    heartbeat_interval: 30
    stale_agent_timeout: 120
  agent_cards_endpoint: "/v1/agents/.well-known"
  discover_endpoint: "/v1/agents/discover"

# ==============================================================================
# Router Settings
# ==============================================================================
router_settings:
  # Routing strategy
  routing_strategy: simple-shuffle

  # Rate limiting
  enable_rate_limiting: true
  default_limit_requests: 60
  default_limit_period: 60

  # -------------------------------------------------------------------------
  # Model Health Checks
  # -------------------------------------------------------------------------
  model_health_check:
    enabled: true
    check_interval: 30
    timeout: 10
    unhealthy_threshold: 2
    recovery_wait: 30

  # -------------------------------------------------------------------------
  # Priority-based Fallback
  # -------------------------------------------------------------------------
  priority_fallback:
    enabled: true
    fallback_order:
      - minimax/MiniMax-M2.7
      - minimax/MiniMax-M2.5
      - zai/glm-5-1
      - zai/glm-5

# ==============================================================================
# Fallback Models (Priority-Ordered)
# ==============================================================================
fallback_models:
  # Priority 1: Primary MiniMax
  - minimax/MiniMax-M2.7
  - minimax/MiniMax-M2.5
  # Priority 2: z.ai Coding API
  - zai/glm-5-1
  - zai/glm-5

# ==============================================================================
# Per-Agent Model Mappings
# ==============================================================================
# This section defines per-agent model configurations that override the default
# model assignments. Each agent can have a primary model, fallback model, and
# a chain of additional fallbacks for high availability.
#
# For detailed configuration files, see: config/agents/<agent>-models.yaml
# ==============================================================================

agent_model_mappings:
  # -------------------------------------------------------------------------
  # Arbiter - Decision maker / Conflict resolver
  # -------------------------------------------------------------------------
  arbiter:
    primary: anthropic/claude-3-5-sonnet
    fallback: openai/gpt-4-turbo
    fallback_chain:
      - openai/gpt-4o
      - openai/gpt-4
      - anthropic/claude-3-sonnet
    max_tokens: 8192
    temperature: 0.5
    api_key_env: ANTHROPIC_API_KEY
    budget_daily_usd: 25.00

  # -------------------------------------------------------------------------
  # Coder - Code generation and review
  # -------------------------------------------------------------------------
  coder:
    primary: anthropic/claude-3-5-sonnet
    fallback: openai/gpt-4o
    fallback_chain:
      - openai/gpt-4-turbo
      - anthropic/claude-3-5-haiku
      - openai/gpt-4o-mini
    max_tokens: 8192
    temperature: 0.7
    api_key_env: ANTHROPIC_API_KEY
    budget_daily_usd: 50.00

  # -------------------------------------------------------------------------
  # Steward - Orchestrator
  # -------------------------------------------------------------------------
  steward:
    primary: minimax/MiniMax-M2.7
    fallback: zai/glm-5-1
    max_tokens: 8192
    temperature: 0.7
    budget_daily_usd: 20.00

  # -------------------------------------------------------------------------
  # Alpha - Triad deliberator
  # -------------------------------------------------------------------------
  alpha:
    primary: minimax/MiniMax-M2.7
    fallback: anthropic/claude-3-5-sonnet
    max_tokens: 8192
    temperature: 0.7
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Beta - Triad deliberator
  # -------------------------------------------------------------------------
  beta:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o
    max_tokens: 8192
    temperature: 0.7
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Charlie - Triad deliberator
  # -------------------------------------------------------------------------
  charlie:
    primary: minimax/MiniMax-M2.7
    fallback: anthropic/claude-3-5-haiku
    max_tokens: 8192
    temperature: 0.7
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Examiner - Interrogator / Challenger
  # -------------------------------------------------------------------------
  examiner:
    primary: anthropic/claude-3-5-sonnet
    fallback: openai/gpt-4-turbo
    max_tokens: 4096
    temperature: 0.4
    budget_daily_usd: 20.00

  # -------------------------------------------------------------------------
  # Explorer - Scout / Opportunity finder
  # -------------------------------------------------------------------------
  explorer:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o-mini
    max_tokens: 4096
    temperature: 0.8
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Sentinel - Guardian / Security
  # -------------------------------------------------------------------------
  sentinel:
    primary: minimax/MiniMax-M2.7
    fallback: anthropic/claude-3-haiku
    max_tokens: 4096
    temperature: 0.3
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Dreamer - Visionary / Creative
  # -------------------------------------------------------------------------
  dreamer:
    primary: openai/gpt-4-turbo
    fallback: anthropic/claude-3-5-sonnet
    max_tokens: 8192
    temperature: 0.9
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Empath - Diplomat / Emotional intelligence
  # -------------------------------------------------------------------------
  empath:
    primary: anthropic/claude-3-5-sonnet
    fallback: openai/gpt-4o
    max_tokens: 4096
    temperature: 0.8
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Historian - Archivist / Memory keeper
  # -------------------------------------------------------------------------
  historian:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o
    max_tokens: 8192
    temperature: 0.3
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Arbiter - Adjudicator / Decision maker
  # -------------------------------------------------------------------------
  arbiter:
    primary: minimax/MiniMax-M2.7
    fallback: anthropic/claude-3-5-sonnet
    max_tokens: 8192
    temperature: 0.5
    budget_daily_usd: 25.00

  # -------------------------------------------------------------------------
  # Catalyst - Accelerator / Process optimization
  # -------------------------------------------------------------------------
  catalyst:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o-mini
    max_tokens: 4096
    temperature: 0.7
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Chronos - Timekeeper / Schedule management
  # -------------------------------------------------------------------------
  chronos:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o
    max_tokens: 4096
    temperature: 0.5
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Coordinator - Integrator / Cross-agent coordination
  # -------------------------------------------------------------------------
  coordinator:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o
    max_tokens: 4096
    temperature: 0.6
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Echo - Communicator / External communications
  # -------------------------------------------------------------------------
  echo:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o-mini
    max_tokens: 4096
    temperature: 0.7
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Habit Forge - Optimizer / Habit formation
  # -------------------------------------------------------------------------
  habit-forge:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o-mini
    max_tokens: 4096
    temperature: 0.6
    budget_daily_usd: 10.00

  # -------------------------------------------------------------------------
  # Metis - Strategist / Strategic planning
  # -------------------------------------------------------------------------
  metis:
    primary: minimax/MiniMax-M2.7
    fallback: anthropic/claude-3-5-sonnet
    max_tokens: 8192
    temperature: 0.7
    budget_daily_usd: 20.00

  # -------------------------------------------------------------------------
  # Nexus - Connector / System integration
  # -------------------------------------------------------------------------
  nexus:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o
    max_tokens: 4096
    temperature: 0.5
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Perceiver - Sensor / Data interpretation
  # -------------------------------------------------------------------------
  perceiver:
    primary: minimax/MiniMax-M2.7
    fallback: openai/gpt-4o
    max_tokens: 4096
    temperature: 0.6
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Prism - Analyzer / Multi-perspective analysis
  # -------------------------------------------------------------------------
  prism:
    primary: minimax/MiniMax-M2.7
    fallback: anthropic/claude-3-5-sonnet
    max_tokens: 8192
    temperature: 0.7
    budget_daily_usd: 15.00

  # -------------------------------------------------------------------------
  # Sentinel Prime - Commander / Security coordination
  # -------------------------------------------------------------------------
  sentinel-prime:
    primary: minimax/MiniMax-M2.7
    fallback: anthropic/claude-3-haiku
    max_tokens: 4096
    temperature: 0.3
    budget_daily_usd: 15.00

# ==============================================================================
# Budget & Rate Limits (Per Agent)
# ==============================================================================
budget_settings:
  enabled: true

  # Per-agent budgets (tokens per day)
  agent_budgets:
    agent/steward: 1000000
    agent/alpha: 500000
    agent/beta: 500000
    agent/charlie: 500000
    agent/examiner: 300000
    agent/explorer: 300000
    agent/sentinel: 300000
    agent/coder: 1000000
    agent/arbiter: 800000
    agent/dreamer: 500000
    agent/empath: 400000
    agent/historian: 500000
    agent/catalyst: 400000
    agent/chronos: 300000
    agent/coordinator: 400000
    agent/echo: 300000
    agent/habit-forge: 300000
    agent/metis: 500000
    agent/nexus: 400000
    agent/perceiver: 400000
    agent/prism: 400000
    agent/sentinel-prime: 500000

  # Global budget
  global_budget: 5000000

  # Alert thresholds
  alert_threshold: 0.8

# ==============================================================================
# Observability Settings
# ==============================================================================
observability:
  # -------------------------------------------------------------------------
  # Prometheus Metrics
  # -------------------------------------------------------------------------
  prometheus:
    enabled: true
    port: 4000  # Exposed on main LiteLLM port at /metrics
    # Metrics available:
    # - litellm_cost_dollars_total{model, agent}
    # - litellm_tokens_total{model, type=input/output}
    # - litellm_request_count_total{model, status}
    # - litellm_request_latency_seconds{model}
    # - litellm_deployment_failure_responses{model}

  # -------------------------------------------------------------------------
  # Langfuse Tracing (LLM Observability)
  # -------------------------------------------------------------------------
  langfuse:
    enabled: true
    public_key: os.environ/LANGFUSE_PUBLIC_KEY
    secret_key: os.environ/LANGFUSE_SECRET_KEY
    host: os.environ/LANGFUSE_HOST
    # Trace all LLM calls with costs, latencies, and user sessions
    # Access dashboard at http://localhost:3000

  # -------------------------------------------------------------------------
  # OpenTelemetry Tracing (Distributed Tracing)
  # -------------------------------------------------------------------------
  opentelemetry:
    enabled: true
    exporter: os.environ/OTEL_EXPORTER_TYPE  # otlp, jaeger, zipkin
    endpoint: os.environ/OTEL_EXPORTER_OTLP_ENDPOINT

  # -------------------------------------------------------------------------
  # LiteLLM WebUI (Built-in Admin Dashboard)
  # -------------------------------------------------------------------------
  # Access at http://localhost:4000/ui
  # Features:
  # - Cost tracking per model/key/user
  # - Token usage analytics
  # - Budget management and alerts
  # - Key management
  # - Spend reports
  ui:
    enabled: true
    access_mode: admin  # Requires master key authentication

  # -------------------------------------------------------------------------
  # Cost Tracking & Budget Alerts
  # -------------------------------------------------------------------------
  cost_tracking:
    enabled: true
    # Track spend by agent passthrough endpoints
    track_agent_costs: true
    # Alert thresholds (percentage of budget)
    alert_threshold_warning: 0.8   # 80% - warning
    alert_threshold_critical: 1.0  # 100% - budget exceeded

  # -------------------------------------------------------------------------
  # Slack/Webhook Alerts (Optional)
  # -------------------------------------------------------------------------
  slack:
    enabled: false
    webhook_url: os.environ/SLACK_WEBHOOK_URL
    # Alert channels for budget warnings, failures, etc.

  # -------------------------------------------------------------------------
  # Health Dashboard Integration
  # -------------------------------------------------------------------------
  # Metrics exposed for external dashboards:
  # - GET /metrics (Prometheus format)
  # - GET /spend (JSON spend data)
  # - GET /budget/list (Budget statuses)
  health_dashboard:
    enabled: true
    # Expose metrics for Heretek OpenClaw Health Dashboard
    # Dashboard collects metrics every 30 seconds