compose/build/honcho/config.toml

# Honcho Configuration
# Pre-configured for self-hosted deployment with Ollama embeddings.
# Mount this file at /app/config.toml in the Honcho container.
#
# Environment variables override these values at runtime
# (e.g. DB_CONNECTION_URI, DERIVER_*).

[app]
LOG_LEVEL = "INFO"
NAMESPACE = "honcho"
SESSION_OBSERVERS_LIMIT = 10
GET_CONTEXT_MAX_TOKENS = 16384
EMBED_MESSAGES = true

[db]
# Connection URI is set via environment variable DB_CONNECTION_URI
SCHEMA = "public"
POOL_SIZE = 10
MAX_OVERFLOW = 20
POOL_TIMEOUT = 30
POOL_RECYCLE = 300
POOL_PRE_PING = true
POOL_USE_LIFO = true
SQL_DEBUG = false

[auth]
USE_AUTH = false

[llm]
DEFAULT_MAX_TOKENS = 4096

[embedding]
VECTOR_DIMENSIONS = 768
MAX_INPUT_TOKENS = 8192
MAX_TOKENS_PER_REQUEST = 2048

[embedding.model_config]
transport = "openai"
model = "nomic-embed-text:latest"

[embedding.model_config.overrides]
base_url = "http://ollama:11434/v1"
# Ollama does not require an API key; env var must be set to non-empty string
api_key_env = "LLM_OPENAI_API_KEY"

[deriver]
ENABLED = false
WORKERS = 1
POLLING_SLEEP_INTERVAL_SECONDS = 1.0
STALE_SESSION_TIMEOUT_MINUTES = 5
DEDUPLICATE = true
LOG_OBSERVATIONS = false

[deriver.model_config]
transport = "openai"
model = "qwen3.6:27b-q4_K_M"

[deriver.model_config.overrides]
base_url = "http://ollama:11434/v1"
api_key_env = "LLM_OPENAI_API_KEY"

[summary]
ENABLED = false

[summary.model_config]
transport = "openai"
model = "qwen3.6:27b-q4_K_M"

[summary.model_config.overrides]
base_url = "http://ollama:11434/v1"
api_key_env = "LLM_OPENAI_API_KEY"

[dream]
ENABLED = false

[dialectic]
MAX_OUTPUT_TOKENS = 4096
MAX_INPUT_TOKENS = 16384

[cache]
ENABLED = false

[vector_store]
TYPE = "pgvector"

[metrics]
ENABLED = false

[telemetry]
ENABLED = false

[sentry]
ENABLED = false