feat: configure Honcho LLM via OpenCode Go, cleanup compose.yml
This commit is contained in:
@@ -29,7 +29,7 @@ URL = "redis://honcho-redis:6379/0"
|
||||
[llm]
|
||||
DEFAULT_MAX_TOKENS = 4096
|
||||
|
||||
# Embeddings via Ollama (nomic-embed-text recommended on this system)
|
||||
# Embeddings via Ollama local (nomic-embed-text)
|
||||
[embedding]
|
||||
VECTOR_DIMENSIONS = 768
|
||||
MAX_INPUT_TOKENS = 8192
|
||||
@@ -40,6 +40,7 @@ model = "nomic-embed-text"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
|
||||
# --- Deriver (user representation builder) ---
|
||||
# Uses DeepSeek V3 Flash via OpenCode Go
|
||||
[deriver]
|
||||
ENABLED = true
|
||||
WORKERS = 1
|
||||
@@ -48,10 +49,11 @@ FLUSH_ENABLED = true
|
||||
|
||||
[deriver.model_config]
|
||||
transport = "openai"
|
||||
model = "hermes-3"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
model = "deepseek/deepseek-v3-flash"
|
||||
base_url = "https://opencode.ai/zen/go/v1"
|
||||
|
||||
# --- Dialectic ---
|
||||
# All levels use DeepSeek V3 Flash via OpenCode Go
|
||||
[dialectic]
|
||||
MAX_INPUT_TOKENS = 4096
|
||||
SESSION_HISTORY_MAX_TOKENS = 8192
|
||||
@@ -61,36 +63,36 @@ MAX_TOOL_ITERATIONS = 1
|
||||
MAX_OUTPUT_TOKENS = 512
|
||||
[dialectic.levels.minimal.model_config]
|
||||
transport = "openai"
|
||||
model = "hermes-3"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
model = "deepseek/deepseek-v3-flash"
|
||||
base_url = "https://opencode.ai/zen/go/v1"
|
||||
|
||||
[dialectic.levels.low]
|
||||
MAX_TOOL_ITERATIONS = 3
|
||||
[dialectic.levels.low.model_config]
|
||||
transport = "openai"
|
||||
model = "hermes-3"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
model = "deepseek/deepseek-v3-flash"
|
||||
base_url = "https://opencode.ai/zen/go/v1"
|
||||
|
||||
[dialectic.levels.medium]
|
||||
MAX_TOOL_ITERATIONS = 2
|
||||
[dialectic.levels.medium.model_config]
|
||||
transport = "openai"
|
||||
model = "hermes-3"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
model = "deepseek/deepseek-v3-flash"
|
||||
base_url = "https://opencode.ai/zen/go/v1"
|
||||
|
||||
[dialectic.levels.high]
|
||||
MAX_TOOL_ITERATIONS = 4
|
||||
[dialectic.levels.high.model_config]
|
||||
transport = "openai"
|
||||
model = "hermes-3"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
model = "deepseek/deepseek-v3-flash"
|
||||
base_url = "https://opencode.ai/zen/go/v1"
|
||||
|
||||
[dialectic.levels.max]
|
||||
MAX_TOOL_ITERATIONS = 10
|
||||
[dialectic.levels.max.model_config]
|
||||
transport = "openai"
|
||||
model = "hermes-3"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
model = "deepseek/deepseek-v3-flash"
|
||||
base_url = "https://opencode.ai/zen/go/v1"
|
||||
|
||||
# --- Summary ---
|
||||
[summary]
|
||||
@@ -100,8 +102,8 @@ MESSAGES_PER_LONG_SUMMARY = 60
|
||||
|
||||
[summary.model_config]
|
||||
transport = "openai"
|
||||
model = "hermes-3"
|
||||
base_url = "http://ollama:11434/v1"
|
||||
model = "deepseek/deepseek-v3-flash"
|
||||
base_url = "https://opencode.ai/zen/go/v1"
|
||||
|
||||
# --- Dream ---
|
||||
[dream]
|
||||
|
||||
Reference in New Issue
Block a user