feat: configure Honcho LLM via OpenCode Go, cleanup compose.yml
Some checks failed
Build Hermes agent / build (pull_request) Has been cancelled
Build ollama (gfx906) / build (pull_request) Has been cancelled

This commit is contained in:
2026-05-22 22:07:53 -04:00
parent 70e687a343
commit 58b5355780
2 changed files with 18 additions and 20 deletions

View File

@@ -32,7 +32,7 @@ services:
- default - default
container_name: hermes container_name: hermes
entrypoint: ["/bin/bash", "-c", entrypoint: ["/bin/bash", "-c",
"bash /opt/data/hermes-tools/install.sh && bash /opt/data/hermes-tools/run-multi-gateways.sh && exec /usr/bin/tini -g -- /opt/hermes/docker/entrypoint.sh \"$@\"", "bash /opt/data/hermes-tools/install.sh && exec /usr/bin/tini -g -- /opt/hermes/docker/entrypoint.sh \"$@\"",
"hermes-entrypoint"] "hermes-entrypoint"]
restart: always restart: always
# Gateway run enables the internal API server on port 8642 # Gateway run enables the internal API server on port 8642
@@ -40,10 +40,6 @@ services:
environment: environment:
- OLLAMA_HOST=http://ollama:11434 - OLLAMA_HOST=http://ollama:11434
- HERMES_DASHBOARD=1 - HERMES_DASHBOARD=1
# Multi-profile: comma-separated list of profiles to run as gateways.
# The entrypoint reads this and starts one gateway per profile.
# Add profiles here when they exist on disk (e.g. default,researcher,writer)
- HERMES_PROFILES=ashley,claire,finn,matt,paul
- API_SERVER_ENABLED=true - API_SERVER_ENABLED=true
- API_SERVER_PORT=8642 - API_SERVER_PORT=8642
- API_SERVER_HOST=0.0.0.0 - API_SERVER_HOST=0.0.0.0

View File

@@ -29,7 +29,7 @@ URL = "redis://honcho-redis:6379/0"
[llm] [llm]
DEFAULT_MAX_TOKENS = 4096 DEFAULT_MAX_TOKENS = 4096
# Embeddings via Ollama (nomic-embed-text recommended on this system) # Embeddings via Ollama local (nomic-embed-text)
[embedding] [embedding]
VECTOR_DIMENSIONS = 768 VECTOR_DIMENSIONS = 768
MAX_INPUT_TOKENS = 8192 MAX_INPUT_TOKENS = 8192
@@ -40,6 +40,7 @@ model = "nomic-embed-text"
base_url = "http://ollama:11434/v1" base_url = "http://ollama:11434/v1"
# --- Deriver (user representation builder) --- # --- Deriver (user representation builder) ---
# Uses DeepSeek V3 Flash via OpenCode Go
[deriver] [deriver]
ENABLED = true ENABLED = true
WORKERS = 1 WORKERS = 1
@@ -48,10 +49,11 @@ FLUSH_ENABLED = true
[deriver.model_config] [deriver.model_config]
transport = "openai" transport = "openai"
model = "hermes-3" model = "deepseek/deepseek-v3-flash"
base_url = "http://ollama:11434/v1" base_url = "https://opencode.ai/zen/go/v1"
# --- Dialectic --- # --- Dialectic ---
# All levels use DeepSeek V3 Flash via OpenCode Go
[dialectic] [dialectic]
MAX_INPUT_TOKENS = 4096 MAX_INPUT_TOKENS = 4096
SESSION_HISTORY_MAX_TOKENS = 8192 SESSION_HISTORY_MAX_TOKENS = 8192
@@ -61,36 +63,36 @@ MAX_TOOL_ITERATIONS = 1
MAX_OUTPUT_TOKENS = 512 MAX_OUTPUT_TOKENS = 512
[dialectic.levels.minimal.model_config] [dialectic.levels.minimal.model_config]
transport = "openai" transport = "openai"
model = "hermes-3" model = "deepseek/deepseek-v3-flash"
base_url = "http://ollama:11434/v1" base_url = "https://opencode.ai/zen/go/v1"
[dialectic.levels.low] [dialectic.levels.low]
MAX_TOOL_ITERATIONS = 3 MAX_TOOL_ITERATIONS = 3
[dialectic.levels.low.model_config] [dialectic.levels.low.model_config]
transport = "openai" transport = "openai"
model = "hermes-3" model = "deepseek/deepseek-v3-flash"
base_url = "http://ollama:11434/v1" base_url = "https://opencode.ai/zen/go/v1"
[dialectic.levels.medium] [dialectic.levels.medium]
MAX_TOOL_ITERATIONS = 2 MAX_TOOL_ITERATIONS = 2
[dialectic.levels.medium.model_config] [dialectic.levels.medium.model_config]
transport = "openai" transport = "openai"
model = "hermes-3" model = "deepseek/deepseek-v3-flash"
base_url = "http://ollama:11434/v1" base_url = "https://opencode.ai/zen/go/v1"
[dialectic.levels.high] [dialectic.levels.high]
MAX_TOOL_ITERATIONS = 4 MAX_TOOL_ITERATIONS = 4
[dialectic.levels.high.model_config] [dialectic.levels.high.model_config]
transport = "openai" transport = "openai"
model = "hermes-3" model = "deepseek/deepseek-v3-flash"
base_url = "http://ollama:11434/v1" base_url = "https://opencode.ai/zen/go/v1"
[dialectic.levels.max] [dialectic.levels.max]
MAX_TOOL_ITERATIONS = 10 MAX_TOOL_ITERATIONS = 10
[dialectic.levels.max.model_config] [dialectic.levels.max.model_config]
transport = "openai" transport = "openai"
model = "hermes-3" model = "deepseek/deepseek-v3-flash"
base_url = "http://ollama:11434/v1" base_url = "https://opencode.ai/zen/go/v1"
# --- Summary --- # --- Summary ---
[summary] [summary]
@@ -100,8 +102,8 @@ MESSAGES_PER_LONG_SUMMARY = 60
[summary.model_config] [summary.model_config]
transport = "openai" transport = "openai"
model = "hermes-3" model = "deepseek/deepseek-v3-flash"
base_url = "http://ollama:11434/v1" base_url = "https://opencode.ai/zen/go/v1"
# --- Dream --- # --- Dream ---
[dream] [dream]