fix: honcho embedding config - fix base_url nesting, switch to bge-m3, add deriver to CMD
This commit is contained in:
@@ -71,4 +71,4 @@ COPY honcho-nginx.conf /etc/nginx/conf.d/default.conf
|
|||||||
|
|
||||||
EXPOSE 80
|
EXPOSE 80
|
||||||
|
|
||||||
CMD ["sh", "-c", "nginx -g 'daemon off;' & fastapi run --host 127.0.0.1 --port 8000 src/main.py"]
|
CMD ["sh", "-c", "nginx -g 'daemon off;' & fastapi run --host 127.0.0.1 --port 8000 src/main.py & python3 -m src.deriver & wait -n"]
|
||||||
|
|||||||
@@ -29,15 +29,15 @@ URL = "redis://honcho-redis:6379/0"
|
|||||||
[llm]
|
[llm]
|
||||||
DEFAULT_MAX_TOKENS = 4096
|
DEFAULT_MAX_TOKENS = 4096
|
||||||
|
|
||||||
# Embeddings via Ollama
|
# Embeddings via Ollama — bge-m3 provides 1024-dim
|
||||||
[embedding]
|
[embedding]
|
||||||
VECTOR_DIMENSIONS = 1024
|
VECTOR_DIMENSIONS = 1024
|
||||||
MAX_INPUT_TOKENS = 8192
|
MAX_INPUT_TOKENS = 8192
|
||||||
|
|
||||||
[embedding.model_config]
|
[embedding.model_config]
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "nomic-embed-text"
|
model = "bge-m3"
|
||||||
base_url = "http://ollama:11434/v1"
|
overrides = {base_url = "http://ollama:11434/v1", api_key = "ollama"}
|
||||||
|
|
||||||
# --- Deriver ---
|
# --- Deriver ---
|
||||||
[deriver]
|
[deriver]
|
||||||
@@ -47,10 +47,9 @@ POLLING_SLEEP_INTERVAL_SECONDS = 5.0
|
|||||||
FLUSH_ENABLED = true
|
FLUSH_ENABLED = true
|
||||||
|
|
||||||
[deriver.model_config]
|
[deriver.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
# --- Dialectic ---
|
# --- Dialectic ---
|
||||||
[dialectic]
|
[dialectic]
|
||||||
@@ -61,42 +60,37 @@ SESSION_HISTORY_MAX_TOKENS = 8192
|
|||||||
MAX_TOOL_ITERATIONS = 1
|
MAX_TOOL_ITERATIONS = 1
|
||||||
MAX_OUTPUT_TOKENS = 512
|
MAX_OUTPUT_TOKENS = 512
|
||||||
[dialectic.levels.minimal.model_config]
|
[dialectic.levels.minimal.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.low]
|
[dialectic.levels.low]
|
||||||
MAX_TOOL_ITERATIONS = 3
|
MAX_TOOL_ITERATIONS = 3
|
||||||
[dialectic.levels.low.model_config]
|
[dialectic.levels.low.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.medium]
|
[dialectic.levels.medium]
|
||||||
MAX_TOOL_ITERATIONS = 2
|
MAX_TOOL_ITERATIONS = 2
|
||||||
[dialectic.levels.medium.model_config]
|
[dialectic.levels.medium.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.high]
|
[dialectic.levels.high]
|
||||||
MAX_TOOL_ITERATIONS = 4
|
MAX_TOOL_ITERATIONS = 4
|
||||||
[dialectic.levels.high.model_config]
|
[dialectic.levels.high.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.max]
|
[dialectic.levels.max]
|
||||||
MAX_TOOL_ITERATIONS = 10
|
MAX_TOOL_ITERATIONS = 10
|
||||||
[dialectic.levels.max.model_config]
|
[dialectic.levels.max.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
# --- Summary ---
|
# --- Summary ---
|
||||||
[summary]
|
[summary]
|
||||||
@@ -105,10 +99,9 @@ MESSAGES_PER_SHORT_SUMMARY = 20
|
|||||||
MESSAGES_PER_LONG_SUMMARY = 60
|
MESSAGES_PER_LONG_SUMMARY = 60
|
||||||
|
|
||||||
[summary.model_config]
|
[summary.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
# --- Dream ---
|
# --- Dream ---
|
||||||
[dream]
|
[dream]
|
||||||
@@ -121,4 +114,4 @@ ENABLED = true
|
|||||||
# --- Vector Store ---
|
# --- Vector Store ---
|
||||||
[vector_store]
|
[vector_store]
|
||||||
TYPE = "pgvector"
|
TYPE = "pgvector"
|
||||||
DIMENSIONS = 1024
|
# DIMENSIONS is deprecated — EMBEDDING.VECTOR_DIMENSIONS is authoritative
|
||||||
|
|||||||
Reference in New Issue
Block a user