Compare commits
19 Commits
08778db685
...
feat/honch
| Author | SHA1 | Date | |
|---|---|---|---|
| b185d43d67 | |||
| efaf3550b9 | |||
| 1460085718 | |||
| 6069ebd6a4 | |||
| 5dd6e9a442 | |||
| 54e3868f94 | |||
| 68009f05c1 | |||
| 87e546beae | |||
| b4a0e4449d | |||
| 9635ed8e7e | |||
| 2e8e0b4561 | |||
| 945d4e43a5 | |||
| 14eba26b6b | |||
| 6774af7c13 | |||
| c9a3386138 | |||
| 51018024e9 | |||
| c9b9f63a34 | |||
| 6641071d8f | |||
| 63b6cd3461 |
@@ -1,4 +1,3 @@
|
|||||||
version: "3.8"
|
|
||||||
services:
|
services:
|
||||||
|
|
||||||
# webui:
|
# webui:
|
||||||
@@ -162,25 +161,31 @@ services:
|
|||||||
- "26"
|
- "26"
|
||||||
|
|
||||||
# --- Honcho + OpenConcho combiné: API + Web UI nginx/FastAPI ---
|
# --- Honcho + OpenConcho combiné: API + Web UI nginx/FastAPI ---
|
||||||
honcho-ui:
|
honcho:
|
||||||
build: ./honcho
|
build:
|
||||||
|
context: ./honcho
|
||||||
|
ssh:
|
||||||
|
- default
|
||||||
container_name: honcho
|
container_name: honcho
|
||||||
restart: unless-stopped
|
restart: unless-stopped
|
||||||
environment:
|
environment:
|
||||||
- DB_CONNECTION_URI=postgresql+psycopg://honcho:honcho_pass@honcho-db:5432/honcho
|
- DB_CONNECTION_URI=postgresql+psycopg://honcho:honcho_pass@honcho-db:5432/honcho
|
||||||
- CACHE_URL=redis://honcho-redis:6379/0
|
- CACHE_URL=redis://honcho-redis:6379/0
|
||||||
- CACHE_ENABLED=true
|
- CACHE_ENABLED=true
|
||||||
- EMBEDDING_VECTOR_DIMENSIONS=1536
|
- EMBEDDING_VECTOR_DIMENSIONS=1024
|
||||||
- AUTH_USE_AUTH=true
|
- AUTH_USE_AUTH=true
|
||||||
- AUTH_JWT_SECRET=${AUTH_JWT_SECRET}
|
- AUTH_JWT_SECRET=${HONCHO_AUTH_JWT_SECRET}
|
||||||
- OPENAI_API_KEY=${OPENAI_API_KEY}
|
# Needed by deriver/dream to make LLM calls (api_key_env = "HONCHO_OPENAI_API_KEY" in config.toml)
|
||||||
|
- HONCHO_OPENAI_API_KEY=${HONCHO_OPENAI_API_KEY}
|
||||||
volumes:
|
volumes:
|
||||||
- /mnt/HoardingCow_docker_data/Honcho/data:/app/data
|
- honcho_data:/app/data
|
||||||
|
- /mnt/HoardingCow_docker_data/Honcho/config.toml:/app/config.toml:ro
|
||||||
networks:
|
networks:
|
||||||
- ai_backend
|
- ai_backend
|
||||||
- ai_net
|
- ai_net
|
||||||
labels:
|
labels:
|
||||||
- "traefik.enable=true"
|
- "traefik.enable=true"
|
||||||
|
- "traefik.docker.network=ai_net"
|
||||||
|
|
||||||
# Router for HTTP + redirect to HTTPS
|
# Router for HTTP + redirect to HTTPS
|
||||||
- "traefik.http.routers.honcho-http.rule=Host(`honcho.lazyworkhorse.net`)"
|
- "traefik.http.routers.honcho-http.rule=Host(`honcho.lazyworkhorse.net`)"
|
||||||
@@ -248,6 +253,11 @@ networks:
|
|||||||
ai_backend:
|
ai_backend:
|
||||||
driver: bridge
|
driver: bridge
|
||||||
name: ai_backend
|
name: ai_backend
|
||||||
|
|
||||||
|
volumes:
|
||||||
|
honcho_data:
|
||||||
|
external: true
|
||||||
|
name: honcho_data
|
||||||
|
|
||||||
# llama_cpp_devstral:
|
# llama_cpp_devstral:
|
||||||
# image: ghcr.io/ggml-org/llama.cpp:server-rocm
|
# image: ghcr.io/ggml-org/llama.cpp:server-rocm
|
||||||
|
|||||||
@@ -2,14 +2,15 @@
|
|||||||
FROM python:3.13-slim-bookworm AS honcho-builder
|
FROM python:3.13-slim-bookworm AS honcho-builder
|
||||||
|
|
||||||
RUN apt-get update && \
|
RUN apt-get update && \
|
||||||
apt-get install -y --no-install-recommends git && \
|
apt-get install -y --no-install-recommends git openssh-client && \
|
||||||
rm -rf /var/lib/apt/lists/*
|
rm -rf /var/lib/apt/lists/*
|
||||||
|
|
||||||
COPY --from=ghcr.io/astral-sh/uv:0.9.24 /uv /bin/uv
|
COPY --from=ghcr.io/astral-sh/uv:0.9.24 /uv /bin/uv
|
||||||
|
|
||||||
ARG HONCHO_REPO=https://github.com/plastic-labs/honcho
|
ARG HONCHO_REPO=ssh://git@code.lazyworkhorse.net:2222/Hermes/honcho.git
|
||||||
ARG HONCHO_REF=main
|
ARG HONCHO_REF=main
|
||||||
RUN git clone --depth 1 --branch ${HONCHO_REF} ${HONCHO_REPO} /app
|
RUN mkdir -p -m 0700 ~/.ssh && ssh-keyscan -p 2222 code.lazyworkhorse.net >> ~/.ssh/known_hosts 2>/dev/null
|
||||||
|
RUN --mount=type=ssh git clone --depth 1 --branch ${HONCHO_REF} ${HONCHO_REPO} /app
|
||||||
|
|
||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
|
|
||||||
@@ -29,8 +30,8 @@ RUN corepack enable && corepack prepare pnpm@latest --activate
|
|||||||
WORKDIR /app
|
WORKDIR /app
|
||||||
RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
|
RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
|
||||||
|
|
||||||
ARG OPENCONCHO_SHA=e490d911fcb27ee193558fd9a28856cde2057665
|
ARG OPENCONCHO_SHA=3b5c3293fc18d768dbe85285264a8d66c896bd81
|
||||||
RUN git clone --depth 1 https://github.com/offendingcommit/openconcho.git /app && \
|
RUN --mount=type=ssh git clone --depth 1 ssh://git@code.lazyworkhorse.net:2222/gortium/openconcho.git /app && \
|
||||||
git -C /app fetch --depth 1 origin ${OPENCONCHO_SHA} && \
|
git -C /app fetch --depth 1 origin ${OPENCONCHO_SHA} && \
|
||||||
git -C /app checkout ${OPENCONCHO_SHA}
|
git -C /app checkout ${OPENCONCHO_SHA}
|
||||||
|
|
||||||
@@ -71,4 +72,4 @@ COPY honcho-nginx.conf /etc/nginx/conf.d/default.conf
|
|||||||
|
|
||||||
EXPOSE 80
|
EXPOSE 80
|
||||||
|
|
||||||
CMD ["sh", "-c", "nginx -g 'daemon off;' & fastapi run --host 127.0.0.1 --port 8000 src/main.py"]
|
CMD ["bash", "-c", "nginx -g 'daemon off;' & fastapi run --host 127.0.0.1 --port 8000 src/main.py & python3 -m src.deriver & wait -n"]
|
||||||
|
|||||||
@@ -29,15 +29,15 @@ URL = "redis://honcho-redis:6379/0"
|
|||||||
[llm]
|
[llm]
|
||||||
DEFAULT_MAX_TOKENS = 4096
|
DEFAULT_MAX_TOKENS = 4096
|
||||||
|
|
||||||
# Embeddings via Ollama
|
# Embeddings via Ollama — bge-m3 provides 1024-dim
|
||||||
[embedding]
|
[embedding]
|
||||||
VECTOR_DIMENSIONS = 1024
|
VECTOR_DIMENSIONS = 1024
|
||||||
MAX_INPUT_TOKENS = 8192
|
MAX_INPUT_TOKENS = 8192
|
||||||
|
|
||||||
[embedding.model_config]
|
[embedding.model_config]
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "nomic-embed-text"
|
model = "bge-m3"
|
||||||
base_url = "http://ollama:11434/v1"
|
overrides = {base_url = "http://ollama:11434/v1", api_key = "ollama"}
|
||||||
|
|
||||||
# --- Deriver ---
|
# --- Deriver ---
|
||||||
[deriver]
|
[deriver]
|
||||||
@@ -47,10 +47,9 @@ POLLING_SLEEP_INTERVAL_SECONDS = 5.0
|
|||||||
FLUSH_ENABLED = true
|
FLUSH_ENABLED = true
|
||||||
|
|
||||||
[deriver.model_config]
|
[deriver.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
# --- Dialectic ---
|
# --- Dialectic ---
|
||||||
[dialectic]
|
[dialectic]
|
||||||
@@ -61,42 +60,37 @@ SESSION_HISTORY_MAX_TOKENS = 8192
|
|||||||
MAX_TOOL_ITERATIONS = 1
|
MAX_TOOL_ITERATIONS = 1
|
||||||
MAX_OUTPUT_TOKENS = 512
|
MAX_OUTPUT_TOKENS = 512
|
||||||
[dialectic.levels.minimal.model_config]
|
[dialectic.levels.minimal.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.low]
|
[dialectic.levels.low]
|
||||||
MAX_TOOL_ITERATIONS = 3
|
MAX_TOOL_ITERATIONS = 3
|
||||||
[dialectic.levels.low.model_config]
|
[dialectic.levels.low.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.medium]
|
[dialectic.levels.medium]
|
||||||
MAX_TOOL_ITERATIONS = 2
|
MAX_TOOL_ITERATIONS = 2
|
||||||
[dialectic.levels.medium.model_config]
|
[dialectic.levels.medium.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.high]
|
[dialectic.levels.high]
|
||||||
MAX_TOOL_ITERATIONS = 4
|
MAX_TOOL_ITERATIONS = 4
|
||||||
[dialectic.levels.high.model_config]
|
[dialectic.levels.high.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
[dialectic.levels.max]
|
[dialectic.levels.max]
|
||||||
MAX_TOOL_ITERATIONS = 10
|
MAX_TOOL_ITERATIONS = 10
|
||||||
[dialectic.levels.max.model_config]
|
[dialectic.levels.max.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
# --- Summary ---
|
# --- Summary ---
|
||||||
[summary]
|
[summary]
|
||||||
@@ -105,14 +99,28 @@ MESSAGES_PER_SHORT_SUMMARY = 20
|
|||||||
MESSAGES_PER_LONG_SUMMARY = 60
|
MESSAGES_PER_LONG_SUMMARY = 60
|
||||||
|
|
||||||
[summary.model_config]
|
[summary.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
transport = "openai"
|
transport = "openai"
|
||||||
model = "deepseek-v4-flash"
|
model = "deepseek-v4-flash"
|
||||||
base_url = "https://opencode.ai/zen/go/v1"
|
|
||||||
api_key_env = "HONCHO_OPENAI_API_KEY"
|
|
||||||
|
|
||||||
# --- Dream ---
|
# --- Dream ---
|
||||||
[dream]
|
[dream]
|
||||||
ENABLED = false
|
ENABLED = true
|
||||||
|
|
||||||
|
[dream.model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
|
transport = "openai"
|
||||||
|
model = "deepseek-v4-flash"
|
||||||
|
|
||||||
|
[dream.deduction_model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
|
transport = "openai"
|
||||||
|
model = "deepseek-v4-flash"
|
||||||
|
|
||||||
|
[dream.induction_model_config]
|
||||||
|
overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
|
||||||
|
transport = "openai"
|
||||||
|
model = "deepseek-v4-flash"
|
||||||
|
|
||||||
# --- Peer Card ---
|
# --- Peer Card ---
|
||||||
[peer_card]
|
[peer_card]
|
||||||
@@ -121,4 +129,4 @@ ENABLED = true
|
|||||||
# --- Vector Store ---
|
# --- Vector Store ---
|
||||||
[vector_store]
|
[vector_store]
|
||||||
TYPE = "pgvector"
|
TYPE = "pgvector"
|
||||||
DIMENSIONS = 1024
|
# DIMENSIONS is deprecated — EMBEDDING.VECTOR_DIMENSIONS is authoritative
|
||||||
|
|||||||
Reference in New Issue
Block a user