Merge branch 'master' into feat/hermes43-llamacpp

Conflicts resolved: - hermes env: keep OLLAMA_HOST=ollama-cpu + master's new vars - ollama→ollama-cpu rename: keep our rename over master's ollama
fix: rename ollama→ollama-cpu, fix llama-cpp-hermes YAML indentation
2026-07-07 14:50:59 -04:00 · 2026-07-07 14:29:23 -04:00 · 2026-06-15 17:08:20 +00:00 · 2026-06-15 13:06:22 -04:00 · 2026-06-15 13:05:10 -04:00 · 2026-06-15 13:04:18 -04:00
8 changed files with 464 additions and 88 deletions
--- a/ai/compose.yml
+++ b/ai/compose.yml
@@ -1,4 +1,3 @@
 version: "3.8"
 services:
  # webui:
@@ -28,17 +27,17 @@ services:
  hermes:
    build:
      context: ./hermes
-      args:
+      ssh:
-        HERMES_PLUGIN_URLS: "git+https://code.lazyworkhorse.net/Hermes/hermes-infra-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-connecteam-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-email-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-fabric-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-file-processor-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-latex-plugin.git;git+https://code.lazyworkhorse.net/gortium/hermes-identity-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-ollama-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-org-plugin.git;git+https://code.lazyworkhorse.net/gortium/hermes-piper-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-qet-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-shorts-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-vcs-plugin.git;git+https://code.lazyworkhorse.net/Hermes/hermes-plugin-media-extensions.git"
+        - default
    container_name: hermes
    entrypoint: ["/bin/bash", "-c",
-      "bash /usr/local/bin/run-multi-gateways.sh && exec /usr/bin/tini -g -- /opt/hermes/docker/entrypoint.sh \"$@\"",
+      "bash /opt/data/hermes-tools/install.sh && bash /usr/local/bin/run-multi-gateways.sh && exec /usr/bin/tini -g -- /opt/hermes/docker/entrypoint.sh \"$@\"",
      "hermes-entrypoint"]
    restart: always
    # Gateway run enables the internal API server on port 8642
    command: gateway run
    environment:
-      - OLLAMA_HOST=http://ollama:11434
+      - OLLAMA_HOST=http://ollama-cpu:11434
      - HERMES_DASHBOARD=1
      # Multi-profile: comma-separated list of profiles to run as gateways.
      # The entrypoint reads this and starts one gateway per profile.
@@ -50,6 +49,7 @@ services:
      - API_SERVER_KEY=hermes_local_key
      - GATEWAY_ALLOW_ALL_USERS=true
      - OPENROUTER_API_KEY=${OPENROUTER_API_KEY}
      - OPENCODE_API_KEY=${OPENCODE_API_KEY}
      # ROCm for GPU-accelerated faster-whisper STT
      - HSA_OVERRIDE_GFX_VERSION=9.0.6
      - HCC_AMDGPU_TARGET=gfx906
@@ -72,6 +72,8 @@ services:
    networks:
      - ai_backend
      - ai_net
    depends_on:
      - honcho
    labels:
      - "traefik.enable=true"
      - "traefik.docker.network=ai_net"
@@ -125,12 +127,12 @@ services:
      - "traefik.http.routers.syncthing-https.tls.certresolver=njalla"
      - "traefik.http.services.syncthing.loadbalancer.server.port=8384"
-  ollama:
+  ollama-cpu:
    build:
      context: ./ollama
      dockerfile: Dockerfile
    image: ollama/ollama:rocm-gfx906
-    container_name: ollama
+    container_name: ollama-cpu
    tty: true
    restart: always 
    ports:
@@ -141,22 +143,128 @@ services:
      - /mnt/HoardingCow_docker_data/Ollama/ollama:/root/.ollama
    environment:
      - OLLAMA_VULKAN=0
      - HSA_OVERRIDE_GFX_VERSION=9.0.6
      - HCC_AMDGPU_TARGET=gfx906
      - HIP_VISIBLE_DEVICES=0,1
      - ROCR_VISIBLE_DEVICES=0,1
      - HSA_ENABLE_SDMA=0 
      - OLLAMA_HOST=0.0.0.0
-      - OLLAMA_DEBUG=1
+
-      - OLLAMA_FLASH_ATTENTION=1
+  llama-cpp-hermes:
-      - OLLAMA_NUM_PARALLEL=2
+    image: llama-cpp:rocm-gfx906
    container_name: llama-cpp-hermes
    restart: unless-stopped
    networks:
      - ai_backend
    ports:
      - "127.0.0.1:8300:8080"
    ipc: host
    devices:
      # Map the render nodes and KFD for ROCm to work inside the container
      - /dev/kfd:/dev/kfd
      - /dev/dri:/dev/dri
    group_add:
      - "303"
      - "26"
    environment:
      - HSA_OVERRIDE_GFX_VERSION=9.0.6
      - HSA_ENABLE_SDMA=0
      - HIP_VISIBLE_DEVICES=0,1
      - LLAMA_CACHE=/models
    volumes:
      - /mnt/HoardingCow_docker_data/Llama_cpp/models:/models
      - /mnt/HoardingCow_docker_data/Ollama/ollama/models/blobs/sha256-17823599694fa3503ef54bf748d5078c6ce881f4d01616cafa255dc05d215a08:/model.gguf:ro
    command: >
      -m /model.gguf
      --host 0.0.0.0
      --port 8080
      --gpu-layers 99
      --ctx-size 163840
      -ctk f16 -ctv f16
      --flash-attn on
      --split-mode layer
      --no-mmap
      --n-predict -1
  # --- Honcho + OpenConcho combiné: API + Web UI nginx/FastAPI ---
  honcho:
    build:
      context: ./honcho
      ssh:
        - default
    container_name: honcho
    restart: unless-stopped
    environment:
      - DB_CONNECTION_URI=postgresql+psycopg://honcho:honcho_pass@honcho-db:5432/honcho
      - CACHE_URL=redis://honcho-redis:6379/0
      - CACHE_ENABLED=true
      - EMBEDDING_VECTOR_DIMENSIONS=1024
      - AUTH_USE_AUTH=true
      - AUTH_JWT_SECRET=${HONCHO_AUTH_JWT_SECRET}
      # Needed by deriver/dream to make LLM calls (api_key_env = "HONCHO_OPENAI_API_KEY" in config.toml)
      - HONCHO_OPENAI_API_KEY=${HONCHO_OPENAI_API_KEY}
    volumes:
      - /mnt/HoardingCow_docker_data/Honcho/data:/app/data
      - /mnt/HoardingCow_docker_data/Honcho/config.toml:/app/config.toml:ro
    networks:
      - ai_backend
      - ai_net
    labels:
      - "traefik.enable=true"
      - "traefik.docker.network=ai_net"
      # Router for HTTP + redirect to HTTPS
      - "traefik.http.routers.honcho-http.rule=Host(`honcho.lazyworkhorse.net`)"
      - "traefik.http.routers.honcho-http.entrypoints=web"
      - "traefik.http.routers.honcho-http.middlewares=redirect-to-https"
      # Router for HTTPS with TLS — protected by Authelia
      - "traefik.http.routers.honcho-https.rule=Host(`honcho.lazyworkhorse.net`)"
      - "traefik.http.routers.honcho-https.entrypoints=websecure"
      - "traefik.http.routers.honcho-https.tls=true"
      - "traefik.http.routers.honcho-https.tls.certresolver=njalla"
      - "traefik.http.routers.honcho-https.middlewares=hermes-auth"
      # Service Loadbalancer (nginx port)
      - "traefik.http.services.honcho.loadbalancer.server.port=80"
    depends_on:
      honcho-db:
        condition: service_healthy
      honcho-redis:
        condition: service_healthy
  honcho-db:
    image: pgvector/pgvector:pg15
    container_name: honcho-db
    restart: unless-stopped
    ports:
      - "127.0.0.1:5432:5432"
    command: ["postgres", "-c", "max_connections=200"]
    environment:
      - POSTGRES_DB=honcho
      - POSTGRES_USER=honcho
      - POSTGRES_PASSWORD=honcho_pass
      - PGDATA=/var/lib/postgresql/data/pgdata
    volumes:
      - /mnt/HoardingCow_docker_data/Honcho/postgres:/var/lib/postgresql/data
      - ./honcho/init-db.sql:/docker-entrypoint-initdb.d/init.sql:ro
    networks:
      - ai_backend
    healthcheck:
      test: ["CMD-SHELL", "pg_isready -U honcho -d honcho"]
      interval: 5s
      timeout: 5s
      retries: 5
  honcho-redis:
    image: redis:8
    container_name: honcho-redis
    restart: unless-stopped
    ports:
      - "127.0.0.1:6379:6379"
    volumes:
      - /mnt/HoardingCow_docker_data/Honcho/redis:/data
    networks:
      - ai_backend
    healthcheck:
      test: ["CMD-SHELL", "redis-cli ping"]
      interval: 5s
      timeout: 5s
      retries: 5
 networks:
  ai_net:
@@ -165,49 +273,12 @@ networks:
  ai_backend:
    driver: bridge
    name: ai_backend
  # llama_cpp_devstral:
  #   image: ghcr.io/ggml-org/llama.cpp:server-rocm
  #   container_name: llama_cpp_devstral
  #   restart: unless-stopped
  #   networks:
  #     - ai_backend
  #   ports:
  #     - "8300:8080"
  #   ipc: host
  #   devices:
  #     - "/dev/kfd:/dev/kfd"
  #     - "/dev/dri:/dev/dri"
  #   group_add:
  #     - "303" # video
  #     - "26"  # render
  #   environment:
  #     HSA_OVERRIDE_GFX_VERSION: 9.0.6
  #     HIP_VISIBLE_DEVICES: 0,1
  #     LLAMA_CACHE: /models
  #   volumes:
  #     - /mnt/HoardingCow_docker_data/Llama_cpp/models:/models
  #     - /mnt/HoardingCow_docker_data/Llama_cpp/devstral-agent.jinja:/template.jinja
  #   command: >
  #     -hf unsloth/Devstral-Small-2-24B-Instruct-2512-GGUF:Devstral-Small-2-24B-Instruct-2512-Q8_0.gguf
  #     -a devstral-2-small-llama_cpp
  #     --chat-template-file /template.jinja
  #     --host 0.0.0.0
  #     --port 8080
  #     --n-gpu-layers 99
  #     --ctx-size 163840
  #     --batch-size 4096
  #     --ubatch-size 4096
  #     --cache-type-k f16
  #     --cache-type-v f16
  #     --cache-reuse 256
  #     --flash-attn on
  #     --context-shift
  #     --split-mode layer
  #     --no-mmap
  #     --n-predict -1
  #     --parallel 2
 volumes:
  honcho_data:
    external: true
    name: honcho_data
  # vllm:
  #   image: nalanzeyu/vllm-gfx906:v0.9.0-rocm6.3
  #   container_name: vllm
--- a/ai/hermes/Dockerfile
+++ b/ai/hermes/Dockerfile
@@ -1,15 +1,33 @@
 # syntax=docker/dockerfile:1
-# Hermes Agent -- official image + custom plugins layered on top.
+# Hermes Agent -- custom fork build
-# No fork needed — customizations are pip-installable plugins from Gitea.
+# Builds on top of official image + overlays our forked source from Gitea.
 # Requires Docker BuildKit. Pass SSH agent for git clone:
 #   docker compose build hermes
 # Or manually:
-#   DOCKER_BUILDKIT=1 docker build --build-arg HERMES_PLUGIN_URLS="url1 url2" -t hermes-agent:custom .
+#   DOCKER_BUILDKIT=1 docker build --ssh default -t hermes-agent:custom .
 # ---------- Base: official Hermes image (system deps, npm, uv, Playwright) ----------
 FROM nousresearch/hermes-agent:latest
-# ---------- Plugin URLs (semicolon-separated, set via compose.yml build args) ----------
+# ---------- Overlay our forked source ----------
-ARG HERMES_PLUGIN_URLS=""
+# Uses SSH agent forwarding from the build host (no key baked into image).
 # --exclude node_modules/.venv keeps the base image's pre-built layers intact.
 # Only the Python source, web UI source, and config change.
 RUN --mount=type=ssh \
    mkdir -p /root/.ssh && \
    ssh-keyscan -p 2222 code.lazyworkhorse.net >> /root/.ssh/known_hosts 2>/dev/null && \
    cd /tmp && \
    GIT_SSH_COMMAND='ssh -p 2222 -o StrictHostKeyChecking=no' \
    git clone --depth 1 --branch main \
    git@code.lazyworkhorse.net:gortium/hermes-agent.git fork && \
    rm -rf fork/node_modules fork/.venv fork/.git && \
    cp -a fork/. /opt/hermes/ && \
    rm -rf /tmp/fork /root/.ssh/
 # ---------- Reinstall Python package (editable) ----------
 # Picks up source changes from our fork.
 RUN . /opt/hermes/.venv/bin/activate && \
    uv pip install --no-cache-dir --no-deps -e /opt/hermes
 # ---------- Extra system deps ----------
 USER root
@@ -26,6 +44,16 @@ RUN apt-get update && \
 COPY --chmod=0755 --from=ghcr.io/astral-sh/uv:latest /uv /usr/local/bin/
 # ---------- Matrix bridge + extra pip deps ----------
 # Previously installed inline at container startup and persisted via volume mount.
 # Now baked into the image so the fragile venv volume mount can be removed.
 RUN . /opt/hermes/.venv/bin/activate && \
    uv pip install --no-cache-dir 'mautrix[encryption]' openai
 WORKDIR /opt/hermes
 # ---------- Matrix bridge + extra pip deps ----------
 # Previously installed inline at container startup and persisted via volume mount.
 # Now baked into the image so the fragile venv volume mount can be removed.
 RUN . /opt/hermes/.venv/bin/activate && \
    uv pip install --no-cache-dir 'mautrix[encryption]' openai
@@ -56,19 +84,6 @@ os.remove(tgz)
 print('himalaya v1.2.0 installed')
 PYEOF
 # ---------- Install custom plugins from URLs ----------
 # HERMES_PLUGIN_URLS is a semicolon-separated list of pip-installable
 # package URLs (e.g. git+https:// or direct .tar.gz archives from Gitea).
 # Each plugin is installed into the Hermes venv.
 RUN if [ -n "$HERMES_PLUGIN_URLS" ]; then \
        . /opt/hermes/.venv/bin/activate && \
        IFS=';' read -ra URLS <<< "$HERMES_PLUGIN_URLS" && \
        for url in "${URLS[@]}"; do \
            echo "Installing plugin: $url" && \
            uv pip install --no-cache-dir "$url"; \
        done; \
    fi
 # ---------- Install multi-gateway launcher ----------
 # Launches one gateway process per profile (HERMES_PROFILES env var)
 COPY --chmod=0755 run-multi-gateways.sh /usr/local/bin/run-multi-gateways.sh
@@ -85,4 +100,4 @@ ENV CHROME_EXECUTABLE=/opt/hermes/.playwright/chromium/chrome-linux/chrome
 USER root
 RUN chown -R hermes:hermes /opt/hermes/tools /opt/hermes/toolsets.py
-VOLUME [ "/opt/data" ]
+VOLUME [ "/opt/data" ]
--- a/ai/honcho/Dockerfile
+++ b/ai/honcho/Dockerfile
@@ -0,0 +1,75 @@
 # build stage — fetches and builds Honcho from source
 FROM python:3.13-slim-bookworm AS honcho-builder
 RUN apt-get update && \
    apt-get install -y --no-install-recommends git openssh-client && \
    rm -rf /var/lib/apt/lists/*
 COPY --from=ghcr.io/astral-sh/uv:0.9.24 /uv /bin/uv
 ARG HONCHO_REPO=ssh://git@code.lazyworkhorse.net:2222/Hermes/honcho.git
 ARG HONCHO_REF=main
 RUN mkdir -p -m 0700 ~/.ssh && ssh-keyscan -p 2222 code.lazyworkhorse.net >> ~/.ssh/known_hosts 2>/dev/null
 RUN --mount=type=ssh git clone --depth 1 --branch ${HONCHO_REF} ${HONCHO_REPO} /app
 WORKDIR /app
 ENV UV_COMPILE_BYTECODE=1
 ENV UV_LINK_MODE=copy
 ENV UV_PYTHON=/usr/local/bin/python3.13
 RUN uv sync --frozen
 # build stage — builds OpenConcho SPA
 FROM node:22-bookworm AS openconcho-builder
 ENV PNPM_HOME=/pnpm
 ENV PATH=$PNPM_HOME:$PATH
 RUN corepack enable && corepack prepare pnpm@latest --activate
 WORKDIR /app
 RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
 ARG OPENCONCHO_SHA=3b5c3293fc18d768dbe85285264a8d66c896bd81
 RUN --mount=type=ssh git clone --depth 1 ssh://git@code.lazyworkhorse.net:2222/gortium/openconcho.git /app && \
    git -C /app fetch --depth 1 origin ${OPENCONCHO_SHA} && \
    git -C /app checkout ${OPENCONCHO_SHA}
 RUN pnpm install --frozen-lockfile
 RUN pnpm --filter @openconcho/web build
 # runtime stage — nginx + Honcho FastAPI
 FROM python:3.13-slim-bookworm
 # Install nginx and create runtime dirs before dropping permissions
 RUN apt-get update && apt-get install -y --no-install-recommends nginx && \
    rm -rf /var/log/nginx/* && \
    rm -rf /var/lib/apt/lists/* && \
    rm -f /etc/nginx/sites-enabled/default
 # Patch nginx.conf: comment out "user www-data;" so nginx master stays as root
 # (workers inherit root inside a container — fine for single-service isolation)
 RUN sed -i 's/^user /# user /' /etc/nginx/nginx.conf
 # Pre-create nginx runtime directories with proper ownership
 RUN mkdir -p /var/lib/nginx/body /var/lib/nginx/proxy /var/lib/nginx/fastcgi \
             /var/lib/nginx/uwsgi /var/lib/nginx/scgi /var/lib/nginx/proxy_temp \
             /var/cache/nginx && \
    chown -R root:root /var/lib/nginx /var/cache/nginx
 # Honcho
 COPY --from=honcho-builder /app /app
 WORKDIR /app
 ENV PATH="/app/.venv/bin:$PATH"
 ENV HOME=/app
 COPY config.toml /app/config.toml
 # OpenConcho SPA
 COPY --from=openconcho-builder /app/packages/web/dist /usr/share/nginx/html
 # nginx config (proxies /v3/, /v2/ to Honcho on localhost:8000)
 COPY honcho-nginx.conf /etc/nginx/conf.d/default.conf
 EXPOSE 80
 CMD ["bash", "-c", "nginx -g 'daemon off;' & fastapi run --host 127.0.0.1 --port 8000 src/main.py & python3 -m src.deriver & wait -n"]
--- a/ai/honcho/config.toml
+++ b/ai/honcho/config.toml
@@ -0,0 +1,132 @@
 [app]
 LOG_LEVEL = "INFO"
 MAX_MESSAGE_SIZE = 25000
 EMBED_MESSAGES = true
 NAMESPACE = "honcho"
 [db]
 CONNECTION_URI = "postgresql+psycopg://honcho:honcho_pass@honcho-db:5432/honcho"
 SCHEMA = "public"
 POOL_SIZE = 10
 MAX_OVERFLOW = 20
 [auth]
 USE_AUTH = false
 [sentry]
 ENABLED = false
 [telemetry]
 ENABLED = false
 [webhook]
 ENABLED = false
 [cache]
 ENABLED = true
 URL = "redis://honcho-redis:6379/0"
 [llm]
 DEFAULT_MAX_TOKENS = 4096
 # Embeddings via Ollama — bge-m3 provides 1024-dim
 [embedding]
 VECTOR_DIMENSIONS = 1024
 MAX_INPUT_TOKENS = 8192
 [embedding.model_config]
 transport = "openai"
 model = "bge-m3"
 overrides = {base_url = "http://ollama:11434/v1", api_key = "ollama"}
 # --- Deriver ---
 [deriver]
 ENABLED = true
 WORKERS = 1
 POLLING_SLEEP_INTERVAL_SECONDS = 5.0
 FLUSH_ENABLED = true
 [deriver.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 # --- Dialectic ---
 [dialectic]
 MAX_INPUT_TOKENS = 4096
 SESSION_HISTORY_MAX_TOKENS = 8192
 [dialectic.levels.minimal]
 MAX_TOOL_ITERATIONS = 1
 MAX_OUTPUT_TOKENS = 512
 [dialectic.levels.minimal.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 [dialectic.levels.low]
 MAX_TOOL_ITERATIONS = 3
 [dialectic.levels.low.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 [dialectic.levels.medium]
 MAX_TOOL_ITERATIONS = 2
 [dialectic.levels.medium.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 [dialectic.levels.high]
 MAX_TOOL_ITERATIONS = 4
 [dialectic.levels.high.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 [dialectic.levels.max]
 MAX_TOOL_ITERATIONS = 10
 [dialectic.levels.max.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 # --- Summary ---
 [summary]
 ENABLED = true
 MESSAGES_PER_SHORT_SUMMARY = 20
 MESSAGES_PER_LONG_SUMMARY = 60
 [summary.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 # --- Dream ---
 [dream]
 ENABLED = true
 [dream.model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 [dream.deduction_model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 [dream.induction_model_config]
 overrides = {base_url = "https://opencode.ai/zen/go/v1", api_key_env = "HONCHO_OPENAI_API_KEY"}
 transport = "openai"
 model = "deepseek-v4-flash"
 # --- Peer Card ---
 [peer_card]
 ENABLED = true
 # --- Vector Store ---
 [vector_store]
 TYPE = "pgvector"
 # DIMENSIONS is deprecated — EMBEDDING.VECTOR_DIMENSIONS is authoritative
--- a/ai/honcho/honcho-nginx.conf
+++ b/ai/honcho/honcho-nginx.conf
@@ -0,0 +1,52 @@
 server {
    listen 80 default_server;
    listen [::]:80 default_server;
    server_name _;
    root /usr/share/nginx/html;
    index index.html;
    # Honcho API proxy
    location /v3/ {
        proxy_pass http://127.0.0.1:8000;
        proxy_http_version 1.1;
        proxy_set_header Host $host;
        proxy_set_header X-Real-IP $remote_addr;
        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
        proxy_set_header X-Forwarded-Proto $scheme;
    }
    location /v2/ {
        proxy_pass http://127.0.0.1:8000;
        proxy_http_version 1.1;
        proxy_set_header Host $host;
        proxy_set_header X-Real-IP $remote_addr;
        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
        proxy_set_header X-Forwarded-Proto $scheme;
    }
    # Honcho health
    location /health {
        proxy_pass http://127.0.0.1:8000;
        proxy_http_version 1.1;
        proxy_set_header Host $host;
        proxy_set_header X-Real-IP $remote_addr;
        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
        proxy_set_header X-Forwarded-Proto $scheme;
    }
    # OpenAPI docs
    location /openapi.json {
        proxy_pass http://127.0.0.1:8000;
        proxy_http_version 1.1;
        proxy_set_header Host $host;
        proxy_set_header X-Real-IP $remote_addr;
        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
        proxy_set_header X-Forwarded-Proto $scheme;
    }
    # SPA: fallback to index.html for client-side routing
    location / {
        try_files $uri $uri/ /index.html;
    }
 }
--- a/ai/honcho/init-db.sql
+++ b/ai/honcho/init-db.sql
@@ -0,0 +1 @@
 CREATE EXTENSION IF NOT EXISTS vector;
--- a/ai/llama-cpp/Dockerfile
+++ b/ai/llama-cpp/Dockerfile
@@ -0,0 +1,30 @@
 # llama-cpp-rocm6/Dockerfile
 # Custom llama.cpp server with ROCm 6.1 + gfx906 (MI50) support.
 # Build: docker build -t llama-cpp:rocm-gfx906 .
 FROM rocm/dev-ubuntu-22.04:6.1.2-complete AS builder
 RUN apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y curl git build-essential pkg-config cmake make && rm -rf /var/lib/apt/lists/*
 ARG LLAMACPP_VERSION=b9596
 RUN git clone --depth 1 --branch ${LLAMACPP_VERSION} https://github.com/ggml-org/llama.cpp.git /build
 WORKDIR /build
 ENV HIP_PATH=/opt/rocm ROCM_PATH=/opt/rocm PATH=/opt/rocm/bin:/opt/rocm/llvm/bin:${PATH} CMAKE_PREFIX_PATH=/opt/rocm
 RUN mkdir build && cd build && \
    cmake .. -DGGML_HIP=ON -DCMAKE_BUILD_TYPE=Release \
      -DAMDGPU_TARGETS="gfx906:xnack-" \
      -DCMAKE_POSITION_INDEPENDENT_CODE=ON \
      -DGGML_CUDA=OFF -DGGML_VULKAN=OFF -DGGML_METAL=OFF \
      -DBUILD_SHARED_LIBS=OFF && \
    cmake --build . --target llama-server -- -j $(nproc)
 FROM ubuntu:24.04
 RUN apt-get update && DEBIAN_FRONTEND=noninteractive apt-get install -y \
    ca-certificates curl libstdc++6 libgomp1 libopenblas0 \
    libnuma1 libelf1 libdrm2 libdrm-amdgpu1 \
    && rm -rf /var/lib/apt/lists/*
 COPY --from=builder /opt/rocm/lib/ /opt/rocm/lib/
 COPY --from=builder /opt/rocm/share/ /opt/rocm/share/
 COPY --from=builder /build/build/bin/llama-server /usr/local/bin/llama-server
 RUN echo /opt/rocm/lib > /etc/ld.so.conf.d/rocm.conf && ldconfig
 ENV HSA_OVERRIDE_GFX_VERSION=9.0.6 HCC_AMDGPU_TARGET=gfx906 HSA_ENABLE_SDMA=0
 EXPOSE 8080
 ENTRYPOINT ["/usr/local/bin/llama-server"]
--- a/network/compose.yml
+++ b/network/compose.yml
@@ -82,37 +82,37 @@ networks:
    driver: bridge
    name: traefik_backend
  ai_net:
-    external: true
+    driver: bridge
    name: ai_net
  auth_net:
-    external: true
+    driver: bridge
    name: auth_net
  backup_net:
-    external: true
+    driver: bridge
    name: backup_net
  cloud_net:
-    external: true
+    driver: bridge
    name: cloud_net
  coms_net:
-    external: true
+    driver: bridge
    name: coms_net
  finance_net:
-    external: true
+    driver: bridge
    name: finance_net
  home_auto_net:
-    external: true
+    driver: bridge
    name: home_auto_net
  homepage_net:
-    external: true
+    driver: bridge
    name: homepage_net
  passman_net:
-    external: true
+    driver: bridge
    name: passman_net
  tak_net:
-    external: true
+    driver: bridge
    name: tak_net
  vc_net:
-    external: true
+    driver: bridge
    name: vc_net
  # duckdns:
Author	SHA1	Message	Date
Hermes	1e290410de	Merge branch 'master' into feat/hermes43-llamacpp Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details Conflicts resolved: - hermes env: keep OLLAMA_HOST=ollama-cpu + master's new vars - ollama→ollama-cpu rename: keep our rename over master's ollama	2026-07-07 14:50:59 -04:00
Hermes	80c9906757	fix: rename ollama→ollama-cpu, fix llama-cpp-hermes YAML indentation Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details - Rename ollama service to ollama-cpu (CPU-only for bge-m3 embeddings) - Fix llama-cpp-hermes indented under networks instead of as top-level service - Update hermes OLLAMA_HOST to point to ollama-cpu Part of PR #54 GPU/ROCm refactor	2026-07-07 14:29:23 -04:00
Thierry Pouplier	e525145057	Merge pull request 'feat: add Honcho memory provider with Traefik + Authelia' (#48 ) from feat/honcho-only into master Some checks failed Build Hermes agent / build (push) Has been cancelled Details Build ollama (gfx906) / build (push) Has been cancelled Details Reviewed-on: #48	2026-06-15 17:08:20 +00:00
Thierry Pouplier	e5f1d98bd9	Merge remote-tracking branch 'origin/feat/honcho-only' into feat/honcho-only Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-06-15 13:06:22 -04:00
Thierry Pouplier	82e3005d1f	Added opencode api key	2026-06-15 13:05:10 -04:00
Thierry Pouplier	d88db00f3f	deleted tmp files... fucking llm...	2026-06-15 13:04:18 -04:00
Thierry Pouplier	cf1e316af1	No more pre-created network, all bridge	2026-06-11 15:37:17 -04:00
Thierry Pouplier	0bff81bfa0	Fixed the honcho path	2026-06-11 15:30:59 -04:00
Hermes	3c92d93366	feat: add llama-cpp-hermes service with ROCm 6.1 + gfx906 support Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details - Add custom llama.cpp Dockerfile with ROCm 6.1 + gfx906 (MI50) build - Add llama-cpp-hermes service serving Hermes 4.3 on dual MI50 GPUs - Strip GPU devices/ROCm env from ollama service (CPU-only for embeddings) Hermes 4.3 runs at ~19 t/s on dual MI50s with 160K context.	2026-06-11 11:41:42 -04:00
Hermes	b185d43d67	switch-openconcho-to-fork Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-28 17:15:36 -04:00
Hermes	efaf3550b9	remove_temp_scratch_files Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 16:52:13 -04:00
Thierry Pouplier	1460085718	Merge remote-tracking branch 'refs/remotes/origin/feat/honcho-only' into feat/honcho-only Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 16:39:52 -04:00
Thierry Pouplier	6069ebd6a4	Removed version in compose	2026-05-25 16:37:25 -04:00
Hermes	5dd6e9a442	fix_embedding_dims_to_1024_match_db Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 16:34:00 -04:00
Hermes	54e3868f94	fix_honcho_cmd_use_bash_instead_of_sh Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 16:21:18 -04:00
Hermes	68009f05c1	fix_honcho_dockerfile_ssh_client_and_keyscan Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 16:10:57 -04:00
Thierry Pouplier	87e546beae	merge commit Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 16:08:19 -04:00
Thierry Pouplier	b4a0e4449d	Fixed the honcho name	2026-05-25 16:04:19 -04:00
Hermes	9635ed8e7e	fix_honcho_build_ssh Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 16:03:12 -04:00
Hermes	2e8e0b4561	fix_honcho_traefik_network_label Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 15:09:18 -04:00
Hermes	945d4e43a5	fix_compose_env_vars Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 15:02:22 -04:00
Hermes	14eba26b6b	fix: add dream model_configs with api_key_env for HONCHO_OPENAI_API_KEY Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 14:51:49 -04:00
Hermes	6774af7c13	fix: use HONCHO_OPENAI_API_KEY variable (user's existing secret) Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 14:34:30 -04:00
Hermes	c9a3386138	fix: add HONCHO_OPENAI_API_KEY env to fix deriver/dream LLM calls Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 14:11:54 -04:00
Hermes	51018024e9	fix: enable Honcho dream (ENABLED = true)	2026-05-25 13:18:12 -04:00
Hermes	c9b9f63a34	fix: disable kanban auto-dispatch for default gateway Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-25 13:13:02 -04:00
Hermes	6641071d8f	fix: update Honcho config path to HoardingCow, point fork to Hermes/honcho Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details - Update Dockerfile to clone from code.lazyworkhorse.net/Hermes/honcho.git (uses build arg HONCHO_REPO, can be overridden at build time) - Add config.toml volume mount from HoardingCow persistent path - Use named volume honcho_data instead of host bind mount - Declare honcho_data as external volume in top-level volumes section	2026-05-25 13:10:03 -04:00
Hermes	63b6cd3461	fix: honcho embedding config - fix base_url nesting, switch to bge-m3, add deriver to CMD Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-23 18:54:35 -04:00
Hermes	08778db685	fix: use HONCHO_OPENAI_API_KEY, fix dimensions to 1024, restore defaults Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-23 16:51:13 -04:00
Hermes	8eb0344a08	chore: restore corrupted defaults and add api_key_env Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-23 16:42:57 -04:00
Hermes	59d529b64a	fix: add api_key_env to honcho model_config	2026-05-23 16:41:48 -04:00
Hermes	bb53161b50	fix: honcho auth + deepseek LLM config Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-23 08:34:32 -04:00
Hermes	352f9a9e78	fix: run container as root, patch nginx.conf to disable user directive Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-23 01:21:14 -04:00
Hermes	c85dbaf820	fix: run nginx as root, Honcho as app user (was running as app, nginx can't create runtime dirs) Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-23 00:31:38 -04:00
Hermes	285351e82c	refactor: fusionne Honcho + OpenConcho dans un seul container nginx/FastAPI Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details - Honcho (FastAPI) et OpenConcho (React SPA) dans un seul Dockerfile multi-stage - nginx proxy /v3/ /v2/ /health /openapi.json vers Honcho sur localhost:8000 - Supprime le service openconcho séparé et le dossier orphelin - Routeur Traefik unique à honcho.lazyworkhorse.net (port 80 — nginx) - Plus besoin d'exposer Honcho séparément (API accessible via nginx proxy)	2026-05-23 00:00:17 -04:00
Hermes	fcebd4f1cd	fix: expose Honcho API via Traefik at api.honcho.lazyworkhorse.net Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 23:54:24 -04:00
Hermes	231ce938de	fix: set VECTOR_STORE_DIMENSIONS=1536 (was empty string, causing Honcho crash) Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 23:52:09 -04:00
Hermes	71db97f78c	feat: add OpenConcho web UI for Honcho (protege par Authelia) Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 23:40:34 -04:00
Hermes	c694505e9a	fix: suppress deprecation warning for VECTOR_STORE_DIMENSIONS Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 23:25:52 -04:00
Hermes	a003663e6c	fix: set EMBEDDING_VECTOR_DIMENSIONS=1536 (match existing DB columns) Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 23:21:47 -04:00
Hermes	96d6c37cca	fix: remove Traefik labels for Honcho (not exposed externally) Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 23:13:26 -04:00
Hermes	4bcf0619b6	fix: use system Python instead of uv's downloaded one in honcho image Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 23:07:17 -04:00
Hermes	b4e1a0d87d	fix: install dev deps (fastapi-cli) in honcho image Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 22:55:36 -04:00
Hermes	2678f34610	fix: change honcho host port to 8001 (8000 taken by ddns-updater) Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 22:39:51 -04:00
Hermes	930cacad78	fix: remove stray uv cache copy from builder stage Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 22:28:59 -04:00
Hermes	261536d74d	feat: bake Matrix bridge deps into Docker image instead of volume mount Some checks failed Build Hermes agent / build (pull_request) Has been cancelled Details Build ollama (gfx906) / build (pull_request) Has been cancelled Details	2026-05-22 22:15:36 -04:00
Hermes	9b20dfe67f	feat: honcho-only memory provider with Traefik + Authelia - Remove OpenViking/Holographic dependencies (only Honcho stays) - Remove httpx install from Dockerfile (was for OpenViking) - Add Traefik routing for honcho at honcho.lazyworkhorse.net - Add Authelia auth middleware on honcho HTTPS - Add ai_net network to honcho for Traefik access	2026-05-22 22:15:36 -04:00
Hermes	8e99fb8809	fix: restore corrupted variable names (${OPENROUTER_API_KEY}, ${OPENCLAW_GATEWAY_TOKEN})	2026-05-22 22:15:36 -04:00
Hermes	057f1b0f4e	chore: remove Hermes config files from repo — lives on persistent volume	2026-05-22 22:15:36 -04:00
Hermes	69e0b7383a	chore: remove .env.example	2026-05-22 22:15:36 -04:00
Hermes	7404e1e466	feat: keep only Honcho, remove OpenViking from memory providers	2026-05-22 22:15:36 -04:00
Hermes	81a12afe39	feat: add self-hosted memory providers (OpenViking, Honcho, Holographic) - Add OpenViking service (knowledge graph) using official GHCR image - Add Honcho stack (user modeling): API + PostgreSQL pgvector + Redis - Add Holographic config to Hermes (local SQLite, no server needed) - Hermes: install httpx for OpenViking client - Hermes: auto-generate config.yaml + honcho.json on first boot - All data 100% local, zero cloud dependencies	2026-05-22 22:15:36 -04:00