Compare commits
2 Commits
feat/honch
...
1ec22ff3fc
| Author | SHA1 | Date | |
|---|---|---|---|
| 1ec22ff3fc | |||
| b1dbdb9f2d |
31
AGENTS.md
Normal file
31
AGENTS.md
Normal file
@@ -0,0 +1,31 @@
|
||||
# AGENTS.md
|
||||
|
||||
Development conventions for the compose repository (Docker Compose stacks).
|
||||
|
||||
## Build & Deploy
|
||||
|
||||
- The ai stack is managed via `systemctl restart ai_stack.service` on the NixOS host
|
||||
- Compose files are built from the git repo; apply via `nh os switch` or `systemctl restart ai_stack.service`
|
||||
- Never `docker compose up -d` directly — it bypasses the systemd env file and breaks secrets
|
||||
|
||||
## Hermes Workers
|
||||
|
||||
- Paperclip Hermes workers are added via `ai/scripts/provision-hermes-worker.sh`
|
||||
- The script appends only — never deletes or modifies existing content
|
||||
- Workers are CPU-only containers on the `ai_backend` network with no GPU passthrough
|
||||
|
||||
## Workflow
|
||||
|
||||
- New feature → clean branch from `origin/master` → push → PR on Gitea
|
||||
- Branch naming: `feat/description` (features), `fix/description` (bugs/docs)
|
||||
- Always branch from `origin/master`, never from another feature branch
|
||||
- Submodule changes (when this repo is consumed as a submodule): commit the submodule update in the parent repo
|
||||
- PR title should describe the change; body should explain motivation + summary
|
||||
- After PR merge, delete the feature branch
|
||||
|
||||
## YAML Conventions
|
||||
|
||||
- Use `x-*` extension fields for reusable anchors
|
||||
- Comment out inactive services rather than deleting them
|
||||
- Environment variables in dictionary format (`KEY: value`) for anchor compatibility
|
||||
- List format (`- KEY=value`) works for standard services but doesn't merge with anchors
|
||||
230
ai/compose.yml
230
ai/compose.yml
@@ -1,4 +1,35 @@
|
||||
version: "3.8"
|
||||
|
||||
# ── Hermes Worker Template ──────────────────────────────────
|
||||
# Used by paperclip-worker-* Hermes containers via YAML anchor.
|
||||
# Each worker = one isolated Hermes agent for a Paperclip employee.
|
||||
# Override at service level: container_name, API_SERVER_PORT,
|
||||
# API_SERVER_KEY, DISCORD_BOT_TOKEN, volumes.
|
||||
# Workers have NO GPU — they use OpenCode Go or remote providers.
|
||||
x-hermes-worker: &hermes-worker
|
||||
build:
|
||||
context: ./hermes
|
||||
ssh:
|
||||
- default
|
||||
entrypoint: ["/bin/bash", "-c",
|
||||
"bash /opt/data/hermes-tools/install.sh && exec /usr/bin/tini -g -- /opt/hermes/docker/entrypoint.sh \"$@\"",
|
||||
"hermes-entrypoint"]
|
||||
command: gateway run
|
||||
restart: always
|
||||
environment:
|
||||
API_SERVER_ENABLED: "true"
|
||||
API_SERVER_HOST: "0.0.0.0"
|
||||
OLLAMA_HOST: "http://ollama:11434"
|
||||
OPENROUTER_API_KEY: ${OPENROUTER_API_KEY}
|
||||
# Each worker needs its own OpenCode Go API key in .env
|
||||
OPENCODE_GO_API_KEY: ${OPENCODE_GO_API_KEY}
|
||||
GATEWAY_ALLOW_ALL_USERS: "true"
|
||||
TZ: "America/Montreal"
|
||||
networks:
|
||||
ai_backend:
|
||||
# NO devices — workers are CPU-only, no GPU passthrough
|
||||
# ─────────────────────────────────────────────────────────────
|
||||
|
||||
services:
|
||||
|
||||
# webui:
|
||||
@@ -44,7 +75,7 @@ services:
|
||||
- API_SERVER_HOST=0.0.0.0
|
||||
- API_SERVER_KEY=hermes_local_key
|
||||
- GATEWAY_ALLOW_ALL_USERS=true
|
||||
- OPENROUTER_API_KEY=${OPEN...KEY}
|
||||
- OPENROUTER_API_KEY=${OPENROUTER_API_KEY}
|
||||
# ROCm for GPU-accelerated faster-whisper STT
|
||||
- HSA_OVERRIDE_GFX_VERSION=9.0.6
|
||||
- HCC_AMDGPU_TARGET=gfx906
|
||||
@@ -54,10 +85,6 @@ services:
|
||||
- TZ=America/Montreal
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Hermes/data:/opt/data
|
||||
# Syncthing-shared org files — read-only view of user's agenda
|
||||
- /mnt/HoardingCow_docker_data/Syncthing/telos-ro:/opt/data/telos-ro:ro
|
||||
# Syncthing-shared inbox — write tasks here, they sync to user's laptop
|
||||
- /mnt/HoardingCow_docker_data/Syncthing/telos-rw:/opt/data/telos-rw:rw
|
||||
devices:
|
||||
- /dev/kfd:/dev/kfd
|
||||
- /dev/dri:/dev/dri
|
||||
@@ -67,35 +94,6 @@ services:
|
||||
networks:
|
||||
- ai_backend
|
||||
|
||||
syncthing:
|
||||
image: syncthing/syncthing:latest
|
||||
container_name: syncthing
|
||||
hostname: syncthing
|
||||
restart: always
|
||||
ports:
|
||||
- "8384:8384"
|
||||
- "22000:22000"
|
||||
- "21027:21027/udp"
|
||||
environment:
|
||||
- TZ=America/Montreal
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Syncthing/config:/var/syncthing/config
|
||||
- /mnt/HoardingCow_docker_data/Syncthing/telos-ro:/telos-ro
|
||||
- /mnt/HoardingCow_docker_data/Syncthing/telos-rw:/telos-rw
|
||||
networks:
|
||||
- ai_backend
|
||||
- ai_net
|
||||
labels:
|
||||
- "traefik.enable=true"
|
||||
- "traefik.http.routers.syncthing-http.rule=Host(`syncthing.lazyworkhorse.net`)"
|
||||
- "traefik.http.routers.syncthing-http.entrypoints=web"
|
||||
- "traefik.http.routers.syncthing-http.middlewares=redirect-to-https"
|
||||
- "traefik.http.routers.syncthing-https.rule=Host(`syncthing.lazyworkhorse.net`)"
|
||||
- "traefik.http.routers.syncthing-https.entrypoints=websecure"
|
||||
- "traefik.http.routers.syncthing-https.tls=true"
|
||||
- "traefik.http.routers.syncthing-https.tls.certresolver=njalla"
|
||||
- "traefik.http.services.syncthing.loadbalancer.server.port=8384"
|
||||
|
||||
ollama:
|
||||
build:
|
||||
context: ./ollama
|
||||
@@ -129,149 +127,23 @@ services:
|
||||
- "303"
|
||||
- "26"
|
||||
|
||||
paperclip-db:
|
||||
image: postgres:17-alpine
|
||||
container_name: paperclip-db
|
||||
restart: always
|
||||
environment:
|
||||
POSTGRES_USER: paperclip
|
||||
POSTGRES_PASSWORD: ${PAPERCLIP_DB_PASSWORD:?PAPERCLIP_DB_PASSWORD must be set}
|
||||
POSTGRES_DB: paperclip
|
||||
healthcheck:
|
||||
test: ["CMD-SHELL", "pg_isready -U paperclip -d paperclip"]
|
||||
interval: 5s
|
||||
timeout: 5s
|
||||
retries: 10
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Paperclip/pgdata:/var/lib/postgresql/data
|
||||
networks:
|
||||
- ai_backend
|
||||
# ── Paperclip Worker Hermes Agents ──────────────────────────
|
||||
# Each worker is an isolated Hermes agent for a Paperclip employee.
|
||||
# Add new workers with: ./scripts/provision-hermes-worker.sh <name> <discord-token>
|
||||
# The API server key and port are generated automatically.
|
||||
# Workers are CPU-only — they use OpenCode Go or remote providers.
|
||||
|
||||
paperclip:
|
||||
image: ghcr.io/paperclipai/paperclip:v2026.517.0
|
||||
container_name: paperclip
|
||||
restart: always
|
||||
ports:
|
||||
- "127.0.0.1:3100:3100"
|
||||
environment:
|
||||
- HOST=0.0.0.0
|
||||
- PORT=3100
|
||||
- SERVE_UI=true
|
||||
- DATABASE_URL=postgres://paperclip:***@paperclip-db:5432/paperclip
|
||||
- BETTER_AUTH_SECRET=${PAPE...CRET must be set}
|
||||
- PAPERCLIP_PUBLIC_URL=https://paperclip.lazyworkhorse.net
|
||||
- PAPERCLIP_DEPLOYMENT_MODE=authenticated
|
||||
- PAPERCLIP_DEPLOYMENT_EXPOSURE=private
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Paperclip/data:/paperclip
|
||||
depends_on:
|
||||
paperclip-db:
|
||||
condition: service_healthy
|
||||
networks:
|
||||
- ai_net
|
||||
- ai_backend
|
||||
labels:
|
||||
- "traefik.enable=true"
|
||||
- "traefik.docker.network=ai_net"
|
||||
|
||||
- "traefik.http.routers.paperclip-http.rule=Host(`paperclip.lazyworkhorse.net`)"
|
||||
- "traefik.http.routers.paperclip-http.entrypoints=web"
|
||||
- "traefik.http.routers.paperclip-http.middlewares=redirect-to-https"
|
||||
|
||||
- "traefik.http.routers.paperclip-https.rule=Host(`paperclip.lazyworkhorse.net`)"
|
||||
- "traefik.http.routers.paperclip-https.entrypoints=websecure"
|
||||
- "traefik.http.routers.paperclip-https.tls=true"
|
||||
- "traefik.http.routers.paperclip-https.tls.certresolver=njalla"
|
||||
|
||||
- "traefik.http.services.paperclip.loadbalancer.server.port=3100"
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Honcho — Memory infrastructure for stateful AI agents
|
||||
# Self-hosted memory server with pgvector for embedding storage.
|
||||
# Defaults to Ollama for embeddings; configure LLM provider for full deriver
|
||||
# and summarization support.
|
||||
#
|
||||
# API port: 8000
|
||||
# Web: https://honcho.lazyworkhorse.net
|
||||
# Docs: https://github.com/plastic-labs/honcho
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
honcho-db:
|
||||
image: pgvector/pgvector:pg17-trixie
|
||||
container_name: honcho-db
|
||||
restart: unless-stopped
|
||||
environment:
|
||||
POSTGRES_DB: honcho
|
||||
POSTGRES_USER: honcho
|
||||
POSTGRES_PASSWORD: ${HONCHO_DB_PASSWORD:?HONCHO_DB_PASSWORD must be set}
|
||||
healthcheck:
|
||||
test: ["CMD-SHELL", "pg_isready -U honcho -d honcho"]
|
||||
interval: 5s
|
||||
timeout: 5s
|
||||
retries: 10
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Honcho/pgdata:/var/lib/postgresql/data
|
||||
- ./honcho/init.sql:/docker-entrypoint-initdb.d/init.sql
|
||||
networks:
|
||||
- ai_backend
|
||||
|
||||
honcho:
|
||||
build:
|
||||
context: ./honcho
|
||||
dockerfile: Dockerfile
|
||||
container_name: honcho
|
||||
restart: unless-stopped
|
||||
ports:
|
||||
- "127.0.0.1:8000:8000"
|
||||
depends_on:
|
||||
honcho-db:
|
||||
condition: service_healthy
|
||||
environment:
|
||||
DB_CONNECTION_URI: postgresql+psycopg://honcho:${HONCHO_DB_PASSWORD:?HONCHO_DB_PASSWORD must be set}@honcho-db:5432/honcho
|
||||
LOG_LEVEL: INFO
|
||||
LLM_OPENAI_API_KEY: ${LLM_OPENAI_API_KEY:-ollama}
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Honcho/config.toml:/app/config.toml
|
||||
networks:
|
||||
- ai_backend
|
||||
- ai_net
|
||||
labels:
|
||||
- "traefik.enable=true"
|
||||
- "traefik.docker.network=ai_net"
|
||||
|
||||
- "traefik.http.routers.honcho-http.rule=Host(`honcho.lazyworkhorse.net`)"
|
||||
- "traefik.http.routers.honcho-http.entrypoints=web"
|
||||
- "traefik.http.routers.honcho-http.middlewares=redirect-to-https"
|
||||
|
||||
- "traefik.http.routers.honcho-https.rule=Host(`honcho.lazyworkhorse.net`)"
|
||||
- "traefik.http.routers.honcho-https.entrypoints=websecure"
|
||||
- "traefik.http.routers.honcho-https.tls=true"
|
||||
- "traefik.http.routers.honcho-https.tls.certresolver=njalla"
|
||||
|
||||
- "traefik.http.services.honcho.loadbalancer.server.port=8000"
|
||||
|
||||
holographic-memory:
|
||||
build:
|
||||
context: ./holographic-memory
|
||||
image: holographic-memory:latest
|
||||
container_name: holographic-memory
|
||||
restart: unless-stopped
|
||||
ports:
|
||||
- "127.0.0.1:8100:8100"
|
||||
environment:
|
||||
- HOLOGRAPHIC_DB_PATH=/data/holographic/memory_store.db
|
||||
- HOLOGRAPHIC_PORT=8100
|
||||
- HOLOGRAPHIC_DEFAULT_TRUST=0.5
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/HolographicMemory:/data/holographic
|
||||
networks:
|
||||
- ai_backend
|
||||
healthcheck:
|
||||
test: ["CMD", "python3", "-c", "import urllib.request; urllib.request.urlopen('http://127.0.0.1:8100/health')"]
|
||||
interval: 30s
|
||||
timeout: 5s
|
||||
retries: 3
|
||||
start_period: 10s
|
||||
# ── Worker Template (commented — uncomment + configure to activate) ──
|
||||
# hermes-worker-1:
|
||||
# <<: *hermes-worker
|
||||
# container_name: hermes-worker-1
|
||||
# environment:
|
||||
# API_SERVER_PORT: "8651"
|
||||
# API_SERVER_KEY: "generated-by-provision-script"
|
||||
# DISCORD_BOT_TOKEN: ${WORKER_1_DISCORD_BOT_TOKEN}
|
||||
# volumes:
|
||||
# - /mnt/HoardingCow_docker_data/Hermes/worker-1:/opt/data
|
||||
# ─────────────────────────────────────────────────────────────
|
||||
|
||||
networks:
|
||||
ai_net:
|
||||
@@ -424,8 +296,8 @@ networks:
|
||||
# - /home/gortium/infra:/data/workspace/infra
|
||||
# environment:
|
||||
# - TZ=America/Toronto
|
||||
# - OPENCLAW_GATEWAY_TOKEN=${OPEN...KEN}
|
||||
# - OPENROUTER_API_KEY=${OPEN...KEY}
|
||||
# - OPENCLAW_GATEWAY_TOKEN=${OPENCLAW_GATEWAY_TOKEN}
|
||||
# - OPENROUTER_API_KEY=${OPENROUTER_API_KEY}
|
||||
# # Point to the sidecar browser
|
||||
# - BROWSER_CDP_URL=http://openclaw-browser:9222
|
||||
# - BROWSER_EVALUATE_ENABLED=true
|
||||
@@ -470,7 +342,7 @@ networks:
|
||||
# - PGID=1000
|
||||
# - PUBLIC_KEY_FILE=/config/ssh/authorized_keys
|
||||
# - SUDO_ACCESS=false
|
||||
# - PASSWORD_ACCESS=***
|
||||
# - PASSWORD_ACCESS=false
|
||||
# volumes:
|
||||
# - /mnt/HoardingCow_docker_data/openclaw/ssh-config:/config
|
||||
# - /home/gortium/infra:/data/workspace/infra:ro
|
||||
|
||||
@@ -79,26 +79,6 @@ PYEOF
|
||||
COPY --chmod=0755 himalaya-ro.sh /usr/local/bin/himalaya-ro
|
||||
|
||||
|
||||
# ---------- Install 7-Zip (7zz) for CHM extraction ----------
|
||||
RUN /opt/hermes/.venv/bin/python3 /dev/stdin << 'PYEOF'
|
||||
import urllib.request, tarfile, os, shutil, subprocess
|
||||
url = 'https://github.com/ip7z/7zip/releases/download/26.01/7z2601-linux-x64.tar.xz'
|
||||
xz = '/tmp/7z2601-linux-x64.tar.xz'
|
||||
urllib.request.urlretrieve(url, xz)
|
||||
os.makedirs('/tmp/7z', exist_ok=True)
|
||||
with tarfile.open(xz, 'r:xz') as t:
|
||||
t.extractall('/tmp/7z')
|
||||
shutil.move('/tmp/7z/7zz', '/usr/local/bin/7zz')
|
||||
os.chmod('/usr/local/bin/7zz', 0o755)
|
||||
shutil.rmtree('/tmp/7z', ignore_errors=True)
|
||||
os.remove(xz)
|
||||
# Verify
|
||||
result = subprocess.run(['/usr/local/bin/7zz'], capture_output=True, text=True)
|
||||
assert result.returncode == 0, f'7zz verify failed: {result.stderr}'
|
||||
print('7-Zip 26.01 installed successfully')
|
||||
PYEOF
|
||||
|
||||
|
||||
# ---------- Runtime ----------
|
||||
USER hermes
|
||||
ENV HERMES_HOME=/opt/data
|
||||
|
||||
@@ -1,72 +0,0 @@
|
||||
# Honcho — Memory infrastructure for stateful AI agents
|
||||
# Builds the Honcho FastAPI server from the official GitHub repository.
|
||||
#
|
||||
# Usage:
|
||||
# docker compose build honcho
|
||||
# docker compose up honcho
|
||||
#
|
||||
# Reference: https://github.com/plastic-labs/honcho
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Stage 1 — clone source & install dependencies
|
||||
# ---------------------------------------------------------------------------
|
||||
FROM python:3.13-slim-bookworm AS builder
|
||||
|
||||
RUN apt-get update && apt-get install -y git && rm -rf /var/lib/apt/lists/*
|
||||
|
||||
COPY --from=ghcr.io/astral-sh/uv:0.9.24 /uv /bin/uv
|
||||
|
||||
WORKDIR /src
|
||||
RUN git clone --depth 1 --branch main https://github.com/plastic-labs/honcho.git .
|
||||
|
||||
ENV UV_COMPILE_BYTECODE=1
|
||||
ENV UV_LINK_MODE=copy
|
||||
|
||||
# Install project dependencies (frozen from lockfile, no dev)
|
||||
RUN --mount=type=cache,target=/root/.cache/uv \
|
||||
uv sync --frozen --no-install-project --no-group dev
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Stage 2 — runtime image
|
||||
# ---------------------------------------------------------------------------
|
||||
FROM python:3.13-slim-bookworm AS runtime
|
||||
|
||||
COPY --from=ghcr.io/astral-sh/uv:0.9.24 /uv /bin/uv
|
||||
|
||||
RUN apt-get update && \
|
||||
apt-get install -y --no-install-recommends ca-certificates && \
|
||||
rm -rf /var/lib/apt/lists/*
|
||||
|
||||
WORKDIR /app
|
||||
|
||||
ENV UV_COMPILE_BYTECODE=1
|
||||
ENV UV_LINK_MODE=copy
|
||||
ENV PYTHONDONTWRITEBYTECODE=1
|
||||
ENV PYTHONUNBUFFERED=1
|
||||
ENV PATH="/app/.venv/bin:$PATH"
|
||||
ENV HOME=/app
|
||||
ENV UV_CACHE_DIR=/tmp/uv-cache
|
||||
|
||||
# Copy the dependency layer from the builder
|
||||
COPY --from=builder /src/uv.lock /src/pyproject.toml /app/
|
||||
RUN --mount=type=cache,target=/root/.cache/uv \
|
||||
uv sync --frozen --no-group dev
|
||||
|
||||
# Copy application source and config
|
||||
COPY --from=builder /src/src/ /app/src/
|
||||
COPY --from=builder /src/migrations/ /app/migrations/
|
||||
COPY --from=builder /src/scripts/ /app/scripts/
|
||||
COPY --from=builder /src/docker/ /app/docker/
|
||||
COPY --from=builder /src/alembic.ini /app/alembic.ini
|
||||
|
||||
# Create non-root user
|
||||
RUN addgroup --system app && \
|
||||
adduser --system --ingroup app app && \
|
||||
mkdir -p /tmp/uv-cache && \
|
||||
chown -R app:app /app /tmp/uv-cache
|
||||
|
||||
USER app
|
||||
EXPOSE 8000
|
||||
|
||||
# The entrypoint.sh script runs database migrations then starts the FastAPI server
|
||||
ENTRYPOINT ["sh", "docker/entrypoint.sh"]
|
||||
@@ -1 +0,0 @@
|
||||
CREATE EXTENSION IF NOT EXISTS vector;
|
||||
135
ai/scripts/provision-hermes-worker.sh
Executable file
135
ai/scripts/provision-hermes-worker.sh
Executable file
@@ -0,0 +1,135 @@
|
||||
#!/usr/bin/env bash
|
||||
set -euo pipefail
|
||||
|
||||
# ── Hermes Worker Provisioner ──────────────────────────────
|
||||
# Adds a new Paperclip Hermes worker to the ai compose stack.
|
||||
#
|
||||
# Usage:
|
||||
# ./provision-hermes-worker.sh <name> <discord_bot_token_var>
|
||||
#
|
||||
# Example:
|
||||
# ./provision-hermes-worker.sh worker-1 WORKER_1_DISCORD_BOT_TOKEN
|
||||
#
|
||||
# The script APPENDS only — never modifies or removes existing
|
||||
# content, even commented lines.
|
||||
#
|
||||
# Post-provision steps (manual):
|
||||
# 1. Add secrets to agenix .env file
|
||||
# 2. systemctl restart ai_stack.service
|
||||
# 3. Configure Paperclip agent
|
||||
# ─────────────────────────────────────────────────────────────
|
||||
|
||||
NAME="${1:?Usage: $0 <name> <discord_bot_token_var>}"
|
||||
TOKEN_VAR="${2:?Usage: $0 <name> <discord_bot_token_var>}"
|
||||
|
||||
# ── Paths ───────────────────────────────────────────────────
|
||||
SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
|
||||
COMPOSE_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
|
||||
COMPOSE_FILE="${COMPOSE_DIR}/compose.yml"
|
||||
|
||||
# Each Hermes worker gets its own volume on the NFS HoardingCow
|
||||
VOLUME_BASE="/mnt/HoardingCow_docker_data/Hermes"
|
||||
VOLUME_DIR="${VOLUME_BASE}/${NAME}"
|
||||
|
||||
# The Hermes container runs as UID 10000 (hermes user from Dockerfile)
|
||||
HERMES_UID=10000
|
||||
|
||||
# ── Validation ──────────────────────────────────────────────
|
||||
if ! [ -f "$COMPOSE_FILE" ]; then
|
||||
echo "❌ compose.yml not found at $COMPOSE_FILE"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
if grep -q "^ ${NAME}:" "$COMPOSE_FILE"; then
|
||||
echo "❌ Service '${NAME}' already exists in ${COMPOSE_FILE}"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
# ── Generate unique API key ─────────────────────────────────
|
||||
# Used by Paperclip to authenticate against this worker's
|
||||
# Hermes API server (/v1/chat/completions)
|
||||
API_KEY="pc_worker_$(openssl rand -hex 16)"
|
||||
|
||||
# ── Find next available API port ────────────────────────────
|
||||
# Workers get sequential ports starting at 8650.
|
||||
# Scans compose.yml for existing API_SERVER_PORT values and
|
||||
# picks the next one.
|
||||
BASE_PORT=8650
|
||||
MAX_PORT=0
|
||||
while IFS= read -r line; do
|
||||
port="${line#*API_SERVER_PORT: \"}"
|
||||
port="${port%%\"*}"
|
||||
if [ -n "$port" ] && [ "$port" -gt "$MAX_PORT" ]; then
|
||||
MAX_PORT="$port"
|
||||
fi
|
||||
done < <(grep -oP 'API_SERVER_PORT:\s*"\d+"' "$COMPOSE_FILE" 2>/dev/null)
|
||||
|
||||
NEW_PORT=$((MAX_PORT + 1))
|
||||
if [ "$NEW_PORT" -lt "$BASE_PORT" ]; then
|
||||
NEW_PORT=$BASE_PORT
|
||||
fi
|
||||
|
||||
# ── Create volume directory (on NFS) ────────────────────────
|
||||
echo "📁 Creating volume directory: ${VOLUME_DIR}"
|
||||
mkdir -p "$VOLUME_DIR"
|
||||
|
||||
# Hermes container runs as UID 10000 — set ownership so the
|
||||
# container can write its config, sessions, skills
|
||||
if command -v chown &>/dev/null; then
|
||||
chown -R "${HERMES_UID}:${HERMES_UID}" "$VOLUME_DIR" 2>/dev/null || \
|
||||
echo "⚠ Could not chown ${VOLUME_DIR} — run with sudo if needed"
|
||||
fi
|
||||
|
||||
# Make it group-readable for debugging
|
||||
chmod 755 "$VOLUME_DIR" 2>/dev/null || true
|
||||
|
||||
# ── Append service to compose.yml ───────────────────────────
|
||||
echo "📝 Appending service '${NAME}' to compose.yml ..."
|
||||
|
||||
TMPFILE=$(mktemp)
|
||||
|
||||
awk -v name="$NAME" \
|
||||
-v port="$NEW_PORT" \
|
||||
-v api_key="$API_KEY" \
|
||||
-v token_var="$TOKEN_VAR" \
|
||||
'
|
||||
# Insert new worker service block just before the networks: section
|
||||
/^networks:/ {
|
||||
print ""
|
||||
print " " name ":"
|
||||
print " <<: *hermes-worker"
|
||||
print " container_name: " name
|
||||
print " environment:"
|
||||
print " API_SERVER_PORT: \"" port "\""
|
||||
print " API_SERVER_KEY: \"" api_key "\""
|
||||
print " DISCORD_BOT_TOKEN: ${" token_var "}"
|
||||
print " volumes:"
|
||||
print " - /mnt/HoardingCow_docker_data/Hermes/" name ":/opt/data"
|
||||
print ""
|
||||
}
|
||||
{ print }
|
||||
' "$COMPOSE_FILE" > "$TMPFILE" && mv "$TMPFILE" "$COMPOSE_FILE"
|
||||
|
||||
# ── Done ────────────────────────────────────────────────────
|
||||
echo ""
|
||||
echo "✅ Worker '${NAME}' provisioned successfully"
|
||||
echo ""
|
||||
echo "────────────────────────────────────────────"
|
||||
echo " NEXT STEPS"
|
||||
echo "────────────────────────────────────────────"
|
||||
echo ""
|
||||
echo "1. Add secrets to the agenix .env stack file:"
|
||||
echo ""
|
||||
echo " # ${NAME}"
|
||||
echo " ${TOKEN_VAR}=<paste-discord-bot-token-here>"
|
||||
echo ""
|
||||
echo "2. Restart the AI stack:"
|
||||
echo ""
|
||||
echo " systemctl restart ai_stack.service"
|
||||
echo ""
|
||||
echo "3. In Paperclip, create an agent with HTTP adapter:"
|
||||
echo ""
|
||||
echo " Endpoint: http://${NAME}:${NEW_PORT}/v1/chat/completions"
|
||||
echo " API Key: ${API_KEY}"
|
||||
echo ""
|
||||
echo "────────────────────────────────────────────"
|
||||
@@ -1,93 +0,0 @@
|
||||
# Honcho Configuration
|
||||
# Pre-configured for self-hosted deployment with Ollama embeddings.
|
||||
# Mount this file at /app/config.toml in the Honcho container.
|
||||
#
|
||||
# Environment variables override these values at runtime
|
||||
# (e.g. DB_CONNECTION_URI, DERIVER_*).
|
||||
|
||||
[app]
|
||||
LOG_LEVEL = "INFO"
|
||||
NAMESPACE = "honcho"
|
||||
SESSION_OBSERVERS_LIMIT = 10
|
||||
GET_CONTEXT_MAX_TOKENS = 16384
|
||||
EMBED_MESSAGES = true
|
||||
|
||||
[db]
|
||||
# Connection URI is set via environment variable DB_CONNECTION_URI
|
||||
SCHEMA = "public"
|
||||
POOL_SIZE = 10
|
||||
MAX_OVERFLOW = 20
|
||||
POOL_TIMEOUT = 30
|
||||
POOL_RECYCLE = 300
|
||||
POOL_PRE_PING = true
|
||||
POOL_USE_LIFO = true
|
||||
SQL_DEBUG = false
|
||||
|
||||
[auth]
|
||||
USE_AUTH = false
|
||||
|
||||
[llm]
|
||||
DEFAULT_MAX_TOKENS = 4096
|
||||
|
||||
[embedding]
|
||||
VECTOR_DIMENSIONS = 768
|
||||
MAX_INPUT_TOKENS = 8192
|
||||
MAX_TOKENS_PER_REQUEST = 2048
|
||||
|
||||
[embedding.model_config]
|
||||
transport = "openai"
|
||||
model = "nomic-embed-text:latest"
|
||||
|
||||
[embedding.model_config.overrides]
|
||||
base_url = "http://ollama:11434/v1"
|
||||
# Ollama does not require an API key; env var must be set to non-empty string
|
||||
api_key_env = "LLM_OPENAI_API_KEY"
|
||||
|
||||
[deriver]
|
||||
ENABLED = false
|
||||
WORKERS = 1
|
||||
POLLING_SLEEP_INTERVAL_SECONDS = 1.0
|
||||
STALE_SESSION_TIMEOUT_MINUTES = 5
|
||||
DEDUPLICATE = true
|
||||
LOG_OBSERVATIONS = false
|
||||
|
||||
[deriver.model_config]
|
||||
transport = "openai"
|
||||
model = "qwen3.6:27b-q4_K_M"
|
||||
|
||||
[deriver.model_config.overrides]
|
||||
base_url = "http://ollama:11434/v1"
|
||||
api_key_env = "LLM_OPENAI_API_KEY"
|
||||
|
||||
[summary]
|
||||
ENABLED = false
|
||||
|
||||
[summary.model_config]
|
||||
transport = "openai"
|
||||
model = "qwen3.6:27b-q4_K_M"
|
||||
|
||||
[summary.model_config.overrides]
|
||||
base_url = "http://ollama:11434/v1"
|
||||
api_key_env = "LLM_OPENAI_API_KEY"
|
||||
|
||||
[dream]
|
||||
ENABLED = false
|
||||
|
||||
[dialectic]
|
||||
MAX_OUTPUT_TOKENS = 4096
|
||||
MAX_INPUT_TOKENS = 16384
|
||||
|
||||
[cache]
|
||||
ENABLED = false
|
||||
|
||||
[vector_store]
|
||||
TYPE = "pgvector"
|
||||
|
||||
[metrics]
|
||||
ENABLED = false
|
||||
|
||||
[telemetry]
|
||||
ENABLED = false
|
||||
|
||||
[sentry]
|
||||
ENABLED = false
|
||||
31
env/.env.example.honcho
vendored
31
env/.env.example.honcho
vendored
@@ -1,31 +0,0 @@
|
||||
# Honcho Environment Variables
|
||||
# Copy this file to your .env (at the compose root or docker-compose working directory)
|
||||
# and fill in the secrets.
|
||||
#
|
||||
# cp env/.env.example.honcho .env
|
||||
#
|
||||
# Then reference it from compose.yml:
|
||||
# env_file:
|
||||
# - path: .env
|
||||
# required: true
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Database
|
||||
# ---------------------------------------------------------------------------
|
||||
# PostgreSQL connection string for Honcho.
|
||||
# The password must match HONCHO_DB_PASSWORD below.
|
||||
HONCHO_DB_PASSWORD=change_me_to_a_strong_random_password
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# LLM Provider
|
||||
# ---------------------------------------------------------------------------
|
||||
# Ollama does not require a real API key, but the env var must be set to a
|
||||
# non-empty string for the OpenAI-compatible client to connect.
|
||||
LLM_OPENAI_API_KEY=ollama
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Honcho Server
|
||||
# ---------------------------------------------------------------------------
|
||||
# Honcho will pick up DB_CONNECTION_URI from the compose environment.
|
||||
# You can override additional settings here if needed.
|
||||
# LOG_LEVEL=INFO
|
||||
@@ -8,10 +8,13 @@ services:
|
||||
- USER_GID=1000
|
||||
- GITEA__server__ROOT_URL=https://code.lazyworkhorse.net
|
||||
- GITEA__actions__ENABLED=true
|
||||
- GITEA__actions__DEFAULT_ACTIONS_URL=off
|
||||
- SSH_PORT=2222
|
||||
- SSH_LISTEN_PORT=2222
|
||||
# Enable Gitea Actions (act_runner required on host)
|
||||
- GITEA__actions__ENABLED=true
|
||||
# Don't fetch actions from GitHub (offline mode + local only)
|
||||
- GITEA__actions__DEFAULT_ACTIONS_URL=off
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Gitea:/data
|
||||
networks:
|
||||
|
||||
Reference in New Issue
Block a user