- Rename ai/ to hermes/ (Hermes agent service) - Move ai/ollama/ to ollama/ (top-level, Ollama ROCm/gfx906 service) - Add ollama/compose.yml for standalone ollama deployment - Update hermes/compose.yml: remove ollama service (now in ollama/) - Update Makefile SERVICES list: ai -> hermes, add ollama - Bump ollama version from v0.13.5 to v0.23.2
39 lines
945 B
YAML
39 lines
945 B
YAML
version: "3.8"
|
|
services:
|
|
|
|
hermes:
|
|
build: ./
|
|
container_name: hermes
|
|
restart: always
|
|
# Gateway run enables the internal API server on port 8642
|
|
command: gateway run
|
|
environment:
|
|
- OLLAMA_HOST=http://ollama:11434
|
|
- API_SERVER_ENABLED=true
|
|
- API_SERVER_PORT=8642
|
|
- API_SERVER_HOST=0.0.0.0
|
|
- API_SERVER_KEY=hermes_local_key
|
|
- GATEWAY_ALLOW_ALL_USERS=true
|
|
- OPENROUTER_API_KEY=${OPEN...KEY}
|
|
# ROCm for GPU-accelerated faster-whisper STT
|
|
- HSA_OVERRIDE_GFX_VERSION=9.0.6
|
|
- HCC_AMDGPU_TARGET=gfx906
|
|
- HIP_VISIBLE_DEVICES=0,1
|
|
- ROCR_VISIBLE_DEVICES=0,1
|
|
- HSA_ENABLE_SDMA=0
|
|
volumes:
|
|
- /mnt/HoardingCow_docker_data/Hermes/data:/opt/data
|
|
devices:
|
|
- /dev/kfd:/dev/kfd
|
|
- /dev/dri:/dev/dri
|
|
group_add:
|
|
- "303"
|
|
- "26"
|
|
networks:
|
|
- ai_backend
|
|
|
|
networks:
|
|
ai_backend:
|
|
external: true
|
|
name: ai_backend
|