refactor: split ai/ into hermes/ and ollama/ directories
- Rename ai/ to hermes/ (Hermes agent service) - Move ai/ollama/ to ollama/ (top-level, Ollama ROCm/gfx906 service) - Add ollama/compose.yml for standalone ollama deployment - Update hermes/compose.yml: remove ollama service (now in ollama/) - Update Makefile SERVICES list: ai -> hermes, add ollama - Bump ollama version from v0.13.5 to v0.23.2
This commit is contained in:
38
hermes/compose.yml
Normal file
38
hermes/compose.yml
Normal file
@@ -0,0 +1,38 @@
|
||||
version: "3.8"
|
||||
services:
|
||||
|
||||
hermes:
|
||||
build: ./
|
||||
container_name: hermes
|
||||
restart: always
|
||||
# Gateway run enables the internal API server on port 8642
|
||||
command: gateway run
|
||||
environment:
|
||||
- OLLAMA_HOST=http://ollama:11434
|
||||
- API_SERVER_ENABLED=true
|
||||
- API_SERVER_PORT=8642
|
||||
- API_SERVER_HOST=0.0.0.0
|
||||
- API_SERVER_KEY=hermes_local_key
|
||||
- GATEWAY_ALLOW_ALL_USERS=true
|
||||
- OPENROUTER_API_KEY=${OPEN...KEY}
|
||||
# ROCm for GPU-accelerated faster-whisper STT
|
||||
- HSA_OVERRIDE_GFX_VERSION=9.0.6
|
||||
- HCC_AMDGPU_TARGET=gfx906
|
||||
- HIP_VISIBLE_DEVICES=0,1
|
||||
- ROCR_VISIBLE_DEVICES=0,1
|
||||
- HSA_ENABLE_SDMA=0
|
||||
volumes:
|
||||
- /mnt/HoardingCow_docker_data/Hermes/data:/opt/data
|
||||
devices:
|
||||
- /dev/kfd:/dev/kfd
|
||||
- /dev/dri:/dev/dri
|
||||
group_add:
|
||||
- "303"
|
||||
- "26"
|
||||
networks:
|
||||
- ai_backend
|
||||
|
||||
networks:
|
||||
ai_backend:
|
||||
external: true
|
||||
name: ai_backend
|
||||
Reference in New Issue
Block a user