refactor: split ai/ into hermes/ and ollama/ directories

- Rename ai/ to hermes/ (Hermes agent service) - Move ai/ollama/ to ollama/ (top-level, Ollama ROCm/gfx906 service) - Add ollama/compose.yml for standalone ollama deployment - Update hermes/compose.yml: remove ollama service (now in ollama/) - Update Makefile SERVICES list: ai -> hermes, add ollama - Bump ollama version from v0.13.5 to v0.23.2
2026-05-09 21:44:46 -04:00
parent ef58155897
commit 781d98046b
8 changed files with 92 additions and 312 deletions
--- a/ollama/compose.yml
+++ b/ollama/compose.yml
@@ -0,0 +1,41 @@
+version: "3.8"
+
+services:
+  ollama:
+    build:
+      context: ./
+      dockerfile: Dockerfile
+    image: ollama/ollama:rocm-gfx906
+    container_name: ollama
+    privileged: true
+    tty: true
+    restart: always
+    ports:
+      - "127.0.0.1:11434:11434"
+    networks:
+      - ai_backend
+    volumes:
+      - /mnt/HoardingCow_docker_data/Ollama/ollama:/root/.ollama
+    environment:
+      - OLLAMA_VULKAN=0
+      - OLLAMA_HOST=0.0.0.0
+      - OLLAMA_DEBUG=1
+      - OLLAMA_FLASH_ATTENTION=0
+      - OLLAMA_NUM_PARALLEL=2
+      # ROCm / gfx906 configuration
+      - HSA_OVERRIDE_GFX_VERSION=9.0.6
+      - HCC_AMDGPU_TARGET=gfx906
+      - HIP_VISIBLE_DEVICES=0,1
+      - ROCR_VISIBLE_DEVICES=0,1
+      - HSA_ENABLE_SDMA=0
+    devices:
+      - /dev/kfd:/dev/kfd
+      - /dev/dri:/dev/dri
+    group_add:
+      - "303"
+      - "26"
+
+networks:
+  ai_backend:
+    external: true
+    name: ai_backend