Initial fleet ansible config - 2026-05-21T14:00:49-04:00

2026-05-21 14:00:49 -04:00
commit cea2a0ff15
8 changed files with 287 additions and 0 deletions
--- a/host_vars/artemis.yml
+++ b/host_vars/artemis.yml
@@ -0,0 +1,31 @@
+---
+# Artemis (AI Foreman) — Control node, no NVIDIA GPU
+node_type: foreman
+has_gpu: false
+
+# Artemis-specific packages (monitoring and control)
+extra_packages:
+  - nvtop                    # GPU monitoring (uses AMD iGPU info if available)
+  - nethogs                  # Per-process network monitoring
+  - iotop                    # Per-process I/O monitoring
+  - lm-sensors               # Temperature/fan monitoring
+  - stress-ng                # Load testing
+  - cockpit                  # Web-based system management
+
+# Services to manage (not auto-started, just ensure packages installed)
+managed_services:
+  - name: hermes-gateway
+    enabled: true
+  - name: hermes-dashboard
+    enabled: true
+
+# Ollama models for Artemis (CPU inference, small models only)
+ollama_models:
+  - gemma3:4b                # Small enough for CPU
+  - phi4-mini:latest         # Tiny, fast
+
+# Hermes configuration
+hermes_config:
+  provider: openrouter
+  model: openai/gpt-4o-mini
+  context_length: 128000
--- a/host_vars/bones.yml
+++ b/host_vars/bones.yml
@@ -0,0 +1,27 @@
+---
+# Bones (Mark XLI) — Headless CPU-only node
+node_type: headless
+has_gpu: false
+
+# Headless essentials
+extra_packages:
+  - cpufrequtils              # CPU frequency management
+  - lm-sensors               # Temperature monitoring
+  - smartmontools             # Disk health monitoring
+  - hdparm                    # Disk performance tuning
+  - netdata                   # lightweight monitoring (optional)
+
+# Services managed on Bones
+managed_services:
+  - name: jarvis              # Paperclip + Ollama + PostgreSQL stack
+    enabled: true
+  - name: ollama              # CPU inference only
+    enabled: true
+
+# Ollama config (CPU mode, very small models)
+ollama_models:
+  - gemma3:1b                # Ultra-tiny for CPU
+
+# Node-specific vars
+bones_storage: "256GB SSD"
+jvm_heap: "512m"
--- a/host_vars/hulkbuster.yml
+++ b/host_vars/hulkbuster.yml
@@ -0,0 +1,32 @@
+---
+# Mark44 (Hulkbuster) — Heavy GPU compute node
+node_type: gpu_heavy
+has_gpu: true
+gpu_type: nvidia
+gpu_model: "RTX 4070"
+vram_mb: 12282
+
+# GPU-specific tools (not drivers — Mark44 uses proprietary NVIDIA package)
+extra_packages:
+  - nvtop                     # GPU monitoring
+  - nethogs                   # Network per-process monitoring
+  - iotop                     # I/O per-process monitoring
+
+# Ollama models — largest VRAM headroom, can run big models
+ollama_models:
+  - gemma4:e4b               # Already pulled — keep it
+  - qwen2.5-coder:14b        # Primary coding model
+  - qwen2.5:14b             # General purpose large model
+
+# Services
+managed_services:
+  - name: ollama
+    enabled: true
+  - name: open-webui
+    enabled: true
+  - name: hermes-gateway
+    enabled: true
+
+# Ollama port override (standard)
+ollama_port: 11434
+open_webui_port: 8080
--- a/host_vars/mark5.yml
+++ b/host_vars/mark5.yml
@@ -0,0 +1,30 @@
+---
+# Mark5 (Suitcase) — Mobile/light GPU node
+node_type: gpu_light
+has_gpu: true
+gpu_type: nvidia
+gpu_model: "RTX 4060 Laptop"
+vram_mb: 8188
+
+# Laptop-specific packages
+extra_packages:
+  - nvtop                     # GPU monitoring
+  - powertop                  # Power management analysis
+  - tlp                       # Laptop power management
+  - htop                      # Already baseline, ensure present
+
+# Ollama models — limited VRAM, smaller models only
+ollama_models:
+  - qwen2.5-coder:7b         # Small coding model
+  - gemma3:4b                # Tiny, fast
+  - llama3.1:8b              # Balanced
+
+# Services
+managed_services:
+  - name: ollama
+    enabled: true
+  - name: hermes-gateway
+    enabled: true
+
+# Ollama port
+ollama_port: 11434
--- a/host_vars/nebuchadnezzar.yml
+++ b/host_vars/nebuchadnezzar.yml
@@ -0,0 +1,28 @@
+---
+# Neo (Nebuchadnezzar) — Services node
+# Nextcloud AIO + Vaultwarden ONLY. Debian.
+node_type: services
+has_gpu: false
+
+# Services-specific packages
+extra_packages:
+  - docker.io                # Nextcloud AIO is container-based
+  - docker-compose           # Compose for multi-service stacks
+  - apache2-utils            # htpasswd for Vaultwarden basic auth
+  - certbot                  # Let's Encrypt automation
+  - cron                     # Ensure cron is present
+
+# Services managed on Neo
+managed_services:
+  - name: nextcloud-aio
+    enabled: true
+  - name: vaultwarden
+    enabled: true
+
+# Ollama models: none — not an inference node
+ollama_models: []
+
+# Neo-specific facts
+neo_services:
+  - nextcloud_aio
+  - vaultwarden