39 lines
1.1 KiB
YAML
39 lines
1.1 KiB
YAML
---
|
|
# Mark44 (Hulkbuster) — Heavy GPU compute node
|
|
node_type: gpu_heavy
|
|
has_gpu: true
|
|
gpu_type: nvidia
|
|
gpu_model: "RTX 4070"
|
|
vram_mb: 12282
|
|
|
|
# GPU-specific packages
|
|
extra_packages:
|
|
- nvidia-driver # NVIDIA driver (if not already installed via proprietary)
|
|
- cuda-toolkit # CUDA toolkit for ML workloads
|
|
- nvtop # GPU monitoring (better than nvidia-smi for live view)
|
|
- nethogs # Network per-process monitoring
|
|
- iotop # I/O per-process monitoring
|
|
|
|
# Ollama models — largest VRAM headroom, can run big models
|
|
ollama_models:
|
|
- gemma4:e4b # Already pulled — keep it
|
|
- qwen2.5-coder:14b # Primary coding model
|
|
- qwen2.5:14b # General purpose large model
|
|
- mistral:7b # Fallback fast model
|
|
|
|
# Services
|
|
managed_services:
|
|
- name: ollama
|
|
enabled: true
|
|
- name: open-webui
|
|
enabled: true
|
|
- name: hermes-gateway
|
|
enabled: true
|
|
|
|
# Ollama port override (standard)
|
|
ollama_port: 11434
|
|
open_webui_port: 8080
|
|
|
|
# Hermes auto-update offset (minutes from hour mark)
|
|
hermes_update_offset: 10
|