Add AI stack

2025-12-27 12:43:54 -05:00
parent 2b5d5d9df2
commit 57ef5a13b1
4 changed files with 118 additions and 0 deletions
--- a/stacks/ai/ai-backend.hcl
+++ b/stacks/ai/ai-backend.hcl
--- a/stacks/ai/ai-backend.nomad
+++ b/stacks/ai/ai-backend.nomad
@@ -0,0 +1,65 @@
 job "ai-backend" {
  datacenters = ["Homelab-PTECH-DC"]
  region      = "home"
  type        = "service"
  group "ollama-group" {
    count = 1
    # Pin to P52 Laptop (eGPU Host)
    constraint {
      attribute = "${meta.device}"
      value     = "p52-laptop"
    }
    network {
      port "api" { static = 11434 }
    }
    task "ollama" {
      driver = "podman"
      env {
        OLLAMA_HOST    = "0.0.0.0"
        OLLAMA_ORIGINS = "*"
        # CRITICAL FOR 6900XT:
        # This tells ROCm to treat the card like a supported Pro workstation card
        HSA_OVERRIDE_GFX_VERSION = "10.3.0"
      }
      config {
        # Standard image (contains ROCm libraries)
        image = "docker.io/ollama/ollama:latest"
        ports = ["api"]
        # Required for hardware access
        privileged = true
        # Pass the graphics hardware to the container
        volumes = [
          "/opt/homelab/ollama:/root/.ollama",
          "/dev/kfd:/dev/kfd",
          "/dev/dri:/dev/dri"
        ]
      }
      service {
        name = "ollama"
        port = "api"
        check {
          type     = "http"
          path     = "/"
          interval = "20s"
          timeout  = "2s"
        }
      }
      resources {
        cpu    = 2000
        memory = 8192 # 8GB System RAM (The GPU has its own VRAM)
      }
    }
  }
 }
--- a/stacks/ai/ai-frontend.hcl
+++ b/stacks/ai/ai-frontend.hcl
--- a/stacks/ai/ai-frontend.nomad
+++ b/stacks/ai/ai-frontend.nomad
@@ -0,0 +1,53 @@
 job "ai-frontend" {
  datacenters = ["Homelab-PTECH-DC"]
  region      = "home"
  type        = "service"
  group "openwebui" {
    count = 1
    network {
      port "http" { to = 8080 }
    }
    service {
      name = "openwebui"
      port = "http"
      tags = ["traefik.enable=true"]
    }
    task "server" {
      driver = "podman"
      env {
        OLLAMA_BASE_URL = "http://ollama.service.consul:11434"
      }
      config {
        image = "ghcr.io/open-webui/open-webui:main"
        ports = ["http"]
        volumes = ["/opt/homelab/openwebui:/app/backend/data"]
      }
      resources { cpu = 1000; memory = 1024 }
    }
  }
  group "lobechat" {
    count = 1
    network {
      port "http" { to = 3210 }
    }
    service {
      name = "lobechat"
      port = "http"
      tags = ["traefik.enable=true"]
    }
    task "server" {
      driver = "podman"
      env {
        OLLAMA_PROXY_URL = "http://ollama.service.consul:11434"
        ACCESS_CODE      = "securepassword123"
      }
      config {
        image = "docker.io/lobehub/lobe-chat"
        ports = ["http"]
      }
      resources { cpu = 500; memory = 512 }
    }
  }
 }