Repository: perrymanuk/hashi-homelab
Branch: master
Commit: c1705ab65354
Files: 180
Total size: 450.4 KB

Directory structure:
gitextract_ikark14b/

├── .bootstrap.mk
├── .gitattributes
├── .github/
│   └── workflows/
│       ├── build-gcp-dns-updater.yaml
│       ├── nomad.yaml
│       ├── update-kideo.yaml
│       ├── update-minecraftmath.yaml
│       ├── update-radbot-dev.yaml
│       └── update-radbot.yaml
├── .gitignore
├── LICENSE
├── Makefile
├── README.md
├── ansible/
│   ├── configs/
│   │   ├── consul.hcl.j2
│   │   ├── consul.service
│   │   ├── docker-daemon.json.j2
│   │   ├── nomad.hcl.j2
│   │   └── nomad.service
│   ├── playbook.yml
│   └── zsh.yml
├── docker_images/
│   ├── gcp-dns-updater/
│   │   ├── Dockerfile
│   │   ├── README.md
│   │   ├── requirements.txt
│   │   └── update_dns.py
│   └── update-metadata/
│       ├── Dockerfile
│       ├── README.md
│       ├── requirements.txt
│       └── update_job_metadata.py
├── envrc
├── nomad_jobs/
│   ├── TEMPLATE-volume.hcl
│   ├── TEMPLATE.job
│   ├── ai-ml/
│   │   ├── cognee/
│   │   │   └── nomad.job
│   │   ├── crawl4ai/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── litellm/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── manyfold/
│   │   │   ├── 3dprints-volume.hcl
│   │   │   ├── nomad.job
│   │   │   ├── prints_volume.hcl
│   │   │   └── volume.hcl
│   │   ├── ollama/
│   │   │   └── nomad.job
│   │   ├── open-webui/
│   │   │   └── nomad.job
│   │   ├── paperless-ai/
│   │   │   └── nomad.job
│   │   ├── pgvector-client/
│   │   │   └── nomad.job
│   │   └── radbot/
│   │       ├── nomad-dev.job
│   │       └── nomad.job
│   ├── core-infra/
│   │   ├── coredns/
│   │   │   ├── README.md
│   │   │   └── nomad.job
│   │   ├── github-runner/
│   │   │   └── nomad.job
│   │   ├── haproxy/
│   │   │   └── nomad.job
│   │   ├── iscsi-csi-plugin/
│   │   │   ├── controller.job
│   │   │   └── node.job
│   │   ├── keepalived/
│   │   │   ├── TODO.md
│   │   │   └── nomad.job
│   │   ├── nfs-csi-plugin/
│   │   │   ├── controller.job
│   │   │   └── nodes.job
│   │   ├── pihole/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── smtp/
│   │   │   └── nomad.job
│   │   ├── tailscale/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── tailscale-este/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── traefik/
│   │   │   ├── config/
│   │   │   │   ├── consul-catalog.yml
│   │   │   │   ├── consul.yml
│   │   │   │   ├── traefik.toml
│   │   │   │   ├── traefik.toml.new
│   │   │   │   └── traefik.toml.test
│   │   │   └── nomad.job
│   │   ├── traefik-forward-auth/
│   │   │   └── nomad.job
│   │   └── vault/
│   │       └── secrets_template.yaml
│   ├── gaming/
│   │   ├── minecraft-1.21/
│   │   │   └── nomad.job
│   │   ├── minecraft-avaritia/
│   │   │   └── nomad.job
│   │   ├── minecraft-axiom/
│   │   │   └── nomad.job
│   │   ├── minecraft-fiskheroes/
│   │   │   └── nomad.job
│   │   └── minecraft-forge/
│   │       └── nomad.job
│   ├── media-stack/
│   │   ├── audioserve/
│   │   │   └── nomad.job
│   │   ├── flaresolverr/
│   │   │   └── nomad.job
│   │   ├── jackett/
│   │   │   └── nomad.job
│   │   ├── lazylibrarian/
│   │   │   └── nomad.job
│   │   ├── lidarr/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── lidify/
│   │   │   └── nomad.job
│   │   ├── maintainerr/
│   │   │   └── nomad.job
│   │   ├── mediasage/
│   │   │   └── nomad.job
│   │   ├── multi-scrobbler/
│   │   │   └── nomad.job
│   │   ├── navidrome/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── ombi/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── overseerr/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── plex/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── prowlarr/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── qbittorrent/
│   │   │   └── nomad.job
│   │   ├── radarr/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── requestrr/
│   │   │   └── nomad.job
│   │   ├── sabnzbd/
│   │   │   └── nomad.job
│   │   ├── sickchill/
│   │   │   └── nomad.job
│   │   ├── sonarr/
│   │   │   └── nomad.job
│   │   ├── synclounge/
│   │   │   └── nomad.job
│   │   ├── tautulli/
│   │   │   └── nomad.job
│   │   └── tdarr/
│   │       ├── nomad.job
│   │       └── volume.hcl
│   ├── misc/
│   │   ├── adb/
│   │   │   └── nomad.job
│   │   ├── gcp-dns-updater/
│   │   │   ├── Dockerfile
│   │   │   ├── README.md
│   │   │   ├── nomad.job
│   │   │   ├── requirements.txt
│   │   │   └── update_dns.py
│   │   ├── gitea/
│   │   │   └── nomad.job
│   │   ├── linuxgsm/
│   │   │   └── nomad.job
│   │   ├── murmur/
│   │   │   └── nomad.job
│   │   ├── octoprint/
│   │   │   └── nomad.job
│   │   └── uploader/
│   │       └── nomad.job
│   ├── observability/
│   │   ├── alertmanager/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── blackbox-exporter/
│   │   │   └── nomad.job
│   │   ├── grafana/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── loki/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── oom-test/
│   │   │   └── nomad.job
│   │   ├── prometheus/
│   │   │   ├── README.md
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── telegraf/
│   │   │   └── nomad.job
│   │   ├── truenas-graphite-exporter/
│   │   │   └── nomad.job
│   │   └── vector/
│   │       └── nomad.job
│   ├── personal-cloud/
│   │   ├── actualbudget/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── bitwarden/
│   │   │   └── nomad.job
│   │   ├── nextcloud/
│   │   │   └── nomad.job
│   │   ├── ntfy/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── paperless/
│   │   │   └── nomad.job
│   │   └── radicale/
│   │       └── nomad.job
│   ├── security/
│   │   ├── suricata/
│   │   │   └── nomad.job
│   │   ├── suricata-update/
│   │   │   └── nomad.job
│   │   ├── wazuh-agent/
│   │   │   └── nomad.job
│   │   └── wazuh-server/
│   │       ├── nomad.job
│   │       ├── volume-dashboard.hcl
│   │       ├── volume-indexer.hcl
│   │       └── volume-manager.hcl
│   ├── smart-home/
│   │   ├── deconz/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── home-assistant/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── mqtt/
│   │   │   └── nomad.job
│   │   ├── owntracks-recorder/
│   │   │   └── nomad.job
│   │   └── zigbee2mqtt/
│   │       └── nomad.job
│   ├── storage-backends/
│   │   ├── docker-registry/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── mariadb/
│   │   │   └── nomad.job
│   │   ├── neo4j/
│   │   │   ├── nomad.job
│   │   │   ├── setup.job
│   │   │   └── volume.hcl
│   │   ├── pgvector/
│   │   │   ├── nomad.job
│   │   │   └── pgvector-setup.job
│   │   ├── postgres/
│   │   │   ├── nomad.job
│   │   │   └── postgres-setup.job
│   │   ├── qdrant/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   ├── redis/
│   │   │   ├── nomad.job
│   │   │   └── volume.hcl
│   │   └── volumes/
│   │       └── nfs-example.hcl
│   ├── system/
│   │   └── docker-cleanup/
│   │       └── nomad.job
│   └── web-apps/
│       ├── alertmanager-dashboard/
│       │   └── nomad.job
│       ├── firecrawl/
│       │   └── nomad.job
│       ├── heimdall/
│       │   └── nomad.job
│       ├── homepage/
│       │   └── nomad.job
│       ├── kideo/
│       │   └── nomad.job
│       ├── minecraftmath/
│       │   └── nomad.job
│       ├── wordpress/
│       │   └── nomad.job
│       └── www/
│           ├── Dockerfile
│           └── nomad.job
├── renovate.json
└── services/
    └── beefcake.json

================================================
FILE CONTENTS
================================================

================================================
FILE: .bootstrap.mk
================================================
export VERSION_TAG=$(shell git rev-parse --short HEAD)
export JOB_NAME=$(shell basename $PWD)

dash-split = $(word $2,$(subst -, ,$1))
dash-1 = $(call dash-split,$*,1)
dash-2 = $(call dash-split,$*,2)

help:##............Show this help.
	@echo ""
	@fgrep -h "##" $(MAKEFILE_LIST) | fgrep -v fgrep | sed -e 's/\\$$//' | sed -e 's/##//' | sed 's/^/    /'
	@echo ""
	@echo ""


================================================
FILE: .gitattributes
================================================
*.job linguist-language=HCL


================================================
FILE: .github/workflows/build-gcp-dns-updater.yaml
================================================
# .github/workflows/build-gcp-dns-updater.yaml
name: Build GCP DNS Updater Image

on:
  push:
    branches:
      - main
    paths:
      - 'docker_images/gcp-dns-updater/**'
  workflow_dispatch:

jobs:
  build-and-push:
    runs-on: ubuntu-latest
    permissions:
      contents: read
      packages: write # Required for pushing to GitHub Packages if used, good practice anyway

    steps:
      - name: Checkout Code
        uses: actions/checkout@v6

      - name: Set up Docker Buildx
        uses: docker/setup-buildx-action@v4

      - name: Login to Docker Registry
        uses: docker/login-action@v4
        with:
          registry: docker.${{ secrets.NOMAD_VAR_tld }}
          username: ${{ secrets.DOCKER_REGISTRY_USER }}
          password: ${{ secrets.DOCKER_REGISTRY_PASSWORD }}

      - name: Build Image using Makefile
        env:
          NOMAD_VAR_tld: ${{ secrets.NOMAD_VAR_tld }}
        run: make build-gcp-dns-updater

      - name: Push Image
        run: docker push docker.${{ secrets.NOMAD_VAR_tld }}/gcp-dns-updater:latest


================================================
FILE: .github/workflows/nomad.yaml
================================================
on:
  push:
    branches:
      - master

jobs:
  # JOB to run change detection
  changes:
    runs-on: ubuntu-latest
    permissions:
      pull-requests: read
    outputs:
      jobs: ${{ steps.filter.outputs.nomadjobs_files }}
      volumes: ${{ steps.filter_volumes.outputs.volumes_files }}
    steps:
    - name: 'Checkout'
      uses: 'actions/checkout@v6'

    - uses: dorny/paths-filter@v4
      id: filter_volumes
      with:
        list-files: 'json'
        filters: |
          volumes:
            - 'nomad_jobs/**/volume.hcl'
            - 'nomad_jobs/**/*-volume.hcl'

    - uses: dorny/paths-filter@v4
      id: filter
      with:
        list-files: 'json'
        filters: |
          nomadjobs:
            # Updated paths based on directory restructure
            - 'nomad_jobs/media-stack/plex/*.job'
            - 'nomad_jobs/media-stack/radarr/*.job'
            - 'nomad_jobs/media-stack/lidarr/*.job'
            - 'nomad_jobs/media-stack/overseerr/*.job'
            - 'nomad_jobs/storage-backends/postgres/*.job'
            - 'nomad_jobs/storage-backends/redis/*.job'
            - 'nomad_jobs/storage-backends/pgvector/*.job'
            - 'nomad_jobs/core-infra/coredns/*.job'
            - 'nomad_jobs/storage-backends/iscsi-csi-plugin/*.job'
            - 'nomad_jobs/media-stack/sabnzbd/*.job'
            - 'nomad_jobs/media-stack/qbittorrent/*.job'
            - 'nomad_jobs/media-stack/prowlarr/*.job'
            - 'nomad_jobs/media-stack/tdarr/*.job'
            - 'nomad_jobs/core-infra/smtp/*.job'
            - 'nomad_jobs/ai-ml/ollama/*.job'
            - 'nomad_jobs/ai-ml/open-webui/*.job'
            - 'nomad_jobs/misc/gcp-dns-updater/*.job'
            - 'nomad_jobs/core-infra/tailscale-este/*.job'
            - 'nomad_jobs/core-infra/traefik/*.job'
            - 'nomad_jobs/core-infra/iscsi-csi-plugin/*.job'
            - 'nomad_jobs/observability/alertmanager/*.job'
            - 'nomad_jobs/observability/prometheus/*.job'
            - 'nomad_jobs/ai-ml/radbot/*.job'
            - 'nomad_jobs/personal-cloud/ntfy/*.job'
            - 'nomad_jobs/web-apps/homepage/*.job'
            - 'nomad_jobs/media-stack/multi-scrobbler/*.job'
            - 'nomad_jobs/media-stack/lidify/*.job'
            - 'nomad_jobs/media-stack/mediasage/*.job'
            - 'nomad_jobs/core-infra/netboot-xyz/*.job'
            - 'nomad_jobs/web-apps/kideo/*.job'
            - 'nomad_jobs/web-apps/minecraftmath/*.job'

  add_volumes:
    runs-on: ubuntu-latest
    needs: changes
    if: needs.changes.outputs.volumes != '[]'
    continue-on-error: true
    strategy:
      matrix:
        job: ${{ fromJSON(needs.changes.outputs.volumes ) }}

    steps:
    - name: 'Checkout'
      uses: 'actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd' # v6

    - name: Connect to Tailscale
      uses: tailscale/github-action@v4
      with:
        oauth-client-id: ${{ secrets.TAILSCALE_OAUTH_CLIENT_ID }}
        oauth-secret: ${{ secrets.TAILSCALE_OAUTH_SECRET }}
        tags: tag:github-actions
        args: --accept-dns=true

    - name: Setup Nomad
      uses: hashicorp/setup-nomad@v1.0.0
      with:
        version: "1.10.4"

    - name: deploy
      shell: bash
      run: |
        # Extract volume ID from the HCL file
        VOLUME_ID=$(grep '^id' ${{ matrix.job }} | head -1 | sed 's/.*= *"\(.*\)"/\1/')
        # Skip if volume already exists
        if nomad volume status "$VOLUME_ID" > /dev/null 2>&1; then
          echo "Volume '$VOLUME_ID' already exists, skipping creation"
        else
          echo "Creating volume '$VOLUME_ID'"
          nomad volume create ${{ matrix.job }}
        fi
      env:
        NOMAD_ADDR: '${{ secrets.NOMAD_ADDR }}'

  deploy_jobs:
    runs-on: ubuntu-latest
    needs: changes
    if: needs.changes.outputs.jobs != '[]'
    continue-on-error: true
    strategy:
      matrix:
        job: ${{ fromJSON(needs.changes.outputs.jobs ) }}

    steps:
    - name: 'Checkout'
      uses: 'actions/checkout@de0fac2e4500dabe0009e67214ff5f5447ce83dd' # v6

    - name: Connect to Tailscale
      uses: tailscale/github-action@v4
      with:
        oauth-client-id: ${{ secrets.TAILSCALE_OAUTH_CLIENT_ID }}
        oauth-secret: ${{ secrets.TAILSCALE_OAUTH_SECRET }}
        tags: tag:github-actions
        args: --accept-dns=true

    - name: Setup Nomad
      uses: hashicorp/setup-nomad@v1.0.0
      with:
        version: "1.10.4"

    - name: deploy
      shell: bash
      run: |
        nomad job run ${{ matrix.job }} # Removed -var flags
      env:
        NOMAD_ADDR: '${{ secrets.NOMAD_ADDR }}'
        NOMAD_VAR_region: 'home'
        NOMAD_VAR_tld: '${{ secrets.NOMAD_VAR_tld }}' # Corrected case
        NOMAD_VAR_shared_dir: '/home/shared/'
        NOMAD_VAR_downloads_dir: '/home/sabnzbd/downloads'
        NOMAD_VAR_music_dir: '/home/media/Music'
        NOMAD_VAR_movies_dir: '/home/media/Movies'
        NOMAD_VAR_books_dir: '/home/media/Books'
        NOMAD_VAR_tv_dir: '/home/media/TV'
        NOMAD_VAR_media_dir: '/home/media'
        NOMAD_VAR_hass_key: '${{ secrets.NOMAD_VAR_hass_key }}' # Corrected case
        NOMAD_VAR_hass_ip: '${{ secrets.NOMAD_VAR_hass_ip }}'
        NOMAD_VAR_github_pat: ${{ secrets.NOMAD_VAR_github_pat }} # Corrected case
        NOMAD_VAR_datacenters_all: '["dc1", "public"]'
        NOMAD_VAR_datacenters_dc1: '["dc1"]'
        NOMAD_VAR_datacenters_public: '["public"]'
        NOMAD_VAR_tailscale_auth: '${{ secrets.NOMAD_VAR_tailscale_auth }}' # Corrected case
        NOMAD_VAR_tailscale_auth_este: '${{ secrets.NOMAD_VAR_tailscale_auth_este }}' # Corrected case
        NOMAD_VAR_oauth_client_id: '${{ secrets.NOMAD_VAR_oauth_client_id }}' # Corrected case
        NOMAD_VAR_oauth_client_secret: '${{ secrets.NOMAD_VAR_oauth_client_secret }}' # Corrected case
        NOMAD_VAR_oauth_secret: '${{ secrets.NOMAD_VAR_oauth_secret }}' # Corrected case
        NOMAD_VAR_oauth_emails: '${{ secrets.NOMAD_VAR_oauth_emails }}' # Corrected case
        NOMAD_VAR_ssh_id: '${{ secrets.NOMAD_VAR_ssh_id }}' # Corrected case
        NOMAD_VAR_truenas_api_key: '${{ secrets.NOMAD_VAR_truenas_api_key }}' # Corrected case
        NOMAD_VAR_gh_access_token: '${{ secrets.NOMAD_VAR_gh_access_token }}' # Corrected case
        NOMAD_VAR_ollama_data_dir: '/home/shared/ollama'
        NOMAD_VAR_ollama_base_url: 'http://ollama.service.consul:11434'
        NOMAD_VAR_webui_secret_key: '${{ secrets.NOMAD_VAR_webui_secret_key }}' # Corrected case
        NOMAD_VAR_datacenter: 'dc1'
        NOMAD_VAR_dns_server_ip: '192.168.50.2'
        # Added missing variables
        NOMAD_VAR_aws_access_key: ${{ secrets.NOMAD_VAR_aws_access_key }}
        NOMAD_VAR_aws_secret_key: ${{ secrets.NOMAD_VAR_aws_secret_key }}
        NOMAD_VAR_bedrock_aws_region: ${{ secrets.NOMAD_VAR_bedrock_aws_region }}
        NOMAD_VAR_gcp_dns_admin: ${{ secrets.NOMAD_VAR_gcp_dns_admin }}
        NOMAD_VAR_gemini_api_key: ${{ secrets.NOMAD_VAR_gemini_api_key }}
        NOMAD_VAR_litellm_master_key: ${{ secrets.NOMAD_VAR_litellm_master_key }}
        NOMAD_VAR_manyfold_secret_key: ${{ secrets.NOMAD_VAR_manyfold_secret_key }}
        NOMAD_VAR_postgres_pass: ${{ secrets.NOMAD_VAR_postgres_pass }}
        NOMAD_VAR_truenas_iscsi_pass: ${{ secrets.NOMAD_VAR_truenas_iscsi_pass }}
        # Added gcp_project_id
        NOMAD_VAR_gcp_project_id: ${{ secrets.NOMAD_VAR_gcp_project_id }}
        # GitHub PAT is now stored securely in secrets
        NOMAD_VAR_truenass_iscsi_pass: ${{ secrets.NOMAD_VAR_truenass_iscsi_pass }} # Note potential typo in name
        NOMAD_VAR_dns_zone: ${{ secrets.NOMAD_VAR_dns_zone }}
        NOMAD_VAR_ingress_ip: ${{ secrets.NOMAD_VAR_ingress_ip }}
        NOMAD_VAR_radbot_credential_key: ${{ secrets.NOMAD_VAR_radbot_credential_key }}
        NOMAD_VAR_radbot_admin_token: ${{ secrets.NOMAD_VAR_radbot_admin_token }}
        NOMAD_VAR_radbot_mcp_token: ${{ secrets.NOMAD_VAR_radbot_mcp_token }}
        NOMAD_VAR_mullvad_wireguard_key: ${{ secrets.NOMAD_VAR_mullvad_wireguard_key }}
        NOMAD_VAR_mullvad_wireguard_addr: ${{ secrets.NOMAD_VAR_mullvad_wireguard_addr }}
        NOMAD_VAR_sonarr_api_key: ${{ secrets.NOMAD_VAR_sonarr_api_key }}
        NOMAD_VAR_radarr_api_key: ${{ secrets.NOMAD_VAR_radarr_api_key }}
        NOMAD_VAR_curseforge_api_key: ${{ secrets.NOMAD_VAR_curseforge_api_key }}
        NOMAD_VAR_pgvector_pass: ${{ secrets.NOMAD_VAR_pgvector_pass }}
        NOMAD_VAR_pgvector_admin_password: ${{ secrets.NOMAD_VAR_pgvector_admin_password }}
        NOMAD_VAR_postgres_admin_password: ${{ secrets.NOMAD_VAR_postgres_admin_password }}
        NOMAD_VAR_litellm_crawl4ai_key: ${{ secrets.NOMAD_VAR_litellm_crawl4ai_key }}
        NOMAD_VAR_litellm_salt_key: ${{ secrets.NOMAD_VAR_litellm_salt_key }}
        NOMAD_VAR_wazuh_api_password: ${{ secrets.NOMAD_VAR_wazuh_api_password }}
        NOMAD_VAR_wazuh_dashboard_password: ${{ secrets.NOMAD_VAR_wazuh_dashboard_password }}
        NOMAD_VAR_wazuh_indexer_password: ${{ secrets.NOMAD_VAR_wazuh_indexer_password }}
        NOMAD_VAR_otr_pass: ${{ secrets.NOMAD_VAR_otr_pass }}
        NOMAD_VAR_plex_token: ${{ secrets.NOMAD_VAR_plex_token }}
        NOMAD_VAR_listenbrainz_token: ${{ secrets.NOMAD_VAR_listenbrainz_token }}
        NOMAD_VAR_listenbrainz_username: ${{ secrets.NOMAD_VAR_listenbrainz_username }}
        NOMAD_VAR_lastfm_api_key: ${{ secrets.NOMAD_VAR_lastfm_api_key }}
        NOMAD_VAR_lastfm_api_secret: ${{ secrets.NOMAD_VAR_lastfm_api_secret }}
        NOMAD_VAR_lidarr_api_key: ${{ secrets.NOMAD_VAR_lidarr_api_key }}
        NOMAD_VAR_kideo_jwt_secret: ${{ secrets.NOMAD_VAR_kideo_jwt_secret }}
        NOMAD_VAR_kideo_youtube_cookies: ${{ secrets.NOMAD_VAR_kideo_youtube_cookies }}
        NOMAD_VAR_kideo_curiositystream_user: ${{ secrets.NOMAD_VAR_kideo_curiositystream_user }}
        NOMAD_VAR_kideo_curiositystream_pass: ${{ secrets.NOMAD_VAR_kideo_curiositystream_pass }}
        NOMAD_VAR_minecraftmath_jwt_secret: ${{ secrets.NOMAD_VAR_minecraftmath_jwt_secret }}


================================================
FILE: .github/workflows/update-kideo.yaml
================================================
name: Update kideo image tag

on:
  repository_dispatch:
    types: [update-kideo]

jobs:
  update-and-deploy:
    runs-on: ubuntu-latest
    steps:
      - name: Checkout
        uses: actions/checkout@v6
        with:
          token: ${{ secrets.ACTIONS_PAT }}

      - name: Update image tag in Nomad job
        run: |
          TAG="${{ github.event.client_payload.tag }}"
          sed -i "s|ghcr.io/perrymanuk/kideo:[^ \"]*|ghcr.io/perrymanuk/kideo:${TAG}|" \
            nomad_jobs/web-apps/kideo/nomad.job
          echo "Updated kideo image tag to ${TAG}"

      - name: Commit and push
        run: |
          git config user.name "github-actions[bot]"
          git config user.email "github-actions[bot]@users.noreply.github.com"
          TAG="${{ github.event.client_payload.tag }}"
          git add nomad_jobs/web-apps/kideo/nomad.job
          git commit -m "chore: bump kideo to ${TAG}"
          git push


================================================
FILE: .github/workflows/update-minecraftmath.yaml
================================================
name: Update minecraftmath image tag

on:
  repository_dispatch:
    types: [update-minecraftmath]

jobs:
  update-and-deploy:
    runs-on: ubuntu-latest
    steps:
      - name: Checkout
        uses: actions/checkout@v6
        with:
          token: ${{ secrets.ACTIONS_PAT }}

      - name: Update image tag in Nomad job
        run: |
          TAG="${{ github.event.client_payload.tag }}"
          sed -i "s|ghcr.io/perrymanuk/minecraftmath:[^ \"]*|ghcr.io/perrymanuk/minecraftmath:${TAG}|" \
            nomad_jobs/web-apps/minecraftmath/nomad.job
          echo "Updated minecraftmath image tag to ${TAG}"

      - name: Commit and push
        run: |
          git config user.name "github-actions[bot]"
          git config user.email "github-actions[bot]@users.noreply.github.com"
          TAG="${{ github.event.client_payload.tag }}"
          git add nomad_jobs/web-apps/minecraftmath/nomad.job
          git commit -m "chore: bump minecraftmath to ${TAG}"
          git push


================================================
FILE: .github/workflows/update-radbot-dev.yaml
================================================
name: Update radbot-dev image tag

on:
  repository_dispatch:
    types: [update-radbot-dev]

jobs:
  update-and-deploy:
    runs-on: ubuntu-latest
    steps:
      - name: Checkout
        uses: actions/checkout@v6
        with:
          token: ${{ secrets.ACTIONS_PAT }}

      - name: Update image tag in dev Nomad job
        run: |
          TAG="${{ github.event.client_payload.tag }}"
          sed -i "s|ghcr.io/perrymanuk/radbot:[^ \"]*|ghcr.io/perrymanuk/radbot:${TAG}|" \
            nomad_jobs/ai-ml/radbot/nomad-dev.job
          echo "Updated radbot-dev image tag to ${TAG}"

      - name: Commit and push
        run: |
          git config user.name "github-actions[bot]"
          git config user.email "github-actions[bot]@users.noreply.github.com"
          TAG="${{ github.event.client_payload.tag }}"
          git add nomad_jobs/ai-ml/radbot/nomad-dev.job
          git commit -m "chore: deploy radbot-dev with ${TAG}"
          git push


================================================
FILE: .github/workflows/update-radbot.yaml
================================================
name: Update radbot image tag

on:
  repository_dispatch:
    types: [update-radbot]

jobs:
  update-and-deploy:
    runs-on: ubuntu-latest
    steps:
      - name: Checkout
        uses: actions/checkout@v6
        with:
          token: ${{ secrets.ACTIONS_PAT }}

      - name: Update image tag in Nomad job
        run: |
          TAG="${{ github.event.client_payload.tag }}"
          sed -i "s|ghcr.io/perrymanuk/radbot:[^ \"]*|ghcr.io/perrymanuk/radbot:${TAG}|" \
            nomad_jobs/ai-ml/radbot/nomad.job
          echo "Updated radbot image tag to ${TAG}"

      - name: Commit and push
        run: |
          git config user.name "github-actions[bot]"
          git config user.email "github-actions[bot]@users.noreply.github.com"
          TAG="${{ github.event.client_payload.tag }}"
          git add nomad_jobs/ai-ml/radbot/nomad.job
          git commit -m "chore: bump radbot to ${TAG}"
          git push


================================================
FILE: .gitignore
================================================
.envrc
.env
*-pub
.passwords
.envrc*
vault/secrets.yaml
vault/*.hcl
www/main.jpg
ssl
levant/*
!levant/defaults.yml
hosts
*.swp
.ra-aid
CLAUDE.md
scripts/*


================================================
FILE: LICENSE
================================================
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      "License" shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      "Licensor" shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      "Legal Entity" shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      "control" means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      "You" (or "Your") shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      "Source" form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      "Object" form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      "Work" shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      "Derivative Works" shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      "Contribution" shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, "submitted"
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as "Not a Contribution."

      "Contributor" shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a "NOTICE" text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an "AS IS" BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets "[]"
      replaced with your own identifying information. (Don't include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same "printed page" as the copyright notice for easier
      identification within third-party archives.

   Copyright [yyyy] [name of copyright owner]

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.


================================================
FILE: Makefile
================================================
# Load .env files
#include .envrc

include ./.bootstrap.mk

# Define base deployments using their service names
base_deployments = coredns docker-registry haproxy

#help: # Placeholder for potential future help generation

# Find the nomad job file for a given service name ($1) within nomad_jobs/ structure
# Usage: $(call find_job_file, service_name)
# Example: $(call find_job_file, coredns) -> nomad_jobs/core-infra/coredns/coredns.job (or .nomad)
find_job_file = $(shell find nomad_jobs/ -mindepth 2 -maxdepth 3 -type f \( -name '$1.job' -o -name '$1.nomad' \) -print -quit)

.PHONY: dc1-%
dc1-%: ## Deploy specific job to dc1 (searches within nomad_jobs/ structure)
	@JOB_FILE=$(call find_job_file,$*); \
	if [ -z "$$JOB_FILE" ]; then \
		echo "Error: Could not find nomad job file for '$*' in nomad_jobs/."; \
		exit 1; \
	fi; \
	echo "Found job file: $$JOB_FILE"; \
	nomad job run -var datacenters='["dc1"]' $$JOB_FILE

.PHONY: all-%
all-%: ## Deploy specific job to all DCs (searches within nomad_jobs/ structure)
	@JOB_FILE=$(call find_job_file,$*); \
	if [ -z "$$JOB_FILE" ]; then \
		echo "Error: Could not find nomad job file for '$*' in nomad_jobs/."; \
		exit 1; \
	fi; \
	echo "Found job file: $$JOB_FILE"; \
	nomad job run -var datacenters='["dc1", "hetzner"]' $$JOB_FILE

.PHONY: deploy-%
deploy-%: ## Deploy specific job (searches within nomad_jobs/ structure)
	@JOB_FILE=$(call find_job_file,$*); \
	if [ -z "$$JOB_FILE" ]; then \
		echo "Error: Could not find nomad job file for '$*' in nomad_jobs/."; \
		exit 1; \
	fi; \
	echo "Found job file: $$JOB_FILE"; \
	nomad job run $$JOB_FILE

.PHONY: deploy-base
deploy-base: ## Deploys base jobs (coredns, docker-registry, haproxy) to dc1
	@echo "Deploying base services to dc1: $(base_deployments)"
	$(foreach var,$(base_deployments), \
	    @JOB_FILE=$$(call find_job_file,$(var)); \
	    if [ -z "$$JOB_FILE" ]; then \
	        echo "Error: Could not find nomad job file for base deployment '$(var)' in nomad_jobs/."; \
	        exit 1; \
	    fi; \
	    echo "Deploying $(var) from $$JOB_FILE..."; \
	    nomad job run -var datacenters='["dc1"]' $$JOB_FILE; \
	)

.PHONY: sslkeys
sslkeys: ## Generate certs if you have SSL enabled
	consul-template -config ssl/consul-template.hcl -once -vault-renew-token=false

.PHONY: ssl-browser-cert
ssl-browser-cert: ## Generate browser cert if you have SSL enabled
	sudo openssl pkcs12 -export -out browser_cert.p12 -inkey ssl/hetzner/server-key.pem -in ssl/hetzner/server.pem -certfile ssl/hetzner/nomad-ca.pem

.PHONY: sync-github-secrets
sync-github-secrets: ## Sync NOMAD_VAR variables from .envrc to GitHub secrets using gh CLI
	@echo "Syncing NOMAD_VAR variables from .envrc to GitHub secrets..."
	@bash -c 'source .envrc && env | grep "^NOMAD_VAR_" | while read -r line; do \
		name="$${line%%=*}"; \
		value="$${line#*=}"; \
		echo "Setting $$name"; \
		printf "%s" "$$value" | gh secret set "$$name"; \
	done'
	@echo "✅ All NOMAD_VAR secrets synced to GitHub"

.PHONY: build-update-metadata
build-update-metadata: ## Build the update-metadata Docker image
	@echo "Building update-metadata Docker image..."
	# Assumes update-metadata is in docker_images/update-metadata/
	docker build --platform linux/amd64 -t update-metadata:latest docker_images/update-metadata/

.PHONY: build-gcp-dns-updater
build-gcp-dns-updater: ## Build the gcp-dns-updater Docker image
	@echo "Building gcp-dns-updater Docker image..."
	# Assumes gcp-dns-updater is in docker_images/gcp-dns-updater/
	docker build --platform linux/amd64 -t docker.$$NOMAD_VAR_tld/gcp-dns-updater:latest docker_images/gcp-dns-updater/

# Example deployment target for gcp-dns-updater (if needed, uncomment and adjust)
#.PHONY: deploy-gcp-dns-updater
#deploy-gcp-dns-updater: ## Deploy gcp-dns-updater job using generic target
#	$(MAKE) deploy-gcp-dns-updater


================================================
FILE: README.md
================================================
# Hashi-Homelab
<p align="center">
<img width="250" src="homelab.png" />
</p>

### UPDATE - September 2nd 2025

This repo has gone through some major changes since the last update. I've completely reorganized the job structure into 10 clean categories (77 services total now!), added a comprehensive AI/ML stack with Ollama and Open-WebUI, enhanced the monitoring with Loki and Vector for log aggregation, modernized the alertmanager with better persistence and pushover notifications, added weekly docker cleanup automation, redesigned CoreDNS and Traefik for proper HA deployment, and implemented comprehensive Nomad allocation monitoring. The GitHub Actions deployment has been refined with better change detection and the whole thing just runs much more smoothly now. Also added a bunch of new services like smart home integration, personal cloud apps, and storage backends including pgvector for AI workloads, plus a few other bits and bobs that make the whole setup more robust.

### Background

The hashi-homelab was born of a desire to have a simple to maintain but very flexible homelab setup. While designed to work as a cohesive whole, each individual job can be taken and deployed on any Nomad cluster with minimal adjustments - they're built to be portable and self-contained.

The main goals were to keep the resources required to run the base lab setup small and to have all of the parts be easily exchangeable.  

`make deploy-base` will deploy coredns, docker-registry and haproxy - these are needed for everything else to work but aside from these you can pick and choose what to deploy with `make deploy-SERVICE_NAME` to deploy any of the 77 services organized across 10 categories. `make deploy-prometheus` or `make deploy-ollama` for example. You can also target specific datacenters with `make dc1-traefik` or `make all-postgres`.

The whole thing is organized much better now with services grouped into logical categories like ai-ml, media-stack, smart-home, observability, etc. Makes it way easier to find what you're looking for and deploy related services together.

In the future I would like to provide a ready to boot image for a raspberry pi where you can run all of this as the resources needed are really minimal. With just the basics you can get away with one pi4 4gb model with plenty of room to spare.

### Core Components:

* **Scheduler**: Nomad *...with proper allocation monitoring now*
* **Service Catalog/Registry**: Consul  
* **Service Mesh**: Traefik *...redesigned for HA deployment, much more robust*
* **VPN**: Tailscale *...can't say enough good things about tailscale, its integral for my homelab now*
* **DNS**: CoreDNS *...now with HA setup and proper failover*
* **Keepalived**: Assign a floating IP for DNS to not lose it if a node goes down
* **Monitoring**: Prometheus, Alertmanager, Telegraf, Blackbox-exporter, and Grafana *...plus Loki and Vector for log aggregation*  
* **Container Registry**: Docker-Registry *...because sometimes you don't want to rely on Docker Hub being up*  
* **AI/ML**: Ollama for local LLM serving, Open-WebUI for chat interface, LiteLLM for API compatibility
* **Vector Database**: PostgreSQL with pgvector extension for AI/ML vector embeddings storage and similarity search
* **Storage**: NFS and iSCSI CSI plugins for persistent storage across the cluster

### Service Categories (77 total):

* **ai-ml** (8): ollama, open-webui, litellm, cognee, crawl4ai, manyfold, paperless-ai, pgvector-client
* **core-infra** (13): coredns, traefik, haproxy, keepalived, tailscale, github-runner, csi plugins, etc.
* **media-stack** (16): plex, sonarr, radarr, lidarr, sabnzbd, qbittorrent, overseerr, navidrome, etc.
* **personal-cloud** (4): nextcloud, bitwarden, paperless, radicale
* **smart-home** (5): home-assistant, deconz, zigbee2mqtt, mqtt, owntracks-recorder  
* **observability** (7): prometheus, grafana, alertmanager, loki, vector, telegraf, blackbox-exporter
* **storage-backends** (9): postgres, pgvector, redis, mariadb, neo4j, qdrant, docker-registry, etc.
* **web-apps** (5): heimdall, wordpress, firecrawl, alertmanager-dashboard, www
* **misc** (7): gitea, uploader, murmur, octoprint, adb, linuxgsm, gcp-dns-updater
* **system** (3): docker-cleanup, volumes

### Setup

You need to have Nomad and Consul already running, a simple setup with the -dev flag will suffice for testing but you'll want a proper cluster for real usage. If don't already have a Nomad and Consul cluster, there are some excellent guides here...  
https://www.nomadproject.io/guides/install/production/deployment-guide.html  
https://learn.hashicorp.com/consul/datacenter-deploy/deployment-guide  

There are also some files in the `config` folder to help you get started and also one with some services to announce so the Consul and Nomad UI are available over the service mesh.

This repo relies on a `.envrc` file and direnv installed or setting the environment variables manually.
There is an `envrc` example file located in the repo that you can fill in and move to `.envrc`


The secret values from the `.envrc` also need to be put into your github secrets if you plan on deploying via the automated workflow. You can use `make sync-github-secrets` to sync them all at once which is pretty handy.

Once this is done, you simply run a `make deploy-base` and point your DNS to resolve via one of the Nomad nodes' IP address.  

One of the more specific parts of the setup that you may need to adjust is I use several NFS mounts to provide persistent storage mounted on each client at `/home/shared` for configs and `/home/media` for images, video, audio, etc. Depending on which parts of this you are planning to deploy you will just need to adjust this persistent storage to meet the setup of your clients. The CSI plugins help make this more flexible now.

Services are exposed by their task name in the nomad job and whatever you configure your TLD to be in the `.envrc`. The whole thing works really well with the automated GitHub Actions deployment now - just push changes and they get deployed automatically to your cluster. This requires tailscale for the GitHub Actions to connect to your cluster.


================================================
FILE: ansible/configs/consul.hcl.j2
================================================
#jinja2: trim_blocks:False
server = {% if "lan-client-server" in group_names %}true{% else %}false{% endif %}
ui = {% if "lan-client-server" in group_names %}true{% else %}false{% endif %}
{% if "wan-clients" in group_names %}
{% raw %}
client_addr = "{{GetInterfaceIP \"tailscale0\"}}"
advertise_addr = "{{GetInterfaceIP \"tailscale0\"}}"
bind_addr = "{{GetInterfaceIP \"tailscale0\"}}"
{% endraw %}
{% else %}
{% raw %}
client_addr = "0.0.0.0"
advertise_addr = "{{ GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"address\" }}"
bind_addr = "0.0.0.0"
{% endraw %}
{% endif %}
{% raw %}
advertise_addr_wan = "{{ GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"address\" }}"
{% endraw %}
translate_wan_addrs = true
data_dir = "/var/lib/consul"
datacenter = "homelab"
enable_syslog = true
leave_on_terminate = true
log_level = "WARN"
retry_join = ["192.168.50.39", "192.168.50.113", "192.168.50.85"]
{% if "lan-client-server" in group_names %}bootstrap_expect = 3{% else %}{% endif %}
telemetry {
  prometheus_retention_time = "60s"
}


================================================
FILE: ansible/configs/consul.service
================================================
[Unit]
Description=consul agent
Requires=network-online.target tailscaled.service
After=network-online.target tailscaled.service

[Service]
ExecStartPre=/bin/sleep 30
EnvironmentFile=-/etc/default/consul
Restart=always
ExecStart=/usr/bin/consul agent -domain consul -ui -config-dir=/etc/consul.d
ExecReload=/bin/kill -HUP $MAINPID
KillSignal=SIGINT
[Install]
WantedBy=multi-user.target


================================================
FILE: ansible/configs/docker-daemon.json.j2
================================================
{
  "dns": ["192.168.50.2", "192.168.50.1", "8.8.8.8"]{% if 'cheese' in group_names %},
  "runtimes": {
    "nvidia": {
      "args": [],
      "path": "nvidia-container-runtime"
    }
  }
{% endif %}
}


================================================
FILE: ansible/configs/nomad.hcl.j2
================================================
#jinja2: trim_blocks:False
data_dir = "/var/lib/nomad/"
datacenter = {% if "cheese" in group_names %}"cheese"{% elif "minecraft" in group_names %}"minecraft"{% else %}"dc1"{% endif %}
log_level = "warn"
bind_addr = "0.0.0.0"
region = "home"

server {
  enabled          = {% if "lan-client-server" in group_names %}true{% else %}false{% endif %}
  bootstrap_expect = 3
  server_join {
    retry_join     = ["192.168.50.39", "192.168.50.113", "192.168.50.85"]
    retry_max      = 3
    retry_interval = "15s"
  }
  authoritative_region  = "home"
  heartbeat_grace = "300s"
  min_heartbeat_ttl = "20s"
}

client {
  enabled = true
{% raw %}
  network_interface = "{{ GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"name\" }}"
{% endraw %}
  options {
    docker.auth.config = "/root/.docker/config.json"
    docker.privileged.enabled = true
    driver.raw_exec.enable = "1"
    docker.volumes.enabled = true
  }

  meta {
    shared_mount = {% if "wan-clients" in group_names %}"false"{% else %}"true"{% endif %}
    dns = {% if "wan-clients" in group_names %}"false"{% else %}"true"{% endif %}
    {%- if ansible_hostname == "klo01" %}
    keepalived_priority = "100"
    keepalived_priority_dns1 = "100"
    keepalived_priority_dns2 = "{{ 200 | random(start=101) }}"
    {%- else %}
    keepalived_priority = "{{ 200 | random(start=101) }}"
    keepalived_priority_dns1 = "{{ 200 | random(start=101) }}"
    keepalived_priority_dns2 = "{{ 200 | random(start=101) }}"
    {%- endif %}
  }

  host_network "lan" {
    cidr = "192.168.50.0/24"
    reserved_ports = "22"
  }

  host_network "tailscale" {
    cidr = "100.0.0.0/8"
    reserved_ports = "22"
  }

  {% if "wan-clients" in group_names %}
  host_network "public" {
    cidr = "78.47.90.68/32"
    reserved_ports = "22"
  }
  {%- endif %}

  {%- if ansible_hostname == "klo01" %}
  reserved {
    memory = 3072
  }
  {%- endif %}

}

telemetry {
  disable_hostname = true
  prometheus_metrics = true
  publish_allocation_metrics = true
  publish_node_metrics = true
  use_node_name = false
}
{% raw %}
advertise {
  http = "{{ GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"address\" }}:4646"
  rpc = "{{ GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"address\" }}:4647"
  serf = "{{ GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"address\" }}:4648"
}
{% endraw %}
consul {
  # The address to the Consul agent.
  {%- raw %}
  address = "127.0.0.1:8500"
  {%- endraw %}
  # The service name to register the server and client with Consul.

  client_service_name = "nomad-client"

  # Enables automatically registering the services.
  auto_advertise = true

  # Enabling the server and client to bootstrap using Consul.
  server_auto_join = true
  client_auto_join = true
}

#vault {
#  enabled = true
#  address = "http://vault.service.home:8200"
#  allow_unauthenticated = true
#  create_from_role = "nomad-cluster"
#}

plugin "docker" {
  config {
    allow_caps = ["CHOWN","DAC_OVERRIDE","FSETID","FOWNER","MKNOD","NET_RAW","SETGID","SETUID","SETFCAP","SETPCAP","NET_BIND_SERVICE","SYS_CHROOT","KILL","AUDIT_WRITE","NET_ADMIN","NET_BROADCAST","SYS_NICE"]
    # extra Docker labels to be set by Nomad on each Docker container with the appropriate value
    extra_labels = ["job_name", "task_group_name", "task_name", "namespace", "node_name"]
    allow_privileged = true
    volumes {
      enabled      = true
      selinuxlabel = "z"
    }
  }
}


================================================
FILE: ansible/configs/nomad.service
================================================
[Unit]
Description=nomad.agent
Requires=network-online.target tailscaled.service
After=network-online.target tailscaled.service remote-fs.target
# Hard requirement: Nomad must not start until NFS mounts are ready
RequiresMountsFor=/home/shared /home/media/TV /home/media/Music /home/media/Movies /home/media/Books

[Service]
EnvironmentFile=-/etc/default/nomad
Restart=on-failure
RestartSec=10
ExecStart=/usr/bin/nomad agent $OPTIONS -config=/etc/nomad.d/nomad.hcl
ExecReload=/bin/kill -HUP $MAINPID
KillSignal=SIGINT
KillMode=process

[Install]
WantedBy=multi-user.target


================================================
FILE: ansible/playbook.yml
================================================
---
- name: network mounts
  hosts:
    - lan-client-server
    - lan-client
    - cheese
    - minecraft
  become: true
  remote_user: root
  tasks:
    - name: Configure static IP via netplan
      copy:
        dest: /etc/netplan/00-installer-config.yaml
        content: |
          network:
            version: 2
            ethernets:
              ens3:
                addresses:
                  - {{ inventory_hostname }}/24
                routes:
                  - to: default
                    via: 192.168.50.1
                nameservers:
                  addresses:
                    - 192.168.50.1
      notify: Apply netplan

    - name: Ensure directories exist
      file:
        path: "{{ item }}"
        state: directory
        mode: '0755'
      with_items:
        - /home/shared
        - /home/media/TV
        - /home/media/Music
        - /home/media/Movies
        - /home/media/Books

    - name: makesure multipath.conf exists
      copy:
        content: ""
        dest: /etc/multipath.conf
        force: no
        backup: yes
      ignore_errors: yes

    - name: Manage /etc/multipath.conf
      blockinfile:
        path: /etc/multipath.conf
        block: |
          defaults {
              user_friendly_names yes
              find_multipaths yes
          }

    - name: Install Apt packages
      apt:
        name:
          - nfs-common
          - avahi-daemon
          - docker.io
          - open-iscsi
          - lsscsi
          - sg3-utils
          - multipath-tools
          - scsitools

    - name: Ensure /etc/docker directory exists
      file:
        path: /etc/docker
        state: directory
        mode: '0755'

    - name: Add NVIDIA Container Toolkit GPG key
      apt_key:
        url: https://nvidia.github.io/libnvidia-container/gpgkey
        state: present
        keyring: /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg
      when: "'cheese' in group_names"

    - name: Add NVIDIA Container Toolkit repository
      apt_repository:
        repo: "deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://nvidia.github.io/libnvidia-container/stable/deb/$(ARCH) /"
        state: present
        filename: nvidia-container-toolkit
      when: "'cheese' in group_names"

    - name: Install NVIDIA Container Toolkit
      apt:
        name: nvidia-container-toolkit
        state: present
        update_cache: yes
      when: "'cheese' in group_names"

    - name: Configure Docker daemon with fallback DNS and nvidia runtime
      template:
        src: configs/docker-daemon.json.j2
        dest: /etc/docker/daemon.json
      notify: Restart Docker

    - name: Remove old NFS fstab entries
      lineinfile:
        path: /etc/fstab
        regexp: '^192\.168\.50\.208:/mnt/.*'
        state: absent

    - name: Add NFS fstab entries with proper options
      blockinfile:
        path: /etc/fstab
        marker: "# {mark} ANSIBLE MANAGED NFS MOUNTS"
        block: |
          192.168.50.208:/mnt/pool0/share              /home/shared         nfs4    _netdev,hard,timeo=600,retrans=5,x-systemd.mount-timeout=90,x-systemd.requires=network-online.target,x-systemd.after=network-online.target  0  0
          192.168.50.208:/mnt/pool1/media/TV           /home/media/TV       nfs4    _netdev,hard,timeo=600,retrans=5,x-systemd.mount-timeout=90,x-systemd.requires=network-online.target,x-systemd.after=network-online.target  0  0
          192.168.50.208:/mnt/pool0/media/music        /home/media/Music    nfs4    _netdev,hard,timeo=600,retrans=5,x-systemd.mount-timeout=90,x-systemd.requires=network-online.target,x-systemd.after=network-online.target  0  0
          192.168.50.208:/mnt/pool1/media/Movies       /home/media/Movies   nfs4    _netdev,hard,timeo=600,retrans=5,x-systemd.mount-timeout=90,x-systemd.requires=network-online.target,x-systemd.after=network-online.target  0  0
          192.168.50.208:/mnt/pool0/media/audiobooks   /home/media/Books    nfs4    _netdev,hard,timeo=600,retrans=5,x-systemd.mount-timeout=90,x-systemd.requires=network-online.target,x-systemd.after=network-online.target  0  0
      notify:
        - Reload systemd fstab
        - Mount Filesystems

    - name: Enable services
      systemd:
        name: "{{ item }}"
        enabled: yes
        state: started
      with_items:
        - open-iscsi
        - multipath-tools

  handlers:
    - name: Apply netplan
      command: netplan apply

    - name: Reload systemd fstab
      systemd:
        daemon_reload: yes

    - name: Mount Filesystems
      command: mount -a

    - name: Restart Docker
      service:
        name: docker
        state: restarted

- name: Update configuration, execute command, and install packages
  hosts:
    - lan-client-server
    - lan-client
    - wan-clients
    - cheese
    - minecraft
  remote_user: root
  #roles:
  #  - role: artis3n.tailscale
  #    vars:
  #      # Example pulling the API key from the env vars on the host running Ansible
  #      tailscale_authkey: "{{ lookup('env', 'NOMAD_VAR_tailscale_auth') }}"
  #      tailscale_args: "{% if 'wan-clients' in group_names %}--accept-routes=true{% else %}--accept-routes=false{% endif %}"
  tasks:
    - name: Ensure directories exist
      file:
        path: "{{ item }}"
        state: directory
        mode: '0755'
      with_items:
        - /var/lib/nomad
        - /var/lib/consul
        - /etc/nomad.d
        - /etc/consul.d

    - name: Manage systemd service file nomad
      copy:
        src: configs/nomad.service
        dest: /lib/systemd/system/nomad.service
      notify: Reload systemd

    - name: Manage systemd service file consul
      copy:
        src: configs/consul.service
        dest: /lib/systemd/system/consul.service
      notify: Reload systemd

    - name: manage nomad config
      template:
        src: configs/nomad.hcl.j2
        dest: /etc/nomad.d/nomad.hcl
      notify: Restart Service

    - name: manage consul config
      template:
        src: configs/consul.hcl.j2
        dest: /etc/consul.d/server.hcl

    - name: Add HashiCorp APT repository key
      apt_key:
        url: https://apt.releases.hashicorp.com/gpg
        state: present
        validate_certs: no
        keyring: /usr/share/keyrings/hashicorp-archive-keyring.gpg

    - name: Configure HashiCorp APT repository
      apt_repository:
        repo: "deb [signed-by=/usr/share/keyrings/hashicorp-archive-keyring.gpg] https://apt.releases.hashicorp.com {{ ansible_distribution_release }} main"

    - name: Install Apt packages
      apt:
        name:
          - nomad=1.10.4-1
          - consul=1.19.1-1
        dpkg_options: 'force-confdef,force-confold'
        update_cache: true
        state: latest
        allow_downgrade: true

    - name: Modify sysctl entry for net.ipv4.ip_nonlocal_bind
      sysctl:
        name: "{{ item.name }}"
        value: "{{ item.value }}"
        state: present
      with_items:
        - { name: "net.ipv4.ip_nonlocal_bind", value: "1" }
        - { name: "net.ipv4.conf.all.forwarding", value: "1" }
      notify: Apply Sysctl Changes

    - name: Enable services
      systemd:
        name: "{{ item }}"
        enabled: yes
        state: started
      with_items:
        - nomad
        - consul
        - tailscaled

  handlers:
    - name: Restart Service
      service:
        name: nomad
        state: restarted

    - name: Reload systemd
      systemd:
        daemon_reload: yes

    - name: Mount Filesystems
      command: mount -a

    - name: Apply Sysctl Changes
      command: sysctl -p /etc/sysctl.conf

- name: Install and configure Tailscale
  hosts:
    - all
  become: yes
  remote_user: root
  gather_facts: yes
  tags: tailscale

  vars:
    # Read authkey from environment variable; default to 'MISSING' if not set
    tailscale_auth_key: "{{ lookup('env', 'NOMAD_VAR_tailscale_auth') | default('MISSING') }}"
    # Optionally customize your Tailscale hostname
    tailscale_hostname: "{{ inventory_hostname }}"
    # Tag to advertise (must match OAuth client tag)
    tailscale_tags: "tag:nomad"

  tasks:
    - name: Download Tailscale GPG key via curl
      shell: >
        curl -fsSL https://pkgs.tailscale.com/stable/ubuntu/noble.noarmor.gpg
        | tee /usr/share/keyrings/tailscale-archive-keyring.gpg
        >/dev/null
      changed_when: true

    - name: Update apt cache
      apt:
        update_cache: yes

    - name: Configure Tailscale apt repository
      copy:
        dest: /etc/apt/sources.list.d/tailscale.list
        content: |
          deb [signed-by=/usr/share/keyrings/tailscale-archive-keyring.gpg arch=amd64] https://pkgs.tailscale.com/stable/ubuntu/ noble main

    - name: Update apt cache (after adding Tailscale repo)
      apt:
        update_cache: yes

    - name: Install Tailscale
      apt:
        name: tailscale
        state: latest

    - name: Enable and start tailscaled service
      service:
        name: tailscaled
        state: started
        enabled: yes

    - name: Bring Tailscale interface up using authkey
      # "command" used because there's no official Ansible module for "tailscale up".
      # This is not strictly idempotent; see notes below for advanced usage.
      command: >
        tailscale up
        --authkey={{ tailscale_auth_key }}
        --hostname={{ tailscale_hostname }}
        --advertise-tags={{ tailscale_tags }}
        --accept-dns=false
        --reset
      register: tailscale_up
      changed_when: "'Success' in tailscale_up.stdout or 'Success' in tailscale_up.stderr or tailscale_up.rc == 0"

    - name: Show tailscale status
      command: tailscale status
      register: tailscale_status
      changed_when: false

    - debug:
        var: tailscale_status.stdout

- name: Install Zsh and Oh My Zsh with Agnoster theme
  hosts: all
  become: yes
  remote_user: root
  gather_facts: yes

  vars:
    my_zsh_user: "root"  # Change this to the desired user

  tasks:
    - name: Install zsh
      apt:
        name: zsh
        state: present
        update_cache: yes

    - name: Ensure home directory path is known
      user:
        name: "{{ my_zsh_user }}"
      register: user_info  # This captures the user details, including home directory.

    - name: Check if Oh My Zsh is already installed
      stat:
        path: "/root/.oh-my-zsh"
      register: oh_my_zsh_stat

    - name: Check if zshrc exists
      stat:
        path: "/root/.zshrc"
      register: zshrc_stat

    - name: Clone Oh My Zsh
      git:
        repo: "https://github.com/ohmyzsh/ohmyzsh.git"
        dest: "/root/.oh-my-zsh"
      become_user: "{{ my_zsh_user }}"
      when: not oh_my_zsh_stat.stat.exists

    - name: Copy the default .zshrc template if not present
      copy:
        src: "/root/.oh-my-zsh/templates/zshrc.zsh-template"
        dest: "/root/.zshrc"
        remote_src: yes
      become_user: "{{ my_zsh_user }}"
      when: not zshrc_stat.stat.exists

    - name: Set Oh My Zsh theme to agnoster
      # Uses a regex replace to ensure 'ZSH_THEME="agnoster"'
      replace:
        path: "/root/.zshrc"
        regexp: '^ZSH_THEME="[^"]+"'
        replace: 'ZSH_THEME="agnoster"'
      become_user: "{{ my_zsh_user }}"

    - name: Change default shell to zsh for the user
      user:
        name: "{{ my_zsh_user }}"
        shell: /usr/bin/zsh


================================================
FILE: ansible/zsh.yml
================================================
---
- name: Install Zsh and Oh My Zsh with Agnoster theme
  hosts: cheese
  become: yes
  remote_user: root
  gather_facts: yes

  vars:
    my_zsh_user: "root"  # Change this to the desired user

  tasks:
    - name: Install zsh
      apt:
        name: zsh
        state: present
        update_cache: yes

    - name: Ensure home directory path is known
      user:
        name: "{{ my_zsh_user }}"
      register: user_info  # This captures the user details, including home directory.

    - name: Check if Oh My Zsh is already installed
      stat:
        path: "/root/.oh-my-zsh"
      register: oh_my_zsh_stat

    - name: Check if zshrc exists
      stat:
        path: "/root/.zshrc"
      register: zshrc_stat

    - name: Clone Oh My Zsh 
      git:
        repo: "https://github.com/ohmyzsh/ohmyzsh.git"
        dest: "/root/.oh-my-zsh"
      become_user: "{{ my_zsh_user }}"
      when: not oh_my_zsh_stat.stat.exists

    - name: Copy the default .zshrc template if not present
      copy:
        src: "/root/.oh-my-zsh/templates/zshrc.zsh-template"
        dest: "/root/.zshrc"
        remote_src: yes
      become_user: "{{ my_zsh_user }}"
      when: not zshrc_stat.stat.exists

    - name: Set Oh My Zsh theme to agnoster
      # Uses a regex replace to ensure 'ZSH_THEME="agnoster"'
      replace:
        path: "/root/.zshrc"
        regexp: '^ZSH_THEME="[^"]+"'
        replace: 'ZSH_THEME="agnoster"'
      become_user: "{{ my_zsh_user }}"

    - name: Change default shell to zsh for the user
      user:
        name: "{{ my_zsh_user }}"
        shell: /usr/bin/zsh


================================================
FILE: docker_images/gcp-dns-updater/Dockerfile
================================================
FROM python:3.14-slim

# Set the working directory in the container
WORKDIR /app

# Copy the requirements file into the container at /app
COPY requirements.txt .

# Install any needed packages specified in requirements.txt
# Using --no-cache-dir to reduce image size
RUN pip install --no-cache-dir -r requirements.txt

# Copy the current directory contents into the container at /app
COPY update_dns.py .

# Define the command to run the application
CMD ["python", "update_dns.py"]


================================================
FILE: docker_images/gcp-dns-updater/README.md
================================================
# GCP Dynamic DNS Updater Service

This service periodically checks the public IPv4 address of the node it's running on and updates a specified A record in a Google Cloud DNS managed zone. It's designed to run as a Nomad job within the Hashi-Homelab environment, utilizing a **pre-built Docker image**.

## Features

*   Fetches the current public IPv4 address from `https://v4.ifconfig.co/ip`.
*   Uses the `google-cloud-dns` Python SDK to interact with Google Cloud DNS.
*   Authenticates using a GCP Service Account key provided via an environment variable.
*   Checks the specified DNS record:
    *   If it's a CNAME, it deletes the CNAME record.
    *   If it's an A record, it updates the IP address if it has changed.
    *   If it doesn't exist (or after deleting a CNAME), it creates the A record with the specified TTL.
*   Runs periodically via a Nomad job, executing the Python script within the pre-built Docker container.

## Prerequisites

1.  **Docker:** Docker must be installed locally to build the service image.
2.  **GCP Service Account:** You need a Google Cloud Platform service account with the necessary permissions to manage DNS records.
    *   Go to the GCP Console -> IAM & Admin -> Service Accounts.
    *   Create a new service account (e.g., `gcp-dns-updater-sa`).
    *   Grant this service account the `DNS Administrator` role (`roles/dns.admin`) on the project containing your managed zone.
    *   Create a JSON key file for this service account and download it securely. You will need the *contents* of this file, not the file itself.
3.  **Nomad Environment:** A running Nomad cluster where this job can be scheduled. The Nomad clients must have Docker installed and configured.

## Configuration

The service is configured via environment variables passed to the Nomad task, which are then consumed by the `update_dns.py` script running inside the Docker container:

*   `GCP_DNS_ZONE_NAME`: The name of the managed zone in GCP DNS (e.g., `demonsafe-com`). The script derives the Project ID from the credentials.
*   `GCP_DNS_RECORD_NAME`: The DNS record name to update (e.g., `*.demonsafe.com`). **Note:** The script expects the base name; the trailing dot is handled internally if needed by the SDK.
*   `RECORD_TTL`: (Optional) The Time-To-Live (in seconds) for the created/updated A record. Defaults to 300 if not set.
*   `GCP_PROJECT_ID`: The Google Cloud Project ID containing the DNS zone.
*   `GCP_SERVICE_ACCOUNT_KEY_B64`: **Required.** The base64-encoded *content* of the GCP service account JSON key file.

**Generating the Base64 Key:**

You need to encode the *content* of your downloaded JSON key file into a single-line base64 string.

On Linux/macOS, you can use:
```bash
base64 -w 0 < /path/to/your/gcp_key.json
```
*(Ensure you use `-w 0` or an equivalent flag for your `base64` command to prevent line wrapping)*

Copy the resulting string.

**Setting Environment Variables in Nomad:**

These variables are defined within the `env` block of the `nomad.job` file using Go templating to read runtime environment variables provided by the Nomad agent (which in turn are often sourced from the deployment mechanism, like GitHub Actions):

```hcl
# Example within nomad.job task config
env {
  GCP_DNS_ZONE_NAME = <<EOH
{{ env "NOMAD_VAR_tld" | replace "." "-" }}
EOH
  GCP_DNS_RECORD_NAME = <<EOH
*.{{ env "NOMAD_VAR_tld" }}
EOH
  GCP_SERVICE_ACCOUNT_KEY_B64 = <<EOH
{{ env "NOMAD_VAR_gcp_dns_admin" }}
EOH
  GCP_PROJECT_ID = <<EOH
{{ env "NOMAD_VAR_gcp_project_id" }}
EOH
  # RECORD_TTL = "300" # Optional, defaults to 300 in the script
}
```

**Important:** The actual values for `NOMAD_VAR_tld`, `NOMAD_VAR_gcp_dns_admin`, and `NOMAD_VAR_gcp_project_id` **must** be provided securely to the Nomad agent's environment during deployment (e.g., via GitHub Actions secrets mapped in the workflow, or using Vault integration), not hardcoded directly in the job file.

## Deployment

1.  **Ensure Prerequisites:** Verify the service account is created, you have the base64 encoded key, and Docker is running.
2.  **Build the Docker Image:** From the root of the `hashi-homelab` repository, run the make target:
    ```bash
    make build-gcp-dns-updater
    ```
    This builds the required Docker image tagged `gcp-dns-updater:latest` using the `gcp-dns-updater/Dockerfile`.
3.  **Deploy the Nomad Job:**
    *   Ensure the required environment variables (`NOMAD_VAR_tld`, `NOMAD_VAR_gcp_dns_admin`, `NOMAD_VAR_gcp_project_id`) are available to the Nomad agent running the job. This is typically handled by the CI/CD pipeline (like the GitHub Actions workflow in this repo) or Vault integration.
    *   Deploy using the Nomad CLI (ensure you are in the repository root or adjust paths). This job will use the `gcp-dns-updater:latest` image built in the previous step:
        ```bash
        # The job will read variables from its environment
        nomad job run gcp-dns-updater/nomad.job
        ```
    *   Alternatively, if using the project's Makefile structure:
        ```bash
        # Assumes the Makefile's deploy target doesn't need extra vars
        # and that required env vars are set in the deployment runner
        make deploy-gcp-dns-updater
        ```

## Files

*   `update_dns.py`: The core Python script for updating DNS (runs inside the container).
*   `requirements.txt`: Python dependencies (installed during Docker build).
*   `Dockerfile`: Defines how to build the service's Docker image.
*   `nomad.job`: Nomad job definition for periodic execution using the `gcp-dns-updater:latest` Docker image.
*   `README.md`: This documentation file.


================================================
FILE: docker_images/gcp-dns-updater/requirements.txt
================================================
google-cloud-dns
requests
google-auth

================================================
FILE: docker_images/gcp-dns-updater/update_dns.py
================================================

import os
import requests
import logging
import sys
import base64
import json
import time
import socket # Added import

# Import GCP specific libraries
from google.cloud import dns
from google.oauth2 import service_account
from google.api_core.exceptions import GoogleAPIError

# Setup logging
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

def get_env_vars():
    """Reads required environment variables and returns them."""
    project_id = os.environ.get('GCP_PROJECT_ID')
    zone_name = os.environ.get('GCP_DNS_ZONE_NAME') # This will be the TLD like "demonsafe.com"
    record_name = os.environ.get('GCP_DNS_RECORD_NAME')
    key_b64 = os.environ.get('GCP_SERVICE_ACCOUNT_KEY_B64') # Changed variable name

    if not all([project_id, zone_name, record_name, key_b64]): # Check for key_b64
        missing = [var for var, val in [
            ('GCP_PROJECT_ID', project_id),
            ('GCP_DNS_ZONE_NAME', zone_name),
            ('GCP_DNS_RECORD_NAME', record_name),
            ('GCP_SERVICE_ACCOUNT_KEY_B64', key_b64) # Updated missing check
        ] if not val]
        logging.error(f"Missing required environment variables: {', '.join(missing)}")
        sys.exit(1)

    return project_id, zone_name, record_name, key_b64 # Return key_b64

def get_public_ip():
    """Fetches the public IPv4 address."""
    try:
        response = requests.get('https://v4.ifconfig.me/ip', timeout=10)
        response.raise_for_status()  # Raise an exception for bad status codes
        ip_address = response.text.strip()
        logging.info(f"Successfully fetched public IP: {ip_address}")
        return ip_address
    except requests.exceptions.RequestException as e:
        logging.error(f"Error fetching public IP: {e}")
        sys.exit(1) # Exit if IP cannot be fetched

def get_dns_client(key_b64: str, project_id: str): # Changed key_path to key_b64 and added project_id
    """Creates and returns a DNS client authenticated with a base64 encoded service account key."""
    try:
        # Decode the base64 string
        logging.info("Decoding base64 service account key...")
        decoded_key = base64.b64decode(key_b64)
        logging.info("Base64 key decoded successfully.")

        # Parse the decoded JSON key
        logging.info("Parsing service account key JSON...")
        key_info = json.loads(decoded_key)
        logging.info("Service account key JSON parsed successfully.")

        # Create credentials from the parsed key info
        credentials = service_account.Credentials.from_service_account_info(key_info)

        # Use the provided project_id, not the one from credentials, to ensure consistency
        client = dns.Client(project=project_id, credentials=credentials)
        logging.info(f"Successfully created DNS client for project {project_id}")
        return client

    except base64.binascii.Error as e:
        logging.error(f"Failed to decode base64 service account key: {e}")
        sys.exit(1)
    except json.JSONDecodeError as e:
        logging.error(f"Failed to parse service account key JSON: {e}")
        sys.exit(1)
    except Exception as e:
        logging.error(f"Failed to create DNS client from service account info: {e}")
        sys.exit(1)

def update_dns_record(client: dns.Client, project_id: str, zone_name: str, record_name: str, ip_address: str):
    """
    Checks and updates/creates an A record for the given name in the specified zone,
    replacing a CNAME if necessary.

    Args:
        client: Authenticated DNS client.
        project_id: GCP project ID.
        zone_name: The domain TLD (e.g., "demonsafe.com"). This will be converted
                   to the GCP zone name format (e.g., "demonsafe-com").
        record_name: The specific record to update (e.g., "*.demonsafe.com").
        ip_address: The public IP address to set.
    """
    try:
        # Convert the TLD zone name (e.g., "demonsafe.com") to GCP zone name format (e.g., "demonsafe-com")
        gcp_zone_name = zone_name.replace('.', '-')
        logging.info(f"Targeting GCP DNS Zone: {gcp_zone_name}")

        zone = client.zone(gcp_zone_name, project_id)
        if not zone.exists():
            logging.error(f"DNS zone '{gcp_zone_name}' not found in project '{project_id}'.")
            return # Cannot proceed without the zone

        # Ensure record_name ends with a dot for FQDN matching
        fqdn = record_name if record_name.endswith('.') else f"{record_name}."
        logging.info(f"Checking DNS records for: {fqdn} in zone {gcp_zone_name}")

        record_sets = list(zone.list_resource_record_sets(filter_=f"name={fqdn}"))

        existing_a_record = None
        existing_cname_record = None

        for record_set in record_sets:
            if record_set.record_type == 'A' and record_set.name == fqdn:
                existing_a_record = record_set
                logging.info(f"Found existing A record: {existing_a_record.name} -> {existing_a_record.rrdatas}")
            elif record_set.record_type == 'CNAME' and record_set.name == fqdn:
                existing_cname_record = record_set
                logging.info(f"Found existing CNAME record: {existing_cname_record.name} -> {existing_cname_record.rrdatas}")

        changes = zone.changes()
        needs_update = False

        # Handle existing CNAME (delete it to replace with A)
        if existing_cname_record:
            logging.warning(f"Deleting existing CNAME record {fqdn} to replace with A record.")
            changes.delete_record_set(existing_cname_record)
            needs_update = True
            # Ensure we don't try to delete an A record if we just deleted a CNAME
            existing_a_record = None

        # Define the new A record we want
        new_a_record = zone.resource_record_set(fqdn, "A", 300, [ip_address])

        # Handle existing A record
        if existing_a_record:
            if existing_a_record.rrdatas == [ip_address]:
                logging.info(f"Existing A record {fqdn} already points to {ip_address}. No update needed.")
                return # Nothing to do
            else:
                logging.info(f"Existing A record {fqdn} points to {existing_a_record.rrdatas}. Updating to {ip_address}.")
                changes.delete_record_set(existing_a_record)
                changes.add_record_set(new_a_record)
                needs_update = True
        # Handle case where no A record (and no CNAME was found/deleted)
        elif not existing_cname_record: # Only add if we didn't already decide to replace CNAME
            logging.info(f"No existing A or CNAME record found for {fqdn}. Creating new A record pointing to {ip_address}.")
            changes.add_record_set(new_a_record)
            needs_update = True
        # Handle case where CNAME was found and deleted - we still need to add the A record
        elif existing_cname_record:
             logging.info(f"Adding A record for {fqdn} pointing to {ip_address} after CNAME deletion.")
             changes.add_record_set(new_a_record)
             # needs_update should already be True

        # Execute the changes if any were queued
        if needs_update:
            logging.info(f"Executing DNS changes for {fqdn} in zone {gcp_zone_name}...")
            changes.create()
            # Wait until the changes are finished.
            while changes.status != 'done':
                logging.info(f"Waiting for DNS changes to complete (status: {changes.status})...")
                time.sleep(5) # Wait 5 seconds before checking again
                changes.reload()
            logging.info(f"Successfully updated DNS record {fqdn} to {ip_address} in zone {gcp_zone_name}.")
        else:
            # This case should only be hit if an A record existed and was correct
            logging.info("No DNS changes were necessary.")

    except GoogleAPIError as e:
        logging.error(f"GCP API Error updating DNS record {fqdn} in zone {gcp_zone_name}: {e}")
    except Exception as e:
        logging.error(f"An unexpected error occurred during DNS update for {fqdn} in zone {gcp_zone_name}: {e}")


def update_spf_record(client: dns.Client, project_id: str, zone_name: str, record_name: str, ip_address: str):
    """Updates the SPF TXT record on the bare domain with the current public IP."""
    try:
        gcp_zone_name = zone_name.replace('.', '-')
        logging.info(f"Updating SPF record in zone: {gcp_zone_name}")

        zone = client.zone(gcp_zone_name, project_id)
        if not zone.exists():
            logging.error(f"DNS zone '{gcp_zone_name}' not found in project '{project_id}'.")
            return

        # Derive bare domain from record_name (e.g., "*.demonsafe.com" -> "demonsafe.com.")
        domain = record_name.lstrip('*.') if record_name.startswith('*.') else record_name
        fqdn = domain if domain.endswith('.') else f"{domain}."
        logging.info(f"Checking TXT records for: {fqdn}")

        spf_value = f'"v=spf1 ip4:{ip_address} ~all"'

        record_sets = list(zone.list_resource_record_sets(filter_=f"name={fqdn}"))
        existing_txt = None
        for rs in record_sets:
            if rs.record_type == 'TXT' and rs.name == fqdn:
                existing_txt = rs
                logging.info(f"Found existing TXT record: {rs.name} -> {rs.rrdatas}")
                break

        changes = zone.changes()
        needs_update = False

        if existing_txt:
            new_rrdatas = []
            spf_found = False
            for rd in existing_txt.rrdatas:
                if 'v=spf1' in rd:
                    spf_found = True
                    if ip_address in rd:
                        logging.info(f"SPF record already contains {ip_address}. No update needed.")
                        return
                    logging.info(f"Replacing SPF entry: {rd} -> {spf_value}")
                    new_rrdatas.append(spf_value)
                else:
                    new_rrdatas.append(rd)
            if not spf_found:
                logging.info(f"No existing SPF entry found. Adding: {spf_value}")
                new_rrdatas.append(spf_value)

            changes.delete_record_set(existing_txt)
            new_txt = zone.resource_record_set(fqdn, "TXT", 300, new_rrdatas)
            changes.add_record_set(new_txt)
            needs_update = True
        else:
            logging.info(f"No TXT record found for {fqdn}. Creating with SPF: {spf_value}")
            new_txt = zone.resource_record_set(fqdn, "TXT", 300, [spf_value])
            changes.add_record_set(new_txt)
            needs_update = True

        if needs_update:
            logging.info(f"Executing SPF TXT changes for {fqdn}...")
            changes.create()
            while changes.status != 'done':
                logging.info(f"Waiting for SPF changes to complete (status: {changes.status})...")
                time.sleep(5)
                changes.reload()
            logging.info(f"Successfully updated SPF record for {fqdn} with ip4:{ip_address}")

    except GoogleAPIError as e:
        logging.error(f"GCP API Error updating SPF record: {e}")
    except Exception as e:
        logging.error(f"Unexpected error updating SPF record: {e}")


if __name__ == "__main__":
    logging.info("Starting DNS update script.")
    project_id, zone_name, record_name, key_b64 = get_env_vars()
    public_ip = get_public_ip()

    # DNS Pre-check logic
    if public_ip:
        hostname_to_check = 'asdf.demonsafe.com'
        logging.info(f"Performing pre-check for hostname: {hostname_to_check}")
        try:
            resolved_ip = socket.gethostbyname(hostname_to_check)
            logging.info(f"Resolved IP for {hostname_to_check}: {resolved_ip}")
            if resolved_ip == public_ip:
                logging.info(f'DNS record for {hostname_to_check} ({resolved_ip}) already matches public IP ({public_ip}). No update needed.')
                sys.exit(0)
            else:
                logging.info(f'Resolved IP for {hostname_to_check} ({resolved_ip}) does not match public IP ({public_ip}). Proceeding with potential update.')
        except socket.gaierror as e:
            logging.warning(f'Could not resolve IP for {hostname_to_check}: {e}. Proceeding with potential update.')
        except Exception as e:
            logging.warning(f'An unexpected error occurred during DNS pre-check for {hostname_to_check}: {e}. Proceeding with potential update.')

    if public_ip:
        dns_client = get_dns_client(key_b64, project_id)
        if dns_client:
            update_dns_record(dns_client, project_id, zone_name, record_name, public_ip)
            update_spf_record(dns_client, project_id, zone_name, record_name, public_ip)
            logging.info("DNS update script finished.")
        else:
            logging.error("Exiting due to DNS client initialization failure.")
            sys.exit(1)
    else:
        logging.error("Exiting due to inability to fetch public IP.")
        sys.exit(1)


================================================
FILE: docker_images/update-metadata/Dockerfile
================================================
FROM python:3.14-slim

WORKDIR /app

COPY requirements.txt .
RUN pip install --no-cache-dir -r requirements.txt

COPY sync_secrets.py .

ENTRYPOINT ["python", "sync_secrets.py"]


================================================
FILE: docker_images/update-metadata/README.md
================================================
# GitHub Secret Synchronization Script (Containerized)

## Purpose

This script (`sync_secrets.py`), running inside a Docker container, reads environment variables defined in the project's root `.envrc` file and synchronizes them as GitHub secrets to the `perrymanuk/hashi-homelab` repository using the `PyGithub` library.

## Requirements

*   **Docker:** Docker must be installed and running to build and execute the container.
*   **`NOMAD_VAR_github_pat` Environment Variable:** A GitHub Personal Access Token (PAT) with the `repo` scope must be available as an environment variable named `NOMAD_VAR_github_pat` in the **host shell** where you run the `make` command. The Makefile target (`sync-secrets`) will handle passing this token into the container under the name `GITHUB_TOKEN` for the script to use.
*   **`.envrc` File:** An `.envrc` file must exist at the project root (`/Users/perry.manuk/git/perrymanuk/hashi-homelab/.envrc`) containing the secrets to sync.

## Usage

1.  **Ensure `NOMAD_VAR_github_pat` is set:** Export your GitHub PAT in your current host shell session:
    ```bash
    export NOMAD_VAR_github_pat="your_github_pat_here"
    ```
2.  **Navigate to the project root directory:**
    ```bash
    cd /Users/perry.manuk/git/perrymanuk/hashi-homelab
    ```
3.  **Run the Makefile target:**
    ```bash
    make sync-secrets
    ```

This command will:
    *   Build the Docker image defined in `scripts/Dockerfile`.
    *   Run a container from the image.
    *   Mount the host's `.envrc` file into the container.
    *   Pass the **host's** `NOMAD_VAR_github_pat` environment variable into the container as `GITHUB_TOKEN`.
    *   Execute the `sync_secrets.py` script within the container.

The script will output the status of each secret synchronization attempt (created, updated, or failed).

**Important:** Running the script will overwrite any existing secrets in the GitHub repository that have the same name as variables found in the `.envrc` file.

## `.envrc` Format

The script expects the `.envrc` file to follow this format:

```bash
export VARIABLE_NAME=value
export ANOTHER_VARIABLE='value with spaces'
export YET_ANOTHER="double quoted value"
# This is a comment and will be ignored

# Empty lines are also ignored
export SECRET_KEY=a_very_secret_value_here
```

*   Lines must start with `export`.
*   Variable names and values are separated by `=`.
*   Values can be unquoted, single-quoted (`'...'`), or double-quoted (`"..."`). Quotes are stripped before syncing.
*   Lines starting with `#` (comments) and empty lines are ignored.


================================================
FILE: docker_images/update-metadata/requirements.txt
================================================
PyGithub
hcl2


================================================
FILE: docker_images/update-metadata/update_job_metadata.py
================================================

import argparse
import logging
import pathlib
import re
import sys

# Configure logging
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')


def find_job_block(content):
    """Find the start and end indices of the main 'job' block."""
    job_match = re.search(r'^job\s+"[^"]+"\s*\{', content, re.MULTILINE)
    if not job_match:
        logging.warning("Could not find job block start.")
        return None, None

    start_index = job_match.start()
    # Find the matching closing brace
    brace_level = 0
    end_index = -1
    in_string = False
    escaped = False
    for i, char in enumerate(content[start_index:]):
        if escaped:
            escaped = False
            continue
        if char == '\\':
            escaped = True
            continue
        if char == '"':
            in_string = not in_string
            continue
        if not in_string:
            if char == '{':
                brace_level += 1
            elif char == '}':
                brace_level -= 1
                if brace_level == 0:
                    end_index = start_index + i
                    break

    if end_index == -1:
        logging.warning("Could not find matching closing brace for job block.")
        return None, None

    return start_index, end_index + 1

def find_meta_block(content):
    """Find the start and end indices of the 'meta' block within the given content."""
    meta_match = re.search(r'^\s*meta\s*\{', content, re.MULTILINE)
    if not meta_match:
        return None, None

    start_index = meta_match.start()
    # Find the matching closing brace
    brace_level = 0
    end_index = -1
    in_string = False
    escaped = False
    for i, char in enumerate(content[start_index:]):
        if escaped:
            escaped = False
            continue
        if char == '\\':
            escaped = True
            continue
        if char == '"':
            in_string = not in_string
            continue
        if not in_string:
            if char == '{':
                brace_level += 1
            elif char == '}':
                brace_level -= 1
                if brace_level == 0:
                    end_index = start_index + i
                    break

    if end_index == -1:
        logging.warning("Could not find matching closing brace for meta block.")
        return None, None

    return start_index, end_index + 1

def update_job_metadata(repo_root):
    """Finds Nomad job files and updates their meta block with job_file path."""
    repo_path = pathlib.Path(repo_root).resolve()
    nomad_jobs_path = repo_path / 'nomad_jobs'

    if not nomad_jobs_path.is_dir():
        logging.error(f"'nomad_jobs' directory not found in {repo_path}")
        sys.exit(1)

    logging.info(f"Scanning for job files in {nomad_jobs_path}...")

    job_files = list(nomad_jobs_path.rglob('*.nomad')) + list(nomad_jobs_path.rglob('*.job'))

    if not job_files:
        logging.warning("No *.nomad or *.job files found.")
        return

    modified_count = 0
    for job_file in job_files:
        try:
            relative_path = job_file.relative_to(repo_path).as_posix()
            logging.debug(f"Processing file: {relative_path}")
            content = job_file.read_text()
            original_content = content # Keep a copy for comparison

            job_start, job_end = find_job_block(content)
            if job_start is None or job_end is None:
                logging.warning(f"Skipping {relative_path}: Could not find main job block.")
                continue
            job_block_content = content[job_start:job_end]
            job_opening_line_match = re.match(r'^job\s+"[^"]+"\s*\{\s*\n?', job_block_content, re.MULTILINE)
            if not job_opening_line_match:
                 logging.warning(f"Skipping {relative_path}: Could not match job opening line format.")
                 continue
            job_insert_pos = job_start + job_opening_line_match.end()

            meta_start_rel, meta_end_rel = find_meta_block(job_block_content)
            new_job_file_line = f'  job_file = "{relative_path}"'
            modified = False

            if meta_start_rel is not None and meta_end_rel is not None:
                meta_start_abs = job_start + meta_start_rel
                meta_end_abs = job_start + meta_end_rel
                meta_block_content = content[meta_start_abs:meta_end_abs]
                meta_opening_line_match = re.match(r'^\s*meta\s*\{\s*\n?', meta_block_content, re.MULTILINE)
                if not meta_opening_line_match:
                    logging.warning(f"Skipping {relative_path}: Could not match meta opening line format.")
                    continue
                meta_insert_pos = meta_start_abs + meta_opening_line_match.end()

                job_file_line_match = re.search(r'^(\s*)job_file\s*=\s*".*?"$\n?', meta_block_content, re.MULTILINE)

                if job_file_line_match:
                    existing_line = job_file_line_match.group(0)
                    indent = job_file_line_match.group(1)
                    new_line_with_indent = f'{indent}job_file = "{relative_path}"\n' # Ensure newline
                    if existing_line.strip() != new_line_with_indent.strip():
                         # Replace existing line
                        start = meta_start_abs + job_file_line_match.start()
                        end = meta_start_abs + job_file_line_match.end()
                        # Ensure we capture the trailing newline if present in match
                        content = content[:start] + new_line_with_indent + content[end:]
                        modified = True
                else:
                    # Insert new job_file line inside meta block
                    content = content[:meta_insert_pos] + new_job_file_line + '\n' + content[meta_insert_pos:]
                    modified = True
            else:
                # Insert new meta block
                new_meta_block = f'\n  meta {{\n{new_job_file_line}\n  }}\n'
                content = content[:job_insert_pos] + new_meta_block + content[job_insert_pos:]
                modified = True

            if modified and content != original_content:
                job_file.write_text(content)
                logging.info(f"Updated metadata in: {relative_path}")
                modified_count += 1
            elif not modified:
                 logging.debug(f"No changes needed for: {relative_path}")

        except Exception as e:
            logging.error(f"Failed to process {relative_path}: {e}")

    logging.info(f"Metadata update complete. {modified_count} files modified.")


if __name__ == "__main__":
    parser = argparse.ArgumentParser(description="Update Nomad job files with job_file metadata.")
    # Default to the parent directory of the script's directory (../)
    script_dir = pathlib.Path(__file__).parent.resolve()
    default_repo_root = script_dir.parent
    parser.add_argument(
        "--repo-root",
        type=str,
        default=str(default_repo_root),
        help="Path to the root of the repository."
    )
    args = parser.parse_args()

    update_job_metadata(args.repo_root)


================================================
FILE: envrc
================================================
export CONSUL_HTTP_ADDR=http://FILL_IN_IP:8500
export CONSUL_CACERT=/etc/consul.d/ssl/ca.cert
export CONSUL_CLIENT_CERT=/etc/consul.d/ssl/consul.cert
export CONSUL_CLIENT_KEY=/etc/consul.d/ssl/consul.key
export VAULT_ADDR=http://FILL_IN_IP:8200
export VAULT_TOKEN=FILL_IN_TOKEN
export NOMAD_ADDR=http://FILL_IN_IP:4646
export NOMAD_VAR_region='home'
export NOMAD_VAR_tld='home'
export NOMAD_VAR_shared_dir='/home/shared/'
export NOMAD_VAR_downloads_dir='/home/sabnzbd/downloads'
export NOMAD_VAR_music_dir='/home/media/Music'
export NOMAD_VAR_movies_dir='/home/media/Movies'
export NOMAD_VAR_tv_dir='/home/media/TV'
export NOMAD_VAR_media_dir='/home/media'


================================================
FILE: nomad_jobs/TEMPLATE-volume.hcl
================================================
// =============================================================================
// Nomad CSI Volume Template
// =============================================================================
//
// Usage:
//   1. Copy this file to nomad_jobs/<category>/<service-name>/volume.hcl
//   2. Replace __VOL_NAME__ with the volume name (usually same as service name)
//   3. Replace __SIZE__ with capacity (e.g. "5GiB", "10GiB", "50GiB")
//   4. Set access_mode based on your needs (see below)
//   5. Volume is auto-created by CI when pushed (if path is in workflow filter)
//
// Access modes:
//   single-node-writer       : one node read/write (most services)
//   single-node-reader-only  : one node read-only
//   multi-node-single-writer : multiple nodes can mount, one writes (HA failover)
//
// Size guide:
//   Config-only (app state):  1-5 GiB
//   Small databases:          5-10 GiB
//   Media metadata/indexes:   10-20 GiB
//   Time-series / logs:       50-100 GiB
//
// =============================================================================

id           = "__VOL_NAME__"
external_id  = "__VOL_NAME__"
name         = "__VOL_NAME__"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "__SIZE__"
capacity_max = "__SIZE__"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "file-system"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/TEMPLATE.job
================================================
// =============================================================================
// Nomad Job Template
// =============================================================================
//
// Usage:
//   1. Copy this file to nomad_jobs/<category>/<service-name>/nomad.job
//   2. Find/replace the following placeholders:
//      - __JOB_NAME__        : lowercase service name (e.g. "sonarr")
//      - __GROUP_NAME__      : group name (e.g. "downloaders", "monitoring", "ai")
//      - __CATEGORY__        : directory category (e.g. "media-stack", "ai-ml")
//      - __IMAGE__           : docker image with tag (e.g. "linuxserver/sonarr:4.0.16")
//      - __PORT__            : container port number (e.g. "8989")
//      - __HEALTH_PATH__     : HTTP health check path (e.g. "/ping", "/-/healthy", "/api/health")
//      - __CPU__             : CPU MHz allocation (see guide below)
//      - __MEMORY__          : Memory MB allocation (see guide below)
//   3. Remove any optional sections you don't need (marked with OPTIONAL)
//   4. Update the variable declarations at the bottom
//   5. Add any job-specific secrets to .envrc as NOMAD_VAR_<name>
//   6. Add the job path to .github/workflows/nomad.yaml if it should auto-deploy
//
// Resource guide:
//   Light services (static sites, proxies):     cpu = 100-200,  memory = 128-256
//   Medium services (APIs, web apps):            cpu = 500-1000, memory = 512-1024
//   Heavy services (.NET apps, databases, Java): cpu = 1000+,    memory = 1024-2048
//   GPU / ML workloads:                          cpu = 200+,     memory = 4096-8192
//
// =============================================================================

job "__JOB_NAME__" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/__CATEGORY__/__JOB_NAME__/nomad.job"
    version  = "1"
  }

  // Ensures scheduling on nodes with NFS shared mount available.
  // Remove if the service has no need for shared storage or config dirs.
  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "__GROUP_NAME__" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to           = "__PORT__"
      }
    }

    // --- OPTIONAL: CSI Volume ------------------------------------------------
    // Use for services that need persistent block storage (databases, stateful apps).
    // Requires a matching volume.hcl deployed first.
    // Remove this block and the prep-disk task + volume_mount if not needed.
    //
    // volume "__JOB_NAME__" {
    //   type            = "csi"
    //   read_only       = false
    //   source          = "__JOB_NAME__"
    //   access_mode     = "single-node-writer"
    //   attachment_mode = "file-system"
    // }
    // -------------------------------------------------------------------------

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel      = 1
      min_healthy_time  = "30s"
      healthy_deadline  = "5m"
      progress_deadline = "10m"
      auto_revert       = true
    }

    // --- OPTIONAL: Prep-disk task --------------------------------------------
    // Required when using CSI volumes to fix ownership before the main task runs.
    // Set UID:GID to match the user the main container runs as.
    // Common values:
    //   linuxserver images: 65534:65534 (nobody)
    //   prometheus:         1000:2000
    //   grafana:            472:472
    //   loki:               10001:10001
    //
    // task "prep-disk" {
    //   driver = "docker"
    //
    //   lifecycle {
    //     hook    = "prestart"
    //     sidecar = false
    //   }
    //
    //   volume_mount {
    //     volume      = "__JOB_NAME__"
    //     destination = "/volume/"
    //     read_only   = false
    //   }
    //
    //   config {
    //     image   = "busybox:latest"
    //     command = "sh"
    //     args    = ["-c", "chown -R UID:GID /volume/"]
    //   }
    //
    //   resources {
    //     cpu    = 200
    //     memory = 128
    //   }
    // }
    // -------------------------------------------------------------------------

    task "__JOB_NAME__" {
      driver = "docker"

      config {
        image = "__IMAGE__"
        ports = ["http"]

        // --- Bind mount pattern (shared NFS config dir) ---
        // Use for services that store config on shared NFS.
        // volumes = [
        //   "${var.shared_dir}__JOB_NAME__:/config",
        // ]

        // --- Template mount pattern (config rendered by Nomad) ---
        // Use when config is templated inline below.
        // volumes = [
        //   "local/config.yaml:/app/config.yaml",
        // ]
      }

      // --- OPTIONAL: CSI volume mount ----------------------------------------
      // volume_mount {
      //   volume      = "__JOB_NAME__"
      //   destination = "/data"
      //   read_only   = false
      // }
      // -----------------------------------------------------------------------

      env {
        TZ = "Etc/UTC"
        // PUID = "65534"    // common for linuxserver images
        // PGID = "65534"
      }

      // --- OPTIONAL: Config template -----------------------------------------
      // Use for services that need a rendered config file.
      // Reference secrets with ${var.secret_name} syntax.
      //
      // template {
      //   data        = <<EOH
      // your config here
      // EOH
      //   destination = "local/config.yaml"
      //   change_mode = "restart"
      //   // change_mode options:
      //   //   "restart" - restart the task on config change (safest default)
      //   //   "signal"  - send a signal: change_signal = "SIGHUP"
      //   //   "noop"    - do nothing (use only for static configs)
      // }
      // -----------------------------------------------------------------------

      service {
        port = "http"
        name = "__JOB_NAME__"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "__HEALTH_PATH__"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = __CPU__
        memory = __MEMORY__
      }
    }
  }
}

// =============================================================================
// Variables
// =============================================================================
// Common variables (always required - provided by .envrc / GitHub Actions):

variable "region" {
  type        = string
  description = "Nomad region"
}

variable "tld" {
  type        = string
  description = "Top-level domain for service discovery"
}

variable "shared_dir" {
  type        = string
  description = "Path to shared NFS config directory"
}

// --- OPTIONAL: Add job-specific variables below ------------------------------
// Follow this pattern:
//
// variable "my_secret" {
//   type        = string
//   description = "Description of what this secret is for"
// }
//
// Then add to .envrc:  export NOMAD_VAR_my_secret='value'
// And to GitHub Actions workflow env block if auto-deploying.
// -----------------------------------------------------------------------------


================================================
FILE: nomad_jobs/ai-ml/cognee/nomad.job
================================================
job "cognee" {
  region = var.region
  datacenters = ["dc1"]
  type = "service"

  meta {
    job_file = "nomad_jobs/ai-ml/cognee/nomad.job"
    version = "3"
  }

  group "cognee-ai" {
    count = 1

    network {
      port "http" { to = 8000 }
#      port "mcp" { to = 3000 }
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "cognee-service" {
      driver = "docker"

      config {
        dns_servers = ["192.168.50.2"]
        image = "cognee/cognee:0.5.8"
        ports = ["http"]
      }

      env {
        # --- LLM Configuration ---
        LLM_PROVIDER            = "openai"
        LLM_MODEL               = "vertex_ai/gemini-1.5-pro-latest"
        LLM_API_KEY             = ""
        LLM_ENDPOINT            = "https://litellm.demonsafe.com"

        # --- Embedding Configuration ---
        EMBEDDING_PROVIDER      = "openai"
        EMBEDDING_MODEL         = "text-embedding-ada-002"
        EMBEDDING_API_KEY       = ""

        # --- Relational Database (PostgreSQL) ---
        DB_PROVIDER             = "postgres"
        DB_HOST                 = "pgvector.service.consul"
        DB_PORT                 = "5432"
        DB_USERNAME             = "postgres"
        DB_PASSWORD             = "ChAnGeMe"
        DB_NAME                 = "cognee_metadata_db"

        # --- Vector Database (Qdrant) ---
        #VECTOR_DB_PROVIDER      = "qdrant"
        #VECTOR_DB_URL           = "http://qdrant.service.consul:6333"

        # --- Graph Database (Neo4j) ---
        GRAPH_DATABASE_PROVIDER = "neo4j"
        GRAPH_DATABASE_URL      = "bolt://neo4j.service.consul:7687"
        GRAPH_DATABASE_USERNAME = "neo4j"
        GRAPH_DATABASE_PASSWORD = "ChAnGeMe"

        # --- General Settings ---
        HOST                    = "0.0.0.0"
        ENVIRONMENT             = "production"
        DEBUG                   = "false"
      }

      resources {
        cpu    = 100
        memory = 2048
      }

      service {
        name     = "cognee"
        tags     = ["traefik.enable=true"]
        port     = "http"

        check {
          type     = "tcp"
          port     = "http"
          interval = "15s"
          timeout  = "3s"
        }
      }
    }
  }
}

variable "region" {
  type = string
  default = "global"
}


================================================
FILE: nomad_jobs/ai-ml/crawl4ai/nomad.job
================================================
job "crawl4ai" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/ai-ml/crawl4ai/nomad.job"
    version  = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "app" {
    count = 1

    network {
      port "http" {
        to = 11235
      }
    }

    volume "crawl4ai" {
      type            = "csi"
      read_only       = false
      source          = "crawl4ai-data"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prep-disk" {
      driver = "docker"
      
      volume_mount {
        volume      = "crawl4ai"
        destination = "/volume/"
        read_only   = false
      }
      
      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "mkdir -p /volume/config && chmod -R 777 /volume/"]
      }
      
      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "crawl4ai" {
      driver = "docker"

      config {
        image    = "unclecode/crawl4ai:0.6.0-r2"
        ports    = ["http"]
        shm_size = "1000000000"
        dns_servers = ["192.168.50.2"]
      }

      volume_mount {
        volume      = "crawl4ai"
        destination = "/app/data"
        read_only   = false
      }

      template {
        data = <<EOH
# Application Configuration
app:
  title: "Crawl4AI API"
  version: "0.6.0-r1"
  host: "0.0.0.0"
  port: 11235
  reload: False
  timeout_keep_alive: 300

# Default LLM Configuration
llm:
  provider: "gemini/gemini-2.5-flash-preview-04-17"
  api_key_env: "${var.litellm_crawl4ai_key}"
  api_base: "https://litellm.${var.tld}"

# Redis Configuration
redis:
  host: "redis.service.consul"
  port: 6379
  key_prefix: "crawl4ai:"

# Rate Limiting Configuration
rate_limit:
  enabled: true
  limits:
    default: "60/minute"
    html: "120/minute" 
    screenshot: "30/minute"
    pdf: "15/minute"
  storage_uri: "redis://redis.service.consul:6379/2"

# Security Configuration
security:
  enabled: false
  jwt_enabled: false
  https_redirect: false
  trusted_hosts: ["*"]
  headers:
    x_content_type_options: "nosniff"
    x_frame_options: "DENY"
    content_security_policy: "default-src 'self'"
    strict_transport_security: "max-age=63072000; includeSubDomains"

# Crawler Configuration
crawler:
  memory_threshold_percent: 95.0
  rate_limiter:
    base_delay: [1.0, 2.0]
  timeouts:
    stream_init: 30.0
    batch_process: 300.0

# Logging Configuration
logging:
  level: "INFO"
  format: "%(asctime)s - %(name)s - %(levelname)s - %(message)s"

# Observability Configuration
observability:
  prometheus:
    enabled: True
    endpoint: "/metrics"
  health_check:
    endpoint: "/health"
EOH

        destination   = "/app/data/config/config.yml"
        change_mode   = "restart"
      }

      resources {
        cpu    = 1000
        memory = 1024
      }

      env {
        PORT = "11235"
        CONFIG_PATH = "/app/data/config/config.yml"
        OPENAI_API_KEY = "${var.litellm_crawl4ai_key}"
      }

      service {
        port = "http"
        name = "crawl4ai"
        tags = [
          "traefik.enable=true",
          "metrics"
        ]

        check {
          type     = "http"
          path     = "/health"
          port     = "http"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }
    }
  }
}

variable "region" {}
variable "tld" {}
variable "shared_dir" {}
variable "litellm_crawl4ai_key" {}

================================================
FILE: nomad_jobs/ai-ml/crawl4ai/volume.hcl
================================================
id           = "crawl4ai-data"
external_id  = "crawl4ai-data"
name         = "crawl4ai-data"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "5GiB"
capacity_max = "5GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime", "nodiratime", "data=ordered"]
}

================================================
FILE: nomad_jobs/ai-ml/litellm/nomad.job
================================================
job "litellm" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/ai-ml/litellm/nomad.job"
      version = "6"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "ai" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        to = "4000"  # LiteLLM default port is 8000
      }
    }

    volume "litellm" {
      type      = "csi"
      read_only = false
      source    = "litellm"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "litellm" {
      driver = "docker"
      config {
        image = "ghcr.io/berriai/litellm:main-latest"
        ports = ["http"]
        volumes = [
          "local/config.yaml:/app/config.yaml",
        ]
      }

      volume_mount {
        volume      = "litellm"
        destination = "/data"
        read_only   = false
      }

      env {
        PORT = "${NOMAD_PORT_http}"
        HOST = "0.0.0.0"
        LITELLM_CONFIG_PATH = "/app/config.yaml"
        OLLAMA_BASE_URL = "${var.ollama_base_url}"
        AWS_ACCESS_KEY_ID = "${var.aws_access_key}"
        AWS_SECRET_ACCESS_KEY = "${var.aws_secret_key}"
        AWS_REGION = "${var.bedrock_aws_region}"
        GOOGLE_API_KEY = "${var.gemini_api_key}"
        LITELLM_MASTER_KEY = "${var.litellm_master_key}"
        #LITELLM_SALT_KEY = "${var.litellm_salt_key}"  # Added salt key for credential encryption
        DATABASE_URL = "postgresql://postgres:${var.postgres_pass}@postgres.service.consul:5432/litellm"
        STORE_MODEL_IN_DB = "True"
      }

      template {
        data = <<EOH
model_list:
  # Ollama models
  - model_name: ollama/llama2
    litellm_params:
      model: ollama/llama2
      api_base: ${var.ollama_base_url}

  - model_name: gpt-3.5-turbo
    litellm_params:
      model: ollama/llama2
      api_base: ${var.ollama_base_url}
  
  # AWS Bedrock - Claude 3.7 Sonnet
  - model_name: anthropic.claude-3-7-sonnet-20250219-v1:0
    litellm_params:
      model: bedrock/eu.anthropic.claude-3-7-sonnet-20250219-v1:0
      aws_access_key_id: ${var.aws_access_key}
      aws_secret_access_key: ${var.aws_secret_key}
      bedrock_aws_region: ${var.bedrock_aws_region}
  
  # Google Gemini Pro 2.5
  - model_name: gemini
    litellm_params:
      api_key: ${var.gemini_api_key}
      vertex_project: "htg-infra"
      vertex_location: "us-central1"


litellm_settings:
  drop_params: True
  cache: True
  cache_params:
    type: redis
    host: redis.service.consul
    port: 6379
    password: ""
    namespace: litellm
  # Log and trace settings
  streaming: True
  logging: True
  # Added user management settings
  user_api_key_backend: "postgres"
  use_queue: True
  num_workers: 4

environment_variables:
  AWS_ACCESS_KEY_ID: ${var.aws_access_key}
  AWS_SECRET_ACCESS_KEY: ${var.aws_secret_key}
  AWS_REGION: ${var.bedrock_aws_region}
  GOOGLE_API_KEY: ${var.gemini_api_key}
  LITELLM_MASTER_KEY: ${var.litellm_master_key}
  LITELLM_SALT_KEY: ${var.litellm_salt_key}
  DATABASE_URL: postgresql://postgres:${var.postgres_pass}@postgres.service.consul:5432/litellm
EOH
        destination = "local/config.yaml"
        env         = false
      }

      service {
        port = "http"
        name = "litellm"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 800
        memory = 1536
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "ollama_base_url" {
    type = string
    description = "Base URL for the Ollama service"
    default = "http://ollama.service.consul:11434"
}

variable "aws_access_key" {
    type = string
    description = "AWS Access Key ID for Bedrock access"
}

variable "aws_secret_key" {
    type = string
    description = "AWS Secret Access Key for Bedrock access"
}

variable "bedrock_aws_region" {
    type = string
    description = "AWS Region for Bedrock"
    default = "eu-central-1"
}

variable "gemini_api_key" {
    type = string
    description = "Google API Key for Gemini access"
}

variable "litellm_master_key" {
    type = string
    description = "Master key for LiteLLM authentication"
}

variable "litellm_salt_key" {
    type = string
    description = "Salt key for encrypting provider credentials"
}

variable "postgres_pass" {
    type = string
    description = "Password for PostgreSQL database"
}

================================================
FILE: nomad_jobs/ai-ml/litellm/volume.hcl
================================================
id           = "litellm"
external_id  = "litellm"
name         = "litellm"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}

================================================
FILE: nomad_jobs/ai-ml/manyfold/3dprints-volume.hcl
================================================
id           = "3dprints"
external_id  = "3dprints"
name         = "3dprints"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "40GiB"
capacity_max = "40GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/ai-ml/manyfold/nomad.job
================================================
job "manyfold" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/ai-ml/manyfold/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        to = "3214"
      }
    }

    volume "manyfold" {
      type      = "csi"
      read_only = false
      source    = "manyfold"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }

    volume "3dprints" {
      type      = "csi"
      read_only = false
      source    = "3dprints"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "manyfold" {
      driver = "docker"
      config {
        image = "ghcr.io/manyfold3d/manyfold-solo:0.137.0"
        ports = ["http"]
      }

      volume_mount {
        volume      = "manyfold"
        destination = "/config"
        read_only   = false
      }

      volume_mount {
        volume      = "3dprints"
        destination = "/libraries"
        read_only   = false
      }

      env {
        PUID = "1000"
        PGID = "1000"
        TZ = "Etc/UTC"
	SECRET_KEY_BASE = "${var.manyfold_secret_key}"
      }

      service {
        port = "http"
	name = "manyfold"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 100
        memory = 1024
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "downloads_dir" {
    type = string
}

variable "music_dir" {
    type = string
}

variable "manyfold_secret_key" {
    type = string
}


================================================
FILE: nomad_jobs/ai-ml/manyfold/prints_volume.hcl
================================================
id           = "3dprints"
external_id  = "3dprints"
name         = "3dprints"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "40GiB"
capacity_max = "40GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/ai-ml/manyfold/volume.hcl
================================================
id           = "manyfold"
external_id  = "manyfold"
name         = "manyfold"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "40GiB"
capacity_max = "40GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/ai-ml/ollama/nomad.job
================================================
job "ollama" {
  region = var.region
  datacenters = ["cheese"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/ai-ml/ollama/nomad.job"
    version = "4"
  }

  group "web" {
    network {
      mode = "host"
      port "web" {
        static = "11434"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "ollama" {
      driver = "docker"

      config {
        image = "ollama/ollama"
        runtime = "nvidia"
        dns_servers = [var.dns_server_ip]
        volumes = [
          "${var.ollama_data_dir}:/root/.ollama",
        ]
        ports = ["web"]
      }

      env {
        # Make the GPU visible to this container.
        NVIDIA_VISIBLE_DEVICES       = "all"
        NVIDIA_DRIVER_CAPABILITIES   = "compute,utility"
        # Pre-pull models on startup
        OLLAMA_MODELS               = "llama3.2:3b,codellama:7b"
      }

      service {
        name = "${NOMAD_JOB_NAME}"
        tags = ["traefik.enable=true"]
        port = "web"

        check {
          type     = "tcp"
          port     = "web"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = "200"
        memory = "7000"
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "ollama_data_dir" {
  type = string
}

variable "datacenter" {
  type = string
}

variable "dns_server_ip" {
  type = string
}


================================================
FILE: nomad_jobs/ai-ml/open-webui/nomad.job
================================================
job "open-webui" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/ai-ml/open-webui/nomad.job"
      version = "3"  // Right-size memory 1024MB -> 768MB
  }

  group "web" {
    network {
      mode = "host"
      port "web" {
        to = "8080"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "open-webui" {
      driver = "docker"

      config {
        image = "ghcr.io/open-webui/open-webui:v0.8.12"
        dns_servers = [var.dns_server_ip]
        volumes = [
          "${var.shared_dir}open-webui:/app/backend/data",
        ]
        ports = ["web"]
      }

     env {
        OLLAMA_BASE_URL= var.ollama_base_url
        WEBUI_SECRET_KEY = var.webui_secret_key
     }
      service {
        name = "${NOMAD_JOB_NAME}"
        tags = ["traefik.enable=true"]
        port = "web"

        check {
          type     = "tcp"
          port     = "web"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = "200"
        memory = "768"
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "ollama_base_url" {
  type = string
}

variable "webui_secret_key" {
  type = string
}

variable "datacenter" {
  type = string
}

variable "dns_server_ip" {
  type = string
}


================================================
FILE: nomad_jobs/ai-ml/paperless-ai/nomad.job
================================================
job "paperless-ai" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/ai-ml/paperless-ai/nomad.job"
version = "2"
  }

  group "web" {
    network {
      mode = "host"
      port "web" {
        to = "3000"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "paperless-ai" {
      driver = "docker"

      config {
        image = "clusterzx/paperless-ai"
        dns_servers = ["192.168.50.2"]
        volumes = [
          "${var.shared_dir}paperless-ai:/app/data",
        ]
        ports = ["web"]
      }

      service {
        name = "${NOMAD_JOB_NAME}"
        tags = ["traefik.enable=true"]
        port = "web"

        check {
          type     = "tcp"
          port     = "web"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = "200"
        memory = "2048"
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/ai-ml/pgvector-client/nomad.job
================================================
job "pgvector-client-example" {
  region = var.region
  datacenters = ["dc1"]
  type        = "batch"

  meta {
    job_file = "nomad_jobs/ai-ml/pgvector-client/nomad.job"
    version = "1"  // Initial version
  }

  group "client" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "embedding-example" {
      driver = "docker"

      config {
        image = "python:3.14-slim"
        command = "python"
        args = [
          "/local/embedding-example.py"
        ]
      }

      env {
        PGVECTOR_HOST     = "pgvector.service.consul"
        PGVECTOR_PORT     = "5433"
        PGVECTOR_USER     = "postgres"
        PGVECTOR_PASSWORD = "${var.pgvector_pass}"
        PGVECTOR_DB       = "embeddings"
      }

      template {
        data = <<EOH
#!/usr/bin/env python3
import os
import time
import psycopg2
import numpy as np
from psycopg2.extras import execute_values

# PostgreSQL connection parameters
pg_host = os.environ.get('PGVECTOR_HOST', 'pgvector.service.consul')
pg_port = os.environ.get('PGVECTOR_PORT', '5433')
pg_user = os.environ.get('PGVECTOR_USER', 'postgres')
pg_password = os.environ.get('PGVECTOR_PASSWORD', '')
pg_db = os.environ.get('PGVECTOR_DB', 'embeddings')

# Function to create random embeddings for demo purposes
def create_random_embedding(dim=1536):
    """Create a random normalized embedding vector."""
    vec = np.random.randn(dim)
    # Normalize to unit vector (common practice for embeddings)
    vec = vec / np.linalg.norm(vec)
    return vec.tolist()

# Connect to PostgreSQL with pgvector
print(f"Connecting to pgvector at {pg_host}:{pg_port}")
conn = psycopg2.connect(
    host=pg_host,
    port=pg_port,
    user=pg_user,
    password=pg_password,
    dbname=pg_db
)

cursor = conn.cursor()

# Ensure pgvector extension is enabled
print("Ensuring pgvector extension is enabled...")
cursor.execute("CREATE EXTENSION IF NOT EXISTS vector")

# Create a table for storing document embeddings
print("Creating documents table...")
cursor.execute("""
    CREATE TABLE IF NOT EXISTS documents (
        id SERIAL PRIMARY KEY,
        content TEXT NOT NULL,
        embedding VECTOR(1536) NOT NULL,
        metadata JSONB,
        created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
    )
""")

# Create an index for efficient similarity search
print("Creating vector index (this might take a while for large tables)...")
try:
    cursor.execute("""
        CREATE INDEX IF NOT EXISTS documents_embedding_idx
        ON documents
        USING ivfflat (embedding vector_cosine_ops)
        WITH (lists = 100)
    """)
except Exception as e:
    print(f"Warning: Could not create index: {e}")
    print("Continuing without index...")

# Sample documents
print("Inserting sample documents...")
documents = [
    "The quick brown fox jumps over the lazy dog",
    "Machine learning models can process vector embeddings efficiently",
    "PostgreSQL with pgvector extension provides vector similarity search",
    "Vector databases are essential for modern AI applications",
    "Semantic search uses embeddings to find relevant results"
]

# Generate random embeddings and insert documents
data = []
for doc in documents:
    embedding = create_random_embedding()
    data.append((doc, embedding, {"source": "example"}))

execute_values(
    cursor,
    """
    INSERT INTO documents (content, embedding, metadata)
    VALUES %s
    RETURNING id
    """,
    data,
    template="(%s, %s::vector, %s)"
)

print(f"Inserted {len(documents)} documents with embeddings")

# Perform a similarity search
print("\nPerforming similarity search...")
query_embedding = create_random_embedding()

cursor.execute("""
    SELECT id, content, 1 - (embedding <=> %s) AS similarity
    FROM documents
    ORDER BY embedding <=> %s
    LIMIT 3
""", (query_embedding, query_embedding))

results = cursor.fetchall()
print("\nTop 3 most similar documents:")
for id, content, similarity in results:
    print(f"ID: {id}, Similarity: {similarity:.4f}")
    print(f"Content: {content}")
    print("-" * 50)

# Commit and close
conn.commit()
cursor.close()
conn.close()
print("Example completed successfully!")
EOH
        destination = "local/embedding-example.py"
      }

      resources {
        cpu    = 500
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}

variable "pgvector_pass" {
    type = string
    description = "Admin password for pgvector PostgreSQL server"
}


================================================
FILE: nomad_jobs/ai-ml/radbot/nomad-dev.job
================================================
job "radbot-dev" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/ai-ml/radbot/nomad-dev.job"
    version  = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "web" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to           = 8000
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "60s"
      healthy_deadline = "5m"
      auto_revert      = true
    }

    task "radbot-dev" {
      driver = "docker"

      config {
        image       = "ghcr.io/perrymanuk/radbot:dev"
        dns_servers = [var.dns_server_ip]
        ports       = ["http"]
        volumes     = [
          "local/config.yaml:/app/config.yaml",
        ]
      }

      env {
        RADBOT_CREDENTIAL_KEY = var.radbot_credential_key
        RADBOT_ADMIN_TOKEN    = var.radbot_admin_token
        RADBOT_CONFIG_FILE    = "/app/config.yaml"
        RADBOT_ENV            = "dev"
      }

      template {
        data = <<EOH
database:
  host: postgres.service.consul
  port: 5432
  user: postgres
  password: ${var.postgres_pass}
  db_name: radbot_dev
EOH
        destination = "local/config.yaml"
        env         = false
      }

      service {
        port = "http"
        name = "radbot-dev"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/health"
          interval = "30s"
          timeout  = "5s"
          check_restart {
            limit           = 3
            grace           = "120s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 1000
        memory = 2048
      }
    }
  }
}

# ------------------------------------------------------------------
# Variables — only bootstrap secrets
# ------------------------------------------------------------------

variable "region" {
  type = string
}

variable "dns_server_ip" {
  type = string
}

variable "postgres_pass" {
  type        = string
  description = "PostgreSQL password (needed to connect to DB where all config lives)"
}

variable "radbot_credential_key" {
  type        = string
  description = "Fernet master key for encrypting credentials/config in the DB"
}

variable "radbot_admin_token" {
  type        = string
  description = "Bearer token for /admin/ — the only pre-shared secret"
}


================================================
FILE: nomad_jobs/ai-ml/radbot/nomad.job
================================================
job "radbot" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/ai-ml/radbot/nomad.job"
    version  = "2"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "web" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to           = 8000
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "60s"
      healthy_deadline = "5m"
      auto_revert      = true
    }

    task "radbot" {
      driver = "docker"

      config {
        image       = "ghcr.io/perrymanuk/radbot:v0.128"
        dns_servers = [var.dns_server_ip]
        ports       = ["http"]
        volumes     = [
          "local/config.yaml:/app/config.yaml",
          "${var.shared_dir}ai-intel:/mnt/ai-intel",
        ]
      }

      # Bootstrap-only env vars:
      # - RADBOT_CREDENTIAL_KEY: decrypt credentials/config stored in the DB
      # - RADBOT_ADMIN_TOKEN:    access /admin/ to manage everything else
      # - RADBOT_MCP_TOKEN:      bootstrap bearer for MCP bridge HTTP
      #                          (credential-store `mcp_token` wins once set)
      # - RADBOT_WIKI_PATH:      wiki root inside the container (matches the
      #                          ai-intel bind mount above)
      # All other config (API keys, models, integrations, endpoints) is stored
      # encrypted in the radbot_credentials table and managed via /admin/ UI.
      env {
        RADBOT_CREDENTIAL_KEY = var.radbot_credential_key
        RADBOT_ADMIN_TOKEN    = var.radbot_admin_token
        RADBOT_MCP_TOKEN      = var.radbot_mcp_token
        RADBOT_WIKI_PATH      = "/mnt/ai-intel"
        RADBOT_CONFIG_FILE    = "/app/config.yaml"
      }

      # Minimal bootstrap config — just enough to connect to the DB.
      # Everything else is loaded from the DB credential store at startup.
      template {
        data = <<EOH
database:
  host: postgres.service.consul
  port: 5432
  user: postgres
  password: ${var.postgres_pass}
  db_name: radbot_todos
EOH
        destination = "local/config.yaml"
        env         = false
      }

      service {
        port = "http"
        name = "radbot"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/health"
          interval = "30s"
          timeout  = "5s"
          check_restart {
            limit           = 3
            grace           = "120s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 1000
        memory = 2048
      }
    }
  }
}

# ------------------------------------------------------------------
# Variables — only bootstrap secrets
# ------------------------------------------------------------------

variable "region" {
  type = string
}

variable "dns_server_ip" {
  type = string
}

variable "postgres_pass" {
  type        = string
  description = "PostgreSQL password (needed to connect to DB where all config lives)"
}

variable "radbot_credential_key" {
  type        = string
  description = "Fernet master key for encrypting credentials/config in the DB"
}

variable "radbot_admin_token" {
  type        = string
  description = "Bearer token for /admin/ — the only pre-shared secret"
}

variable "radbot_mcp_token" {
  type        = string
  description = "Bootstrap bearer token for the MCP bridge HTTP transport. The credential-store entry `mcp_token` takes priority once set, so this is only used before the first rotate."
}

variable "shared_dir" {
  type        = string
  description = "Base path on shared-mount nodes; jobs append their own subdirectory (this job mounts <shared_dir>/ai-intel at /mnt/ai-intel)."
}


================================================
FILE: nomad_jobs/core-infra/coredns/README.md
================================================
### Coredns
you can place extra configuration for coredns in the consul kv store at `apps/coredns/corefile` and it will be deployed with the job


================================================
FILE: nomad_jobs/core-infra/coredns/nomad.job
================================================
job "coredns" {
  region = var.region
  datacenters = ["dc1"]
  type = "service"
  priority = 100

  meta {
      job_file = "nomad_jobs/core-infra/coredns/nomad.job"
      version = "10"  // Write keepalived.conf directly instead of env.yaml
  }

  constraint {
    attribute = "${meta.dns}"
    operator  = "="
    value     = "true"
  }

  group "dns" {
    count = 2
    
    constraint {
      operator = "distinct_hosts"
      value    = "true"
    }
    
    network {
      mode = "host"
      port "dns" {
        static = "53"
        host_network = "lan"
      }
      port "metrics" {
        static = "9153"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "60s"
      auto_revert      = true
      auto_promote     = true
      canary           = 2
    }

    task "keepalived-dns" {
      driver = "docker"
      
      lifecycle {
        hook = "prestart"
        sidecar = true
      }
      
      config {
        image = "osixia/keepalived:2.3.4"
        network_mode = "host"
        force_pull = false
        volumes = [
          "local/keepalived.conf:/etc/keepalived/keepalived.conf"
        ]
        cap_add = ["NET_ADMIN", "NET_BROADCAST", "NET_RAW"]
      }

      template {
        destination = "local/keepalived.conf"
        change_mode = "restart"
        splay       = "1m"
        data        = <<EOH
vrrp_instance VI_1 {
    state BACKUP
    interface {{ sockaddr "GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"name\"" }}
    virtual_router_id 51
    priority 100
    advert_int 1

    unicast_peer {
{{- range service "coredns" }}
        {{ .Address }}
{{- end }}
    }

    virtual_ipaddress {
        192.168.50.2/24
        192.168.50.3/24
    }
}
EOH
      }
      
      resources {
        cpu    = 100
        memory = 64
      }
    }

    task "coredns" {
      driver = "docker"
      
      config {
        image = "coredns/coredns:1.14.2"
        network_mode = "host"
        force_pull = false
        ports = ["dns", "metrics"]
        args = ["-conf", "/local/coredns/corefile"]
      }

      service {
        port = "dns"
        name = "coredns"
        tags = ["coredns"]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }
      
      service {
        port = "metrics"
        name = "coredns"
        tags = ["metrics", "coredns"]
      }

      template {
        data = <<EOH
. {
  bind {{ env "NOMAD_IP_dns" }} 192.168.50.2 192.168.50.3
  forward . 8.8.8.8
  log
  errors
  prometheus {{ env "NOMAD_IP_metrics" }}:9153
}
consul.:53 {
  bind {{ env "NOMAD_IP_dns" }} 192.168.50.2 192.168.50.3
  forward . {{ env "NOMAD_IP_dns" }}:8600
  log
  prometheus {{ env "NOMAD_IP_metrics" }}:9153
}
fritz.box.:53 {
  bind {{ env "NOMAD_IP_dns" }} 192.168.50.2 192.168.50.3
  forward . 192.168.50.1:53
  log
  prometheus {{ env "NOMAD_IP_metrics" }}:9153
}
${var.tld}. {
  bind {{ env "NOMAD_IP_dns" }} 192.168.50.2 192.168.50.3

  file /local/coredns/zones/db.home.lab ${var.tld}

}
k8s. {
  bind {{ env "NOMAD_IP_dns" }} 192.168.50.2 192.168.50.3

  file /local/coredns/zones/db.k8s k8s

}
EOH
        destination = "local/coredns/corefile"
        env         = false
        change_mode = "signal"
        change_signal = "SIGHUP"
        left_delimiter  = "{{"
        right_delimiter = "}}"
      }

      template {
        change_mode   = "signal"
        change_signal = "SIGUSR1"
        destination = "local/coredns/zones/db.home.lab"
        data = <<EOH
$ORIGIN ${var.tld}.
$TTL    604800
${var.tld}.         IN SOA	ns1.${var.tld}. admin.${var.tld}. (
         {{ timestamp "unix" }}        ; Serial, current unix timestamp
             604800        ; Refresh
              86400        ; Retry
            2419200        ; Expire
             604800 )      ; Negative Cache TTL

; name servers - NS records
${var.tld}.         IN NS	 ns1.${var.tld}.
${var.tld}.         IN NS	 ns2.${var.tld}.

; name servers - A records
ns1                      IN A   192.168.50.1
ns2                      IN A   192.168.50.2

{{- /*  Point domains to the floating IP from keepalived */}}
; services - A records
lab.${var.tld}.         IN A   192.168.50.20
*                       IN A   192.168.50.20
@                       IN A   192.168.50.20

EOH
      }

      template {
        change_mode   = "signal"
        change_signal = "SIGUSR1"
        destination = "local/coredns/zones/db.k8s"
        data = <<EOH
$ORIGIN ${var.tld}.
$TTL    604800
k8s.         IN SOA	ns1.k8s. admin.k8s. (
         {{ timestamp "unix" }}        ; Serial, current unix timestamp
             604800        ; Refresh
              86400        ; Retry
            2419200        ; Expire
             604800 )      ; Negative Cache TTL

; name servers - NS records
k8s.         IN NS	 ns1.k8s.
k8s.         IN NS	 ns2.k8s.

; name servers - A records
ns1                      IN A   192.168.50.1
ns2                      IN A   192.168.50.2

{{- /*  Point domains to the floating IP from keepalived */}}
; services - A records
lab.k8s.                IN A   192.168.50.93
*.k8s.                  IN A   192.168.50.93
@                       IN A   192.168.50.93

EOH
      }
      
      resources {
        cpu    = 100
        memory = 128
      }
    }
  }
}

variable "region" {}
variable "tld" {}


================================================
FILE: nomad_jobs/core-infra/github-runner/nomad.job
================================================
job "github-runner" {
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/core-infra/github-runner/nomad.job"
version = "3"
  }

  group "runners" {
    count = 3
    # Don't reschedule in case of failure or drain
    reschedule {
      attempts  = 0
      unlimited = false
    }
   
    restart {
      attempts = 3
      delay = "30s"
      interval = "3m"
      mode = "delay"
    }

    network {
      port "http" { 
        host_network = "lan"
        to = "9252" 
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "runner" {
      driver = "docker"
      kill_timeout = "25s"

      template {
        env         = true
        destination = "secrets/env"
        data        = <<-EOH
        RUNNER_NAME_PREFIX = "amd64"
        RUNNER_GROUP = "Default"
        RUNNER_SCOPE = "repo"
        REPO_URL = "https://github.com/perrymanuk/hashi-homelab"
        ACCESS_TOKEN = "${var.github_pat}"
        EPHEMERAL = "0"
        DISABLE_AUTO_UPDATE = "1"
        LABELS = "${var.labels}"
        EOH
      }

      template {
        data = <<-EOH
        {
        	"auths": {
        		"https://index.docker.io/v1/": {
              "auth": ""
        		}
	        }
        }
        EOH
        destination = "secrets/config.json"
      }

      resources {
        cpu    = 100
        memory = 128
      }

      config {
        image       = "myoung34/github-runner:2.333.1"
        extra_hosts = ["nomad.service.home:192.168.50.120"]
        ports       = ["http"]
        userns_mode = "host"
        privileged  = true
        mounts = [
          {
            type     = "bind"
            source   = "/var/run/docker.sock"
            target   = "/var/run/docker.sock"
            readonly = false
            bind_options = {
              propagation = "rprivate"
            }
          },
          {
            type     = "bind"
            source   = "secrets/config.json"
            target   = "/root/.docker/config.json"
            readonly = false
            bind_options = {
              propagation = "rprivate"
            }
          }
        ]
      }
    }
  }
}


variable "labels" {
  type = string
  default = "self-hosted"
}

variable "github_pat" {}


================================================
FILE: nomad_jobs/core-infra/haproxy/nomad.job
================================================
job "haproxy" {
  region = var.region
  datacenters = ["dc1"]
  type = "system"

  meta {
      job_file = "nomad_jobs/core-infra/haproxy/nomad.job"
version = "6"
  }

  group "lbs" {
    count = 1

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }
    task "haproxy" {
      driver = "docker"
      service {
        tags = ["haproxy"]
        name = "haproxy"
        port = "http"

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }

      }
      service {
        tags = ["metrics", "${NOMAD_ALLOC_ID}"]
        name = "haproxy-metrics"
        port = "metrics"

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      service {
        tags = ["metrics", "${NOMAD_ALLOC_ID}"]
        name = "service-mesh"
        port = "http"

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      config {
        image = "haproxy:3.3.6-alpine"
        args = ["-W", "-f", "local/etc/haproxy.cfg"]
        network_mode = "host"
      }

      template {
data = <<EOH
global
  maxconn     20000
  pidfile     /run/haproxy.pid
  stats timeout 2m
  daemon

defaults
  retry-on all-retryable-errors
  option http-use-htx
  errorfile 503 local/etc/error503.http

frontend http
  bind {{ env "NOMAD_ADDR_http" }}
  # options
  http-request add-header x-forwarded-proto http
  maxconn 50000
  mode http
  timeout client 0s
  timeout server 0s
  # acls
{{ range services }}{{ if .Tags | contains "net-internal" }}
  acl {{ .Name }}_net-internal hdr_reg(Host) -i {{ .Name }}.homelab
  acl {{ .Name }}_net-internal base_dom {{ .Name }}.homelab
  use_backend {{ .Name }}_net-internal if {{ .Name }}_net-internal
{{ end }}{{ end }}


# services

{{ range services -}}{{ if .Tags | contains "net-internal" -}}
backend {{ .Name }}_net-internal
  mode http
  option redispatch
  retries 10

  timeout connect 5s
  timeout queue 30s
  timeout server 30s

  {{ range service .Name -}}
  {{ if .Tags | contains "net-internal" -}}
  server {{ .ID }} {{ .Address }}:{{ .Port }}
  {{ end -}}
  {{ end }}
{{ end -}}
{{ end -}}

listen {{ env "NOMAD_IP_http" }}
  mode http

  bind ${NOMAD_ADDR_metrics}

  timeout client 30s
  timeout connect 5s
  timeout server  30s
  timeout queue   30s

  http-request use-service prometheus-exporter if { path /metrics }

  stats enable
  stats uri /
  stats show-node
  stats refresh 30s
  stats show-legends


EOH
        destination = "local/etc/haproxy.cfg"
        env         = false
        change_mode = "signal"
        change_signal = "SIGUSR2"
      }

      template {
data = <<EOH
HTTP/1.0 503 Service Unavailable
Cache-Control: no-cache
Connection: close
Content-Type: text/plain

Error 503: The specified service was not found or has no allocations. Please check your service configuration and try again

EOH
        destination = "local/etc/error503.http"
        env         = false
        change_mode = "signal"
        change_signal = "SIGHUP"
      }

      resources {
        cpu = 100
        memory = 64
        network {
          port "http" { 
            static = "80" 
          }
          port "metrics" {}
        }
      }
    }
  }
}


================================================
FILE: nomad_jobs/core-infra/iscsi-csi-plugin/controller.job
================================================
job "democratic-csi-iscsi-controller" {
  
  meta {
  job_file = "nomad_jobs/core-infra/iscsi-csi-plugin/controller.job"
  }
datacenters = ["dc1"]

  group "controller" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "plugin" {
      driver = "docker"

      config {
        image = "docker.io/democraticcsi/democratic-csi:v1.9.5"

        args = [
          "--csi-version=1.5.0",
          # must match the csi_plugin.id attribute below
          "--csi-name=org.democratic-csi.iscsi",
          "--driver-config-file=${NOMAD_TASK_DIR}/driver-config-file.yaml",
          "--log-level=info",
          "--csi-mode=controller",
          "--server-socket=/csi/csi.sock",
        ]
      }

      template {
        destination = "${NOMAD_TASK_DIR}/driver-config-file.yaml"

        data = <<EOH
driver: freenas-iscsi
instance_id:
httpConnection:
  protocol: https
  host: 192.168.50.208
  port: 443
  # use only 1 of apiKey or username/password
  # if both are present, apiKey is preferred
  # apiKey is only available starting in TrueNAS-12
  apiKey: ${var.truenas_api_key}
  username: iscsi-no
  password: "${var.truenas_iscsi_pass}"
  allowInsecure: true
  # use apiVersion 2 for TrueNAS-12 and up (will work on 11.x in some scenarios as well)
  apiVersion: 2
sshConnection:
  host: 192.168.50.208
  port: 22
  username: root
  # use either password or key
  password: "${var.truenas_iscsi_pass}"
zfs:
  # TrueNAS SCALE 24.10+ (Electric Eel) paths differ from FreeBSD defaults
  cli:
    paths:
      zfs: /usr/sbin/zfs
      zpool: /usr/sbin/zpool
      sudo: /usr/bin/sudo
      chroot: /usr/sbin/chroot
  
  # can be used to set arbitrary values on the dataset/zvol
  # can use handlebars templates with the parameters from the storage class/CO
  # TODO: set up handlebars templates to make this far more awesome
  #datasetProperties:
  #   "org.freenas:description": "created via democratic-csi"

  datasetParentName: ssd-vms0/nomad/vols
  # do NOT make datasetParentName and detachedSnapshotsDatasetParentName overlap
  # they may be siblings, but neither should be nested in the other
  detachedSnapshotsDatasetParentName: ssd-vms0/nomad/snaps
  zvolCompression: "lz4"
  zvolDedupe: ""
  zvolEnableReservation: False
  zvolBlocksize: ""
iscsi:
  targetPortal: "192.168.50.208:3260"
  targetPortals: []
  interface:

  # MUST ensure uniqueness
  # full iqn limit is 223 bytes, plan accordingly
  # default is //template name isn't defined!
  #nameTemplate: "{ { parameters.[csi.storage.k8s.io/pvc/namespace] }}-{ { parameters.[csi.storage.k8s.io/pvc/name] }}"
  namePrefix: csi-
  nameSuffix: "-discovery"
  # add as many as needed
  targetGroups:
    # get the correct ID from the "portal" section in the UI
    - targetGroupPortalGroup: 1
      # get the correct ID from the "initiators" section in the UI
      targetGroupInitiatorGroup: 1
      # None, CHAP, or CHAP Mutual
      targetGroupAuthType: None
      # get the correct ID from the "Authorized Access" section of the UI
      # only required if using Chap
      #targetGroupAuthGroup:

  extentInsecureTpc: true
  extentXenCompat: false
  extentDisablePhysicalBlocksize: true
  # 512, 1024, 2048, or 4096,
  extentBlocksize: 512
  # "" (let FreeNAS decide, currently defaults to SSD), Unknown, SSD, 5400, 7200, 10000, 15000
  extentRpm: "SSD"
  # 0-100 (0 == ignore)
  extentAvailThreshold: 0
EOH
      }

      csi_plugin {
        # must match --csi-name arg
        id        = "org.democratic-csi.iscsi"
        type      = "controller"
        mount_dir = "/csi"
      }

      resources {
        cpu    = 500
        memory = 128
      }
    }
  }
}

variable "truenas_api_key" {}
variable "truenas_iscsi_pass" {}


================================================
FILE: nomad_jobs/core-infra/iscsi-csi-plugin/node.job
================================================
job "democratic-csi-iscsi-node" {
  
  meta {
  job_file = "nomad_jobs/core-infra/iscsi-csi-plugin/node.job"
  }
datacenters = ["dc1", "cheese"]
  priority = 100
  # you can run node plugins as service jobs as well, but this ensures
  # that all nodes in the DC have a copy
  type = "system"

  group "nodes" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "plugin" {
      driver = "docker"

      env {
        CSI_NODE_ID = "${attr.unique.hostname}"
        
        # if you run into a scenario where your iscsi volumes are zeroed each time they are mounted,
        # you can configure the fs detection system used with the following envvar:
        #FILESYSTEM_TYPE_DETECTION_STRATEGY = "blkid"
      }

      config {
        image = "docker.io/democraticcsi/democratic-csi:v1.9.5"

        args = [
          "--csi-version=1.5.0",
          # must match the csi_plugin.id attribute below
          "--csi-name=org.democratic-csi.iscsi",
          "--driver-config-file=${NOMAD_TASK_DIR}/driver-config-file.yaml",
          "--log-level=debug",
          "--csi-mode=node",
          "--server-socket=/csi/csi.sock",
        ]

        # node plugins must run as privileged jobs because they
        # mount disks to the host
        privileged = true
        ipc_mode = "host"
        network_mode = "host"

        mount {
          type = "bind"
          target = "/host"
          source = "/"
          readonly=false
        }
        
        # if you run into a scenario where your iscsi volumes are zeroed each time they are mounted,
        # you can try uncommenting the following additional mount block:
        mount {
          type     = "bind"
          target   = "/run/udev"
          source   = "/run/udev"
          readonly = true
        }
      }

      template {
        destination = "${NOMAD_TASK_DIR}/driver-config-file.yaml"

        data = <<EOH
driver: freenas-iscsi
instance_id:
httpConnection:
  protocol: https
  host: 192.168.50.208
  port: 443
  # use only 1 of apiKey or username/password
  # if both are present, apiKey is preferred
  # apiKey is only available starting in TrueNAS-12
  apiKey: ${var.truenas_api_key}
  username: iscsi-no
  password: "${var.truenas_iscsi_pass}"
  allowInsecure: true
  # use apiVersion 2 for TrueNAS-12 and up (will work on 11.x in some scenarios as well)
  # leave unset for auto-detection
  apiVersion: 2
sshConnection:
  host: 192.168.50.208
  port: 22
  username: root
  # use either password or key
  password: "${var.truenas_iscsi_pass}"
zfs:
  # can be used to override defaults if necessary
  # the example below is useful for TrueNAS 12
  #cli:
  #  sudoEnabled: true
  #
  #  leave paths unset for auto-detection
  #  paths:
  #    zfs: /usr/local/sbin/zfs
  #    zpool: /usr/local/sbin/zpool
  #    sudo: /usr/local/bin/sudo
  #    chroot: /usr/sbin/chroot
  
  # can be used to set arbitrary values on the dataset/zvol
  # can use handlebars templates with the parameters from the storage class/CO
  # TODO: set up handlebars templates to make this far more awesome
  #datasetProperties:
  #   "org.freenas:description": "created via democratic-csi"

  datasetParentName: ssd-vms0/nomad/vols
  # do NOT make datasetParentName and detachedSnapshotsDatasetParentName overlap
  # they may be siblings, but neither should be nested in the other
  detachedSnapshotsDatasetParentName: ssd-vms0/nomad/snaps
  zvolCompression: ""
  zvolDedupe: ""
  zvolEnableReservation: False
  zvolBlocksize: ""
iscsi:
  targetPortal: "192.168.50.208:3260"
  targetPortals: []
  interface:

  # MUST iensure uniqueness
  # full iqn limit is 223 bytes, plan accordingly
  # default is //template name isn't defined!
  #nameTemplate: "{ { parameters.[csi.storage.k8s.io/pvc/namespace] }}-{ { parameters.[csi.storage.k8s.io/pvc/name] }}"
  namePrefix: csi-
  nameSuffix: "-discovery"
  # add as many as needed
  targetGroups:
    # get the correct ID from the "portal" section in the UI
    - targetGroupPortalGroup: 1
      # get the correct ID from the "initiators" section in the UI
      targetGroupInitiatorGroup: 1
      # None, CHAP, or CHAP Mutual
      targetGroupAuthType: None
      # get the correct ID from the "Authorized Access" section of the UI
      # only required if using Chap
      #targetGroupAuthGroup:

  extentInsecureTpc: true
  extentXenCompat: false
  extentDisablePhysicalBlocksize: true
  # 512, 1024, 2048, or 4096,
  extentBlocksize: 512
  # "" (let FreeNAS decide, currently defaults to SSD), Unknown, SSD, 5400, 7200, 10000, 15000
  extentRpm: "SSD"
  # 0-100 (0 == ignore)
  extentAvailThreshold: 0
EOH
      }

      csi_plugin {
        # must match --csi-name arg
        id        = "org.democratic-csi.iscsi"
        type      = "node"
        mount_dir = "/csi"
      }

      resources {
        cpu    = 500
        memory = 128
      }
    }
  }
}

variable "ssh_id" {}
variable "truenas_api_key" {}
variable "truenas_iscsi_pass" {}


================================================
FILE: nomad_jobs/core-infra/keepalived/TODO.md
================================================
# Keepalived Improvements TODO

## Problem
The osixia/keepalived image uses environment variables (env.yaml) to generate keepalived.conf at startup. This doesn't support dynamic config reloads via SIGHUP because the conf isn't regenerated from env vars on signal.

Combined with Nomad templates that use `change_mode = "restart"` and dynamic Consul service lookups, this causes restart loops.

## Proposed Solution
Replace osixia/keepalived with plain keepalived using a direct config template:

```hcl
config {
  image = "osixia/keepalived:2.0.20"  # or alpine + keepalived
  volumes = [
    "local/keepalived.conf:/etc/keepalived/keepalived.conf"
  ]
}

template {
  destination = "local/keepalived.conf"
  change_mode = "signal"
  change_signal = "SIGHUP"
  data = <<EOH
vrrp_instance VI_1 {
  state BACKUP
  interface {{ sockaddr "GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"name\"" }}
  virtual_router_id 51
  priority 100
  nopreempt
  virtual_ipaddress {
    192.168.50.50/24
  }
}
EOH
}
```

## Alternatives Considered
- **vip-manager** - lightweight, single purpose
- **kube-vip** - modern, supports ARP/BGP
- **ucarp** - simple CARP implementation

## Affected Jobs
- `nomad_jobs/core-infra/coredns/nomad.job` (keepalived-dns sidecar)
- `nomad_jobs/core-infra/traefik/nomad.job` (keepalived-traefik sidecar)


================================================
FILE: nomad_jobs/core-infra/keepalived/nomad.job
================================================
job "keepalived" {
  datacenters = ["dc1"]
  type        = "system"
  priority    = 100

  meta {
      job_file = "nomad_jobs/core-infra/keepalived/nomad.job"
version = "5"
  }

  group "keepalived" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "keepalived" {
      driver = "docker"
      config {
        image = "osixia/keepalived:2.3.4"
        network_mode = "host"
        volumes = [
            "local/:/container/environment/01-custom"
        ]
        cap_add = ["NET_ADMIN", "NET_BROADCAST", "NET_RAW"]
      }
      template {
        destination = "local/env.yaml"
        change_mode = "restart"
        splay       = "1m"
        data        = <<EOH
KEEPALIVED_VIRTUAL_IPS:
  - 192.168.50.2/24
  - 192.168.50.3/24
KEEPALIVED_UNICAST_PEERS:
{{- with $node := node -}}
{{ range nodes }}
{{- if ne .Address $node.Node.Address }}
  - {{ .Address }}
{{- end -}}
{{- end -}}
{{- end }}
KEEPALIVED_INTERFACE: {{ sockaddr "GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"name\"" }}
EOH
      }
      resources {
        cpu    = 100
        memory = 32
      }
    }
  }
}


================================================
FILE: nomad_jobs/core-infra/nfs-csi-plugin/controller.job
================================================
job "plugin-nfs-controller" {
  
  meta {
  job_file = "nomad_jobs/core-infra/nfs-csi-plugin/controller.job"
  }
datacenters = ["dc1"]
  group "controller" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "plugin" {
      driver = "docker"
      config {
        image = "registry.k8s.io/sig-storage/nfsplugin:v4.13.2"
        args = [
          "--v=5",
          "--nodeid=${attr.unique.hostname}",
          "--endpoint=unix:///csi/csi.sock",
          "--drivername=nfs.csi.k8s.io"
        ]
      }
      csi_plugin {
        id        = "nfsofficial"
        type      = "controller"
        mount_dir = "/csi"
      }
      resources {
        memory = 128
        cpu    = 100
      }
    }
  }
}


================================================
FILE: nomad_jobs/core-infra/nfs-csi-plugin/nodes.job
================================================
job "plugin-nfs-nodes" {
  
  meta {
  job_file = "nomad_jobs/core-infra/nfs-csi-plugin/nodes.job"
  }
datacenters = ["dc1"]
  # you can run node plugins as service jobs as well, but this ensures
  # that all nodes in the DC have a copy.
  type = "system"
  group "nodes" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "plugin" {
      driver = "docker"
      config {
        image = "registry.k8s.io/sig-storage/nfsplugin:v4.13.2"
        args = [
          "--v=5",
          "--nodeid=${attr.unique.hostname}",
          "--endpoint=unix:///csi/csi.sock",
          "--drivername=nfs.csi.k8s.io"
        ]
        # node plugins must run as privileged jobs because they
        # mount disks to the host
        privileged = true
      }
      csi_plugin {
        id        = "nfsofficial"
        type      = "node"
        mount_dir = "/csi"
      }
      resources {
        memory = 64
        cpu = 100
      }
    }
  }
}


================================================
FILE: nomad_jobs/core-infra/pihole/nomad.job
================================================
job "pihole" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"
  priority    = 100

  meta {
      job_file = "nomad_jobs/core-infra/pihole/nomad.job"
version = "3"
  }

  constraint {
    attribute = "${meta.dns}"
    operator  = "="
    value     = "true"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "infra" {
    count = 1 

    network {
      port "dns" { 
        host_network = "lan"
        static = "8053" 
        to     = "53" 
      }
      port "web" { 
        host_network = "lan"
        to = "80" 
      }
    }

    volume "pihole" {
      type      = "csi"
      read_only = false
      source    = "pihole3"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "pihole" {
      driver = "docker"
      config {
        image = "pihole/pihole:2026.04.0"
        ports = ["dns", "web"]
        volumes = [
          "${var.shared_dir}pihole-dnsmasq:/etc/dnsmasq.d/",
        ]
      }

      volume_mount {
        volume      = "pihole"
        destination = "/etc/pihole"
        read_only   = false
      }

      service {
         tags = [
          "traefik.enable=true"
         ]
         name = "pihole"
	 provider = "consul"
         port = "web"
         check {
           type     = "tcp"
           interval = "10s"
           timeout  = "2s"
         }
      }

      env {
        TZ                             = "Europe/Amsterdam"
        FTLCONF_webserver_api_password = ""
        FTLCONF_dns_upstreams          = "8.8.8.8;1.1.1.1"
        FTLCONF_dns_listeningMode      = "ALL"
        FTLCONF_misc_etc_dnsmasq_d     = "true"
      }

      resources {
        cpu    = 300
        memory = 128
      }
    }
  }
}

variable "region" {}


variable "shared_dir" {}


================================================
FILE: nomad_jobs/core-infra/pihole/volume.hcl
================================================
id           = "pihole3"
external_id  = "pihole3"
name         = "pihole3"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/core-infra/smtp/nomad.job
================================================
job "smtp" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/core-infra/smtp/nomad.job"
version = "7"
  }

  group "mail" {
    count = 1 
    network {
      port "smtp" {
        host_network = "lan"
        static = "25"
      }
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "smtp" {
      driver = "docker"
      config {
        image = "ixdotai/smtp"
        network_mode = "host"
        ports = ["smtp"]
        force_pull = "true"
      }

      template {
data = <<EOH
MAILNAME=${var.tld}
RELAY_NETWORKS=:172.0.0.0/8:127.0.0.1/32:10.0.0.0/8:100.0.0.0/8:192.168.50.0/24
NET_DEV=enp2s0
DISABLE_IPV6=true
EOH
        destination = "local/env"
        env         = true
      }

      service {
        port = "smtp"
	name = "smtp"
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 100
        memory = 32
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/core-infra/tailscale/nomad.job
================================================
job "tailscale" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/core-infra/tailscale/nomad.job"
      version = "6"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "networking" {
    count = 1 

    volume "tailscale" {
      type      = "csi"
      read_only = false

      source    = "tailscale2"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "tailscale" {
      driver = "docker"
      config {
        image = "tailscale/tailscale:v1.96.5"
        network_mode = "host"
        force_pull = "true"
        privileged = true
        cap_add = ["NET_ADMIN", "NET_RAW"]
	volumes = [
          "/dev/net/tun:/dev/net/tun",
	]
      }

      volume_mount {
        volume      = "tailscale"
        destination = "/var/lib/tailscale"
        read_only   = false
      }

      template {
data = <<EOH
TS_HOSTNAME="home-gateway"
TS_ROUTES="192.168.50.0/24"
TS_AUTHKEY="${var.tailscale_auth}"
TS_STATE_DIR="/var/lib/tailscale/tailscaled.state"
TS_USERSPACE="true"
TS_EXTRA_ARGS="--reset --advertise-tags=tag:nomad"
EOH
      destination = "local/env"
      env         = true
      }

      resources {
        cpu    = 200
        memory = 128
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "tailscale_auth" {}


================================================
FILE: nomad_jobs/core-infra/tailscale/volume.hcl
================================================
id           = "tailscale2"
external_id  = "tailscale2"
name         = "tailscale2"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/core-infra/tailscale-este/nomad.job
================================================
job "tailscale-este" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/core-infra/tailscale-este/nomad.job"
version = "3"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "networking" {
    count = 1 

    volume "tailscale-este" {
      type      = "csi"
      read_only = false

      source    = "tailscale-este"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "tailscale" {
      driver = "docker"
      config {
        image = "tailscale/tailscale:v1.96.5"
        entrypoint = ["/local/start.sh"]
        network_mode = "host"
        force_pull = "true"
        privileged = true
        cap_add = ["NET_ADMIN", "NET_RAW"]
	volumes = [
          "/dev/net/tun:/dev/net/tun",
	]
      }

      volume_mount {
        volume      = "tailscale-este"
        destination = "/var/lib/tailscale"
        read_only   = false
      }

      template {
data = <<EOH
#!/bin/sh

function up() {
    until /usr/local/bin/tailscale up --snat-subnet-routes=false --auth-key="${var.tailscale_auth_este}" --advertise-routes="192.168.50.0/24" --hostname="este-gateway"
    do
        sleep 0.1
    done

}

# send this function into the background
up &

exec tailscaled --tun=userspace-networking --statedir="/var/lib/tailscale/tailscaled.state"
EOH
        destination = "local/start.sh"
        env         = false
        perms       = 755
      }

      resources {
        cpu    = 200
        memory = 128
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "tailscale_auth_este" {}


================================================
FILE: nomad_jobs/core-infra/tailscale-este/volume.hcl
================================================
id           = "tailscale-este"
external_id  = "tailscale-este"
name         = "tailscale-este"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/core-infra/traefik/config/consul-catalog.yml
================================================
# Enable Rancher Provider.
providers:
  consulcatalog:

    # Expose Consul Catalog services by default in Traefik.
    exposedByDefault: true

    # Defines the consul address endpoint.
    address: 127.0.0.1:8500

    # Defines the scheme used.
    scheme: "foobar"

    # Defines the DC.
    datacenter: "foobar"

    # Defines the token.
    token: "foobar"

    # Defines the expoint wait time.
    endpointWaitTime: "15s"

    # Defines Consul Catalog Provider TLS endpoint.
    endpoint:
      tls:

        # Defines Consul Catalog Provider endpoint.
        caOptional: true
        cert: "foobar"
        key: "foobar"
        insecureSkipVerify: true


================================================
FILE: nomad_jobs/core-infra/traefik/config/consul.yml
================================================
# Enable Rancher Provider.
providers:
  consulcatalog:

    # Expose Consul Catalog services by default in Traefik.
    exposedByDefault: true

    # Defines the consul address endpoint.
    address: 127.0.0.1:8500

    # Defines the scheme used.
    scheme: "foobar"

    # Defines the DC.
    datacenter: "foobar"

    # Defines the token.
    token: "foobar"

    # Defines the expoint wait time.
    endpointWaitTime: "15s"

    # Defines Consul Catalog Provider TLS endpoint.
    endpoint:
      tls:

        # Defines Consul Catalog Provider endpoint.
        caOptional: true
        cert: "foobar"
        key: "foobar"
        insecureSkipVerify: true


================================================
FILE: nomad_jobs/core-infra/traefik/config/traefik.toml
================================================
################################################################
#
# Configuration sample for Traefik v2.
#
# For Traefik v1: https://github.com/containous/traefik/blob/v1.7/traefik.sample.toml
#
################################################################

################################################################
# Global configuration
################################################################
[global]
  checkNewVersion = false
  sendAnonymousUsage = false

################################################################
# Entrypoints configuration
################################################################

# Entrypoints definition
#
# Optional
# Default:
[entryPoints]
  [entryPoints.web]
    address = "0.0.0.0:80"

  [entryPoints.traefik]
    address = "0.0.0.0:9001"

  [entryPoints.websecure]
    address = "0.0.0.0:443"

[http.middlewares]
  [http.middlewares.https-redirect.redirectscheme]
    scheme = "https"

[certificatesResolvers.sample.acme]
  email = "me@you.com"
  storage = "acme.json"
  [certificatesResolvers.sample.acme.httpChallenge]
    # used during the challenge
    entryPoint = "web"

################################################################
# ServersTransports for HTTPS backends with self-signed certs
################################################################
[serversTransports.insecure-skip-verify]
  insecureSkipVerify = true


################################################################
# Traefik logs configuration
################################################################

# Traefik logs
# Enabled by default and log to stdout
#
# Optional
#
[log]

  # Log level
  #
  # Optional
  # Default: "ERROR"
  #
  # level = "DEBUG"

  # Sets the filepath for the traefik log. If not specified, stdout will be used.
  # Intermediate directories are created if necessary.
  #
  # Optional
  # Default: os.Stdout
  #
  # filePath = "log/traefik.log"

  # Format is either "json" or "common".
  #
  # Optional
  # Default: "common"
  #
  # format = "json"

################################################################
# Access logs configuration
################################################################

# Enable access logs
# By default it will write to stdout and produce logs in the textual
# Common Log Format (CLF), extended with additional fields.
#
# Optional
#
# [accessLog]

  # Sets the file path for the access log. If not specified, stdout will be used.
  # Intermediate directories are created if necessary.
  #
  # Optional
  # Default: os.Stdout
  #
  # filePath = "/path/to/log/log.txt"

  # Format is either "json" or "common".
  #
  # Optional
  # Default: "common"
  #
  # format = "json"

################################################################
# API and dashboard configuration
################################################################

# Enable API and dashboard
[api]

  # Name of the related entry point
  #
  # Optional
  # Default: "traefik"
  #
  # entryPoint = "traefik"

  # Enabled Dashboard
  #
  # Optional
  # Default: true
  #
  dashboard = true
  insecure = true
################################################################
# Ping configuration
################################################################

# Enable ping
[ping]

  # Name of the related entry point
  #
  # Optional
  # Default: "traefik"
  #
  # entryPoint = "traefik"

################################################################
# Docker configuration backend
################################################################

# Enable Docker configuration backend
#[providers.docker]

  # Docker server endpoint. Can be a tcp or a unix socket endpoint.
  #
  # Required
  # Default: "unix:///var/run/docker.sock"
  #
  # endpoint = "tcp://10.10.10.10:2375"

  # Default host rule.
  #
  # Optional
  # Default: "Host(`{{ normalize .Name }}`)"
  #
  # defaultRule = "Host(`{{ normalize .Name }}.docker.localhost`)"

  # Expose containers by default in traefik
  #
  # Optional
  # Default: true
  #
  # exposedByDefault = false

# Enable Consul Catalog Provider.
[providers.consulcatalog]

  # Expose Consul Catalog services by default in Traefik.
  exposedByDefault = false

  # Prefix used for accessing the Consul service metadata.
  prefix = "traefik"

  # Defines the polling interval (in seconds).
  #refreshSeconds = 15

  # Defines default rule.
  defaultRule = "Host(`{{ .Name }}.stuck-in-blue.com`)"

  # Includes only containers having a label with key `a.label.name` and value `foo`
  #constraints = "Label(`a.label.name`, `foo`)"
  # Defines Consul Catalog Provider endpoint.
  [providers.consulcatalog.endpoint]

    # Defines the consul address endpoint.
    address = "127.0.0.1:8500"

    # Defines the scheme used.
    scheme = "https"

    # Defines the DC.
    datacenter = "home"

    # Defines the token.
    #token = "foobar"

    # Defines the expoint wait time.
    endpointWaitTime = "15s"

#    [providers.consulCatalog.endpoint.tls]
#      ca = "/etc/consul.d/homelab-agent-ca.pem"
#      cert = "/etc/consul.d/hetzner-server-homelab-0.pem"
#      key = "/etc/consul.d/hetzner-server-homelab-0-key.pem"

#[file]
#
## rules
#[backends]
#  [backends.sabnzbd]
#    [backends.sabnzbd.servers.server1]
#    url = "http://127.0.0.1:8080"
#    weight = 10
#    extractorfunc = "request.host"
#
#[frontends]
#  [frontends.sabnzbd]
#  backend = "sabnzbd"
#    [frontends.sabnzbd.routes.sab]
#    rule = "Host:sab.nolab.xyz"


================================================
FILE: nomad_jobs/core-infra/traefik/config/traefik.toml.new
================================================
################################################################
#
# Configuration sample for Traefik v2.
#
# For Traefik v1: https://github.com/containous/traefik/blob/v1.7/traefik.sample.toml
#
################################################################

################################################################
# Global configuration
################################################################
[global]
  checkNewVersion = false
  sendAnonymousUsage = false

################################################################
# Entrypoints configuration
################################################################

# Entrypoints definition
#
# Optional
# Default:
[entryPoints]
  [entryPoints.grpc]
    address = ":7576"

  [entryPoints.traefik]
    address = ":9009"

################################################################
# Traefik logs configuration
################################################################

# Traefik logs
# Enabled by default and log to stdout
#
# Optional
#
[log]

  # Log level
  #
  # Optional
  # Default: "ERROR"
  #
  # level = "DEBUG"

  # Sets the filepath for the traefik log. If not specified, stdout will be used.
  # Intermediate directories are created if necessary.
  #
  # Optional
  # Default: os.Stdout
  #
  # filePath = "log/traefik.log"

  # Format is either "json" or "common".
  #
  # Optional
  # Default: "common"
  #
  # format = "json"

################################################################
# Access logs configuration
################################################################

# Enable access logs
# By default it will write to stdout and produce logs in the textual
# Common Log Format (CLF), extended with additional fields.
#
# Optional
#
# [accessLog]

  # Sets the file path for the access log. If not specified, stdout will be used.
  # Intermediate directories are created if necessary.
  #
  # Optional
  # Default: os.Stdout
  #
  # filePath = "/path/to/log/log.txt"

  # Format is either "json" or "common".
  #
  # Optional
  # Default: "common"
  #
  # format = "json"

################################################################
# API and dashboard configuration
################################################################

# Enable API and dashboard
[api]

  # Name of the related entry point
  #
  # Optional
  # Default: "traefik"
  #
  # entryPoint = "traefik"

  # Enabled Dashboard
  #
  # Optional
  # Default: true
  #
  # dashboard = false
  insecure = true
################################################################
# Ping configuration
################################################################

# Enable ping
[ping]

  # Name of the related entry point
  #
  # Optional
  # Default: "traefik"
  #
  # entryPoint = "traefik"

################################################################
# Docker configuration backend
################################################################

# Enable Docker configuration backend
#[providers.docker]

  # Docker server endpoint. Can be a tcp or a unix socket endpoint.
  #
  # Required
  # Default: "unix:///var/run/docker.sock"
  #
  # endpoint = "tcp://10.10.10.10:2375"

  # Default host rule.
  #
  # Optional
  # Default: "Host(`{{ normalize .Name }}`)"
  #
  # defaultRule = "Host(`{{ normalize .Name }}.docker.localhost`)"

  # Expose containers by default in traefik
  #
  # Optional
  # Default: true
  #
  # exposedByDefault = false

# Enable Consul Catalog Provider.
[providers.consulcatalog]

  # Expose Consul Catalog services by default in Traefik.
  exposedByDefault = false

  # Prefix used for accessing the Consul service metadata.
  prefix = "traefik"

  # Defines the polling interval (in seconds).
  #refreshSeconds = 15

  # Defines default rule.
  defaultRule = "Host(`{{ .Name }}.stage.dus.tcs.trv.cloud`)"

  # Includes only containers having a label with key `a.label.name` and value `foo`
  #constraints = "Label(`a.label.name`, `foo`)"
  # Defines Consul Catalog Provider endpoint.
  [providers.consulcatalog.endpoint]

    # Defines the consul address endpoint.
    address = "127.0.0.1:8500"

    # Defines the scheme used.
    scheme = "http"

    # Defines the DC.
    datacenter = "dus"

    # Defines the token.
    #token = "foobar"

    # Defines the expoint wait time.
    endpointWaitTime = "15s"


================================================
FILE: nomad_jobs/core-infra/traefik/config/traefik.toml.test
================================================
################################################################
# Entrypoints configuration
################################################################
# Entrypoints definition
#
defaultEntryPoints = ["https"]

[entryPoints]
  [entryPoints.admin]
  address = "10.90.80.120:6062"
  [entryPoints.http]
  address = "78.94.59.116:80"
    [entryPoints.http.redirect]
    entryPoint = "https"
  [entryPoints.https]
  address = ":443"
  [entryPoints.https.tls]

[acme]
email = "perry@stuck-in-blue.com"
storage = "acme.json"
#caServer = "https://acme-staging-v02.api.letsencrypt.org/directory"
caServer = "https://acme-v02.api.letsencrypt.org/directory"
entryPoint = "https"
[acme.httpChallenge]
entryPoint = "http"
[acme.dnsChallenge]
  provider = "gcloud"
  delayBeforeCheck = 0

[[acme.domains]]
  main = "*.nolab.xyz"
  sans = ["nolab.xyz"]

################################################################
# Traefik logs configuration
################################################################
# Enable logs
# By default it will write to stdout
[traefikLog]

################################################################
# Access logs configuration
################################################################
# Enable access logs
# By default it will write to stdout and produce logs in the textual
# Common Log Format (CLF), extended with additional fields.

[accessLog]

################################################################
# Metrics configuration
################################################################
[metrics]
  [metrics.prometheus]
    entryPoint = "admin"

################################################################
# API and dashboard configuration
################################################################
# Enable API and dashboard
[api]
  entryPoint = "admin"
  [api.statistics]
    recentErrors = 100
################################################################
# Ping configuration
################################################################
# Enable ping
[ping]
  entryPoint = "admin"
################################################################
# Consul Catalog Provider
################################################################
[consulCatalog]
endpoint = "{{ env "NOMAD_IP_https" }}:8500"
stale = true
prefix = "traefik"
domain = "holab.io"
#filename = "/usr/local/etc/traefik/consul.toml"
#templateVersion = 2


================================================
FILE: nomad_jobs/core-infra/traefik/nomad.job
================================================
job "traefik" {
  region = var.region
  datacenters = ["dc1"]
  type = "service"
  meta {
      job_file = "nomad_jobs/core-infra/traefik/nomad.job"
      version = "12"  // HA: run 2 instances with keepalived failover
  }

  group "lbs" {
    count = 2

    constraint {
      operator = "distinct_hosts"
      value    = "true"
    }

    network {
      port "http" {
        host_network = "lan"
        static = "80"
      }
      port "admin" {
        host_network = "lan"
        static = "9002"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
      auto_promote     = true
      canary           = 2
    }

    task "keepalived-traefik" {
      driver = "docker"

      lifecycle {
        hook = "prestart"
        sidecar = true
      }

      config {
        image = "osixia/keepalived:2.3.4"
        network_mode = "host"
        force_pull = false
        volumes = [
          "local/keepalived.conf:/etc/keepalived/keepalived.conf"
        ]
        cap_add = ["NET_ADMIN", "NET_BROADCAST", "NET_RAW"]
      }

      template {
        destination = "local/keepalived.conf"
        change_mode = "restart"
        splay       = "1m"
        data        = <<EOH
vrrp_instance VI_1 {
    state BACKUP
    interface {{ sockaddr "GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"name\"" }}
    virtual_router_id 50
    priority 100
    advert_int 1

    use_vmac vrrp.50
    vmac_xmit_base

    unicast_peer {
{{- range service "traefik-web" }}
        {{ .Address }}
{{- end }}
    }

    virtual_ipaddress {
        192.168.50.20/24
    }
}
EOH
      }

      resources {
        cpu    = 100
        memory = 64
      }
    }

    task "traefik" {
      driver = "docker"
      service {
        name = "traefik-web"
        port = "http"
      }
      service {
        name = "traefik"
        port = "admin"
        tags = [
          "metrics"
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      config {
        image = "traefik:v3.6"
        ports = ["http", "admin"]
        network_mode = "host"
        volumes = [
          "local/traefik.toml:/etc/traefik/traefik.toml",
          "local/dynamic-config.toml:/etc/traefik/dynamic/dynamic-config.toml",
          "local/servers-transport.toml:/etc/traefik/dynamic/servers-transport.toml",
          "${var.shared_dir}traefik-ingress/acme.json:/acme.json",
          "${var.shared_dir}traefik-ingress/dynamic-whitelist.toml:/etc/traefik/dynamic/dynamic-whitelist.toml",
        ]
      }

      template {
data = <<EOH
[global]
  checkNewVersion = false
  sendAnonymousUsage = false

[metrics]
  [metrics.prometheus]

[entryPoints]
  [entryPoints.web]
    address = ":80"
    # No entrypoint middleware - applied at router level to allow ACME challenges

  [entryPoints.websecure]
    address = ":443"
    [entryPoints.websecure.http]
        middlewares=["home-ip-whitelist@file"]
    [entryPoints.websecure.http.tls]
      certResolver = "letsencrypt"

  [entryPoints.traefik]
    address = ":9002"

[tls.options]
  [tls.options.TLSOptions]
    minVersion = "VersionTLS12"
    sniStrict = true

[accessLog]
  format = "json"

[log]

[api]
  dashboard = true
  insecure = true  # Enable direct access on :9002 (protected by local network)

[ping]

[providers.consulcatalog]
  exposedByDefault = false
  prefix = "traefik"
  defaultRule = "Host(`{{ .Name }}.${var.tld}`)"

  [providers.consulcatalog.endpoint]
    address = "{{{ env "NOMAD_IP_http" }}}:8500"
    scheme = "http"
    datacenter = "homelab"
    endpointWaitTime = "15s"

[certificatesResolvers.letsencrypt.acme]
  email = "me@you.com"
  storage = "acme.json"
  [certificatesResolvers.letsencrypt.acme.httpChallenge]
    entryPoint = "web"

[providers.file]
  directory = "/etc/traefik/dynamic"
  watch = true
EOH
        destination = "local/traefik.toml"
        env         = false
        change_mode = "noop"
        left_delimiter = "{{{"
        right_delimiter = "}}}"
      }

      template {
data = <<EOH
[http.middlewares]
  [http.middlewares.allow-local-network.ipWhiteList]
    sourceRange = ["192.168.50.0/24", "10.0.0.0/16"]  # Local network only

  [http.middlewares.basic-auth.basicAuth]
    users = [
      "admin:$apr1$Ht8D2P1z$7QOq2s8xKUomI1cM.rFJX/" # Replace with an htpasswd-generated hash
    ]
    realm = "Restricted Area"


  [http.middlewares.ip-or-auth.chain]
    middlewares = ["home-ip-whitelist@file", "allow-local-network", "basic-auth"]

  [http.middlewares.redirect-to-https.redirectScheme]
    scheme = "https"
    permanent = true

  [http.middlewares.whitelist-then-redirect.chain]
    middlewares = ["home-ip-whitelist@file", "redirect-to-https"]

[http.routers]
  # Redirect HTTP to HTTPS except for ACME challenges - apply whitelist first
  [http.routers.http-redirect]
    entryPoints = ["web"]
    rule = "PathPrefix(`/`) && !PathPrefix(`/.well-known/acme-challenge/`)"
    middlewares = ["whitelist-then-redirect"]
    service = "noop@internal"
    priority = 1000

  [http.routers.https-local]
    entryPoints = ["websecure"]
    rule = "HostRegexp(`{any:.+}`)"  # Matches any domain
    middlewares = ["home-ip-whitelist@file"]
    service = "beefcake"
    [http.routers.https-local.tls]

[http.services]
  [http.services.beefcake.loadBalancer]
    [[http.services.beefcake.loadBalancer.servers]]
      url = "http://192.168.50.208:80"
EOH
        destination = "local/dynamic-config.toml"
        env         = false
        change_mode = "noop"
      }

      template {
        data = <<EOH
# ServersTransport for HTTPS backends with self-signed certificates
[http.serversTransports]
  [http.serversTransports.insecure-skip-verify]
    insecureSkipVerify = true
EOH
        destination = "local/servers-transport.toml"
        env         = false
        change_mode = "noop"
      }

      resources {
        cpu = 100
        memory = 256
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "ingress_ip" {
    type = string
}


================================================
FILE: nomad_jobs/core-infra/traefik-forward-auth/nomad.job
================================================
job "traefik-forward-auth" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/core-infra/traefik-forward-auth/nomad.job"
version = "4"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "tailscale"
        static = "4181"
      }

    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "auth" {
      driver = "docker"
      config {
        image = "ghcr.io/jordemort/traefik-forward-auth:latest"
        ports = ["http"]
      }

      env {
        PROVIDERS_GOOGLE_CLIENT_ID     = "${var.oauth_client_id}"
        PROVIDERS_GOOGLE_CLIENT_SECRET = "${var.oauth_client_secret}"
        SECRET                         = "${var.oauth_secret}"
        AUTH_HOST                      = "auth.${var.tld}"
        COOKIE_DOMAIN                  = "${var.tld}"
        WHITELIST                      = "${var.oauth_emails}"
        LOG_LEVEL                      = "debug"
        URL_PATH                       = "/_oauth"
        DEFAULT_ACTION                 = "auth"
        INSECURE_COOKIE                = "false"
        CONFIG                         = "local/config"
	TRUSTED_IP_ADDRESS	       = "86.111.155.199/32,86.111.152.230/32,89.246.171.154/32,86.111.155.93/32"
      }

      service {
        port = "http"
	name = "traefik-forward-auth"
        tags = [
          "traefik.enable=true",
          "traefik.http.routers.auth.rule=Host(`auth.${var.tld}`)",
          "traefik.http.routers.auth.entrypoints=websecure",
          "traefik.http.routers.auth.tls=true",
          "traefik.http.routers.${NOMAD_TASK_NAME}_insecure.rule=Host(`auth.${var.tld}`)",
          "traefik.http.routers.auth.tls.domains[0].main=${var.tld}",
          "traefik.http.routers.auth.tls.domains[0].sans=*.${var.tld}",
          "traefik.http.routers.auth.rule=Host(`auth.${var.tld}`)",
          "traefik.http.routers.auth.rule=Path(`/_oauth`)",
          "traefik.http.middlewares.forward-auth.forwardauth.address=http://${NOMAD_IP_http}:${NOMAD_PORT_http}/",
          "traefik.http.middlewares.forward-auth.forwardauth.trustForwardHeader=true",
          "traefik.http.middlewares.forward-auth.forwardauth.authResponseHeaders=X-Forwarded-User",
          "traefik.http.routers.auth.middlewares=forward-auth"
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      template {
data = <<EOH
rule.sabnzbd.action = allow
rule.sabnzbd.rule = PathPrefix(`/sabnzbd/api`)
EOH
        destination = "local/config"
        env         = false
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {}
variable "tld" {}
variable "oauth_client_id" {}
variable "oauth_client_secret" {}
variable "oauth_secret" {}
variable "oauth_emails" {}


================================================
FILE: nomad_jobs/core-infra/vault/secrets_template.yaml
================================================
backends:
- type: generic
  path: secret
  description: secrets

secrets:
  - path: /secret/homelab/couchpotato
    values:
      apikey: ${COUCHPOTATO_APIKEY}
      username: ${COUCHPOTATO_USERNAME}
      password: ${COUCHPOTATO_PASS}
      host: ${COUCHPOTATO_HOST}

  - path: /secret/homelab/plex
    values:
      auth_token: ${PLEX_AUTHTOKEN}
      host: ${PLEX_HOST}

  - path: /secret/external/pushover
    values:
      api_key: ${PUSHOVER_APIKEY}
      user_key: ${PUSHOVER_USERKEY}

  - path: /secret/external/newsnab
    values:
      api: ${NEWSNAB_API}
      host: ${NEWSNAB_HOST}

  - path: /secret/homelab/mqtt-pub
    values:
      remote_username: ${MQTTPUB_REMOTE_USERNAME}
      remote_password: ${MQTTPUB_REMOTE_PASSWORD}
      address: ${MQTTPUB_ADDRESS}

  - path: /secret/homelab/sonarr
    values:
      api: ${SONAR_API}
      host: ${SONAR_HOST}

  - path: /secret/homelab/sabnzbd
    values:
      api: ${SABNZBD_API}
      host: ${SABNZBD_HOST}

  - path: /secret/homelab/asuswrt
    values:
      username: ${ASUSWRT_USER}
      password: ${ASUSWRT_PASS}
      host: ${ASUSWRT_HOST}

  - path: /secret/homelab/sabnzbd
    values:
      api: ${SABNZBD_API}
      host: ${SABNZBD_HOST}

  - path: /secret/external/github
    values:
      token: ${GITHUB_TOKEN}


================================================
FILE: nomad_jobs/gaming/minecraft-1.21/nomad.job
================================================
job "minecraft-1-21" {
  region      = var.region
  datacenters = ["minecraft"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/gaming/minecraft-1.21/nomad.job"
    version  = "2"
  }

  group "minecraft" {
    count = 1

    network {
      port "minecraft" {
        host_network = "lan"
        static       = 25568
        to           = 25565
      }
      port "query" {
        host_network = "lan"
        static       = 25569
        to           = 25565
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "minecraft-server" {
      driver = "docker"

      config {
        image        = "itzg/minecraft-server:2026.4.1"
        force_pull   = false
        network_mode = "host"

        volumes = [
          "/root/minecraft-1.21.10/data:/data",
          "/root/minecraft-1.21.10/config:/config",
        ]
      }

      env {
        EULA                          = "TRUE"
        VERSION                       = "1.21.10"
        TYPE                          = "FABRIC"
        INIT_MEMORY                   = "2G"
        MAX_MEMORY                    = "8G"
        MOTD                          = "Minecraft 1.21.10 Fabric Server"
        DIFFICULTY                    = "peaceful"
        MAX_PLAYERS                   = "20"
        VIEW_DISTANCE                 = "10"
        SIMULATION_DISTANCE           = "8"
        SPAWN_PROTECTION              = "16"
        ONLINE_MODE                   = "false"
        ENABLE_WHITELIST              = "false"
        SERVER_PORT                   = "25568"
        ENABLE_QUERY                  = "true"
        QUERY_PORT                    = "25568"
        NETWORK_COMPRESSION_THRESHOLD = "512"
        ENABLE_AUTOPAUSE              = "FALSE"
        PAUSE_WHEN_EMPTY_SECONDS      = "0"
        REMOVE_OLD_MODS               = "true"
        MODRINTH_PROJECTS             = "axiom\nfabric-api\ncloth-config\ndistanthorizons\nbalm\nferrite-core\nwaystones\ncarry-on\nbeautify-refabricated\nmacaws-furniture\nmacaws-trapdoors\nmore-decorative-blocks\nblackwolf-library"
        MODRINTH_ALLOWED_VERSION_TYPE = "beta"
        OPS                           = "perry,hannah,Perry,Steve5leon"
        JVM_OPTS                      = "-XX:+UseG1GC -XX:+ParallelRefProcEnabled -XX:MaxGCPauseMillis=100 -XX:+UnlockExperimentalVMOptions -XX:+DisableExplicitGC -XX:+AlwaysPreTouch -XX:+UseStringDeduplication -XX:G1NewSizePercent=30 -XX:G1MaxNewSizePercent=40 -XX:G1HeapRegionSize=8M -XX:G1ReservePercent=20 -XX:InitiatingHeapOccupancyPercent=20 -XX:G1MixedGCLiveThresholdPercent=90 -XX:SurvivorRatio=32 -XX:MaxTenuringThreshold=1"
      }

      service {
        name = "minecraft-1-21"
        port = "minecraft"
        tags = ["minecraft", "gaming", "1.21"]

        check {
          type     = "tcp"
          interval = "30s"
          timeout  = "5s"
        }
      }

      resources {
        cpu        = 4000
        memory     = 3072
        memory_max = 9728
      }
    }
  }
}

variable "region" {
  type = string
}


================================================
FILE: nomad_jobs/gaming/minecraft-avaritia/nomad.job
================================================
job "minecraft-avaritia" {
  region      = var.region
  datacenters = ["minecraft"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/gaming/minecraft-avaritia/nomad.job"
    version  = "1"
  }

  group "minecraft" {
    count = 1

    network {
      port "minecraft" {
        host_network = "lan"
        static       = 25571
        to           = 25565
      }
    }

    restart {
      attempts = 2
      delay    = "120s"
      interval = "30m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "minecraft-server" {
      driver = "docker"

      config {
        image        = "itzg/minecraft-server:2026.4.1"
        force_pull   = false
        network_mode = "host"

        volumes = [
          "/root/minecraft-avaritia/data:/data",
        ]
      }

      env {
        EULA                          = "TRUE"
        VERSION                       = "1.20.1"
        TYPE                          = "FORGE"
        INIT_MEMORY                   = "2G"
        MAX_MEMORY                    = "8G"
        MOTD                          = "Avaritia Modded Server (1.20.1)"
        MODE                          = "creative"
        DIFFICULTY                    = "normal"
        MAX_PLAYERS                   = "20"
        VIEW_DISTANCE                 = "10"
        SIMULATION_DISTANCE           = "8"
        SPAWN_PROTECTION              = "16"
        ONLINE_MODE                   = "false"
        ENABLE_WHITELIST              = "false"
        SERVER_PORT                   = "25571"
        ENABLE_QUERY                  = "true"
        QUERY_PORT                    = "25571"
        NETWORK_COMPRESSION_THRESHOLD = "512"
        FORCE_GAMEMODE                = "true"
        ENABLE_COMMAND_BLOCK          = "true"
        OPS                           = "perry,hannah,Perry"
        MAX_TICK_TIME                 = "-1"
        ENABLE_RCON                   = "true"
        RCON_PORT                     = "25572"
        RCON_PASSWORD                 = "minecraft"
        CREATE_CONSOLE_IN_PIPE        = "true"
        JVM_OPTS                      = "-XX:+UseG1GC -XX:+ParallelRefProcEnabled -XX:MaxGCPauseMillis=100 -XX:+UnlockExperimentalVMOptions -XX:+DisableExplicitGC -XX:+AlwaysPreTouch -XX:+UseStringDeduplication -XX:G1NewSizePercent=30 -XX:G1MaxNewSizePercent=40 -XX:G1HeapRegionSize=8M -XX:G1ReservePercent=20 -XX:InitiatingHeapOccupancyPercent=20 -XX:G1MixedGCLiveThresholdPercent=90 -XX:SurvivorRatio=32 -XX:MaxTenuringThreshold=1 -XX:G1PeriodicGCInterval=15000 -XX:G1PeriodicGCSystemLoadThreshold=0.0"
        MODRINTH_PROJECTS             = "remorphed\nwoodwalkers\ncrafted-core"
        CURSEFORGE_FILES              = "re-avaritia\nluckytnt\nlucky-tnt-lib\npehkui\nterrablender\nbiomes-o-plenty\noh-the-biomes-weve-gone\nterralith\ntectonic\nlithostitched\noh-the-trees-youll-grow\njei\njourneymap\nwaystones\nembeddium\ngeckolib\narchitectury-api\nglitchcore\ncorgilib\nbalm"
        CF_API_KEY                    = "${var.curseforge_api_key}"
      }

      service {
        name = "minecraft-avaritia"
        port = "minecraft"
        tags = ["minecraft", "gaming", "avaritia", "modded"]

        check {
          type     = "tcp"
          interval = "30s"
          timeout  = "5s"
        }
      }

      resources {
        cpu        = 4000
        memory     = 3072
        memory_max = 9728
      }
    }
  }
}

variable "region" {
  type = string
}

variable "curseforge_api_key" {
  type    = string
  default = ""
}


================================================
FILE: nomad_jobs/gaming/minecraft-axiom/nomad.job
================================================
job "minecraft-axiom" {
  region      = var.region
  datacenters = ["minecraft"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/gaming/minecraft-axiom/nomad.job"
    version  = "2"  // Added forge-config-api-port dependency
  }

  group "minecraft" {
    count = 1

    network {
      port "minecraft" {
        host_network = "lan"
        static       = 25566
        to           = 25565
      }
      port "query" {
        host_network = "lan"
        static       = 25567
        to           = 25565
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "minecraft-server" {
      driver = "docker"

      config {
        image        = "itzg/minecraft-server:2026.4.1"
        force_pull   = false
        network_mode = "host"

        volumes = [
          "/root/minecraft_new/minecraft-fabric-server/data:/data",
          "/root/minecraft_new/minecraft-fabric-server/config:/config",
          "/root/minecraft_new/minecraft-fabric-server/mods:/mods",
        ]
      }

      env {
        EULA                          = "TRUE"
        VERSION                       = "1.20.1"
        TYPE                          = "FABRIC"
        FABRIC_LOADER_VERSION         = "0.17.2"
        INIT_MEMORY                   = "2G"
        MAX_MEMORY                    = "8G"
        MOTD                          = "Axiom Building Server (1.20.1)"
        MODE                          = "creative"
        DIFFICULTY                    = "easy"
        MAX_PLAYERS                   = "20"
        VIEW_DISTANCE                 = "10"
        SIMULATION_DISTANCE           = "8"
        SPAWN_PROTECTION              = "16"
        ONLINE_MODE                   = "false"
        ENABLE_WHITELIST              = "false"
        SERVER_PORT                   = "25566"
        ENABLE_QUERY                  = "true"
        QUERY_PORT                    = "25566"
        NETWORK_COMPRESSION_THRESHOLD = "512"
        FORCE_GAMEMODE                = "true"
        ENABLE_COMMAND_BLOCK          = "true"
        OPS                           = "perry,hannah,Perry"
        JVM_OPTS                      = "-XX:+UseG1GC -XX:+ParallelRefProcEnabled -XX:MaxGCPauseMillis=100 -XX:+UnlockExperimentalVMOptions -XX:+DisableExplicitGC -XX:+AlwaysPreTouch -XX:+UseStringDeduplication -XX:G1NewSizePercent=30 -XX:G1MaxNewSizePercent=40 -XX:G1HeapRegionSize=8M -XX:G1ReservePercent=20 -XX:InitiatingHeapOccupancyPercent=20 -XX:G1MixedGCLiveThresholdPercent=90 -XX:SurvivorRatio=32 -XX:MaxTenuringThreshold=1 -Dfabric.networkMaxPacketSize=16777216 -Dnetty.maxDirectMemory=0"
        MODRINTH_PROJECTS             = "axiom\nbeautify-refabricated\nchipped\necologics\ndecorative-blocks\nresourceful-lib\nathena-ctm\nconnected-glass\ndiagonal-fences\ndiagonal-walls\ndiagonal-windows\ndouble-doors\nsupplementaries\nhandcrafted\nmacaws-fences-and-walls\nmacaws-windows\nmacaws-bridges\nmacaws-roofs\nfairy-lights-fabric\nimmediatelyfast\nmacaws-doors\nmacaws-furniture\nmacaws-paths-and-pavings\nmacaws-stairs\nmacaws-paintings\nmacaws-trapdoors\nmacaws-lights-and-lamps\nmoonlight\nstarlight\npuzzles-lib\ncollective\nregions-unexplored\ntwigs\nforge-config-api-port"
        CURSEFORGE_FILES              = "grass-overhaul\nfabric-api\nfusion-connected-textures\narchitectury-api\nsodium\nlithium\ncloth-config\nworldedit\njourneymap\nxaeros-minimap\nwaystones\nbalm-fabric\nbiomes-o-plenty\ntectonic\nterralith\nsupermartijn642s-core-lib\noh-the-biomes-weve-gone\nglitchcore\nterrablender-fabric\ncorgilib\noh-the-trees-youll-grow\ngeckolib\nrefurbished-furniture\nframework"
        CF_API_KEY                    = "${var.curseforge_api_key}"
      }

      service {
        name = "minecraft-axiom"
        port = "minecraft"
        tags = ["minecraft", "gaming", "axiom"]

        check {
          type     = "tcp"
          interval = "30s"
          timeout  = "5s"
        }
      }

      resources {
        cpu        = 4000
        memory     = 3072
        memory_max = 9728
      }
    }
  }
}

variable "region" {
  type = string
}

variable "curseforge_api_key" {
  type    = string
  default = ""
}


================================================
FILE: nomad_jobs/gaming/minecraft-fiskheroes/nomad.job
================================================
job "minecraft-fiskheroes" {
  region      = var.region
  datacenters = ["minecraft"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/gaming/minecraft-fiskheroes/nomad.job"
    version  = "1"
  }

  group "minecraft" {
    count = 1

    network {
      port "minecraft" {
        host_network = "lan"
        static       = 25570
        to           = 25565
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "minecraft-server" {
      driver = "docker"

      config {
        image        = "itzg/minecraft-server:java8"
        force_pull   = false
        network_mode = "host"

        volumes = [
          "/root/minecraft-fiskheroes/data:/data",
        ]
      }

      env {
        EULA                          = "TRUE"
        VERSION                       = "1.7.10"
        TYPE                          = "FORGE"
        FORGE_VERSION                 = "10.13.4.1614"
        MEMORY                        = "10G"
        SERVER_PORT                   = "25570"
        ENABLE_QUERY                  = "true"
        QUERY_PORT                    = "25570"
        MOTD                          = "Fisk Superheroes - New York City"
        MODE                          = "creative"
        DIFFICULTY                    = "peaceful"
        FORCE_GAMEMODE                = "true"
        MAX_PLAYERS                   = "20"
        VIEW_DISTANCE                 = "12"
        SIMULATION_DISTANCE           = "8"
        SPAWN_PROTECTION              = "0"
        ONLINE_MODE                   = "false"
        ENABLE_WHITELIST              = "false"
        ENABLE_COMMAND_BLOCK          = "true"
        OPS                           = "perry,hannah,Perry"
        JAVA_TOOL_OPTIONS             = "-Dfml.queryResult=confirm"
        JVM_OPTS                      = "-XX:+UseG1GC -XX:+ParallelRefProcEnabled -XX:MaxGCPauseMillis=100 -XX:+UnlockExperimentalVMOptions -XX:+DisableExplicitGC -XX:+AlwaysPreTouch -XX:+UseStringDeduplication -XX:G1NewSizePercent=30 -XX:G1MaxNewSizePercent=40 -XX:G1HeapRegionSize=8M -XX:G1ReservePercent=20 -XX:InitiatingHeapOccupancyPercent=20 -XX:G1MixedGCLiveThresholdPercent=90 -XX:SurvivorRatio=32 -XX:MaxTenuringThreshold=1 -XX:MetaspaceSize=256M -XX:MaxMetaspaceSize=512M -XX:ReservedCodeCacheSize=512M -XX:+UseCodeCacheFlushing"
      }

      service {
        name = "minecraft-fiskheroes"
        port = "minecraft"
        tags = ["minecraft", "gaming", "forge", "fiskheroes"]

        check {
          type     = "tcp"
          interval = "30s"
          timeout  = "5s"
        }
      }

      resources {
        cpu    = 4000
        memory = 12288
      }
    }
  }
}

variable "region" {
  type = string
}


================================================
FILE: nomad_jobs/gaming/minecraft-forge/nomad.job
================================================
job "minecraft-forge" {
  region      = var.region
  datacenters = ["minecraft"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/gaming/minecraft-forge/nomad.job"
    version  = "1"
  }

  group "minecraft" {
    count = 1

    network {
      port "minecraft" {
        host_network = "lan"
        static       = 25565
        to           = 25565
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "minecraft-server" {
      driver = "docker"

      config {
        image        = "itzg/minecraft-server:2026.4.1"
        force_pull   = false
        network_mode = "host"

        volumes = [
          "/root/minecraft/minecraft-server/data:/data",
          "/root/minecraft/minecraft-server/mods:/mods:ro",
          "/root/minecraft/minecraft-server/config:/config:ro",
        ]
      }

      env {
        EULA                          = "TRUE"
        VERSION                       = "1.20.1"
        TYPE                          = "FORGE"
        INIT_MEMORY                   = "4G"
        MAX_MEMORY                    = "12G"
        SERVER_PORT                   = "25565"
        MOTD                          = "Welcome to our modded Minecraft server!"
        MODE                          = "creative"
        DIFFICULTY                    = "easy"
        MAX_PLAYERS                   = "20"
        VIEW_DISTANCE                 = "12"
        SIMULATION_DISTANCE           = "10"
        SPAWN_PROTECTION              = "16"
        ONLINE_MODE                   = "false"
        ENABLE_WHITELIST              = "false"
        FORCE_GAMEMODE                = "true"
        ENABLE_COMMAND_BLOCK          = "true"
        ENABLE_RCON                   = "true"
        RCON_PASSWORD                 = "minecraft"
        RCON_PORT                     = "25576"
        MAX_TICK_TIME                 = "-1"
        OPS                           = "perry,hannah,Perry"
        JVM_OPTS                      = "-Dwatchdog.timeoutMillis=180000 -XX:+UseG1GC -XX:+ParallelRefProcEnabled -XX:MaxGCPauseMillis=100 -XX:+UnlockExperimentalVMOptions -XX:+DisableExplicitGC -XX:+AlwaysPreTouch -XX:+UseStringDeduplication -XX:G1NewSizePercent=30 -XX:G1MaxNewSizePercent=40 -XX:G1HeapRegionSize=8M -XX:G1ReservePercent=20 -XX:InitiatingHeapOccupancyPercent=20 -XX:G1MixedGCLiveThresholdPercent=90 -XX:SurvivorRatio=32 -XX:MaxTenuringThreshold=1 -XX:MetaspaceSize=256M -XX:MaxMetaspaceSize=512M -XX:ReservedCodeCacheSize=512M -XX:+UseCodeCacheFlushing"
      }

      service {
        name = "minecraft-forge"
        port = "minecraft"
        tags = ["minecraft", "gaming", "forge", "1.20.1"]

        check {
          type     = "tcp"
          interval = "30s"
          timeout  = "5s"
        }
      }

      resources {
        cpu        = 4000
        memory     = 13312
        memory_max = 13312
      }
    }
  }
}

variable "region" {
  type = string
}


================================================
FILE: nomad_jobs/media-stack/audioserve/nomad.job
================================================
job "audioserve" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/audioserve/nomad.job"
version = "3"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "tailscale"
        to = "3000"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "audioserve" {
      driver = "docker"
      config {
        image = "izderadicka/audioserve:v0.28.6"
        ports = ["http"]
        args = ["--tags", "/audiobooks"]
        volumes = [
          "${var.media_dir}/Books:/audiobooks",
        ]
      }

      env {
        AUDIOSERVE_SHARED_SECRET = "${var.web_pass}"
      }

      service {
        port = "http"
	name = "audioserve"
        tags = [
          "traefik.enable=true",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "media_dir" {
    type = string
}

variable "web_pass" {}


================================================
FILE: nomad_jobs/media-stack/flaresolverr/nomad.job
================================================
job "flaresolverr" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/flaresolverr/nomad.job"
version = "2"
  }

  group "downloaders" {
    count = 1

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "flaresolverr" {
      driver = "docker"
      config {
        image = "ghcr.io/flaresolverr/flaresolverr:v3.4.6"
        network_mode = "host"
        volumes = [
          "${var.shared_dir}flaresolverr/config:/config",
          "${var.shared_dir}flaresolverr/torrents:/torrents",
          "${var.downloads_dir}:/downloads",
        ]
      }

      service {
        port = "http"
	name = "flaresolverr"
      }

      resources {
        cpu    = 500
        memory = 256
        network {
          port "http" { static = "8191" }
        }
      }
    }
  }
}

variable "region" {
    type = string
}


variable "shared_dir" {
    type = string
}

variable "downloads_dir" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/jackett/nomad.job
================================================
job "jackett" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/jackett/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 

    network {
      port "http" {
        static = "9117"
        host_network = "tailscale"
      }
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "jackett" {
      driver = "docker"
      config {
        image = "lscr.io/linuxserver/jackett:0.24.1234"
        network_mode = "host"
        ports = ["http"]
        volumes = [
          "${var.shared_dir}jackett:/config",
          "/tmp:/downloads",
        ]
      }

      service {
        port = "http"
	name = "jackett"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
      }

      resources {
        cpu    = 500
        memory = 256
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/lazylibrarian/nomad.job
================================================
job "lazylibrarian" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/lazylibrarian/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        static = "5299"
        host_network = "lan"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "lazylibrarian" {
      driver = "docker"
      config {
        image = "linuxserver/lazylibrarian"
        dns_servers = ["192.168.50.2"]
        ports = ["http"]
        volumes = [
          "${var.shared_dir}lazylibrarian:/config",
          "${var.books_dir}:/books",
          "${var.downloads_dir}:/downloads",
        ]
      }

      service {
        port = "http"
      	name = "lazylibrarian"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 128
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "downloads_dir" {
    type = string
}

variable "books_dir" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/lidarr/nomad.job
================================================
job "lidarr" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/lidarr/nomad.job"
version = "10"  // Full config.xml template with API key
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        to = "8686"
      }
    }

    volume "lidarr" {
      type      = "csi"
      read_only = false
      source    = "lidarr2"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "lidarr" {
      driver = "docker"
      config {
        image = "linuxserver/lidarr:3.1.0"
        ports = ["http"]
        dns_servers = ["192.168.50.2"]
        volumes = [
          "${var.downloads_dir}:/downloads",
          "${var.music_dir}:/music",
          "${var.music_dir}:/media/Music",
          "local/config.xml:/config/config.xml",
        ]
      }

      volume_mount {
        volume      = "lidarr"
        destination = "/config"
        read_only   = false
      }

      env {
        PUID = "65534"
        PGID = "65534"
        TZ = "Etc/UTC"
      }

      template {
        data = <<EOH
<Config>
  <PostgresUser>postgres</PostgresUser>
  <PostgresPassword>${var.postgres_pass}</PostgresPassword>
  <PostgresPort>5432</PostgresPort>
  <PostgresHost>postgres.service.consul</PostgresHost>
  <PostgresMainDb>lidarr_main</PostgresMainDb>
  <PostgresLogDb>lidarr_logs</PostgresLogDb>
  <LogLevel>info</LogLevel>
  <UrlBase></UrlBase>
  <BindAddress>*</BindAddress>
  <Port>8686</Port>
  <SslPort>6868</SslPort>
  <EnableSsl>False</EnableSsl>
  <LaunchBrowser>False</LaunchBrowser>
  <ApiKey>${var.lidarr_api_key}</ApiKey>
  <AuthenticationMethod>External</AuthenticationMethod>
  <AuthenticationRequired>DisabledForLocalAddresses</AuthenticationRequired>
  <TrustedProxies>100.64.0.0/10,192.168.50.0/24</TrustedProxies>
  <Branch>master</Branch>
  <InstanceName>Lidarr</InstanceName>
  <UpdateMechanism>Docker</UpdateMechanism>
</Config>
EOH
        destination = "local/config.xml"
        perms = "644"
      }

      service {
        port = "http"
        name = "lidarr"
        tags = [
          "traefik.enable=true",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
        ]
        check {
          type     = "http"
          path     = "/ping"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "downloads_dir" {
    type = string
}

variable "music_dir" {
    type = string
}

variable "postgres_pass" {
    type = string
    description = "Admin password for PostgreSQL"
}

variable "lidarr_api_key" {
    type = string
    description = "API key for Lidarr"
}


================================================
FILE: nomad_jobs/media-stack/lidarr/volume.hcl
================================================
id           = "lidarr2"
external_id  = "lidarr2"
name         = "lidarr2"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "10GiB"
capacity_max = "10GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/media-stack/lidify/nomad.job
================================================
job "lidify" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/lidify/nomad.job"
    version  = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "discovery" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to = "5000"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "lidify" {
      driver = "docker"
      config {
        image = "thewicklowwolf/lidify:latest"
        ports = ["http"]
        dns_servers = ["192.168.50.2"]
        volumes = [
          "${var.shared_dir}lidify:/lidify/config",
        ]
      }

      env {
        lidarr_address      = "http://lidarr.service.consul:8686"
        lidarr_api_key      = var.lidarr_api_key
        lastfm_api_key      = var.lastfm_api_key
        root_folder_path    = "/music"
        quality_profile_id  = "1"
        metadata_profile_id = "1"
        sleep_interval      = "3600"
      }

      service {
        port = "http"
        name = "lidify"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}

variable "shared_dir" {
  type = string
}

variable "lidarr_api_key" {
  type        = string
  description = "API key for Lidarr"
}

variable "lastfm_api_key" {
  type        = string
  description = "Last.fm API key"
}


================================================
FILE: nomad_jobs/media-stack/maintainerr/nomad.job
================================================
job "maintainerr" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/maintainerr/nomad.job"
    version = "2"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "media" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to = 6246
      }
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "maintainerr" {
      driver = "docker"

      config {
        image = "ghcr.io/maintainerr/maintainerr:3.7.0"
        ports = ["http"]
        volumes = [
          "${var.shared_dir}maintainerr:/opt/data",
        ]
      }

      env {
        TZ = "Etc/UTC"
      }

      user = "1000:1000"

      service {
        port = "http"
        name = "maintainerr"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "30s"
          timeout  = "5s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 200
        memory = 512
      }
    }
  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}

variable "shared_dir" {
  type = string
}


================================================
FILE: nomad_jobs/media-stack/mediasage/nomad.job
================================================
job "mediasage" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/mediasage/nomad.job"
    version  = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "playlists" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to = "5765"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prep-disk" {
      driver = "docker"
      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "mkdir -p /data && chmod 777 /data"]
        volumes = [
          "${var.shared_dir}mediasage:/data",
        ]
      }
      resources {
        cpu    = 50
        memory = 32
      }
    }

    task "mediasage" {
      driver = "docker"
      config {
        image = "ghcr.io/ecwilsonaz/mediasage:latest"
        ports = ["http"]
        dns_servers = ["192.168.50.2"]
        volumes = [
          "${var.shared_dir}mediasage:/app/data",
        ]
      }

      env {
        PLEX_URL     = "http://plex.service.consul:32400"
        PLEX_TOKEN   = var.plex_token
        AI_PROVIDER  = "ollama"
        OLLAMA_URL   = "http://ollama.service.consul:11434"
      }

      service {
        port = "http"
        name = "mediasage"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 200
        memory = 512
      }
    }
  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}

variable "shared_dir" {
  type = string
}

variable "plex_token" {
  type        = string
  description = "Plex authentication token"
}


================================================
FILE: nomad_jobs/media-stack/multi-scrobbler/nomad.job
================================================
job "multi-scrobbler" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/multi-scrobbler/nomad.job"
    version  = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "scrobbler" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to = "9078"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "multi-scrobbler" {
      driver = "docker"
      config {
        image = "foxxmd/multi-scrobbler:latest"
        ports = ["http"]
        dns_servers = ["192.168.50.2"]
        volumes = [
          "${var.shared_dir}multi-scrobbler:/config",
          "local/config.json:/config/config.json",
        ]
      }

      env {
        TZ = "Etc/UTC"
      }

      template {
        data = <<EOH
{
  "sources": [
    {
      "type": "plex",
      "name": "Plex",
      "data": {
        "url": "http://plex.service.consul:32400",
        "token": "${var.plex_token}"
      }
    }
  ],
  "clients": [
    {
      "type": "listenbrainz",
      "name": "ListenBrainz",
      "data": {
        "token": "${var.listenbrainz_token}",
        "url": "https://api.listenbrainz.org",
        "username": "${var.listenbrainz_username}"
      }
    },
    {
      "type": "lastfm",
      "name": "Last.fm",
      "data": {
        "apiKey": "${var.lastfm_api_key}",
        "secret": "${var.lastfm_api_secret}",
        "redirectUri": "https://multi-scrobbler.${var.tld}/lastfm/callback"
      }
    }
  ]
}
EOH
        destination = "local/config.json"
        perms       = "644"
      }

      service {
        port = "http"
        name = "multi-scrobbler"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}

variable "shared_dir" {
  type = string
}

variable "plex_token" {
  type        = string
  description = "Plex authentication token for scrobbling"
}

variable "listenbrainz_token" {
  type        = string
  description = "ListenBrainz user token"
}

variable "listenbrainz_username" {
  type        = string
  description = "ListenBrainz/MusicBrainz username"
}

variable "lastfm_api_key" {
  type        = string
  description = "Last.fm API key"
}

variable "lastfm_api_secret" {
  type        = string
  description = "Last.fm API secret"
}


================================================
FILE: nomad_jobs/media-stack/navidrome/nomad.job
================================================
job "navidrome" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/navidrome/nomad.job"
version = "3"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        to = "4533"
      }
    }

    volume "navidrome" {
      type      = "csi"
      read_only = false
      source    = "navidrome"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "navidrome" {
      driver = "docker"
      config {
        image = "deluan/navidrome:0.61.2"
        dns_servers = ["192.168.50.2"]
        ports = ["http"]
        volumes = [
          "${var.music_dir}:/music",
        ]
      }

      volume_mount {
        volume      = "navidrome"
        destination = "/data"
        read_only   = false
      }

      env {
        UMASK_SET = "022"
        TZ        = "UTC"
        PGUID     = "1000"
        PGID      = "1000"
      }

      service {
        port = "http"
        name = "navidrome"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 500
        memory = 1024
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "music_dir" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/navidrome/volume.hcl
================================================
id           = "navidrome"
external_id  = "navidrome"
name         = "navidrome"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "10GiB"
capacity_max = "10GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/media-stack/ombi/nomad.job
================================================
job "ombi" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/ombi/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 

    network {
      port "http" {
        host_network = "tailscale"
        to = "3579"
      }
    }

    volume "ombi" {
      type      = "csi"
      read_only = false
      
      source    = "ombi"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "ombi" {
      driver = "docker"
      config {
        image = "linuxserver/ombi:4.53.4"
        force_pull = "true"
        ports = ["http"]
      }

      volume_mount {
        volume      = "ombi"
        destination = "/config"
        read_only   = false
      }

      env {
        PUID = "65534"
        PGID = "65534"
        TZ = "Etc/UTC"
      }

      service {
        port = "http"
        name = "ombi"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 100
        memory = 512
      }
    }
  }
}

variable "region" {}
variable "tld" {}


================================================
FILE: nomad_jobs/media-stack/ombi/volume.hcl
================================================
id           = "ombi"
external_id  = "ombi"
name         = "ombi"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/media-stack/overseerr/nomad.job
================================================
job "overseerr" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/overseerr/nomad.job"
    version = "7"  // Migrate to Seerr + patch webhook bug
  }

  group "media" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to = 5055
      }
    }

    volume "overseerr" {
      type      = "csi"
      read_only = false
      source    = "overseerr"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prep-disk" {
      driver = "docker"

      volume_mount {
        volume      = "overseerr"
        destination = "/volume/"
        read_only   = false
      }

      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "chown -R 1000:1000 /volume/"]
      }

      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    task "overseerr" {
      driver = "docker"
      config {
        image = "seerr/seerr:v3.2.0"
        dns_servers = ["192.168.50.2"]
        init = true
        ports = ["http"]
        entrypoint = ["/bin/sh", "-c", "sed -i 's/Buffer.from(req.body.options.jsonPayload)/Buffer.from(JSON.stringify(req.body.options.jsonPayload))/g' /app/dist/routes/settings/notifications.js && exec docker-entrypoint.sh npm start"]
      }

      volume_mount {
        volume      = "overseerr"
        destination = "/app/config"
        read_only   = false
      }

      env {
        TZ = "Etc/UTC"
        LOG_LEVEL = "info"
      }

      service {
        port = "http"
        name = "overseerr"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 500
        memory = 384
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/overseerr/volume.hcl
================================================
id           = "overseerr"
external_id  = "overseerr"
name         = "overseerr"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "2GiB"
capacity_max = "2GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}

================================================
FILE: nomad_jobs/media-stack/plex/nomad.job
================================================
job "plex" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"
  priority    = 80

  meta {
      job_file = "nomad_jobs/media-stack/plex/nomad.job"
version = "7"  // Pin to klo01 for QuickSync hardware transcoding
  }

  group "downloaders" {
    count = 1

    # Pin to klo01 for Intel QuickSync hardware transcoding
    constraint {
      attribute = "${attr.unique.hostname}"
      value     = "klo01"
    }

    network {
      port "http" {
        host_network = "lan"
        static = "32400"
      }
    }

    // Use a CSI volume specifically optimized for databases
    volume "plex-db" {
      type      = "csi"
      read_only = false
      source    = "plex-database"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "plex" {
      driver = "docker"
      config {
        image = "plexinc/pms-docker@sha256:4e704a2172129d8a6bc5b05ea201945b329bb6512f48a4e92ed4a4a787c35462"
        network_mode = "host"
        privileged = "true"
        force_pull = "true"
        volumes = [
          # Intel QuickSync hardware transcoding (privileged mode grants access)
          "/dev/dri:/dev/dri",
          "/tmp:/transcode",
          "${var.media_dir}:/data",
          "${var.shared_dir}plex_new:/config",
          "local/optimize-db.sh:/etc/cont-init.d/30-optimize-db",
        ]
        // No custom command - let the container start normally
      }

      volume_mount {
        volume      = "plex-db"
        destination = "/opt/plex-db"
        read_only   = false
      }

      // Setup script that runs as part of the container init system
      template {
        data = <<EOH
#!/usr/bin/with-contenv bash
set -euo pipefail

echo "Setting up Plex database optimizations..."

# Create necessary directory structure
mkdir -p /opt/plex-db
DB_DIR="/config/Library/Application Support/Plex Media Server/Plug-in Support/Databases"
mkdir -p "$DB_DIR"

# Check if we need to move existing databases
if [ -z "$(ls -A /opt/plex-db 2>/dev/null || true)" ]; then
  echo "Database volume is empty, copying existing databases if any..."
  if [ -d "$DB_DIR" ] && [ -n "$(ls -A "$DB_DIR" 2>/dev/null || true)" ]; then
    cp -a "$DB_DIR"/* /opt/plex-db/
    echo "Copied existing databases to persistent volume"
  fi
fi

# Set up link to optimized database storage (only if not already linked)
if [ ! -L "$DB_DIR" ] || [ "$(readlink "$DB_DIR")" != "/opt/plex-db" ]; then
  echo "Setting up database symlink..."
  rm -rf "$DB_DIR"
  ln -sf /opt/plex-db "$DB_DIR"
fi

# Install SQLite3 if needed
if ! command -v sqlite3 &>/dev/null; then
  echo "Installing SQLite3..."
  apt-get update && apt-get install -y sqlite3
fi

# Set environment variables for SQLite
export SQLITE_TMPDIR=/tmp/plex_sqlite
mkdir -p "$SQLITE_TMPDIR"

# Apply optimizations to all databases
echo "Applying SQLite optimizations to databases..."
find /opt/plex-db -name "*.db" -type f 2>/dev/null | while read -r db; do
  echo "Optimizing $db"
  sqlite3 "$db" <<EOF
PRAGMA journal_mode = WAL;
PRAGMA synchronous = NORMAL;
PRAGMA temp_store = MEMORY;
PRAGMA mmap_size = 268435456;
PRAGMA cache_size = -8000;
PRAGMA busy_timeout = 5000;
ANALYZE;
EOF
done

echo "Database optimizations complete"
EOH
        destination = "local/optimize-db.sh"
        perms = "755"
      }

      env {
        PLEX_CLAIM = ""  // Add your claim token if needed
        ADVERTISE_IP = "http://192.168.50.5:32400/"  // Replace with your server IP
        PLEX_UID = "1000"
        PLEX_GID = "1000"
        CHANGE_CONFIG_DIR_OWNERSHIP = "false"
        // Skip first run setup if config exists
      }

      service {
        port = "http"
        name = "plex"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 1500  # QuickSync handles transcoding, minimal CPU needed
        memory = 4096
      }
    }
  }
}

variable "region" {}
variable "tld" {}
variable "shared_dir" {}
variable "media_dir" {}


================================================
FILE: nomad_jobs/media-stack/plex/volume.hcl
================================================
id           = "plex-database"
external_id  = "plex-database"
name         = "plex-database"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "20GiB"
capacity_max = "20GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime", "nodiratime", "discard", "data=ordered"]
}


================================================
FILE: nomad_jobs/media-stack/prowlarr/nomad.job
================================================
job "prowlarr" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/prowlarr/nomad.job"
    version  = "3"  // Right-size prowlarr memory 512 -> 256
  }

  group "downloaders" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        static       = 9696
      }
      port "flaresolverr" {
        host_network = "lan"
        static       = 8191
      }
    }

    volume "prowlarr" {
      type            = "csi"
      read_only       = false
      source          = "prowlarr"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prowlarr" {
      driver = "docker"

      config {
        image       = "linuxserver/prowlarr"
        dns_servers = ["192.168.50.2"]
        ports       = ["http"]
      }

      volume_mount {
        volume      = "prowlarr"
        destination = "/config"
        read_only   = false
      }

      env {
        PUID = "65534"
        PGID = "65534"
        TZ   = "Etc/UTC"
      }

      service {
        port = "http"
        name = "prowlarr"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/ping"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 500
        memory = 256
      }
    }

    task "flaresolverr" {
      driver = "docker"

      config {
        image = "ghcr.io/flaresolverr/flaresolverr:v3.4.6"
        ports = ["flaresolverr"]
      }

      env {
        LOG_LEVEL = "info"
        LOG_HTML  = "false"
        TZ        = "Etc/UTC"
      }

      service {
        port = "flaresolverr"
        name = "flaresolverr"
        check {
          type     = "http"
          path     = "/"
          interval = "30s"
          timeout  = "5s"
        }
      }

      resources {
        cpu    = 500
        memory = 512
      }

      lifecycle {
        hook    = "prestart"
        sidecar = true
      }
    }
  }
}

variable "region" {}

variable "tld" {}


================================================
FILE: nomad_jobs/media-stack/prowlarr/volume.hcl
================================================
id           = "prowlarr"
external_id  = "prowlarr"
name         = "prowlarr"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "5GiB"
capacity_max = "5GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/media-stack/qbittorrent/nomad.job
================================================
job "qbittorrent" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/qbittorrent/nomad.job"
    version  = "5"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        static       = 8081
      }
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "gluetun" {
      driver = "docker"

      lifecycle {
        hook    = "prestart"
        sidecar = true
      }

      config {
        image = "qmcgaw/gluetun"

        cap_add = ["NET_ADMIN"]

        ports = ["http"]

        mounts = [
          {
            type     = "tmpfs"
            target   = "/tmp/gluetun"
            readonly = false
          },
        ]
      }

      env {
        VPN_SERVICE_PROVIDER  = "mullvad"
        VPN_TYPE              = "wireguard"
        WIREGUARD_PRIVATE_KEY = var.mullvad_wireguard_key
        WIREGUARD_ADDRESSES   = var.mullvad_wireguard_addr
        SERVER_COUNTRIES      = "Netherlands"
        FIREWALL_VPN_INPUT_PORTS = "8081"
      }

      resources {
        cpu    = 500
        memory = 512
      }
    }

    task "qbittorrent" {
      driver = "docker"

      config {
        image        = "linuxserver/qbittorrent"
        network_mode = "container:gluetun-${NOMAD_ALLOC_ID}"

        mounts = [
          {
            type     = "bind"
            target   = "/config"
            source   = "${var.shared_dir}qbittorrent"
            readonly = false
            bind_options = {
              propagation = "rshared"
            }
          },
          {
            type     = "bind"
            target   = "/downloads"
            source   = "${var.downloads_dir}"
            readonly = false
            bind_options = {
              propagation = "rshared"
            }
          },
          {
            type     = "bind"
            target   = "/media"
            source   = "${var.media_dir}"
            readonly = false
            bind_options = {
              propagation = "rshared"
            }
          },
        ]
      }

      env {
        PUID            = "65534"
        PGID            = "65534"
        TZ              = "Etc/UTC"
        WEBUI_PORT      = "8081"
      }

      service {
        port = "http"
        name = "qbittorrent"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "90s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 1000
        memory = 1024
      }
    }
  }
}

variable "region" {}

variable "tld" {}

variable "shared_dir" {}

variable "downloads_dir" {}

variable "media_dir" {}

variable "mullvad_wireguard_key" {
  type        = string
  description = "Mullvad WireGuard private key"
}

variable "mullvad_wireguard_addr" {
  type        = string
  description = "Mullvad WireGuard interface address"
}


================================================
FILE: nomad_jobs/media-stack/radarr/nomad.job
================================================
job "radarr" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/radarr/nomad.job"
version = "10"  // Full config.xml template with API key
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        to = "7878"
      }
    }

    volume "radarr" {
      type      = "csi"
      read_only = false
      source    = "radarr2"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "radarr" {
      driver = "docker"
      config {
        image = "linuxserver/radarr:6.1.1"
        dns_servers = ["192.168.50.2"]
        ports = ["http"]
        volumes = [
          "${var.downloads_dir}:/downloads",
          "${var.movies_dir}:/media/Movies",
          "local/config.xml:/config/config.xml",
        ]
      }

      volume_mount {
        volume      = "radarr"
        destination = "/config"
        read_only   = false
      }

      env {
        UMASK_SET = "022"
        TZ        = "UTC"
        PUID      = "65534"
        PGID      = "65534"
      }

      template {
        data = <<EOH
<Config>
  <PostgresUser>postgres</PostgresUser>
  <PostgresPassword>${var.postgres_pass}</PostgresPassword>
  <PostgresPort>5432</PostgresPort>
  <PostgresHost>postgres.service.consul</PostgresHost>
  <PostgresMainDb>radarr_main</PostgresMainDb>
  <PostgresLogDb>radarr_logs</PostgresLogDb>
  <LogLevel>info</LogLevel>
  <UrlBase></UrlBase>
  <BindAddress>*</BindAddress>
  <Port>7878</Port>
  <SslPort>9898</SslPort>
  <EnableSsl>False</EnableSsl>
  <LaunchBrowser>False</LaunchBrowser>
  <ApiKey>${var.radarr_api_key}</ApiKey>
  <AuthenticationMethod>External</AuthenticationMethod>
  <AuthenticationRequired>DisabledForLocalAddresses</AuthenticationRequired>
  <TrustedProxies>100.64.0.0/10,192.168.50.0/24</TrustedProxies>
  <Branch>master</Branch>
  <InstanceName>Radarr</InstanceName>
  <UpdateMechanism>Docker</UpdateMechanism>
</Config>
EOH
        destination = "local/config.xml"
        perms = "644"
      }
      
      service {
        port = "http"
        name = "radarr"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/ping"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 1000
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "downloads_dir" {
    type = string
}

variable "tv_dir" {
    type = string
}

variable "movies_dir" {
    type = string
}

variable "postgres_pass" {
    type = string
    description = "Admin password for PostgreSQL"
}

variable "radarr_api_key" {
    type = string
    description = "API key for Radarr"
}


================================================
FILE: nomad_jobs/media-stack/radarr/volume.hcl
================================================
id           = "radarr2"
external_id  = "radarr2"
name         = "radarr2"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "10GiB"
capacity_max = "10GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/media-stack/requestrr/nomad.job
================================================
job "requestrr" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/media-stack/requestrr/nomad.job"
    version = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "media" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to = 4545
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "requestrr" {
      driver = "docker"

      config {
        dns_servers = ["192.168.50.2"]
        image = "thomst08/requestrr:v2.1.9"
        ports = ["http"]
        volumes = [
          "${var.shared_dir}requestrr:/root/config",
        ]
      }

      env {
        TZ = "Etc/UTC"
      }

      service {
        port = "http"
        name = "requestrr"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 200
        memory = 256
      }
    }
  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}

variable "shared_dir" {
  type = string
}


================================================
FILE: nomad_jobs/media-stack/sabnzbd/nomad.job
================================================
job "sabnzbd" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/sabnzbd/nomad.job"
version = "6"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        static = "8080"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "sabnzbd" {
      driver = "docker"
      config {
        image = "linuxserver/sabnzbd"
        network_mode = "host"
        ports = ["http"]
        mounts = [
          {
            type = "bind"
            target = "/config"
            source = "${var.shared_dir}sabnzbd",
            readonly = false
            bind_options = {
              propagation = "rshared"
            }
          },
          {
            type = "bind"
            target = "/downloads"
            source = "/tmp"
            readonly = false
            bind_options = {
              propagation = "rshared"
            }
          },
          {
            type = "bind"
            target = "/media"
            source = "${var.media_dir}"
            readonly = false
            bind_options = {
              propagation = "rshared"
            }
          }
        ]
      }
  
      env {
        PUID = "65534"
        PGID = "65534"
        TZ = "Etc/UTC"
      }

      service {
        port = "http"
        name = "${NOMAD_TASK_NAME}"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/api?mode=auth"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu        = 1000    # Match actual usage (952 MHz observed)
        memory     = 3072    # Accommodate 2GB cache + 1GB overhead
        memory_max = 4096    # Hard limit for burst usage
      }
    }
  }
}

variable "region" {}

variable "tld" {}

variable "shared_dir" {}

variable "media_dir" {}

variable "downloads_dir" {}


================================================
FILE: nomad_jobs/media-stack/sickchill/nomad.job
================================================
job "sickchill" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/sickchill/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        to = "8081"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "sickchill" {
      driver = "docker"
      config {
        image = "linuxserver/sickchill:2024.3.1"
        dns_servers = ["192.168.50.2"]
        ports = ["http"]
        volumes = [
          "${var.downloads_dir}:/downloads",
          "${var.tv_dir}:/tv",
          "${var.shared_dir}sickchill:/config",
        ]
      }

      env {
        PUID = "65534"
        PGID = "65534"
        TZ = "Etc/UTC"
      }

      service {
        port = "http"
        name = "sickchill"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 1000
        memory = 256
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "downloads_dir" {
    type = string
}

variable "tv_dir" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/sonarr/nomad.job
================================================
job "sonarr" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/sonarr/nomad.job"
version = "11"  // Full config.xml template with API key
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        to = "8989"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "sonarr" {
      driver = "docker"
      config {
        image = "linuxserver/sonarr:4.0.17"
        dns_servers = ["192.168.50.2"]
        ports = ["http"]
        volumes = [
          "${var.shared_dir}sonarr:/config",
          "${var.downloads_dir}:/downloads",
          "${var.tv_dir}:/media/TV",
          "local/config.xml:/config/config.xml",
        ]
      }

      env {
        PUID = "65534"
        PGID = "65534"
        TZ = "Etc/UTC"
      }

      template {
        data = <<EOH
<Config>
  <PostgresUser>postgres</PostgresUser>
  <PostgresPassword>${var.postgres_pass}</PostgresPassword>
  <PostgresPort>5432</PostgresPort>
  <PostgresHost>postgres.service.consul</PostgresHost>
  <PostgresMainDb>sonarr_main</PostgresMainDb>
  <PostgresLogDb>sonarr_logs</PostgresLogDb>
  <LogLevel>info</LogLevel>
  <UrlBase></UrlBase>
  <BindAddress>*</BindAddress>
  <Port>8989</Port>
  <SslPort>9898</SslPort>
  <EnableSsl>False</EnableSsl>
  <LaunchBrowser>False</LaunchBrowser>
  <ApiKey>${var.sonarr_api_key}</ApiKey>
  <AuthenticationMethod>External</AuthenticationMethod>
  <AuthenticationRequired>DisabledForLocalAddresses</AuthenticationRequired>
  <TrustedProxies>100.64.0.0/10,192.168.50.0/24</TrustedProxies>
  <Branch>main</Branch>
  <InstanceName>Sonarr</InstanceName>
  <UpdateMechanism>Docker</UpdateMechanism>
</Config>
EOH
        destination = "local/config.xml"
        perms = "644"
      }

      service {
        port = "http"
        name = "sonarr"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/ping"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 1000
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "downloads_dir" {
    type = string
}

variable "tv_dir" {
    type = string
}

variable "postgres_pass" {
    type = string
    description = "Admin password for PostgreSQL"
}

variable "sonarr_api_key" {
    type = string
    description = "API key for Sonarr"
}


================================================
FILE: nomad_jobs/media-stack/synclounge/nomad.job
================================================
job "synclounge" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/synclounge/nomad.job"
version = "4"
  }

  group "synclounge" {
    count = 1 
    network {
      port "http" {
        host_network = "tailscale"
        to = "8088"
      }
      port "server" {
        host_network = "tailscale"
        to = "8089"
      }
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "plexlounge" {
      driver = "docker"
      config {
        image = "starbix/synclounge"
        network_mode = "host"
        force_pull = "true"
        ports = ["http", "server"]
      }

      env {
        DOMAIN = "${NOMAD_TASK_NAME}.${var.tld}"
      }

      service {
        port = "http"
	name = "plexlounge"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      service {
        port = "server"
	name = "syncserver"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


          "traefik.http.routers.syncserver.tls.domains[0].sans=syncserver.${var.tld}",
          "traefik.http.routers.syncserver.middlewares=forward-auth"
        ]

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 3500
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/tautulli/nomad.job
================================================
job "tautulli" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/media-stack/tautulli/nomad.job"
version = "3"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "metrics" {
    count = 1 
    network {
      port "http" {
        host_network = "tailscale"
        to = "8181"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "tautulli" {
      driver = "docker"
      config {
        image = "tautulli/tautulli"
        ports = ["http"]
        volumes = [
          "${var.shared_dir}tautulli:/config",
          "[[ .dirs.plexlogs ]]:/media/TV",
        ]
      }

      service {
        port = "http"
	name = "tautulli"
        tags = ["net-internal", "net-external", "tautulli", "net.frontend.entryPoints=https"]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 128
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/media-stack/tdarr/nomad.job
================================================
job "tdarr" {
  region      = var.region
  datacenters = ["cheese"]
  type        = "service"
  priority    = 50

  meta {
    job_file = "nomad_jobs/media-stack/tdarr/nomad.job"
    version  = "4"  // Move to cheese01 for NVENC GPU transcoding
  }

  group "tdarr" {
    count = 1

    constraint {
      attribute = "${attr.unique.hostname}"
      value     = "cheese01"
    }

    network {
      port "http" {
        host_network = "lan"
        static       = 8265
      }
      port "server" {
        host_network = "lan"
        static       = 8266
      }
    }

    volume "tdarr" {
      type            = "csi"
      read_only       = false
      source          = "tdarr"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel      = 1
      min_healthy_time  = "30s"
      healthy_deadline  = "9m"
      progress_deadline = "15m"
      auto_revert       = true
    }

    task "tdarr" {
      driver = "docker"

      config {
        image        = "ghcr.io/haveagitgat/tdarr:latest"
        network_mode = "host"
        privileged   = true
        runtime      = "nvidia"
        force_pull   = true
        ports        = ["http", "server"]
        volumes = [
          "/tmp/tdarr:/temp",
          "${var.shared_dir}tdarr/configs:/app/configs",
          "${var.shared_dir}tdarr/logs:/app/logs",
          "${var.media_dir}:/media",
        ]
      }

      volume_mount {
        volume      = "tdarr"
        destination = "/app/server"
        read_only   = false
      }

      env {
        PUID                   = "1000"
        PGID                   = "1000"
        NVIDIA_VISIBLE_DEVICES = "all"
        serverIP               = "0.0.0.0"
        serverPort             = "8266"
        webUIPort              = "8265"
        internalNode           = "true"
        nodeName               = "cheese01"
      }

      service {
        port = "http"
        name = "tdarr"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "120s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 2000
        memory = 2048
      }
    }
  }
}

variable "region" {}
variable "tld" {}
variable "shared_dir" {}
variable "media_dir" {}


================================================
FILE: nomad_jobs/media-stack/tdarr/volume.hcl
================================================
id           = "tdarr"
external_id  = "tdarr"
name         = "tdarr"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "10GiB"
capacity_max = "10GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/misc/adb/nomad.job
================================================
job "adb" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/misc/adb/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  constraint {
    attribute = "${meta.zigbee}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 

    network {
      mode = "host"
      port "tcp" {
        static = "5037"
        host_network = "lan"
      }
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "adb" {
      driver = "docker"
      config {
        image = "docker-registry.demonsafe.com/adb"
        entrypoint = ["/local/start.sh"]
        network_mode = "host"
        extra_hosts = ["hassio:127.0.0.1"]
        args = ["&", "adb", "-a", "-P", "5037", "server", "nodaemon"]
        volumes = [
          "${var.shared_dir}home-assistant/android:/root/.android",
        ]
      }

      env {
        log_level = "warning"
      }

      service {
        port = "tcp"
	name = "adb"
        tags = ["net-internal", "adb"]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      template {
data = <<EOH
#!/bin/sh
echo "Start the server in background mode..."
adb -a -P 5037 server nodaemon &
echo "Sleep 10 seconds for the adb server to start"
sleep 10
DEVICES="192.168.50.206"
echo "Connecting to devices."
for device in $DEVICES; do
echo "Connect to device: $device"
adb connect $device
done   
echo "Done."
echo "Foreground the server again..."
       
wait %1 

EOH
        destination = "local/start.sh"
        env         = false
        perms       = 755
        change_mode = "signal"
        change_signal = "SIGHUP"
        left_delimiter  = "{{"
        right_delimiter = "}}"

      }

      resources {
        cpu    = 100
        memory = 10
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {}


================================================
FILE: nomad_jobs/misc/gcp-dns-updater/Dockerfile
================================================
# Use an official Python runtime as a parent image
FROM python:3.14-slim

# Set the working directory in the container
WORKDIR /app

# Copy the requirements file into the container at /app
COPY requirements.txt .

# Install any needed packages specified in requirements.txt
# Using --no-cache-dir to reduce image size
RUN pip install --no-cache-dir -r requirements.txt

# Copy the current directory contents into the container at /app
COPY update_dns.py .

# Define the command to run the application
CMD ["python", "update_dns.py"]


================================================
FILE: nomad_jobs/misc/gcp-dns-updater/README.md
================================================
# GCP Dynamic DNS Updater Service

This service periodically checks the public IPv4 address of the node it's running on and updates a specified A record in a Google Cloud DNS managed zone. It's designed to run as a Nomad job within the Hashi-Homelab environment, utilizing a **pre-built Docker image**.

## Features

*   Fetches the current public IPv4 address from `https://v4.ifconfig.co/ip`.
*   Uses the `google-cloud-dns` Python SDK to interact with Google Cloud DNS.
*   Authenticates using a GCP Service Account key provided via an environment variable.
*   Checks the specified DNS record:
    *   If it's a CNAME, it deletes the CNAME record.
    *   If it's an A record, it updates the IP address if it has changed.
    *   If it doesn't exist (or after deleting a CNAME), it creates the A record with the specified TTL.
*   Runs periodically via a Nomad job, executing the Python script within the pre-built Docker container.

## Prerequisites

1.  **Docker:** Docker must be installed locally to build the service image.
2.  **GCP Service Account:** You need a Google Cloud Platform service account with the necessary permissions to manage DNS records.
    *   Go to the GCP Console -> IAM & Admin -> Service Accounts.
    *   Create a new service account (e.g., `gcp-dns-updater-sa`).
    *   Grant this service account the `DNS Administrator` role (`roles/dns.admin`) on the project containing your managed zone.
    *   Create a JSON key file for this service account and download it securely. You will need the *contents* of this file, not the file itself.
3.  **Nomad Environment:** A running Nomad cluster where this job can be scheduled. The Nomad clients must have Docker installed and configured.

## Configuration

The service is configured via environment variables passed to the Nomad task, which are then consumed by the `update_dns.py` script running inside the Docker container:

*   `GCP_DNS_ZONE_NAME`: The name of the managed zone in GCP DNS (e.g., `demonsafe-com`). The script derives the Project ID from the credentials.
*   `GCP_DNS_RECORD_NAME`: The DNS record name to update (e.g., `*.demonsafe.com`). **Note:** The script expects the base name; the trailing dot is handled internally if needed by the SDK.
*   `RECORD_TTL`: (Optional) The Time-To-Live (in seconds) for the created/updated A record. Defaults to 300 if not set.
*   `GCP_PROJECT_ID`: The Google Cloud Project ID containing the DNS zone.
*   `GCP_SERVICE_ACCOUNT_KEY_B64`: **Required.** The base64-encoded *content* of the GCP service account JSON key file.

**Generating the Base64 Key:**

You need to encode the *content* of your downloaded JSON key file into a single-line base64 string.

On Linux/macOS, you can use:
```bash
base64 -w 0 < /path/to/your/gcp_key.json
```
*(Ensure you use `-w 0` or an equivalent flag for your `base64` command to prevent line wrapping)*

Copy the resulting string.

**Setting Environment Variables in Nomad:**

These variables are defined within the `env` block of the `nomad.job` file using Go templating to read runtime environment variables provided by the Nomad agent (which in turn are often sourced from the deployment mechanism, like GitHub Actions):

```hcl
# Example within nomad.job task config
env {
  GCP_DNS_ZONE_NAME = <<EOH
{{ env "NOMAD_VAR_tld" | replace "." "-" }}
EOH
  GCP_DNS_RECORD_NAME = <<EOH
*.{{ env "NOMAD_VAR_tld" }}
EOH
  GCP_SERVICE_ACCOUNT_KEY_B64 = <<EOH
{{ env "NOMAD_VAR_gcp_dns_admin" }}
EOH
  GCP_PROJECT_ID = <<EOH
{{ env "NOMAD_VAR_gcp_project_id" }}
EOH
  # RECORD_TTL = "300" # Optional, defaults to 300 in the script
}
```

**Important:** The actual values for `NOMAD_VAR_tld`, `NOMAD_VAR_gcp_dns_admin`, and `NOMAD_VAR_gcp_project_id` **must** be provided securely to the Nomad agent's environment during deployment (e.g., via GitHub Actions secrets mapped in the workflow, or using Vault integration), not hardcoded directly in the job file.

## Deployment

1.  **Ensure Prerequisites:** Verify the service account is created, you have the base64 encoded key, and Docker is running.
2.  **Build the Docker Image:** From the root of the `hashi-homelab` repository, run the make target:
    ```bash
    make build-gcp-dns-updater
    ```
    This builds the required Docker image tagged `gcp-dns-updater:latest` using the `gcp-dns-updater/Dockerfile`.
3.  **Deploy the Nomad Job:**
    *   Ensure the required environment variables (`NOMAD_VAR_tld`, `NOMAD_VAR_gcp_dns_admin`, `NOMAD_VAR_gcp_project_id`) are available to the Nomad agent running the job. This is typically handled by the CI/CD pipeline (like the GitHub Actions workflow in this repo) or Vault integration.
    *   Deploy using the Nomad CLI (ensure you are in the repository root or adjust paths). This job will use the `gcp-dns-updater:latest` image built in the previous step:
        ```bash
        # The job will read variables from its environment
        nomad job run gcp-dns-updater/nomad.job
        ```
    *   Alternatively, if using the project's Makefile structure:
        ```bash
        # Assumes the Makefile's deploy target doesn't need extra vars
        # and that required env vars are set in the deployment runner
        make deploy-gcp-dns-updater
        ```

## Files

*   `update_dns.py`: The core Python script for updating DNS (runs inside the container).
*   `requirements.txt`: Python dependencies (installed during Docker build).
*   `Dockerfile`: Defines how to build the service's Docker image.
*   `nomad.job`: Nomad job definition for periodic execution using the `gcp-dns-updater:latest` Docker image.
*   `README.md`: This documentation file.


================================================
FILE: nomad_jobs/misc/gcp-dns-updater/nomad.job
================================================
job "gcp-dns-updater" {
  
  meta {
    job_file = "nomad_jobs/misc/gcp-dns-updater/nomad.job"
    version  = "6"  // Added SPF TXT record update
  }
  type        = "batch"
  periodic {
    crons = ["*/15 * * * *"]
    prohibit_overlap = true 
  }

  group "updater" {
    count = 1
    restart {
      attempts = 2
      interval = "1m"
      delay = "15s"
      mode = "delay" 
    }


    task "update-dns" {
      driver = "docker"

      config {
        image = "python:3.14-slim"
        dns_servers = ["192.168.50.2"]
        command = "sh"
        args = ["-c", "pip install --no-cache-dir --root-user-action=ignore google-cloud-dns requests pyyaml && python /local/update_dns.py"]
        volumes = [
          "${var.shared_dir}traefik-ingress:/shared/traefik-ingress"
        ]
      }

      template {
        data = <<-EOH
GCP_DNS_ZONE_NAME = ${var.dns_zone}
GCP_DNS_RECORD_NAME = *.${var.tld}
GCP_SERVICE_ACCOUNT_KEY_B64 = ${var.gcp_dns_admin}
GCP_PROJECT_ID = ${var.gcp_project_id}
EOH
        env         = true
        destination = "secrets/file.env" 
      }

      template {
        data = <<-EOF
import os
import requests
import logging
import sys
import base64
import binascii
import json
import time

from google.cloud import dns
from google.oauth2 import service_account
from google.api_core.exceptions import GoogleAPIError

logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

def get_env_vars():
    """Reads required environment variables and returns them."""
    project_id = os.environ.get('GCP_PROJECT_ID')
    zone_name = os.environ.get('GCP_DNS_ZONE_NAME')
    record_name = os.environ.get('GCP_DNS_RECORD_NAME')
    key_b64 = os.environ.get('GCP_SERVICE_ACCOUNT_KEY_B64')

    if not all([project_id, zone_name, record_name, key_b64]):
        missing = [var for var, val in [
            ('GCP_PROJECT_ID', project_id),
            ('GCP_DNS_ZONE_NAME', zone_name),
            ('GCP_DNS_RECORD_NAME', record_name),
            ('GCP_SERVICE_ACCOUNT_KEY_B64', key_b64)
        ] if not val]
        logging.error(f"Missing required environment variables: {', '.join(missing)}")
        sys.exit(1)

    return project_id, zone_name, record_name, key_b64

def get_public_ip():
    """Fetches the public IPv4 address."""
    try:
        response = requests.get('https://v4.ifconfig.me/ip', timeout=10)
        response.raise_for_status()
        ip_address = response.text.strip()
        logging.info(f"Successfully fetched public IP: {ip_address}")
        return ip_address
    except requests.exceptions.RequestException as e:
        logging.error(f"Error fetching public IP: {e}")
        sys.exit(1)

def get_dns_client(key_b64: str, project_id: str):
    """Creates and returns a DNS client authenticated with a base64 encoded service account key."""
    try:
        logging.info("Decoding base64 service account key...")
        logging.info(f"Original key length: {len(key_b64)}")
        logging.info(f"Key content (first 50 chars): {key_b64[:50]}{'...' if len(key_b64) > 50 else ''}")
        
        # Clean the base64 string - remove any whitespace/newlines
        key_b64 = key_b64.strip().replace('\n', '').replace('\r', '').replace(' ', '')
        logging.info(f"Cleaned key length: {len(key_b64)}")
        logging.info(f"Cleaned key content (first 50 chars): {key_b64[:50]}{'...' if len(key_b64) > 50 else ''}")
        
        # Check if this looks like a valid base64 string
        if len(key_b64) < 100:
            logging.warning(f"Service account key seems too short ({len(key_b64)} chars). Expected several thousand characters.")
            logging.warning(f"Full key content: '{key_b64}'")
            logging.error("The GCP_SERVICE_ACCOUNT_KEY_B64 environment variable appears to contain invalid or incomplete data.")
            sys.exit(1)
        
        # Fix base64 padding if needed
        missing_padding = len(key_b64) % 4
        if missing_padding:
            padding_needed = 4 - missing_padding
            key_b64 += '=' * padding_needed
            logging.info(f"Added {padding_needed} padding characters")
        
        logging.info(f"Final key length: {len(key_b64)}")
        decoded_key = base64.b64decode(key_b64, validate=True)
        logging.info("Base64 key decoded successfully.")

        logging.info("Parsing service account key JSON...")
        key_info = json.loads(decoded_key)
        logging.info("Service account key JSON parsed successfully.")

        credentials = service_account.Credentials.from_service_account_info(key_info)
        client = dns.Client(project=project_id, credentials=credentials)
        logging.info(f"Successfully created DNS client for project {project_id}")
        return client

    except binascii.Error as e:
        logging.error(f"Failed to decode base64 service account key: {e}")
        sys.exit(1)
    except json.JSONDecodeError as e:
        logging.error(f"Failed to parse service account key JSON: {e}")
        sys.exit(1)
    except Exception as e:
        logging.error(f"Failed to create DNS client from service account info: {e}")
        sys.exit(1)

def update_traefik_whitelist(ip_address: str):
    """Updates Traefik IP whitelist configuration."""
    try:
        logging.info(f"Updating Traefik whitelist with IP: {ip_address}")
        
        traefik_config = {
            "http": {
                "middlewares": {
                    "home-ip-whitelist": {
                        "ipAllowList": {
                            "sourceRange": [
                                f"{ip_address}/32",
                                "192.168.0.0/16",
                                "10.0.0.0/8",
                                "172.16.0.0/12",
                                "100.64.0.0/10"
                            ]
                        }
                    }
                }
            }
        }
        
        config_path = "/shared/traefik-ingress/dynamic-whitelist.toml"
        
        # Write as TOML format
        toml_content = f"""[http.middlewares.home-ip-whitelist.ipAllowList]
sourceRange = ["{ip_address}/32", "192.168.0.0/16", "10.0.0.0/8", "172.16.0.0/12", "100.64.0.0/10"]
"""
        
        with open(config_path, 'w') as f:
            f.write(toml_content)
        
        logging.info(f"Successfully updated Traefik whitelist configuration at {config_path}")
        
    except Exception as e:
        logging.error(f"Failed to update Traefik whitelist: {e}")

def update_dns_record(client: dns.Client, project_id: str, zone_name: str, record_name: str, ip_address: str):
    """Updates DNS record."""
    try:
        # Use zone_name directly as it should already be the correct GCP zone name
        gcp_zone_name = zone_name
        logging.info(f"Targeting GCP DNS Zone: {gcp_zone_name}")

        zone = client.zone(gcp_zone_name, project_id)
        if not zone.exists():
            logging.error(f"DNS zone '{gcp_zone_name}' not found in project '{project_id}'.")
            return

        fqdn = record_name if record_name.endswith('.') else f"{record_name}."
        logging.info(f"Checking DNS records for: {fqdn} in zone {gcp_zone_name}")

        record_sets = list(zone.list_resource_record_sets())

        existing_a_record = None
        existing_cname_record = None

        for record_set in record_sets:
            if record_set.record_type == 'A' and record_set.name == fqdn:
                existing_a_record = record_set
                logging.info(f"Found existing A record: {existing_a_record.name} -> {existing_a_record.rrdatas}")
            elif record_set.record_type == 'CNAME' and record_set.name == fqdn:
                existing_cname_record = record_set
                logging.info(f"Found existing CNAME record: {existing_cname_record.name} -> {existing_cname_record.rrdatas}")

        changes = zone.changes()
        needs_update = False

        if existing_cname_record:
            logging.warning(f"Deleting existing CNAME record {fqdn} to replace with A record.")
            changes.delete_record_set(existing_cname_record)
            needs_update = True
            existing_a_record = None

        new_a_record = zone.resource_record_set(fqdn, "A", 300, [ip_address])

        if existing_a_record:
            if existing_a_record.rrdatas == [ip_address]:
                logging.info(f"Existing A record {fqdn} already points to {ip_address}. No update needed.")
                return
            else:
                logging.info(f"Existing A record {fqdn} points to {existing_a_record.rrdatas}. Updating to {ip_address}.")
                changes.delete_record_set(existing_a_record)
                changes.add_record_set(new_a_record)
                needs_update = True
        elif not existing_cname_record:
            logging.info(f"No existing A or CNAME record found for {fqdn}. Creating new A record pointing to {ip_address}.")
            changes.add_record_set(new_a_record)
            needs_update = True
        elif existing_cname_record:
             logging.info(f"Adding A record for {fqdn} pointing to {ip_address} after CNAME deletion.")
             changes.add_record_set(new_a_record)

        if needs_update:
            logging.info(f"Executing DNS changes for {fqdn} in zone {gcp_zone_name}...")
            changes.create()
            while changes.status != 'done':
                logging.info(f"Waiting for DNS changes to complete (status: {changes.status})...")
                time.sleep(5)
                changes.reload()
            logging.info(f"Successfully updated DNS record {fqdn} to {ip_address} in zone {gcp_zone_name}.")
        else:
            logging.info("No DNS changes were necessary.")

    except GoogleAPIError as e:
        logging.error(f"GCP API Error updating DNS record {fqdn} in zone {gcp_zone_name}: {e}")
    except Exception as e:
        logging.error(f"An unexpected error occurred during DNS update for {fqdn} in zone {gcp_zone_name}: {e}")

def update_spf_record(client: dns.Client, project_id: str, zone_name: str, record_name: str, ip_address: str):
    """Updates the SPF TXT record on the bare domain with the current public IP."""
    try:
        gcp_zone_name = zone_name
        logging.info(f"Updating SPF record in zone: {gcp_zone_name}")

        zone = client.zone(gcp_zone_name, project_id)
        if not zone.exists():
            logging.error(f"DNS zone '{gcp_zone_name}' not found in project '{project_id}'.")
            return

        # Derive bare domain from record_name (e.g., "*.demonsafe.com" -> "demonsafe.com.")
        domain = record_name.lstrip('*.') if record_name.startswith('*.') else record_name
        fqdn = domain if domain.endswith('.') else f"{domain}."
        logging.info(f"Checking TXT records for: {fqdn}")

        spf_value = f'"v=spf1 ip4:{ip_address} ~all"'

        record_sets = list(zone.list_resource_record_sets())
        existing_txt = None
        for rs in record_sets:
            if rs.record_type == 'TXT' and rs.name == fqdn:
                existing_txt = rs
                logging.info(f"Found existing TXT record: {rs.name} -> {rs.rrdatas}")
                break

        changes = zone.changes()
        needs_update = False

        if existing_txt:
            new_rrdatas = []
            spf_found = False
            for rd in existing_txt.rrdatas:
                if 'v=spf1' in rd:
                    spf_found = True
                    if ip_address in rd:
                        logging.info(f"SPF record already contains {ip_address}. No update needed.")
                        return
                    logging.info(f"Replacing SPF entry: {rd} -> {spf_value}")
                    new_rrdatas.append(spf_value)
                else:
                    new_rrdatas.append(rd)
            if not spf_found:
                logging.info(f"No existing SPF entry found. Adding: {spf_value}")
                new_rrdatas.append(spf_value)

            changes.delete_record_set(existing_txt)
            new_txt = zone.resource_record_set(fqdn, "TXT", 300, new_rrdatas)
            changes.add_record_set(new_txt)
            needs_update = True
        else:
            logging.info(f"No TXT record found for {fqdn}. Creating with SPF: {spf_value}")
            new_txt = zone.resource_record_set(fqdn, "TXT", 300, [spf_value])
            changes.add_record_set(new_txt)
            needs_update = True

        if needs_update:
            logging.info(f"Executing SPF TXT changes for {fqdn}...")
            changes.create()
            while changes.status != 'done':
                logging.info(f"Waiting for SPF changes to complete (status: {changes.status})...")
                time.sleep(5)
                changes.reload()
            logging.info(f"Successfully updated SPF record for {fqdn} with ip4:{ip_address}")

    except GoogleAPIError as e:
        logging.error(f"GCP API Error updating SPF record: {e}")
    except Exception as e:
        logging.error(f"Unexpected error updating SPF record: {e}")

if __name__ == "__main__":
    logging.info("Starting DNS update script.")
    project_id, zone_name, record_name, key_b64 = get_env_vars()
    logging.info(f"Environment variables loaded - zone_name: '{zone_name}', record_name: '{record_name}'")
    public_ip = get_public_ip()

    if public_ip:
        dns_client = get_dns_client(key_b64, project_id)
        if dns_client:
            update_dns_record(dns_client, project_id, zone_name, record_name, public_ip)
            update_spf_record(dns_client, project_id, zone_name, record_name, public_ip)
            update_traefik_whitelist(public_ip)
            logging.info("DNS, SPF, and Traefik whitelist update script finished.")
        else:
            logging.error("Exiting due to DNS client initialization failure.")
            sys.exit(1)
    else:
        logging.error("Exiting due to inability to fetch public IP.")
        sys.exit(1)
    
    # Sleep to allow log viewing before container exits
    logging.info("Sleeping for 10 seconds to allow log viewing...")
    time.sleep(10)
EOF
        destination = "local/update_dns.py"
      }

      resources {
        cpu    = 100 
        memory = 128  
      }
    }
  }
}

variable "gcp_project_id" {}
variable "dns_zone" {}
variable "tld" {}
variable "gcp_dns_admin" {}
variable "shared_dir" {}


================================================
FILE: nomad_jobs/misc/gcp-dns-updater/requirements.txt
================================================
google-cloud-dns
requests
google-auth

================================================
FILE: nomad_jobs/misc/gcp-dns-updater/update_dns.py
================================================

import os
import requests
import logging
import sys
import base64
import json
import time  # Moved import to top

# Import GCP specific libraries
from google.cloud import dns
from google.oauth2 import service_account
from google.api_core.exceptions import GoogleAPIError

# Setup logging
logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')

def get_env_vars():
    """Reads required environment variables and returns them."""
    project_id = os.environ.get('GCP_PROJECT_ID')
    zone_name = os.environ.get('GCP_DNS_ZONE_NAME') # This will be the TLD like "demonsafe.com"
    record_name = os.environ.get('GCP_DNS_RECORD_NAME')
    key_b64 = os.environ.get('GCP_SERVICE_ACCOUNT_KEY_B64') # Changed variable name

    if not all([project_id, zone_name, record_name, key_b64]): # Check for key_b64
        missing = [var for var, val in [
            ('GCP_PROJECT_ID', project_id),
            ('GCP_DNS_ZONE_NAME', zone_name),
            ('GCP_DNS_RECORD_NAME', record_name),
            ('GCP_SERVICE_ACCOUNT_KEY_B64', key_b64) # Updated missing check
        ] if not val]
        logging.error(f"Missing required environment variables: {', '.join(missing)}")
        sys.exit(1)

    return project_id, zone_name, record_name, key_b64 # Return key_b64

def get_public_ip():
    """Fetches the public IPv4 address."""
    try:
        response = requests.get('https://v4.ifconfig.me/ip', timeout=10)
        response.raise_for_status()  # Raise an exception for bad status codes
        ip_address = response.text.strip()
        logging.info(f"Successfully fetched public IP: {ip_address}")
        return ip_address
    except requests.exceptions.RequestException as e:
        logging.error(f"Error fetching public IP: {e}")
        sys.exit(1) # Exit if IP cannot be fetched

def get_dns_client(key_b64: str, project_id: str): # Changed key_path to key_b64 and added project_id
    """Creates and returns a DNS client authenticated with a base64 encoded service account key."""
    try:
        # Decode the base64 string
        logging.info("Decoding base64 service account key...")
        decoded_key = base64.b64decode(key_b64)
        logging.info("Base64 key decoded successfully.")

        # Parse the decoded JSON key
        logging.info("Parsing service account key JSON...")
        key_info = json.loads(decoded_key)
        logging.info("Service account key JSON parsed successfully.")

        # Create credentials from the parsed key info
        credentials = service_account.Credentials.from_service_account_info(key_info)

        # Use the provided project_id, not the one from credentials, to ensure consistency
        client = dns.Client(project=project_id, credentials=credentials)
        logging.info(f"Successfully created DNS client for project {project_id}")
        return client

    except base64.binascii.Error as e:
        logging.error(f"Failed to decode base64 service account key: {e}")
        sys.exit(1)
    except json.JSONDecodeError as e:
        logging.error(f"Failed to parse service account key JSON: {e}")
        sys.exit(1)
    except Exception as e:
        logging.error(f"Failed to create DNS client from service account info: {e}")
        sys.exit(1)

def update_dns_record(client: dns.Client, project_id: str, zone_name: str, record_name: str, ip_address: str):
    """
    Checks and updates/creates an A record for the given name in the specified zone,
    replacing a CNAME if necessary.

    Args:
        client: Authenticated DNS client.
        project_id: GCP project ID.
        zone_name: The domain TLD (e.g., "demonsafe.com"). This will be converted
                   to the GCP zone name format (e.g., "demonsafe-com").
        record_name: The specific record to update (e.g., "*.demonsafe.com").
        ip_address: The public IP address to set.
    """
    try:
        # Convert the TLD zone name (e.g., "demonsafe.com") to GCP zone name format (e.g., "demonsafe-com")
        gcp_zone_name = zone_name.replace('.', '-')
        logging.info(f"Targeting GCP DNS Zone: {gcp_zone_name}")

        zone = client.zone(gcp_zone_name, project_id)
        if not zone.exists():
            logging.error(f"DNS zone '{gcp_zone_name}' not found in project '{project_id}'.")
            return # Cannot proceed without the zone

        # Ensure record_name ends with a dot for FQDN matching
        fqdn = record_name if record_name.endswith('.') else f"{record_name}."
        logging.info(f"Checking DNS records for: {fqdn} in zone {gcp_zone_name}")

        record_sets = list(zone.list_resource_record_sets(filter_=f"name={fqdn}"))

        existing_a_record = None
        existing_cname_record = None

        for record_set in record_sets:
            if record_set.record_type == 'A' and record_set.name == fqdn:
                existing_a_record = record_set
                logging.info(f"Found existing A record: {existing_a_record.name} -> {existing_a_record.rrdatas}")
            elif record_set.record_type == 'CNAME' and record_set.name == fqdn:
                existing_cname_record = record_set
                logging.info(f"Found existing CNAME record: {existing_cname_record.name} -> {existing_cname_record.rrdatas}")

        changes = zone.changes()
        needs_update = False

        # Handle existing CNAME (delete it to replace with A)
        if existing_cname_record:
            logging.warning(f"Deleting existing CNAME record {fqdn} to replace with A record.")
            changes.delete_record_set(existing_cname_record)
            needs_update = True
            # Ensure we don't try to delete an A record if we just deleted a CNAME
            existing_a_record = None

        # Define the new A record we want
        new_a_record = zone.resource_record_set(fqdn, "A", 300, [ip_address])

        # Handle existing A record
        if existing_a_record:
            if existing_a_record.rrdatas == [ip_address]:
                logging.info(f"Existing A record {fqdn} already points to {ip_address}. No update needed.")
                return # Nothing to do
            else:
                logging.info(f"Existing A record {fqdn} points to {existing_a_record.rrdatas}. Updating to {ip_address}.")
                changes.delete_record_set(existing_a_record)
                changes.add_record_set(new_a_record)
                needs_update = True
        # Handle case where no A record (and no CNAME was found/deleted)
        elif not existing_cname_record: # Only add if we didn't already decide to replace CNAME
            logging.info(f"No existing A or CNAME record found for {fqdn}. Creating new A record pointing to {ip_address}.")
            changes.add_record_set(new_a_record)
            needs_update = True
        # Handle case where CNAME was found and deleted - we still need to add the A record
        elif existing_cname_record:
             logging.info(f"Adding A record for {fqdn} pointing to {ip_address} after CNAME deletion.")
             changes.add_record_set(new_a_record)
             # needs_update should already be True

        # Execute the changes if any were queued
        if needs_update:
            logging.info(f"Executing DNS changes for {fqdn} in zone {gcp_zone_name}...")
            changes.create()
            # Wait until the changes are finished.
            while changes.status != 'done':
                logging.info(f"Waiting for DNS changes to complete (status: {changes.status})...")
                time.sleep(5) # Wait 5 seconds before checking again
                changes.reload()
            logging.info(f"Successfully updated DNS record {fqdn} to {ip_address} in zone {gcp_zone_name}.")
        else:
            # This case should only be hit if an A record existed and was correct
            logging.info("No DNS changes were necessary.")

    except GoogleAPIError as e:
        logging.error(f"GCP API Error updating DNS record {fqdn} in zone {gcp_zone_name}: {e}")
    except Exception as e:
        logging.error(f"An unexpected error occurred during DNS update for {fqdn} in zone {gcp_zone_name}: {e}")


def update_spf_record(client: dns.Client, project_id: str, zone_name: str, record_name: str, ip_address: str):
    """Updates the SPF TXT record on the bare domain with the current public IP."""
    try:
        gcp_zone_name = zone_name.replace('.', '-')
        logging.info(f"Updating SPF record in zone: {gcp_zone_name}")

        zone = client.zone(gcp_zone_name, project_id)
        if not zone.exists():
            logging.error(f"DNS zone '{gcp_zone_name}' not found in project '{project_id}'.")
            return

        # Derive bare domain from record_name (e.g., "*.demonsafe.com" -> "demonsafe.com.")
        domain = record_name.lstrip('*.') if record_name.startswith('*.') else record_name
        fqdn = domain if domain.endswith('.') else f"{domain}."
        logging.info(f"Checking TXT records for: {fqdn}")

        spf_value = f'"v=spf1 ip4:{ip_address} ~all"'

        record_sets = list(zone.list_resource_record_sets(filter_=f"name={fqdn}"))
        existing_txt = None
        for rs in record_sets:
            if rs.record_type == 'TXT' and rs.name == fqdn:
                existing_txt = rs
                logging.info(f"Found existing TXT record: {rs.name} -> {rs.rrdatas}")
                break

        changes = zone.changes()
        needs_update = False

        if existing_txt:
            new_rrdatas = []
            spf_found = False
            for rd in existing_txt.rrdatas:
                if 'v=spf1' in rd:
                    spf_found = True
                    if ip_address in rd:
                        logging.info(f"SPF record already contains {ip_address}. No update needed.")
                        return
                    logging.info(f"Replacing SPF entry: {rd} -> {spf_value}")
                    new_rrdatas.append(spf_value)
                else:
                    new_rrdatas.append(rd)
            if not spf_found:
                logging.info(f"No existing SPF entry found. Adding: {spf_value}")
                new_rrdatas.append(spf_value)

            changes.delete_record_set(existing_txt)
            new_txt = zone.resource_record_set(fqdn, "TXT", 300, new_rrdatas)
            changes.add_record_set(new_txt)
            needs_update = True
        else:
            logging.info(f"No TXT record found for {fqdn}. Creating with SPF: {spf_value}")
            new_txt = zone.resource_record_set(fqdn, "TXT", 300, [spf_value])
            changes.add_record_set(new_txt)
            needs_update = True

        if needs_update:
            logging.info(f"Executing SPF TXT changes for {fqdn}...")
            changes.create()
            while changes.status != 'done':
                logging.info(f"Waiting for SPF changes to complete (status: {changes.status})...")
                time.sleep(5)
                changes.reload()
            logging.info(f"Successfully updated SPF record for {fqdn} with ip4:{ip_address}")

    except GoogleAPIError as e:
        logging.error(f"GCP API Error updating SPF record: {e}")
    except Exception as e:
        logging.error(f"Unexpected error updating SPF record: {e}")


if __name__ == "__main__":
    logging.info("Starting DNS update script.")
    project_id, zone_name, record_name, key_b64 = get_env_vars()
    public_ip = get_public_ip()

    if public_ip:
        dns_client = get_dns_client(key_b64, project_id)
        if dns_client:
            update_dns_record(dns_client, project_id, zone_name, record_name, public_ip)
            update_spf_record(dns_client, project_id, zone_name, record_name, public_ip)
            logging.info("DNS update script finished.")
        else:
            # Error handled in get_dns_client, it exits
            logging.error("Exiting due to DNS client initialization failure.")
            sys.exit(1) # Explicit exit for clarity
    else:
        # Error handled in get_public_ip, it exits
        logging.error("Exiting due to inability to fetch public IP.")
        sys.exit(1) # Explicit exit for clarity


================================================
FILE: nomad_jobs/misc/gitea/nomad.job
================================================
job "gitea" {
  
  meta {
  job_file = "nomad_jobs/misc/gitea/nomad.job"
  }
region = var.region
  datacenters = ["dc1"]
  type = "service"
    group "svc" {
      count = 1
      volume "gitea-data" {
        type      = "host"
        source    = "gitea-data"
        read_only = false
      }
      volume "gitea-db" {
        type      = "host"
        source    = "gitea-db"
        read_only = false
      }
      restart {
        attempts = 5
        delay    = "30s"
      }
      task "app" {
        driver = "docker"
        volume_mount {
          volume      = "gitea-data"
          destination = "/data"
          read_only   = false
      }
        config {
          image = "gitea/gitea"
          port_map {
            http     = 3000
            ssh_pass = 22
          }
        }
        env = {
          "APP_NAME"   = "Gitea: Git with a cup of tea"
          "RUN_MODE"   = "prod"
          "SSH_DOMAIN" = "git.${var.tld}"
          "SSH_PORT"   = "22"
          "ROOT_URL"   = "http://git.${var.tld}/"
          "USER_UID"   = "1002"
          "USER_GID"   = "1002"
          "DB_TYPE"    = "postgres"
          "DB_NAME"    = "gitea"
          "DB_USER"    = "gitea"
          "DB_PASSWD"  = "gitea"
          "SHOW_REGISTRATION_BUTTON" = "false"
        }
      template {
data = <<EOH
GITEA__database__HOST="{{ env "NOMAD_ADDR_db_db" }}"
EOH
        destination = "local/env"
        env         = true
        }
        resources {
          cpu    = 200
          memory = 256
            network {
              port "http" {}
              port "ssh_pass" {
                static = "2222"
              }
            }
        }
        service {
          name = "gitea"
          port = "http"
          tags = [
            "traefik.enable=true",
            "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


            "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=git.${var.tld}",
            "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
          ]
        }
      }
      task "db" {
        driver = "docker"
          volume_mount {
            volume      = "gitea-db"
            destination = "/var/lib/postgresql/data"
            read_only   = false
          }
        config {
          image = "postgres:17-alpine"
          port_map {
            db = 5432
          }
        }
        template {
data = <<EOH
POSTGRES_USER="gitea"
POSTGRES_PASSWORD="gitea"
POSTGRES_DB="gitea"
EOH
        destination = "local/env"
        env         = true
        }
        resources {
          cpu    = 200
          memory = 128
          network {
            port "db" {}
          }
        }
      }
    }
}
variable "region" {
    type = string
}


variable "tld" {
    type = string
}


================================================
FILE: nomad_jobs/misc/linuxgsm/nomad.job
================================================
job "linuxgsm" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/misc/linuxgsm/nomad.job"
version = "2"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "gaming" {
    count = 1

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "linuxgsm" {
      driver = "docker"
      config {
        image = "gameservermanagers/linuxgsm-docker"
        network_mode = "host"
        command = "/home/linuxgsm/rustserver"
        args = ["start"]
        volumes = [
          "${var.shared_dir}linuxgsm:/home/linuxgsm",
        ]
      }

      service {
        port = "port0"
	name = "linuxgsm"
      }

      env {
        GAMESERVER = "rustserver"
        LGSM_GITHUBUSER = "GameServerManagers"
        LGSM_GITHUBREPO = "LinuxGSM"
        LGSM_GITHUBBRANCH = "master"
      }

      resources {
        cpu    = 100
        memory = 8000
        network {
          port "port0" { static = "27015" }
          port "port1" { static = "27020" }
          port "port2" { static = "27005" }
        }
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/misc/murmur/nomad.job
================================================
job "murmur" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/misc/murmur/nomad.job"
service_owner = "@pmanuk"
    version = "2"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "chat" {
    count = 1

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "mumble-server" {
      driver = "docker"
      config {
        image = "vimagick/murmur"
        force_pull = true
        network_mode = "host"
        volumes = [
          "${var.shared_dir}murmur-data:/opt/murmur/data",
          "${var.shared_dir}murmur-cert:/opt/murmur/cert",
          "local/murmur-config:/etc/murmur/murmur.ini",
        ]
      }

      service {
         tags = [
          "traefik.enable=true",
          "traefik.tcp.routers.${NOMAD_TASK_NAME}.rule=HostSNI(`mumble-server.${var.tld}`)",
          "traefik.tcp.services.${NOMAD_TASK_NAME}.loadbalancer.server.port=${NOMAD_PORT_0}",
          "traefik.tcp.routers.${NOMAD_TASK_NAME}.entrypoints=mumble",
          "traefik.tcp.routers.${NOMAD_TASK_NAME}.tls.passthrough=true",
          "traefik.udp.routers.${NOMAD_TASK_NAME}.service=mumble-server",
          "traefik.udp.services.${NOMAD_TASK_NAME}.loadbalancer.server.port=${NOMAD_PORT_0}",
          "traefik.udp.routers.${NOMAD_TASK_NAME}.entrypoints=mumble-udp",
         ]
         name = "mumble-server"
         port = "0"
      }

      env {
        TZ = "Europe/Amsterdam"
      }

      template {
data = <<EOH
; Murmur configuration file.
;
; General notes:
; * Settings in this file are default settings and many of them can be overridden
;   with virtual server specific configuration via the Ice or DBus interface.
; * Due to the way this configuration file is read some rules have to be
;   followed when specifying variable values (as in variable = value):
;     * Make sure to quote the value when using commas in strings or passwords.
;        NOT variable = super,secret BUT variable = "super,secret"
;     * Make sure to escape special characters like '\' or '"' correctly
;        NOT variable = """ BUT variable = "\""
;        NOT regex = \w* BUT regex = \\w*

; Path to database. If blank, will search for
; murmur.sqlite in default locations or create it if not found.
database=

; Murmur defaults to using SQLite with its default rollback journal.
; In some situations, using SQLite's write-ahead log (WAL) can be
; advantageous.
; If you encounter slowdowns when moving between channels and similar
; operations, enabling the SQLite write-ahead log might help.
;
; To use SQLite's write-ahead log, set sqlite_wal to one of the following
; values:
;
; 0 - Use SQLite's default rollback journal.
; 1 - Use write-ahead log with synchronous=NORMAL.
;     If Murmur crashes, the database will be in a consistent state, but
;     the most recent changes might be lost if the operating system did
;     not write them to disk yet. This option can improve Murmur's
;     interactivity on busy servers, or servers with slow storage.
; 2 - Use write-ahead log with synchronous=FULL.
;     All database writes are synchronized to disk when they are made.
;     If Murmur crashes, the database will be include all completed writes.
;sqlite_wal=0

; If you wish to use something other than SQLite, you'll need to set the name
; of the database above, and also uncomment the below.
; Sticking with SQLite is strongly recommended, as it's the most well tested
; and by far the fastest solution.
;
;dbDriver=QMYSQL
;dbUsername=
;dbPassword=
;dbHost=
;dbPort=
;dbPrefix=murmur_
;dbOpts=

; Murmur defaults to not using D-Bus. If you wish to use dbus, which is one of the
; RPC methods available in Murmur, please specify so here.
;
;dbus=session

; Alternate D-Bus service name. Only use if you are running distinct
; murmurd processes connected to the same D-Bus daemon.
;dbusservice=net.sourceforge.mumble.murmur

; If you want to use ZeroC Ice to communicate with Murmur, you need
; to specify the endpoint to use. Since there is no authentication
; with ICE, you should only use it if you trust all the users who have
; shell access to your machine.
; Please see the ICE documentation on how to specify endpoints.
ice="tcp -h 127.0.0.1 -p 6502"

; Ice primarily uses local sockets. This means anyone who has a
; user account on your machine can connect to the Ice services.
; You can set a plaintext "secret" on the Ice connection, and
; any script attempting to access must then have this secret
; (as context with name "secret").
; Access is split in read (look only) and write (modify)
; operations. Write access always includes read access,
; unless read is explicitly denied (see note below).
;
; Note that if this is uncommented and with empty content,
; access will be denied.

;icesecretread=
icesecretwrite=

; If you want to expose Murmur's experimental gRPC API, you
; need to specify an address to bind on.
; Note: not all builds of Murmur support gRPC. If gRPC is not
; available, Murmur will warn you in its log output.
;grpc="127.0.0.1:50051"
; Specifying both a certificate and key file below will cause gRPC to use
; secured, TLS connections.
; When using secured connections you need to also set the list of authorized
; clients. grpcauthorized is a space delimited list of SHA256 fingerprints
; for authorized client certificates.
; Get this from the command line:
; openssl x509 -in cert.pem -SHA256 -noout -fingerprint
;grpccert=""
;grpckey=""
;grpcauthorized=""

; Specifies the file Murmur should log to. By default, Murmur
; logs to the file 'murmur.log'. If you leave this field blank
; on Unix-like systems, Murmur will force itself into foreground
; mode which logs to the console.
;logfile=murmur.log

; If set, Murmur will write its process ID to this file
; when running in daemon mode (when the -fg flag is not
; specified on the command line). Only available on
; Unix-like systems.
;pidfile=

; The below will be used as defaults for new configured servers.
; If you're just running one server (the default), it's easier to
; configure it here than through D-Bus or Ice.
;
; Welcome message sent to clients when they connect.
; If the welcome message is set to an empty string,
; no welcome message will be sent to clients.
welcometext="<br />Welcome to this server running <b>Murmur</b>.<br />Enjoy your stay!<br />"

; The welcometext can also be read from an external file which might be useful
; if you want to specify a rather lengthy text. If a value for welcometext is
; set, the welcometextfile will not be read.
;welcometextfile=

; Port to bind TCP and UDP sockets to.
port={{ env "NOMAD_PORT_0" }}

; Specific IP or hostname to bind to.
; If this is left blank (default), Murmur will bind to all available addresses.
;host=

; Password to join server.
serverpassword=

; Maximum bandwidth (in bits per second) clients are allowed
; to send speech at.
bandwidth=558000

; Murmur and Mumble are usually pretty good about cleaning up hung clients, but
; occasionally one will get stuck on the server. The timeout setting will cause
; a periodic check of all clients who haven't communicated with the server in
; this many seconds - causing zombie clients to be disconnected.
;
; Note that this has no effect on idle clients or people who are AFK. It will
; only affect people who are already disconnected, and just haven't told the
; server.
;timeout=30

; Maximum number of concurrent clients allowed.
users=100

; Where users sets a blanket limit on the number of clients per virtual server,
; usersperchannel sets a limit on the number per channel. The default is 0, for
; no limit.
;usersperchannel=0

; Per-user rate limiting
;
; These two settings allow to configure the per-user rate limiter for some
; command messages sent from the client to the server. The messageburst setting
; specifies an amount of messages which are allowed in short bursts. The
; messagelimit setting specifies the number of messages per second allowed over
; a longer period. If a user hits the rate limit, his packages are then ignored
; for some time. Both of these settings have a minimum of 1 as setting either to
; 0 could render the server unusable.
messageburst=5
messagelimit=1

; Respond to UDP ping packets.
;
; Setting to true exposes the current user count, the maximum user count, and
; the server's maximum bandwidth per client to unauthenticated users. In the
; Mumble client, this information is shown in the Connect dialog.
allowping=true

; Amount of users with Opus support needed to force Opus usage, in percent.
; 0 = Always enable Opus, 100 = enable Opus if it's supported by all clients.
;opusthreshold=100

; Maximum depth of channel nesting. Note that some databases like MySQL using
; InnoDB will fail when operating on deeply nested channels.
;channelnestinglimit=10

; Maximum number of channels per server. 0 for unlimited. Note that an
; excessive number of channels will impact server performance
;channelcountlimit=1000

; Regular expression used to validate channel names.
; (Note that you have to escape backslashes with \ )
;channelname=[ \\-=\\w\\#\\[\\]\\{\\}\\(\\)\\@\\|]+

; Regular expression used to validate user names.
; (Note that you have to escape backslashes with \ )
;username=[-=\\w\\[\\]\\{\\}\\(\\)\\@\\|\\.]+

; If a user has no stored channel (they've never been connected to the server
; before, or rememberchannel is set to false) and the client hasn't been given
; a URL that includes a channel path, the default behavior is that they will
; end up in the root channel.
;
; You can set this setting to a channel ID, and the user will automatically be
; moved into that channel instead. Note that this is the numeric ID of the
; channel, which can be a little tricky to get (you'll either need to use an
; RPC mechanism, watch the console of a debug client, or root around through
; the Murmur Database to get it).
;
;defaultchannel=0

; When a user connects to a server they've already been on, by default the
; server will remember the last channel they were in and move them to it
; automatically. Toggling this setting to false will disable that feature.
;
;rememberchannel=true

; How many seconds should the server remember the last channel of a user.
; Set to 0 (default) to remember forever. This option has no effect if
; rememberchannel is set to false.
;rememberchannelduration=0

; Maximum length of text messages in characters. 0 for no limit.
;textmessagelength=5000

; Maximum length of text messages in characters, with image data. 0 for no limit.
;imagemessagelength=131072

; Allow clients to use HTML in messages, user comments and channel descriptions?
;allowhtml=true

; Murmur retains the per-server log entries in an internal database which
; allows it to be accessed over D-Bus/ICE.
; How many days should such entries be kept?
; Set to 0 to keep forever, or -1 to disable logging to the DB.
;logdays=31

; To enable public server registration, the serverpassword must be blank, and
; this must all be filled out.
; The password here is used to create a registry for the server name; subsequent
; updates will need the same password. Don't lose your password.
; The URL is your own website, and only set the registerHostname for static IP
; addresses.
; Location is typically the country of typical users of the server, in
; two-letter TLD style (ISO 3166-1 alpha-2 country code)
;
; If you only wish to give your "Root" channel a custom name, then only
; uncomment the 'registerName' parameter.
;
;registerName=Mumble Server
;registerPassword=secret
;registerUrl=http://www.mumble.info/
;registerHostname=
;registerLocation=

; If this option is enabled, the server will announce its presence via the
; bonjour service discovery protocol. To change the name announced by bonjour
; adjust the registerName variable.
; See http://developer.apple.com/networking/bonjour/index.html for more information
; about bonjour.
;bonjour=True

; If you have a proper SSL certificate, you can provide the filenames here.
; Otherwise, Murmur will create its own certificate automatically.
;sslCert=
;sslKey=

; If the keyfile specified above is encrypted with a passphrase, you can enter
; it in this setting. It must be plaintext, so you may wish to adjust the
; permissions on your murmur.ini file accordingly.
;sslPassPhrase=

; If your certificate is signed by an authority that uses a sub-signed or
; "intermediate" certificate, you probably need to bundle it with your
; certificate in order to get Murmur to accept it. You can either concatenate
; the two certificates into one file, or you can put it in a file by itself and
; put the path to that PEM-file in sslCA.
;sslCA=

; The sslDHParams option allows you to specify a PEM-encoded file with
; Diffie-Hellman parameters, which will be used as the default Diffie-
; Hellman parameters for all virtual servers.
;
; Instead of pointing sslDHParams to a file, you can also use the option
; to specify a named set of Diffie-Hellman parameters for Murmur to use.
; Murmur comes bundled with the Diffie-Hellman parameters from RFC 7919.
; These parameters are available by using the following names:
;
; @ffdhe2048, @ffdhe3072, @ffdhe4096, @ffdhe6144, @ffdhe8192
;
; By default, Murmur uses @ffdhe2048.
;sslDHParams=@ffdhe2048

; The sslCiphers option chooses the cipher suites to make available for use
; in SSL/TLS. This option is server-wide, and cannot be set on a
; per-virtual-server basis.
;
; This option is specified using OpenSSL cipher list notation (see
; https://www.openssl.org/docs/apps/ciphers.html#CIPHER-LIST-FORMAT).
;
; It is recommended that you try your cipher string using 'openssl ciphers <string>'
; before setting it here, to get a feel for which cipher suites you will get.
;
; After setting this option, it is recommend that you inspect your Murmur log
; to ensure that Murmur is using the cipher suites that you expected it to.
;
; Note: Changing this option may impact the backwards compatibility of your
; Murmur server, and can remove the ability for older Mumble clients to be able
; to connect to it.
;sslCiphers=EECDH+AESGCM:EDH+aRSA+AESGCM:DHE-RSA-AES256-SHA:DHE-RSA-AES128-SHA:AES256-SHA:AES128-SHA

; If Murmur is started as root, which user should it switch to?
; This option is ignored if Murmur isn't started with root privileges.
;uname=

; By default, in log files and in the user status window for privileged users,
; Mumble will show IP addresses - in some situations you may find this unwanted
; behavior. If obfuscate is set to true, Murmur will randomize the IP addresses
; of connecting users.
;
; The obfuscate function only affects the log file and DOES NOT effect the user
; information section in the client window.
;obfuscate=false

; If this options is enabled, only clients which have a certificate are allowed
; to connect.
;certrequired=False

; If enabled, clients are sent information about the servers version and operating
; system.
;sendversion=True

; You can set a recommended minimum version for your server, and clients will
; be notified in their log when they connect if their client does not meet the
; minimum requirements. suggestVersion expects the version in the format X.X.X.
;
; Note that the suggest* options appeared after 1.2.3 and will have no effect
; on client versions 1.2.3 and earlier.
;
;suggestVersion=

; Setting this to "true" will alert any user who does not have positional audio
; enabled that the server administrators recommend enabling it. Setting it to
; "false" will have the opposite effect - if you do not care whether the user
; enables positional audio or not, set it to blank. The message will appear in
; the log window upon connection, but only if the user's settings do not match
; what the server requests.
;
; Note that the suggest* options appeared after 1.2.3 and will have no effect
; on client versions 1.2.3 and earlier.
;
;suggestPositional=

; Setting this to "true" will alert any user who does not have Push-To-Talk
; enabled that the server administrators recommend enabling it. Setting it to
; "false" will have the opposite effect - if you do not care whether the user
; enables PTT or not, set it to blank. The message will appear in the log
; window upon connection, but only if the user's settings do not match what the
; server requests.
;
; Note that the suggest* options appeared after 1.2.3 and will have no effect
; on client versions 1.2.3 and earlier.
;
;suggestPushToTalk=

; This sets password hash storage to legacy mode (1.2.4 and before)
; (Note that setting this to true is insecure and should not be used unless absolutely necessary)
;legacyPasswordHash=false

; By default a strong amount of PBKDF2 iterations are chosen automatically. If >0 this setting
; overrides the automatic benchmark and forces a specific number of iterations.
; (Note that you should only change this value if you know what you are doing)
;kdfIterations=-1

; In order to prevent misconfigured, impolite or malicious clients from
; affecting the low-latency of other users, Murmur has a rudimentary global-ban
; system. It's configured using the autobanAttempts, autobanTimeframe and
; autobanTime settings.
;
; If a client attempts autobanAttempts connections in autobanTimeframe seconds,
; they will be banned for autobanTime seconds. This is a global ban, from all
; virtual servers on the Murmur process. It will not show up in any of the
; ban-lists on the server, and they can't be removed without restarting the
; Murmur process - just let them expire. A single, properly functioning client
; should not trip these bans.
;
; To disable, set autobanAttempts or autobanTimeframe to 0. Commenting these
; settings out will cause Murmur to use the defaults:
;
; To avoid autobanning successful connection attempts from the same IP address,
; set autobanSuccessfulConnections=False.
;
;autobanAttempts=10
;autobanTimeframe=120
;autobanTime=300
;autobanSuccessfulConnections=True

; Enables logging of group changes. This means that every time a group in a
; channel changes, the server will log all groups and their members from before
; the change and after the change. Deault is false. This option was introduced
; with Murmur 1.4.0.
;
;loggroupchanges=false

; Enables logging of ACL changes. This means that every time the ACL in a
; channel changes, the server will log all ACLs from before the change and
; after the change. Default is false. This option was introduced with Murmur
; 1.4.0.
;
;logaclchanges=false

; You can configure any of the configuration options for Ice here. We recommend
; leave the defaults as they are.
; Please note that this section has to be last in the configuration file.
;
[Ice]
Ice.Warn.UnknownProperties=1
Ice.MessageSizeMax=65536

EOH
        destination = "local/murmur-config"
        env         = false
      }

      resources {
        cpu    = 100
        memory = 128
        network {
          port "0" {}
        }
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "auth" {
    type = string
}


================================================
FILE: nomad_jobs/misc/octoprint/nomad.job
================================================
job "octoprint" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/misc/octoprint/nomad.job"
version = "6"
  }

  constraint {
    attribute = "${meta.3d_printer}"
    operator  = "="
    value     = "true"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "3dprinter" {
    count = 1 

    network {
      port "web" {
        host_network = "tailscale"
        to = "5000"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "octoprint" {
      driver = "docker"
      config {
        image = "octoprint/octoprint"
        force_pull = true
        #network_mode = "host"
        privileged = true
        ports = ["web"]
        volumes = [
          "${var.shared_dir}octoprint:/home/octoprint/.octoprint",
          "/dev/ttyUSB0:/dev/ttyUSB0",
        ]
      }

      service {
        port = "web"
	name = "octoprint"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.cors.headers.accesscontrolallowmethods=GET,OPTIONS,PUT",
          "traefik.http.middlewares.cors.headers.accesscontrolalloworigin=origin-list-or-null",
          "traefik.http.middlewares.cors.headers.accesscontrolmaxage=100",
          "traefik.http.middlewares.cors.headers.addvaryheader=true",


          "traefik.http.middlewares.malpotAuth.basicauth.users=${var.auth}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      env {
        TZ = "Europe/Amsterdam"
      }

      resources {
        cpu    = 100
        memory = 1024
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/misc/uploader/nomad.job
================================================
job "uploader" {
  region = var.region
  datacenters = ["dc1"]
  type = "service"
  meta {
      job_file = "nomad_jobs/misc/uploader/nomad.job"
version = "5"
  }

  group "webserver" {
    count = 1

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }
    task "uploader" {
      driver = "docker"

      service {
        name = "uploader"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
        port = "http"

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      config {
        image = "docker-registry.${var.tld}/uploader:latest"
        network_mode = "host"
        volumes = [
          "${var.shared_dir}uploader:/data",
        ]
      }
      template {
data = <<EOH
UPLOADER_RS_FILES_DIR=/data
UPLOADER_RS_BINDING={{env "NOMAD_ADDR_http" }}
EOH
        destination = "local/env"
        env         = true
      }

      resources {
        cpu = 100
        memory = 16
        network {
          port "http" {} 
        }
      }
    }
  }
}


================================================
FILE: nomad_jobs/observability/alertmanager/nomad.job
================================================
job "alertmanager" {
  region = var.region
  datacenters = ["dc1"]
  type = "service"

  meta {
    job_file = "nomad_jobs/observability/alertmanager/nomad.job"
    version = "13"  // Switch from Pushover to ntfy
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  update {
    max_parallel     = 1
    min_healthy_time = "30s"
    healthy_deadline = "5m"
    progress_deadline = "10m"
    auto_revert      = true
  }

  group "alerting" {
    count = 1
    
    ephemeral_disk {
      sticky = true
    }

    volume "alertmanager" {
      type      = "csi"
      read_only = false
      source    = "alertmanager"
      access_mode = "multi-node-single-writer"
      attachment_mode = "file-system"
    }
    network {
      port "http" {
        static = "9093"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "prep-disk" {
      driver = "docker"
      volume_mount {
        volume      = "alertmanager"
        destination = "/volume/"
        read_only   = false
      }
      config {
        image        = "busybox:latest"
        command      = "sh"
        args         = ["-c", "chown -R 1000:2000 /volume/ && chmod -R 755 /volume/"]
      }
      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    task "alertmanager" {
      driver = "docker"
      user = "1000:2000"

      volume_mount {
        volume      = "alertmanager"
        destination = "/alertmanager"
        read_only   = false
      }
      
      service {
        name = "alertmanager"
        port = "http"
        tags = [
          "traefik.enable=true"
        ]

        check {
          type     = "tcp"
          port     = "http"
          interval = "10s"
          timeout  = "2s"
        }
      }

      config {
        image = "prom/alertmanager:v0.32.0"
        network_mode = "host"
        ports = ["http"]
        force_pull = true
        args = ["--web.external-url", "https://alertmanager.${var.tld}", "--config.file", "/local/config.yml", "--storage.path", "/alertmanager", "--web.listen-address", "0.0.0.0:9093"]
      }

      template {
        left_delimiter = "{{{"
        right_delimiter = "}}}"
        data = <<EOH
global:
  smtp_smarthost: 'smtp.service.home:25'
  smtp_from: 'alertmanager@example.org'

route:
  group_by: ['alertname', 'cluster', 'service', 'service_name', 'service_id']
  group_wait: 10s
  group_interval: 10s
  repeat_interval: 12h
  receiver: 'ntfy'

  routes:
  - match:
      severity: critical
    receiver: 'ntfy'
    group_wait: 5s
    group_interval: 5s
    repeat_interval: 15m
  - match:
      severity: warning
    receiver: 'ntfy'
    group_wait: 30s
    group_interval: 30s
    repeat_interval: 1h
  - match:
      severity: page
    receiver: 'ntfy'
    group_wait: 5s
    group_interval: 5s
    repeat_interval: 30m
  - match_re:
      alertname: ".*Down.*"
    receiver: 'ntfy'
    group_wait: 5s
    group_interval: 5s
    repeat_interval: 15m

receivers:
- name: 'email'
  email_configs:
  - to: 'pmanuk@perrymanuk.com'

- name: 'ntfy'
  webhook_configs:
  - url: 'http://{{{ range service "ntfy" }}}{{{ .Address }}}:{{{ .Port }}}{{{ end }}}/homelab-alerts?template=alerts'
    send_resolved: true

EOH

        destination = "local/config.yml"
        env         = false
      }

      resources {
        cpu    = 100
        memory = 64
      }
    }
  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}


================================================
FILE: nomad_jobs/observability/alertmanager/volume.hcl
================================================
id        = "alertmanager"
name      = "alertmanager"
type      = "csi"
plugin_id = "org.democratic-csi.iscsi"

capacity_max = "1GB"
capacity_min = "100MB"

capability {
  access_mode     = "multi-node-single-writer"
  attachment_mode = "file-system"
}

mount_options {
  fs_type = "ext4"
}

parameters {
  fsType = "ext4"
}

================================================
FILE: nomad_jobs/observability/blackbox-exporter/nomad.job
================================================
job "blackbox-exporter" {
  
  meta {
  job_file = "nomad_jobs/observability/blackbox-exporter/nomad.job"
  }
region      = var.region
  datacenters = ["dc1"]
  type = "system"

  group "blackbox-exporter" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      canary           = 1
      min_healthy_time = "30s"
      healthy_deadline = "8m"
      auto_revert      = true
    }

    task "blackbox_exporter" {
      driver = "docker"
      service {
        tags = ["net-internal", "blackbox-exporter", "metrics"]
        name = "blackbox-exporter"
        port = "http"

        check {
          type     = "tcp"
          interval = "5s"
          timeout  = "2s"
        }
      }

      config {
        image = "prom/blackbox-exporter:v0.28.0"
        network_mode = "host"
        args = [
          "--config.file=/local/config.yaml",
          "--web.listen-address=${NOMAD_ADDR_http}",
        ]

      }
      template {
data = <<EOH
modules:
  http_2xx:
    prober: http
    timeout: 10s
    http:
      valid_http_versions: ["HTTP/1.1", "HTTP/2"]
      valid_status_codes: []  # Defaults to 2xx
      method: GET
      no_follow_redirects: false
      fail_if_ssl: false
      fail_if_not_ssl: false
      tls_config:
        insecure_skip_verify: false
      preferred_ip_protocol: "ip4" # defaults to "ip6"
  tls_tcp:
    prober: tcp
    timeout: 10s
    tcp:
      tls: false
      preferred_ip_protocol: ip4
  dns_consul:
    prober: dns
    dns:
      preferred_ip_protocol: "ip4"
      query_name: "consul.service.consul"
      query_type: "MX"
  dns_google_com:
    prober: dns
    dns:
      preferred_ip_protocol: "ip4"
      query_name: "www.google.com"
      query_type: "MX"
  dns_vault:
    prober: dns
    dns:
      preferred_ip_protocol: "ip4"
      query_name: "vault.service.consul"
      query_type: "MX"

EOH
        destination = "local/config.yaml"
         env         = false
      }
      resources {
        cpu    = 100
        memory = 64

        network {
          port "http" { static = 9115 }
        }
      }
    }
  }
}

variable "region" {
    type = string
}


================================================
FILE: nomad_jobs/observability/grafana/nomad.job
================================================
job "grafana" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/observability/grafana/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "monitoring" {
    count = 1 

    network {
      port "http" {
        static = "3000"
        host_network = "tailscale"
      }
    }

    volume "grafana" {
      type      = "csi"
      read_only = false
      source    = "grafana"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prep-disk" {
      driver = "docker"
      volume_mount {
        volume      = "grafana"
        destination = "/volume/"
        read_only   = false
      }
      config {
        image        = "busybox:latest"
        command      = "sh"
        args         = ["-c", "chown -R 1000:1000 /volume/"]
      }
      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "grafana" {
      driver = "docker"
      user = "1000:1000"
      config {
        image = "grafana/grafana:12.4.3"
        userns_mode = "host"
        volumes = [
          "${var.shared_dir}grafana/config:/etc/grafana/",
        ]

        network_mode = "host"
      }
      volume_mount {
        volume      = "grafana"
        destination = "/var/lib/grafana"
        read_only   = false
      }
      env {
        GF_PATHS_DATA = "/var/lib/grafana"
        GF_AUTH_BASIC_ENABLED = "false"
        GF_INSTALL_PLUGINS = "grafana-piechart-panel"
      }
      service {
        port = "http"
	name = "grafana"
        tags = [
          "traefik.enable=true",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ] 
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 128
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/observability/grafana/volume.hcl
================================================
id           = "grafana"
external_id  = "grafana"
name         = "grafana"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/observability/loki/nomad.job
================================================
job "loki" {
  
  meta {
  job_file = "nomad_jobs/observability/loki/nomad.job"
  }
region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "loki" {
    network {
      port "loki" {
        host_network = "tailscale"
        static = 3100
      }
    }

    volume "loki" {
      type      = "csi"
      read_only = false
      source    = "loki"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prep-disk" {
      driver = "docker"
      volume_mount {
        volume      = "loki"
        destination = "/volume/"
        read_only   = false
      }
      config {
        image        = "busybox:latest"
        command      = "sh"
        args         = ["-c", "chown -R 10001:10001 /volume/"]
      }
      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "loki" {
      user = "10001:10001"
      driver = "docker"
      config {
        image = "grafana/loki:3.7.1"
        args = [
          "-config.file",
          "local/loki/local-config.yaml",
        ]
        ports = ["loki"]
      }
      volume_mount {
        volume      = "loki"
        destination = "/loki"
        read_only   = false
      }
      service {
        name = "loki"
        port = "loki"
        check {
          name     = "Loki healthcheck"
          port     = "loki"
          type     = "http"
          path     = "/ready"
          interval = "20s"
          timeout  = "5s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
        tags = []
      }
      template {
        data = <<EOH
auth_enabled: false
server:
  http_listen_port: 3100
ingester:
  lifecycler:
    address: 127.0.0.1
    ring:
      kvstore:
        store: inmemory
      replication_factor: 1
    final_sleep: 0s
  # Any chunk not receiving new logs in this time will be flushed
  chunk_idle_period: 1h
  # All chunks will be flushed when they hit this age, default is 1h
  max_chunk_age: 1h
  # Loki will attempt to build chunks up to 1.5MB, flushing if chunk_idle_period or max_chunk_age is reached first
  chunk_target_size: 1048576
  # Must be greater than index read cache TTL if using an index cache (Default index read cache TTL is 5m)
  chunk_retain_period: 30s
  max_transfer_retries: 0     # Chunk transfers disabled
  wal:
    dir: "/tmp/wal"
schema_config:
  configs:
    - from: 2020-10-24
      store: boltdb-shipper
      object_store: filesystem
      schema: v11
      index:
        prefix: index_
        period: 24h
storage_config:
  boltdb_shipper:
    active_index_directory: /loki/boltdb-shipper-active
    cache_location: /loki/boltdb-shipper-cache
    cache_ttl: 24h         # Can be increased for faster performance over longer query periods, uses more disk space
    shared_store: filesystem
  filesystem:
    directory: /loki/chunks
compactor:
  working_directory: /tmp/loki/boltdb-shipper-compactor
  shared_store: filesystem
limits_config:
  reject_old_samples: true
  reject_old_samples_max_age: 168h
chunk_store_config:
  max_look_back_period: 0s
table_manager:
  retention_deletes_enabled: false
  retention_period: 0s
EOH
        destination = "local/loki/local-config.yaml"
      }
      resources {
        cpu    = 500
        memory = 256
      }
    }
  }
}

variable "datacenters_dc1" {
  type = list(string)
}
variable "region" {}
variable "shared_dir" {}


================================================
FILE: nomad_jobs/observability/loki/volume.hcl
================================================
id           = "loki"
external_id  = "loki"
name         = "loki"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/observability/oom-test/nomad.job
================================================
job "oom-test" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/observability/oom-test/nomad.job"
    version  = "3"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "oom-test" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to           = "8080"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel      = 1
      min_healthy_time  = "30s"
      healthy_deadline  = "5m"
      progress_deadline = "10m"
      auto_revert       = true
    }

    task "oom-test" {
      driver = "docker"

      config {
        image   = "python:3.14-slim"
        ports   = ["http"]
        command = "python3"
        args    = ["-c", <<EOH
import http.server
import threading
import time

memory_hog = []

def consume_memory():
    """Gradually consume memory until OOM."""
    time.sleep(30)  # Give the task time to become healthy
    while True:
        # Allocate ~1MB per iteration
        memory_hog.append(b'x' * 1024 * 1024)
        time.sleep(1)

# Start memory consumer in background
threading.Thread(target=consume_memory, daemon=True).start()

# Run a simple HTTP server for health checks
server = http.server.HTTPServer(('0.0.0.0', 8080), http.server.SimpleHTTPRequestHandler)
server.serve_forever()
EOH
        ]
      }

      service {
        port = "http"
        name = "oom-test"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 64
      }
    }
  }
}

variable "region" {
  type        = string
  description = "Nomad region"
}

variable "tld" {
  type        = string
  description = "Top-level domain for service discovery"
}

variable "shared_dir" {
  type        = string
  description = "Path to shared NFS config directory"
}


================================================
FILE: nomad_jobs/observability/prometheus/README.md
================================================
### Prometheus
This prometheus is configured to scrape any service launched with the service tag `metrics` in addition to scraping all consul/nomad agents and itself.


================================================
FILE: nomad_jobs/observability/prometheus/nomad.job
================================================
job "prometheus" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/observability/prometheus/nomad.job"
    version = "10"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "monitoring" {
    count = 1

    network {
      port "http" {
        static = "9090"
      }
    }

    volume "prometheus" {
      type      = "csi"
      read_only = false
      source    = "prometheus"
      access_mode = "multi-node-single-writer"
      attachment_mode = "file-system"
    }


    task "prep-disk" {
      driver = "docker"
      volume_mount {
        volume      = "prometheus"
        destination = "/volume/"
        read_only   = false
      }
      config {
        image        = "busybox:latest"
        command      = "sh"
        args         = ["-c", "chown -R 1000:2000 /volume/"]
      }
      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      healthy_deadline = "5m"
      progress_deadline = "10m"
      auto_revert      = true
    }

    task "prometheus" {
      driver = "docker"
      user = "1000:2000"

      volume_mount {
        volume      = "prometheus"
        destination = "/opt/prometheus"
        read_only   = false
      }

      service {
        name = "prometheus"
        port = "http"
        tags = [
          "traefik.enable=true"
        ]

        check {
          type     = "http"
          path     = "/-/healthy"
          name     = "http"
          interval = "5s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      # main configuration file
      template {
        left_delimiter = "[["
        right_delimiter = "]]"
        data = <<EOH
global:
  scrape_interval:     60s # Set the scrape interval to every 15 seconds. Default is every 1 minute.
  evaluation_interval: 60s # Evaluate rules every 15 seconds. The default is every 1 minute.
  # scrape_timeout is set to the global default (10s).

# Alertmanager configuration
alerting:
  alertmanagers:
  - static_configs:
    - targets:
       - alertmanager.service.consul:9093

# Load rules once and periodically evaluate them according to the global 'evaluation_interval'.
rule_files:
  - "alerts.yml"
  # - "second_rules.yml"

scrape_configs:
  - job_name: 'prometheus'
    static_configs:
      - targets: ['localhost:9090']

  - job_name: 'metrics'
    scrape_interval: 5s
    metrics_path: /metrics
    consul_sd_configs:
      - server: '[[ env "NOMAD_IP_http" ]]:8500'
        tags: ['metrics']
        scheme: http
    relabel_configs:
      - source_labels: ['__meta_consul_dc']
        target_label:  'dc'
      - source_labels: [__meta_consul_service]
        target_label:  'job'
      - source_labels: ['__meta_consul_node']
        target_label:  'host'
      - source_labels: ['__meta_consul_tags']
        target_label: 'tags'
      - source_labels: ['__meta_consul_tags']
        regex: '.*job-(.*?)(,.*)'
        replacement: '${1}'
        target_label: 'job_name'

  - job_name: 'consul-server'
    scrape_interval: 10s
    metrics_path: /v1/agent/metrics
    honor_labels: true
    params:
      format: ['prometheus']
    consul_sd_configs:
      - server: '[[ env "NOMAD_IP_http" ]]:8500'
        services: ['nomad-client']
        scheme: http
    relabel_configs:
      - source_labels: ['__meta_consul_dc']
        target_label:  'dc'
      - source_labels: ['__meta_consul_node']
        target_label:  'host'
      - source_labels: ['__meta_consul_tags']
        target_label: 'tags'
      - source_labels: [__address__]
        action: replace
        regex: ([^:]+):.*
        replacement: $1:8500
        target_label: __address__

  - job_name: 'hass'
    scrape_interval: 60s
    metrics_path: /api/prometheus

    # Long-Lived Access Token
    authorization:
      credentials: ${var.hass_key}

    scheme: http
    static_configs:
      - targets: ['${var.hass_ip}:8123']

  - job_name: 'nomad'
    consul_sd_configs:
    - server: '[[ env "NOMAD_IP_http" ]]:8500'
      services: ['nomad-client']
      tags: ['http']
      scheme: http
    scrape_interval: 10s
    metrics_path: /v1/metrics
    params:
      format: ['prometheus']
    relabel_configs:
      - source_labels: ['__meta_consul_dc']
        target_label:  'dc'
      - source_labels: [__meta_consul_service]
        target_label:  'job'
      - source_labels: ['__meta_consul_node']
        target_label:  'host'

#  - job_name: 'blackbox_http_2xx'
#    metrics_path: /probe
#    scheme: http
#    scrape_interval: 30s
#    scrape_timeout: 10s
#    params:
#      module: [ http_2xx ]
#    static_configs:
#      - targets:
#        - https://www.google.com/
#        - http://prometheus.homelab/
#    relabel_configs:
#      - source_labels: ['__address__']
#        regex: 'https?://(.+?)(/.*)'
#        replacement: '${1}'
#        target_label: 'url'
#      - source_labels: ['__param_target']
#        target_label: 'instance'
#      - source_labels: [__address__]
#        target_label: __param_target
#      - target_label: __address__
#        replacement: blackbox-exporter.service.[[ .region ]]:9115
#      - source_labels: ['__param_target']
#        target_label: 'endpoint'
#
#  - job_name: 'dns_google_com' 
#    metrics_path: /probe   
#    params:                
#      module: [dns_google_com]                                                                 
#    static_configs:        
#      - targets:           
#        - 8.8.8.8
#        - 1.1.1.1
#        labels:                            
#          dc: '[[ .datacenter ]]'        
#          region: '[[ .region ]]'        
#    relabel_configs:       
#      - source_labels: [__address__] 
#        target_label: __param_target 
#      - source_labels: [__param_target] 
#        target_label: instance 
#      - target_label: __address__ 
#        replacement: blackbox-exporter.service.[[ .region ]]:9115

EOH

        destination   = "local/prometheus.yml"
        change_mode   = "signal"
        change_signal = "SIGHUP"
        env           = false
      }

      template {
        change_mode = "noop"
        destination = "local/alerts.yml"
        left_delimiter = "[["
        right_delimiter = "]]"
        data = <<EOH
---
groups:
- name: basic_alerts
  rules:
  - alert: PrometheusDown
    expr: absent(up{job="prometheus"})
    for: 2m
    labels:
      severity: page
      alertname: "PrometheusDown"
    annotations:
      summary: "Prometheus is down"
      description: "Prometheus has been down for more than 2 minutes"
      service: "prometheus"
      
  - alert: NomadClusterDown
    expr: absent(up{job="nomad-client"})
    for: 2m
    labels:
      severity: page
      alertname: "NomadClusterDown"
    annotations:
      summary: "Nomad cluster is unreachable"
      description: "No Nomad metrics available - cluster may be down"
      service: "nomad"
  # Alert for any instance that is unreachable for >5 minutes.
  - alert: InstanceDown
    expr: up{job!="hass"} == 0
    for: 5m
    labels:
      severity: page
    annotations:
      summary: "Instance {{ $labels.instance }} down"
      description: "{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 5 minutes."
  
  - alert: HomeAssistantDown
    expr: up{job="hass"} == 0
    for: 10m
    labels:
      severity: warning
    annotations:
      summary: "Home Assistant is down"  
      description: "Home Assistant at {{ $labels.instance }} has been down for more than 10 minutes."
  # Alert for any device that is over 80% capacity  
  - alert: DiskUsage
    expr: avg(nomad_client_host_disk_used_percent) by (host, device) > 80
    for: 5m
    labels:
      severity: page
    annotations:
      summary: "Host {{ $labels.host }} disk {{ $labels.device }} usage alert"
      description: "{{ $labels.host }} is using over 80% of its device: {{ $labels.device }}"

- name: nomad_allocation_alerts
  rules:
  - alert: NomadJobFailureRate
    expr: rate(nomad_nomad_job_summary_failed[5m]) > 0
    for: 2m
    labels:
      severity: critical
      alertname: "NomadJobFailureRate"
    annotations:
      summary: "Nomad job {{ $labels.exported_job }} is experiencing failures"
      description: "Job {{ $labels.exported_job }} is failing allocations at a rate of {{ $value | printf \"%.2f\" }} per second"
      service: "nomad"
      
  - alert: NomadJobLostRate
    expr: rate(nomad_nomad_job_summary_lost[5m]) > 0
    for: 2m
    labels:
      severity: warning
      alertname: "NomadJobLostRate"
    annotations:
      summary: "Nomad job {{ $labels.exported_job }} is losing allocations"
      description: "Job {{ $labels.exported_job }} is losing allocations at a rate of {{ $value | printf \"%.2f\" }} per second"
      service: "nomad"
      
  - alert: NomadJobQueued
    expr: nomad_nomad_job_summary_queued > 0
    for: 5m
    labels:
      severity: warning
      alertname: "NomadJobQueued"
    annotations:
      summary: "Nomad job {{ $labels.exported_job }} has queued allocations"
      description: "Job {{ $labels.exported_job }} has {{ $value }} allocations queued for over 5 minutes"
      service: "nomad"
      
  - alert: NomadAllocationsRestarting
    expr: rate(nomad_client_allocs_restart[5m]) > 0.1
    for: 2m
    labels:
      severity: warning
      alertname: "NomadAllocationsRestarting"
    annotations:
      summary: "High allocation restart rate on {{ $labels.host }}"
      description: "Allocation restart rate is {{ $value }} per second on {{ $labels.host }}"
      service: "nomad"
      
  - alert: NomadAllocationsOOMKilled
    expr: nomad_client_allocs_oom_killed > 0
    for: 0s
    labels:
      severity: critical
      alertname: "NomadAllocationsOOMKilled"
    annotations:
      summary: "Allocation killed due to OOM on {{ $labels.host }}"
      description: "{{ $value }} allocations were killed due to out-of-memory on {{ $labels.host }}"
      service: "nomad"
      
EOH
      }


      config {
        image = "prom/prometheus:v3.11.2"
        network_mode = "host"
        args = ["--storage.tsdb.path", "/opt/prometheus", "--web.listen-address", "0.0.0.0:9090", "--storage.tsdb.retention.time", "90d"]
        force_pull = true
        ports = ["http"]
        dns_servers = ["192.168.50.2"]
        volumes = [
          "local/alerts.yml:/prometheus/alerts.yml",
          "local/prometheus.yml:/prometheus/prometheus.yml",
        ]
      }

      resources {
        cpu    = 1000
        memory = 512
      }
    }
  }
}


variable "region" {}
variable "tld" {}
variable "shared_dir" {}
variable "hass_key" {}
variable "hass_ip" {}


================================================
FILE: nomad_jobs/observability/prometheus/volume.hcl
================================================
id           = "prometheus"
external_id  = "prometheus"
name         = "prometheus"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "50GiB"
capacity_max = "50GiB"

capability {
  access_mode     = "multi-node-single-writer"
  attachment_mode = "file-system"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/observability/telegraf/nomad.job
================================================
job "telegraf" {
  region = var.region
  datacenters = ["dc1", "public", "system"]
  type = "system"
  priority = 100
  meta {
      job_file = "nomad_jobs/observability/telegraf/nomad.job"
version = "4"
  }
  group "telegraf-exporter" {

    network {
      port "http" {
        host_network = "tailscale"
        to = "9273"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "telegraf" {
      driver = "docker"
      service {
        name = "telegraf"
        port = "http"
        tags = ["metrics"]
        check {
          type     = "tcp"
          interval = "5s"
          timeout  = "2s"
        }
      }

      config {
        image = "telegraf:1.38.2"
        privileged = "true"
        ports = ["http"]
        args = [
          "--config=/local/config.yaml",
        ]
      }
      template {
      data = <<EOH
[global_tags]
  realm = '${var.region}'
  role = 'nomad'
[agent]
[[outputs.prometheus_client]]
  listen = ':9273'
[[inputs.cpu]]
  percpu = true
  totalcpu = true
[[inputs.disk]]
  ignore_fs = ['tmpfs', 'devtmpfs']
[[inputs.diskio]]
[[inputs.kernel]]
[[inputs.mem]]
[[inputs.net]]
[[inputs.ntpq]]
[[inputs.processes]]
[[inputs.swap]]
[[inputs.system]]

EOH
        destination = "local/config.yaml"
        env         = false
      }
      resources {
        cpu    = 100
        memory = 128
      }
    }
  }
}

variable "region" {
    type = string
}


================================================
FILE: nomad_jobs/observability/truenas-graphite-exporter/nomad.job
================================================
job "truenas-graphite-exporter" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/observability/truenas-graphite-exporter/nomad.job"
    version  = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "graphite-exporter" {
    count = 1

    network {
      port "graphite" {
        static = 9109
      }
      port "metrics" {
        static = 9108
      }
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      healthy_deadline = "5m"
      progress_deadline = "10m"
      auto_revert      = true
    }

    task "graphite-exporter" {
      driver = "docker"

      config {
        image      = "ghcr.io/supporterino/truenas-graphite-to-prometheus:v2.2.1"
        force_pull = true
        ports      = ["graphite", "metrics"]
      }

      service {
        name = "truenas-graphite-exporter"
        port = "metrics"
        tags = [
          "metrics",
        ]

        check {
          type     = "http"
          path     = "/metrics"
          name     = "http"
          interval = "15s"
          timeout  = "5s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 200
        memory = 128
      }
    }
  }
}

variable "region" {}
variable "shared_dir" {}


================================================
FILE: nomad_jobs/observability/vector/nomad.job
================================================
job "vector" {
  
  meta {
  job_file = "nomad_jobs/observability/vector/nomad.job"
  }
datacenters = ["dc1"]
  region = var.region
  type = "system"
  group "vector" {
    network {
      port "api" {
        host_network = "tailscale"
        to = 8686
      }
    }
    ephemeral_disk {
      size    = 500
      sticky  = true
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "vector" {
      driver = "docker"
      config {
        image = "timberio/vector:0.28.X-alpine"
        ports = ["api"]
        volumes = ["/var/run/docker.sock:/var/run/docker.sock"]
      }

      env {
        VECTOR_CONFIG = "local/vector.toml"
        VECTOR_REQUIRE_HEALTHY = "true"
      }

      service {
        check {
          port     = "api"
          type     = "http"
          path     = "/health"
          interval = "30s"
          timeout  = "5s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 500 # 500 MHz
        memory = 256 # 256MB
      }

      template {
        destination = "local/vector.toml"
        change_mode   = "signal"
        change_signal = "SIGHUP"
        # overriding the delimiters to [[ ]] to avoid conflicts with Vector's native templating, which also uses {{ }}
        left_delimiter = "[["
        right_delimiter = "]]"
        data=<<EOH
          data_dir = "alloc/data/vector/"
          [api]
            enabled = true
            address = "0.0.0.0:8686"
            playground = false
          [sources.logs]
            type = "docker_logs"
          [transforms.transformed]
            type = "remap"
            inputs = [ "logs" ]
            source = '''
                   .debug = parse_key_value!(.message)
                   .job_name = split(get!(value: .label, path: ["com.hashicorp.nomad.job_name"]), "/")[0] ?? get!(value: .label, path: ["com.hashicorp.nomad.job_name"])
            '''
          [sinks.loki]
            type = "loki"
            inputs = ["transformed"]
            endpoint = "http://[[ range service "loki" ]][[ .Address ]]:[[ .Port ]][[ end ]]"
            encoding.codec = "json"
            buffer.type = "memory"
            out_of_order_action = "accept"
            request.concurrency = "adaptive"
            remove_label_fields = true
            healthcheck.enabled = true
              [sinks.loki.labels]
              job = "{{label.\"com.hashicorp.nomad.job_name\" }}"
              task = "{{label.\"com.hashicorp.nomad.task_name\" }}"
              group = "{{label.\"com.hashicorp.nomad.task_group_name\" }}"
              namespace = "{{label.\"com.hashicorp.nomad.namespace\" }}"
              node = "{{label.\"com.hashicorp.nomad.node_name\" }}"
              correlation_id = "{{ message.requestId }}"
              stream = "{{ stream }}"
        EOH
      }
      kill_timeout = "30s"
    }
  }
}

variable "datacenters_all" {
  type = list(string)
}
variable "region" {}


================================================
FILE: nomad_jobs/personal-cloud/actualbudget/nomad.job
================================================
job "actualbudget" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/personal-cloud/actualbudget/nomad.job"
      version = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "actualbudget" {
    count = 1

    network {
      mode = "host"
      port "http" {
        static = "5006"
        host_network = "lan"
      }
    }

    volume "actualbudget" {
      type            = "csi"
      read_only       = false
      source          = "actualbudget-data"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prep-disk" {
      driver = "docker"
      volume_mount {
        volume      = "actualbudget"
        destination = "/volume/"
        read_only   = false
      }
      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "chmod 777 /volume/"]
      }
      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    task "actualbudget" {
      driver = "docker"
      config {
        image = "actualbudget/actual-server:26.4.0"
        ports = ["http"]
      }

      volume_mount {
        volume      = "actualbudget"
        destination = "/data"
        read_only   = false
      }

      env {
        TZ = "Etc/UTC"
      }

      service {
        port = "http"
        name = "actualbudget"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 200
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {
    type = string
}

================================================
FILE: nomad_jobs/personal-cloud/actualbudget/volume.hcl
================================================
id           = "actualbudget-data"
external_id  = "actualbudget-data"
name         = "actualbudget-data"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "5GiB"
capacity_max = "5GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime", "nodiratime", "data=ordered"]
}

================================================
FILE: nomad_jobs/personal-cloud/bitwarden/nomad.job
================================================
job "bitwarden" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/personal-cloud/bitwarden/nomad.job"
version = "3"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "password" {
    count = 1

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "bitwarden" {
      driver = "docker"
      config {
        image = "vaultwarden/server:1.35.7"
        force_pull = "true"
        port_map = {
          http = 80 
        }
        volumes = [
          "${var.shared_dir}bitwarden:/data",
        ]
      }

      service {
        port = "http"
	name = "bitwarden"
        tags = [
          "traefik.enable=true",
        ]

        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      template {
data = <<EOH
ADMIN_TOKEN="u3L9xN7vB2mK5zP8wA4qR1tY6cX0jH2nG7dS9fL4kM1vP3qW"
SMTP_HOST="192.168.50.120"
SMTP_PORT="25"
SMTP_SECURITY="off"
SMTP_FROM="vault@demonsafe.com"
EOH
        destination = "local/env"
        env         = true
      }

      resources {
        cpu    = 1000
        memory = 2048
        network {
          port "http" {}
        }
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/personal-cloud/nextcloud/nomad.job
================================================
job "nextcloud" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/personal-cloud/nextcloud/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  vault {
    policies      = ["admin"]
    change_mode   = "signal"
    change_signal = "SIGUSR1"
  }

  group "nextcloud" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "web" {
      driver = "docker"

      config {
        image = "nextcloud"
        volumes = [
          "${var.shared_dir}nextcloud:/var/www/html",
          "${var.shared_dir}nextcloud_data:/data",
          "local/default:/config/nginx/site-confs/default"
        ]
        port_map {
          http = 80
        }
      }

      service {
        name = "${NOMAD_JOB_NAME}"
        port = "http"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


          "traefik.http.routers.${NOMAD_JOB_NAME}.tls.domains[0].sans=${NOMAD_JOB_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_JOB_NAME}.middlewares=forward-auth"
        ]

        check {
          type     = "tcp"
          port     = "http"
          interval = "30s"
          timeout  = "2s"
        }
      }

      template {
data = <<EOH
POSTGRES_DB="nextcloud"
POSTGRES_USER=""
POSTGRES_PASSWORD=""
NEXTCLOUD_ADMIN_USER=""
NEXTCLOUD_ADMIN_PASSWORD=""
NEXTCLOUD_TRUSTED_DOMAINS=""
POSTGRES_HOST="{{ env "NOMAD_ADDR_postgres_db" }}"
EOH
        destination = "local/env"
        env         = true
      }

      template {
data = <<EOH
upstream php-handler {
    server 127.0.0.1:9000;
}
#server {
#    listen 80;
#    listen [::]:80;
#    server_name _;
#    return 301 https://$host$request_uri;
#}
server {
    listen 80;
    listen [::]:80;
    server_name _;
    ssl_certificate /config/keys/cert.crt;
    ssl_certificate_key /config/keys/cert.key;
    add_header X-Content-Type-Options nosniff;
    add_header X-XSS-Protection "1; mode=block";
    add_header X-Robots-Tag none;
    add_header X-Download-Options noopen;
    add_header X-Permitted-Cross-Domain-Policies none;
    add_header Referrer-Policy no-referrer;
    fastcgi_hide_header X-Powered-By;
    root /config/www/nextcloud/;
    location = /robots.txt {
        allow all;
        log_not_found off;
        access_log off;
    }
    location = /.well-known/carddav {
      return 301 $scheme://$host/remote.php/dav;
    }
    location = /.well-known/caldav {
      return 301 $scheme://$host/remote.php/dav;
    }
    client_max_body_size 10G;
    fastcgi_buffers 64 4K;
    gzip on;
    gzip_vary on;
    gzip_comp_level 4;
    gzip_min_length 256;
    gzip_proxied expired no-cache no-store private no_last_modified no_etag auth;
    gzip_types application/atom+xml application/javascript application/json application/ld+json application/manifest+json application/rss+xml application/vnd.geo+json application/vnd.ms-fontobject application/x-font-ttf application/x-web-app-manifest+json application/xhtml+xml application/xml font/opentype image/bmp image/svg+xml image/x-icon text/cache-manifest text/css text/plain text/vcard text/vnd.rim.location.xloc text/vtt text/x-component text/x-cross-domain-policy;
    location / {
        rewrite ^ /index.php;
    }
    location ~ ^\/(?:build|tests|config|lib|3rdparty|templates|data)\/ {
        deny all;
    }
    location ~ ^\/(?:\.|autotest|occ|issue|indie|db_|console) {
        deny all;
    }
    location ~ ^\/(?:index|remote|public|cron|core\/ajax\/update|status|ocs\/v[12]|updater\/.+|ocs-provider\/.+|ocm-provider\/.+)\.php(?:$|\/) {
        fastcgi_split_path_info ^(.+?\.php)(\/.*|)$;
        try_files $fastcgi_script_name =404;
        include /etc/nginx/fastcgi_params;
        fastcgi_param SCRIPT_FILENAME $document_root$fastcgi_script_name;
        fastcgi_param PATH_INFO $fastcgi_path_info;
        fastcgi_param HTTPS on;
        fastcgi_param modHeadersAvailable true;
        fastcgi_param front_controller_active true;
        fastcgi_pass php-handler;
        fastcgi_intercept_errors on;
        fastcgi_request_buffering off;
    }

    location ~ ^\/(?:updater|ocs-provider|ocm-provider)(?:$|\/) {
        try_files $uri/ =404;
        index index.php;
    }
    location ~ \.(?:css|js|woff2?|svg|gif)$ {
        try_files $uri /index.php$request_uri;
        add_header Cache-Control "public, max-age=15778463";
        add_header X-Content-Type-Options nosniff;
        add_header X-XSS-Protection "1; mode=block";
        add_header X-Robots-Tag none;
        add_header X-Download-Options noopen;
        add_header X-Permitted-Cross-Domain-Policies none;
        add_header Referrer-Policy no-referrer;
        access_log off;
    }
    location ~ \.(?:png|html|ttf|ico|jpg|jpeg)$ {
        try_files $uri /index.php$request_uri;
        access_log off;
    }
}
EOH
        destination = "local/default"
        env         = false
      }

      resources {
        cpu = 500
        memory = 2048
        network {
          port "http" {}
        }
      }
    }
    task "postgres" {
      driver = "docker"

      config {
        image = "postgres:9.6.24"
        volumes = [
          "${var.shared_dir}nextcloud-postgres:/appdata/postgres",
        ]
        port_map {
          db = 5432
        }
      }
      template {
data = <<EOH
POSTGRES_DB=nextcloud
POSTGRES_USER=""
POSTGRES_PASSWORD=""
PGDATA="/appdata/postgres"
EOH
        destination = "local/env"
        env         = true
      }

      service {
        name = "${NOMAD_JOB_NAME}-postgres"
        tags = ["postgres"]

        port = "db"

        check {
          type     = "tcp"
          port     = "db"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu = 100
        memory = 512
        network {
          port  "db"  {
            static = "25432"
          }
        }
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/personal-cloud/ntfy/nomad.job
================================================
job "ntfy" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/personal-cloud/ntfy/nomad.job"
    version  = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "ntfy" {
    count = 1

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    volume "ntfy" {
      type            = "csi"
      read_only       = false
      source          = "ntfy-data"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }

    network {
      port "http" {
        static       = 8180
        host_network = "lan"
      }
    }

    task "prep-disk" {
      driver = "docker"

      volume_mount {
        volume      = "ntfy"
        destination = "/volume/"
        read_only   = false
      }

      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "chmod 777 /volume/"]
      }

      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    task "ntfy" {
      driver = "docker"

      config {
        image      = "binwiederhier/ntfy:v2.21.0"
        force_pull = true
        ports      = ["http"]
        args       = ["serve"]
        volumes = [
          "local/server.yml:/etc/ntfy/server.yml:ro",
          "local/templates/:/etc/ntfy/templates/:ro",
        ]
      }

      volume_mount {
        volume      = "ntfy"
        destination = "/var/cache/ntfy"
        read_only   = false
      }

      env {
        TZ = "Europe/Berlin"
      }

      template {
        data = <<EOH
base-url: "https://ntfy.${var.tld}"
listen-http: ":{{ env "NOMAD_PORT_http" }}"
cache-file: "/var/cache/ntfy/cache.db"
cache-duration: "12h"
attachment-cache-dir: "/var/cache/ntfy/attachments"
attachment-total-size-limit: "1G"
attachment-file-size-limit: "15M"
template-dir: "/etc/ntfy/templates"
EOH
        destination = "local/server.yml"
        change_mode = "restart"
      }

      template {
        left_delimiter = "((("
        right_delimiter = ")))"
        data = <<EOH
title: |-
  {{- $status := .status -}}
  {{- $first := index .alerts 0 -}}
  {{- if eq $status "firing" -}}
  🚨 FIRING: {{ $first.labels.alertname }}
  {{- else if eq $status "resolved" -}}
  ✅ RESOLVED: {{ $first.labels.alertname }}
  {{- else -}}
  {{ $status | title }}: {{ $first.labels.alertname }}
  {{- end }}
message: |-
  {{- range .alerts }}
  Status: {{ .status | title }}
  {{- if .annotations.summary }}
  Summary: {{ .annotations.summary }}
  {{- end }}
  {{- if .annotations.description }}
  Description: {{ .annotations.description }}
  {{- end }}
  {{- if .labels.exported_job }}
  Job: {{ .labels.exported_job }}
  {{- end }}
  {{- if .labels.task_group }}
  Task Group: {{ .labels.task_group }}
  {{- end }}
  {{- if .labels.instance }}
  Instance: {{ .labels.instance }}
  {{- end }}
  {{- if .labels.host }}
  Host: {{ .labels.host }}
  {{- end }}
  {{- if .labels.severity }}
  Severity: {{ .labels.severity }}
  {{- end }}
  {{ end }}
priority: |-
  {{- $first := index .alerts 0 -}}
  {{- if eq .status "resolved" -}}
  default
  {{- else if eq $first.labels.severity "critical" -}}
  urgent
  {{- else if eq $first.labels.severity "page" -}}
  high
  {{- else if eq $first.labels.severity "warning" -}}
  default
  {{- else -}}
  default
  {{- end }}
EOH
        destination = "local/templates/alerts.yml"
        change_mode = "restart"
      }

      template {
        left_delimiter = "((("
        right_delimiter = ")))"
        data = <<EOH
title: |-
  {{- if eq .notification_type "MEDIA_PENDING" -}}
  📥 Request Pending: {{ .subject }}
  {{- else if eq .notification_type "MEDIA_APPROVED" -}}
  ✅ Approved: {{ .subject }}
  {{- else if eq .notification_type "MEDIA_AUTO_APPROVED" -}}
  ✅ Auto-Approved: {{ .subject }}
  {{- else if eq .notification_type "MEDIA_AVAILABLE" -}}
  🎬 Now Available: {{ .subject }}
  {{- else if eq .notification_type "MEDIA_DECLINED" -}}
  ❌ Declined: {{ .subject }}
  {{- else if eq .notification_type "MEDIA_FAILED" -}}
  ⚠️ Failed: {{ .subject }}
  {{- else if eq .notification_type "MEDIA_AUTO_REQUESTED" -}}
  🤖 Auto-Requested: {{ .subject }}
  {{- else if eq .notification_type "ISSUE_CREATED" -}}
  🐛 Issue: {{ .subject }}
  {{- else if eq .notification_type "ISSUE_RESOLVED" -}}
  ✅ Issue Resolved: {{ .subject }}
  {{- else if eq .notification_type "ISSUE_COMMENT" -}}
  💬 Issue Comment: {{ .subject }}
  {{- else if eq .notification_type "TEST_NOTIFICATION" -}}
  🔔 Test: {{ .subject }}
  {{- else -}}
  {{ .subject }}
  {{- end }}
message: |-
  {{- if .message }}
  {{ .message }}
  {{ end }}
  {{- if .media_type }}
  Type: {{ .media_type | title }}
  {{- end }}
  {{- if .media_status }}
  Status: {{ .media_status }}
  {{- end }}
  {{- if .requestedBy_username }}
  Requested by: {{ .requestedBy_username }}
  {{- end }}
  {{- if .event }}
  Event: {{ .event }}
  {{- end }}
priority: |-
  {{- if or (eq .notification_type "MEDIA_FAILED") (eq .notification_type "ISSUE_CREATED") -}}
  high
  {{- else if or (eq .notification_type "MEDIA_AVAILABLE") (eq .notification_type "MEDIA_APPROVED") -}}
  default
  {{- else if eq .notification_type "MEDIA_PENDING" -}}
  default
  {{- else -}}
  low
  {{- end }}
EOH
        destination = "local/templates/overseerr.yml"
        change_mode = "restart"
      }

      service {
        name = "ntfy"
        port = "http"
        tags = [
          "traefik.enable=true",
        ]

        check {
          type     = "http"
          path     = "/v1/health"
          interval = "10s"
          timeout  = "2s"

          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 200
        memory = 256
      }
    }
  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}

variable "shared_dir" {
  type = string
}


================================================
FILE: nomad_jobs/personal-cloud/ntfy/volume.hcl
================================================
id           = "ntfy-data"
external_id  = "ntfy-data"
name         = "ntfy-data"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/personal-cloud/paperless/nomad.job
================================================
job "paperless" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/personal-cloud/paperless/nomad.job"
    version = "6"  // Incremented version number
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "paperless" {

    network {
      mode = "host"
      port "tika" {
        static = "9998"
        host_network = "lan"
      }
      port "gotenberg" {
        static = "3000"
        host_network = "lan"
      }
      port "paperless" {
        static = "8000"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "paperless" {
      driver = "docker"
      config {
        image = "ghcr.io/paperless-ngx/paperless-ngx:2.20.14"
        dns_servers = ["192.168.50.2"]
        network_mode = "host"
        ports = ["paperless"]
        volumes = [
          "${var.shared_dir}paperless/data:/usr/src/paperless/data",
          "${var.shared_dir}paperless/consume:/usr/src/paperless/consume",
          "${var.shared_dir}paperless/export:/usr/src/paperless/export",
          "${var.shared_dir}paperless/media:/usr/src/paperless/media",
        ]
      }

      resources {
        cpu    = 500
        memory = 2048
      }

      service {
        port = "paperless"
        name = "paperless"
        tags = ["traefik.enable=true"]
      }

      template {
        data = <<EOH
PAPERLESS_DBHOST="postgres.service.consul"
PAPERLESS_DBPASS="${var.postgres_admin_password}"
PAPERLESS_DBUSER="postgres"
PAPERLESS_DBENGINE="postgres"
PAPERLESS_REDIS="redis://redis.service.consul:6379/1"
PAPERLESS_REDIS_PREFIX="paperless"
PAPERLESS_TIKA_ENABLED="true"
PAPERLESS_TIKA_ENDPOINT="http://paperless-tika.service.consul:9998"
PAPERLESS_TIKA_GOTENBERG_ENDPOINT="http://paperless-gotenberg.service.consul:3000"
PAPERLESS_ADMIN_USER="admin"
PAPERLESS_ADMIN_PASSWORD="${var.paperless_admin_password}"
PAPERLESS_OCR_LANGUAGE="deu+eng"
EOH
        destination = "local/env"
        env         = true
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "tika" {
      driver = "docker"

      config {
        image = "apache/tika"
        ports = ["tika"]
      }

      service {
        name = "${NOMAD_JOB_NAME}-${NOMAD_TASK_NAME}"
        tags = ["${NOMAD_TASK_NAME}"]
        port = "tika"

        check {
          type     = "tcp"
          port     = "tika"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 500
        memory = 512
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "gotenberg" {
      driver = "docker"

      config {
        image = "gotenberg/gotenberg:8"
        ports = ["gotenberg"]
        command = "gotenberg"
        args = ["--chromium-disable-javascript=true", "--chromium-allow-list=file:///tmp/.*"]
      }

      service {
        name = "${NOMAD_JOB_NAME}-${NOMAD_TASK_NAME}"
        tags = ["${NOMAD_TASK_NAME}"]
        port = "gotenberg"

        check {
          type     = "tcp"
          port     = "gotenberg"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 500
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "postgres_admin_password" {
    type = string
    description = "Admin password for PostgreSQL"
}

variable "paperless_admin_password" {
    type = string
    description = "Admin password for Paperless web interface"
    default = "admin"  // You might want to override this with a more secure password
}

================================================
FILE: nomad_jobs/personal-cloud/radicale/nomad.job
================================================
job "radicale" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/personal-cloud/radicale/nomad.job"
version = "3"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "lan"
        static = "5232"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "radicale" {
      driver = "docker"
      config {
        image = "tomsquest/docker-radicale"
        ports = ["http"]
        mounts = [
          {
            type = "bind"
            target = "/data"
            source = "${var.shared_dir}radicale",
            readonly = false
            bind_options = {
              propagation = "rshared"
            }
          }
        ]
      }
  
      env {
        PUID = "65534"
        PGID = "65534"
        TZ = "Etc/UTC"
      }

      service {
        port = "http"
        name = "${NOMAD_TASK_NAME}"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 512
      }
    }
  }
}

variable "region" {}

variable "tld" {}

variable "shared_dir" {}


================================================
FILE: nomad_jobs/security/suricata/nomad.job
================================================
job "suricata" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "system"
  priority    = 100

  meta {
    job_file = "nomad_jobs/security/suricata/nomad.job"
    version  = "8"  // Add hourly log rotation
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "ids" {
    network {
      mode = "host"
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "suricata" {
      driver = "docker"

      config {
        image        = "jasonish/suricata:8.0"
        network_mode = "host"
        force_pull   = true
        privileged   = true
        cap_add      = ["NET_ADMIN", "NET_RAW", "SYS_NICE"]

        # Run Suricata in af-packet mode using config file
        args = ["-c", "/etc/suricata/suricata.yaml", "--af-packet"]

        # Host mounts for logs (Wazuh reads these) and rules (shared NFS)
        volumes = [
          "local/suricata.yaml:/etc/suricata/suricata.yaml:ro",
          "/var/log/suricata:/var/log/suricata",
          "${var.shared_dir}suricata/rules:/var/lib/suricata:ro",
        ]
      }

      # Suricata configuration
      template {
        data = <<EOH
%YAML 1.1
---
vars:
  address-groups:
    HOME_NET: "[192.168.50.0/24,10.0.0.0/8]"
    EXTERNAL_NET: "!$HOME_NET"
    HTTP_SERVERS: "$HOME_NET"
    SMTP_SERVERS: "$HOME_NET"
    SQL_SERVERS: "$HOME_NET"
    DNS_SERVERS: "$HOME_NET"
    TELNET_SERVERS: "$HOME_NET"
    AIM_SERVERS: "$EXTERNAL_NET"
    DC_SERVERS: "$HOME_NET"
    DNP3_SERVER: "$HOME_NET"
    DNP3_CLIENT: "$HOME_NET"
    MODBUS_CLIENT: "$HOME_NET"
    MODBUS_SERVER: "$HOME_NET"
    ENIP_CLIENT: "$HOME_NET"
    ENIP_SERVER: "$HOME_NET"

  port-groups:
    HTTP_PORTS: "80"
    SHELLCODE_PORTS: "!80"
    ORACLE_PORTS: 1521
    SSH_PORTS: 22
    DNP3_PORTS: 20000
    MODBUS_PORTS: 502
    FILE_DATA_PORTS: "[$HTTP_PORTS,110,143]"
    FTP_PORTS: 21
    GENEVE_PORTS: 6081
    VXLAN_PORTS: 4789
    TEREDO_PORTS: 3544

# Output configuration for JSON logs (Wazuh integration)
outputs:
  - eve-log:
      enabled: yes
      filetype: regular
      filename: /var/log/suricata/eve.json
      rotate: yes
      rotate-interval: hour
      rotate-count: 2
      pcap-file: false
      community-id: true
      community-id-seed: 0
      xff:
        enabled: no
        mode: extra-data
        deployment: reverse
        header: X-Forwarded-For

      types:
        - alert:
            tagged-packets: yes
            xff:
              enabled: no
              mode: extra-data
              deployment: reverse
              header: X-Forwarded-For
        - anomaly:
            enabled: yes
            types:
        - http:
            extended: yes
        - dns:
            version: 2
        - tls:
            extended: yes
        - files:
            force-magic: no
        - smtp:
        - ssh
        - stats:
            totals: yes
            threads: no
            deltas: no
        - flow
        - netflow

  # Stats output
  - stats:
      enabled: yes
      filename: /var/log/suricata/stats.log
      append: yes
      totals: yes
      threads: no

# Logging configuration
logging:
  default-log-level: notice
  outputs:
    - console:
        enabled: yes
    - file:
        enabled: yes
        level: info
        filename: /var/log/suricata/suricata.log

# Network interface configuration
af-packet:
  - interface: {{ sockaddr "GetPrivateInterfaces | include \"network\" \"192.168.50.0/24\" | attr \"name\"" }}
    threads: auto
    cluster-id: 99
    cluster-type: cluster_flow
    defrag: yes
    use-mmap: yes
    tpacket-v3: yes
    ring-size: 2048
    block-size: 32768

# Detect engine settings
detect-engine:
  - profile: medium
  - custom-values:
      toclient-groups: 3
      toserver-groups: 25
  - sgh-mpm-context: auto
  - inspection-recursion-limit: 3000

# Threading
threading:
  set-cpu-affinity: no
  detect-thread-ratio: 1.0

# Rules configuration
default-rule-path: /var/lib/suricata/rules
rule-files:
  - suricata.rules

# Live rule reload
rule-reload: true

# Application layer protocols
app-layer:
  protocols:
    rfb:
      enabled: yes
    mqtt:
      enabled: yes
    krb5:
      enabled: yes
    snmp:
      enabled: yes
    ikev2:
      enabled: yes
    tls:
      enabled: yes
      detection-ports:
        dp: 443
    dcerpc:
      enabled: yes
    ftp:
      enabled: yes
    ssh:
      enabled: yes
    smtp:
      enabled: yes
    http:
      enabled: yes
    dns:
      tcp:
        enabled: yes
      udp:
        enabled: yes

# Performance tuning
stream:
  memcap: 64mb
  checksum-validation: yes
  inline: auto
  reassembly:
    memcap: 256mb
    depth: 1mb
    toserver-chunk-size: 2560
    toclient-chunk-size: 2560
    randomize-chunk-size: yes

host:
  hash-size: 4096
  prealloc: 1000
  memcap: 32mb

flow:
  memcap: 128mb
  hash-size: 65536
  prealloc: 10000
  emergency-recovery: 30

# Defragmentation settings
defrag:
  memcap: 32mb
  hash-size: 65536
  trackers: 65535
  max-frags: 65535
  prealloc: yes
  timeout: 60
EOH
        destination = "local/suricata.yaml"
        change_mode = "restart"
      }

      resources {
        cpu    = 500
        memory = 768
      }

      service {
        name = "suricata"
        tags = ["security", "ids"]

        check {
          type     = "script"
          name     = "suricata-running"
          command  = "/bin/sh"
          args     = ["-c", "pgrep -x Suricata-Main > /dev/null || pgrep -x suricata > /dev/null"]
          interval = "30s"
          timeout  = "5s"
        }
      }
    }
  }
}

variable "region" {
  type = string
}

variable "shared_dir" {
  type = string
}


================================================
FILE: nomad_jobs/security/suricata-update/nomad.job
================================================
job "suricata-update" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "batch"
  priority    = 80

  meta {
    job_file = "nomad_jobs/security/suricata-update/nomad.job"
    version  = "3"  // Single instance with shared NFS storage
  }

  # Run daily at 4am
  periodic {
    crons            = ["0 4 * * *"]
    prohibit_overlap = true
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "update" {
    count = 1

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "suricata-update" {
      driver = "docker"

      config {
        image   = "jasonish/suricata:8.0"
        command = "suricata-update"
        volumes = [
          "${var.shared_dir}suricata/rules:/var/lib/suricata",
        ]
      }

      resources {
        cpu    = 500
        memory = 1024
      }
    }
  }
}

variable "region" {
  type = string
}

variable "shared_dir" {
  type = string
}


================================================
FILE: nomad_jobs/security/wazuh-agent/nomad.job
================================================
job "wazuh-agent" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "system"
  priority    = 100

  meta {
    job_file = "nomad_jobs/security/wazuh-agent/nomad.job"
    version  = "6"  // Fix client.keys file permissions for persistence
  }

  group "agent" {
    network {
      mode = "host"
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      min_healthy_time = "30s"
      auto_revert      = true
    }

    # Ensure agent data directory exists on host
    task "prep-agent-dir" {
      driver = "docker"

      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "mkdir -p /host/var/lib/wazuh-agent; test -f /host/var/lib/wazuh-agent/client.keys || touch /host/var/lib/wazuh-agent/client.keys; chmod 666 /host/var/lib/wazuh-agent/client.keys"]
        volumes = [
          "/var/lib:/host/var/lib",
        ]
      }

      resources {
        cpu    = 100
        memory = 32
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    task "wazuh-agent" {
      driver = "docker"

      config {
        image        = "wazuh/wazuh-agent:4.14.4"
        network_mode = "host"
        force_pull   = true
        privileged   = true

        # Mount host directories for monitoring and config
        volumes = [
          "/var/log:/host/var/log:ro",
          "/var/run/docker.sock:/var/run/docker.sock:ro",
          "/:/host:ro",
          "/var/lib/wazuh-agent/client.keys:/var/ossec/etc/client.keys",
          "local/ossec.conf:/var/ossec/etc/ossec.conf",
        ]
      }

      # Configuration template for the agent
      # Uses Consul service discovery to automatically find Wazuh manager
      template {
        data = <<EOH
{{- if service "wazuh-agent-comm" -}}
{{- with index (service "wazuh-agent-comm") 0 -}}
WAZUH_MANAGER={{ .Address }}
WAZUH_MANAGER_PORT={{ .Port }}
WAZUH_PROTOCOL=tcp
WAZUH_REGISTRATION_SERVER={{ .Address }}
WAZUH_REGISTRATION_PORT=1515
WAZUH_AGENT_NAME={{ env "node.unique.name" }}
WAZUH_AGENT_GROUP=nomad-cluster
{{- end -}}
{{- else }}
# Waiting for wazuh-agent-comm service to be available in Consul
WAZUH_MANAGER=127.0.0.1
WAZUH_MANAGER_PORT=1514
WAZUH_PROTOCOL=tcp
WAZUH_REGISTRATION_SERVER=127.0.0.1
WAZUH_REGISTRATION_PORT=1515
WAZUH_AGENT_NAME={{ env "node.unique.name" }}
WAZUH_AGENT_GROUP=nomad-cluster
{{- end }}
EOH
        destination = "local/agent.env"
        env         = true
        change_mode = "restart"
      }

      # Custom ossec.conf for monitoring specific logs
      # Uses Consul service discovery to automatically find Wazuh manager
      # Uses SIGHUP for hot reload (requires Wazuh 4.14.0+)
      template {
        data = <<EOH
<ossec_config>
  <client>
    <server>
{{- if service "wazuh-agent-comm" -}}
{{- with index (service "wazuh-agent-comm") 0 }}
      <address>{{ .Address }}</address>
      <port>{{ .Port }}</port>
{{- end -}}
{{- else }}
      <address>127.0.0.1</address>
      <port>1514</port>
{{- end }}
      <protocol>tcp</protocol>
    </server>
    <config-profile>ubuntu, ubuntu20, ubuntu20.04</config-profile>
    <notify_time>10</notify_time>
    <time-reconnect>60</time-reconnect>
    <auto_restart>yes</auto_restart>
  </client>

  <client_buffer>
    <disabled>no</disabled>
    <queue_size>5000</queue_size>
    <events_per_second>500</events_per_second>
  </client_buffer>

  <!-- ==================== LOG COLLECTION ==================== -->

  <!-- System logs -->
  <localfile>
    <log_format>syslog</log_format>
    <location>/host/var/log/syslog</location>
  </localfile>

  <localfile>
    <log_format>syslog</log_format>
    <location>/host/var/log/auth.log</location>
  </localfile>

  <localfile>
    <log_format>syslog</log_format>
    <location>/host/var/log/kern.log</location>
  </localfile>

  <localfile>
    <log_format>syslog</log_format>
    <location>/host/var/log/dpkg.log</location>
  </localfile>

  <!-- HashiCorp stack logs -->
  <localfile>
    <log_format>json</log_format>
    <location>/host/var/log/nomad/*.log</location>
  </localfile>

  <localfile>
    <log_format>json</log_format>
    <location>/host/var/log/consul/*.log</location>
  </localfile>

  <!-- Docker daemon logs -->
  <localfile>
    <log_format>syslog</log_format>
    <location>/host/var/log/docker.log</location>
  </localfile>

  <!-- Audit logs if auditd is installed -->
  <localfile>
    <log_format>audit</log_format>
    <location>/host/var/log/audit/audit.log</location>
  </localfile>

  <!-- SSH logs -->
  <localfile>
    <log_format>syslog</log_format>
    <location>/host/var/log/secure</location>
  </localfile>

  <!-- Journal logs for systemd -->
  <localfile>
    <log_format>journald</log_format>
    <location>journald</location>
  </localfile>

  <!-- ==================== SURICATA IDS INTEGRATION ==================== -->
  <!-- Suricata eve.json - Wazuh has native decoder for this format -->
  <localfile>
    <log_format>json</log_format>
    <location>/host/var/log/suricata/eve.json</location>
  </localfile>

  <!-- Suricata service log -->
  <localfile>
    <log_format>syslog</log_format>
    <location>/host/var/log/suricata/suricata.log</location>
  </localfile>

  <!-- ==================== FILE INTEGRITY MONITORING ==================== -->
  <syscheck>
    <disabled>no</disabled>
    <frequency>21600</frequency>
    <scan_on_start>yes</scan_on_start>
    <alert_new_files>yes</alert_new_files>

    <!-- Critical system directories -->
    <directories check_all="yes" realtime="yes">/host/etc</directories>
    <directories check_all="yes" realtime="yes">/host/usr/bin</directories>
    <directories check_all="yes" realtime="yes">/host/usr/sbin</directories>
    <directories check_all="yes" realtime="yes">/host/bin</directories>
    <directories check_all="yes" realtime="yes">/host/sbin</directories>

    <!-- HashiCorp config directories -->
    <directories check_all="yes">/host/etc/nomad.d</directories>
    <directories check_all="yes">/host/etc/consul.d</directories>

    <!-- SSH keys and config -->
    <directories check_all="yes" realtime="yes">/host/root/.ssh</directories>
    <directories check_all="yes">/host/home/*/.ssh</directories>

    <!-- Ignore frequently changing files -->
    <ignore>/host/etc/mtab</ignore>
    <ignore>/host/etc/hosts.deny</ignore>
    <ignore>/host/etc/mail/statistics</ignore>
    <ignore>/host/etc/random-seed</ignore>
    <ignore>/host/etc/adjtime</ignore>
    <ignore>/host/etc/httpd/logs</ignore>
    <ignore>/host/etc/resolv.conf</ignore>
    <ignore type="sregex">.log$|.tmp$|.swp$</ignore>
  </syscheck>

  <!-- ==================== ROOTCHECK ==================== -->
  <rootcheck>
    <disabled>no</disabled>
    <check_files>yes</check_files>
    <check_trojans>yes</check_trojans>
    <check_dev>yes</check_dev>
    <check_sys>yes</check_sys>
    <check_pids>yes</check_pids>
    <check_ports>yes</check_ports>
    <check_if>yes</check_if>
    <frequency>43200</frequency>
    <rootkit_files>/var/ossec/etc/shared/rootkit_files.txt</rootkit_files>
    <rootkit_trojans>/var/ossec/etc/shared/rootkit_trojans.txt</rootkit_trojans>
  </rootcheck>

  <!-- ==================== VULNERABILITY DETECTION ==================== -->
  <wodle name="syscollector">
    <disabled>no</disabled>
    <interval>1h</interval>
    <scan_on_start>yes</scan_on_start>
    <hardware>yes</hardware>
    <os>yes</os>
    <network>yes</network>
    <packages>yes</packages>
    <ports all="no">yes</ports>
    <processes>yes</processes>
  </wodle>

  <!-- ==================== SECURITY CONFIGURATION ASSESSMENT ==================== -->
  <wodle name="sca">
    <enabled>yes</enabled>
    <scan_on_start>yes</scan_on_start>
    <interval>12h</interval>
    <skip_nfs>yes</skip_nfs>
  </wodle>

  <!-- ==================== DOCKER MONITORING ==================== -->
  <wodle name="docker-listener">
    <disabled>no</disabled>
    <interval>10m</interval>
    <attempts>5</attempts>
    <run_on_start>yes</run_on_start>
  </wodle>

  <!-- ==================== ACTIVE RESPONSE ==================== -->
  <!-- Disabled by default - enable with caution in production -->
  <active-response>
    <disabled>yes</disabled>
  </active-response>

</ossec_config>
EOH
        destination = "local/ossec.conf"
        change_mode = "restart"
      }

      resources {
        cpu    = 300
        memory = 512
      }

      service {
        name = "wazuh-agent"
        tags = ["security", "monitoring"]

        # Use a simple script check that runs inside the container
        check {
          type     = "script"
          name     = "agent-status"
          command  = "/var/ossec/bin/wazuh-control"
          args     = ["status"]
          interval = "30s"
          timeout  = "10s"
        }
      }
    }
  }
}

variable "region" {
  type = string
}


================================================
FILE: nomad_jobs/security/wazuh-server/nomad.job
================================================
job "wazuh-server" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "wazuh-stack" {
    count = 1

    network {
      port "indexer" {
        host_network = "lan"
        to = 9200
      }
      port "manager" {
        static       = 1514
        host_network = "lan"
        to = 1514
      }
      port "manager_reg" {
        static       = 1515
        host_network = "lan"
        to = 1515
      }
      port "manager_api" {
        host_network = "lan"
        to = 55000
      }
      port "dashboard" {
        host_network = "lan"
        to = 443
      }
    }

    # Persistent volumes for Wazuh components
    volume "wazuh-indexer" {
      type            = "csi"
      read_only       = false
      source          = "wazuh-indexer"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }

    volume "wazuh-manager" {
      type            = "csi"
      read_only       = false
      source          = "wazuh-manager"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }

    volume "wazuh-dashboard" {
      type            = "csi"
      read_only       = false
      source          = "wazuh-dashboard"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    # Prep disk task for indexer volume permissions
    task "prep-indexer-disk" {
      driver = "docker"

      volume_mount {
        volume      = "wazuh-indexer"
        destination = "/volume/"
        read_only   = false
      }

      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "chown -R 1000:1000 /volume/"]
      }

      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    # Prep disk task for manager volume permissions
    task "prep-manager-disk" {
      driver = "docker"

      volume_mount {
        volume      = "wazuh-manager"
        destination = "/volume/"
        read_only   = false
      }

      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "chown -R 999:999 /volume/"]
      }

      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }


    # Prep disk task for dashboard volume permissions
    task "prep-dashboard-disk" {
      driver = "docker"

      volume_mount {
        volume      = "wazuh-dashboard"
        destination = "/volume/"
        read_only   = false
      }

      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "rm -rf /volume/wazuh && mkdir -p /volume/wazuh/config && chown -R 1000:1000 /volume/"]
      }

      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    # Wazuh Indexer (OpenSearch-based)
    task "wazuh-indexer" {
      driver = "docker"

      volume_mount {
        volume      = "wazuh-indexer"
        destination = "/var/lib/wazuh-indexer"
        read_only   = false
      }

      config {
        image      = "wazuh/wazuh-indexer:4.14.4"
        force_pull = true
        ports      = ["indexer"]
        volumes = [
          "local/opensearch.yml:/usr/share/wazuh-indexer/config/opensearch.yml",
        ]
        ulimit {
          nofile = "65536:65536"
          memlock = "-1:-1"
        }
      }

      env {
        OPENSEARCH_JAVA_OPTS = "-Xms1g -Xmx1g"
      }

      template {
        data = <<EOH
network.host: "0.0.0.0"
node.name: "wazuh-indexer"
cluster.name: "wazuh-cluster"
path.data: /var/lib/wazuh-indexer
path.logs: /var/log/wazuh-indexer
discovery.type: single-node
compatibility.override_main_response_version: true

# Enable SSL with demo certificates
plugins.security.ssl.http.enabled: true
plugins.security.ssl.http.pemcert_filepath: certs/indexer.pem
plugins.security.ssl.http.pemkey_filepath: certs/indexer-key.pem
plugins.security.ssl.http.pemtrustedcas_filepath: certs/root-ca.pem
plugins.security.ssl.transport.enabled: true
plugins.security.ssl.transport.pemcert_filepath: certs/indexer.pem
plugins.security.ssl.transport.pemkey_filepath: certs/indexer-key.pem
plugins.security.ssl.transport.pemtrustedcas_filepath: certs/root-ca.pem
plugins.security.ssl.transport.enforce_hostname_verification: false
plugins.security.ssl.transport.resolve_hostname: false
plugins.security.allow_unsafe_democertificates: true
plugins.security.allow_default_init_securityindex: true
plugins.security.authcz.admin_dn:
  - "CN=admin,OU=Wazuh,O=Wazuh,L=California,C=US"
plugins.security.nodes_dn:
  - "CN=wazuh-indexer,OU=Wazuh,O=Wazuh,L=California,C=US"
plugins.security.audit.type: internal_opensearch
plugins.security.enable_snapshot_restore_privilege: true
plugins.security.check_snapshot_restore_write_privileges: true
plugins.security.restapi.roles_enabled: ["all_access", "security_rest_api_access"]
EOH
        destination = "local/opensearch.yml"
        perms       = "0644"
      }

      resources {
        cpu    = 1000
        memory = 2048
      }

      service {
        name = "wazuh-indexer"
        port = "indexer"

        check {
          type     = "tcp"
          port     = "indexer"
          interval = "10s"
          timeout  = "2s"
        }
      }
    }

    # Wazuh Manager (Analysis Engine)
    task "wazuh-manager" {
      driver = "docker"

      volume_mount {
        volume      = "wazuh-manager"
        destination = "/var/ossec/data"
        read_only   = false
      }

      config {
        image      = "wazuh/wazuh-manager:4.14.4"
        force_pull = true
        hostname   = "wazuh-manager"
        ports      = ["manager", "manager_reg", "manager_api"]
        volumes = [
          "local/local_rules.xml:/var/ossec/etc/rules/local_rules.xml:ro",
          "local/ossec.conf:/var/ossec/etc/ossec.conf:ro",
        ]
      }

      template {
        data = <<EOH
INDEXER_URL=https://{{ env "NOMAD_IP_indexer" }}:{{ env "NOMAD_HOST_PORT_indexer" }}
INDEXER_USERNAME=admin
INDEXER_PASSWORD=admin
FILEBEAT_SSL_VERIFICATION_MODE=none
SSL_CERTIFICATE_AUTHORITIES=""
API_USERNAME=wazuh-wui
API_PASSWORD=${var.wazuh_api_password}
EOH
        destination = "secrets/manager.env"
        env         = true
      }

      # Custom rules to suppress noisy alerts
      template {
        data = <<EOH
<!-- Local rules for Wazuh Manager -->
<group name="local,syslog,suricata,">

  <!-- Suppress noisy Suricata STREAM alerts (rule 86601) -->
  <!-- These "invalid ack" alerts are low-value network noise -->
  <rule id="100001" level="0">
    <if_sid>86601</if_sid>
    <description>Suppressed: Suricata STREAM ESTABLISHED invalid ack</description>
  </rule>

</group>
EOH
        destination = "local/local_rules.xml"
        perms       = "0644"
      }

      # Wazuh ossec.conf with log_alert_level=8 (only high/critical alerts)
      # Wazuh levels: 0=ignored, 1-4=low, 5-7=medium, 8-10=high, 11-15=critical
      template {
        data = <<EOH
<!--
  Wazuh - Manager - Default configuration for amzn 2023
  More info at: https://documentation.wazuh.com
  Mailing list: https://groups.google.com/forum/#!forum/wazuh

  CUSTOMIZED: log_alert_level set to 8 (high/critical alerts only)
-->

<ossec_config>
  <global>
    <jsonout_output>yes</jsonout_output>
    <alerts_log>yes</alerts_log>
    <logall>no</logall>
    <logall_json>no</logall_json>
    <email_notification>no</email_notification>
    <smtp_server>smtp.example.wazuh.com</smtp_server>
    <email_from>wazuh@example.wazuh.com</email_from>
    <email_to>recipient@example.wazuh.com</email_to>
    <email_maxperhour>12</email_maxperhour>
    <email_log_source>alerts.log</email_log_source>
    <agents_disconnection_time>15m</agents_disconnection_time>
    <agents_disconnection_alert_time>0</agents_disconnection_alert_time>
    <update_check>yes</update_check>
  </global>

  <alerts>
    <!-- CUSTOMIZED: Changed from 3 to 8 to only log high/critical alerts -->
    <log_alert_level>8</log_alert_level>
    <email_alert_level>12</email_alert_level>
  </alerts>

  <!-- Choose between "plain", "json", or "plain,json" for the format of internal logs -->
  <logging>
    <log_format>plain</log_format>
  </logging>

  <remote>
    <connection>secure</connection>
    <port>1514</port>
    <protocol>tcp</protocol>
    <queue_size>131072</queue_size>
  </remote>

  <!-- Policy monitoring -->
  <rootcheck>
    <disabled>no</disabled>
    <check_files>yes</check_files>
    <check_trojans>yes</check_trojans>
    <check_dev>yes</check_dev>
    <check_sys>yes</check_sys>
    <check_pids>yes</check_pids>
    <check_ports>yes</check_ports>
    <check_if>yes</check_if>

    <!-- Frequency that rootcheck is executed - every 12 hours -->
    <frequency>43200</frequency>

    <rootkit_files>etc/rootcheck/rootkit_files.txt</rootkit_files>
    <rootkit_trojans>etc/rootcheck/rootkit_trojans.txt</rootkit_trojans>

    <skip_nfs>yes</skip_nfs>

    <ignore>/var/lib/containerd</ignore>
    <ignore>/var/lib/docker/overlay2</ignore>
  </rootcheck>

  <wodle name="cis-cat">
    <disabled>yes</disabled>
    <timeout>1800</timeout>
    <interval>1d</interval>
    <scan-on-start>yes</scan-on-start>

    <java_path>wodles/java</java_path>
    <ciscat_path>wodles/ciscat</ciscat_path>
  </wodle>

  <!-- Osquery integration -->
  <wodle name="osquery">
    <disabled>yes</disabled>
    <run_daemon>yes</run_daemon>
    <log_path>/var/log/osquery/osqueryd.results.log</log_path>
    <config_path>/etc/osquery/osquery.conf</config_path>
    <add_labels>yes</add_labels>
  </wodle>

  <!-- System inventory -->
  <wodle name="syscollector">
    <disabled>no</disabled>
    <interval>1h</interval>
    <scan_on_start>yes</scan_on_start>
    <hardware>yes</hardware>
    <os>yes</os>
    <network>yes</network>
    <packages>yes</packages>
    <ports all="yes">yes</ports>
    <processes>yes</processes>
    <users>yes</users>
    <groups>yes</groups>
    <services>yes</services>
    <browser_extensions>yes</browser_extensions>

    <!-- Database synchronization settings -->
    <synchronization>
      <max_eps>10</max_eps>
    </synchronization>
  </wodle>

  <sca>
    <enabled>yes</enabled>
    <scan_on_start>yes</scan_on_start>
    <interval>12h</interval>
    <skip_nfs>yes</skip_nfs>
  </sca>

  <vulnerability-detection>
    <enabled>yes</enabled>
    <index-status>yes</index-status>
    <feed-update-interval>60m</feed-update-interval>
  </vulnerability-detection>

  <indexer>
    <enabled>yes</enabled>
    <hosts>
      <host>https://{{ env "NOMAD_IP_indexer" }}:{{ env "NOMAD_HOST_PORT_indexer" }}</host>
    </hosts>
    <ssl>
      <certificate_authorities>
        <ca>/etc/filebeat/certs/root-ca.pem</ca>
      </certificate_authorities>
      <certificate>/etc/filebeat/certs/filebeat.pem</certificate>
      <key>/etc/filebeat/certs/filebeat-key.pem</key>
    </ssl>
  </indexer>

  <!-- File integrity monitoring -->
  <syscheck>
    <disabled>no</disabled>

    <!-- Frequency that syscheck is executed default every 12 hours -->
    <frequency>43200</frequency>

    <scan_on_start>yes</scan_on_start>

    <!-- Generate alert when new file detected -->
    <alert_new_files>yes</alert_new_files>

    <!-- Don't ignore files that change more than 'frequency' times -->
    <auto_ignore frequency="10" timeframe="3600">no</auto_ignore>

    <!-- Directories to check  (perform all possible verifications) -->
    <directories>/etc,/usr/bin,/usr/sbin</directories>
    <directories>/bin,/sbin,/boot</directories>

    <!-- Files/directories to ignore -->
    <ignore>/etc/mtab</ignore>
    <ignore>/etc/hosts.deny</ignore>
    <ignore>/etc/mail/statistics</ignore>
    <ignore>/etc/random-seed</ignore>
    <ignore>/etc/random.seed</ignore>
    <ignore>/etc/adjtime</ignore>
    <ignore>/etc/httpd/logs</ignore>
    <ignore>/etc/utmpx</ignore>
    <ignore>/etc/wtmpx</ignore>
    <ignore>/etc/cups/certs</ignore>
    <ignore>/etc/dumpdates</ignore>
    <ignore>/etc/svc/volatile</ignore>

    <!-- File types to ignore -->
    <ignore type="sregex">.log$|.swp$</ignore>

    <!-- Check the file, but never compute the diff -->
    <nodiff>/etc/ssl/private.key</nodiff>

    <skip_nfs>yes</skip_nfs>
    <skip_dev>yes</skip_dev>
    <skip_proc>yes</skip_proc>
    <skip_sys>yes</skip_sys>

    <!-- Nice value for Syscheck process -->
    <process_priority>10</process_priority>

    <!-- Maximum output throughput -->
    <max_eps>50</max_eps>

    <!-- Database synchronization settings -->
    <synchronization>
      <enabled>yes</enabled>
      <interval>5m</interval>
      <max_eps>10</max_eps>
    </synchronization>
  </syscheck>

  <!-- Active response -->
  <global>
    <white_list>127.0.0.1</white_list>
    <white_list>^localhost.localdomain$</white_list>
    <white_list>168.63.129.16</white_list>
  </global>

  <command>
    <name>disable-account</name>
    <executable>disable-account</executable>
    <timeout_allowed>yes</timeout_allowed>
  </command>

  <command>
    <name>restart-wazuh</name>
    <executable>restart-wazuh</executable>
  </command>

  <command>
    <name>firewall-drop</name>
    <executable>firewall-drop</executable>
    <timeout_allowed>yes</timeout_allowed>
  </command>

  <command>
    <name>host-deny</name>
    <executable>host-deny</executable>
    <timeout_allowed>yes</timeout_allowed>
  </command>

  <command>
    <name>route-null</name>
    <executable>route-null</executable>
    <timeout_allowed>yes</timeout_allowed>
  </command>

  <command>
    <name>win_route-null</name>
    <executable>route-null.exe</executable>
    <timeout_allowed>yes</timeout_allowed>
  </command>

  <command>
    <name>netsh</name>
    <executable>netsh.exe</executable>
    <timeout_allowed>yes</timeout_allowed>
  </command>

  <!--
  <active-response>
    active-response options here
  </active-response>
  -->

  <!-- Log analysis -->
  <localfile>
    <log_format>command</log_format>
    <command>df -P</command>
    <frequency>360</frequency>
  </localfile>

  <localfile>
    <log_format>full_command</log_format>
    <command>netstat -tulpn | sed 's/\([[:alnum:]]\+\)\ \+[[:digit:]]\+\ \+[[:digit:]]\+\ \+\(.*\):\([[:digit:]]*\)\ \+\([0-9\.\:\*]\+\).\+\ \([[:digit:]]*\/[[:alnum:]\-]*\).*/\1 \2 == \3 == \4 \5/' | sort -k 4 -g | sed 's/ == \(.*\) ==/:\1/' | sed 1,2d</command>
    <alias>netstat listening ports</alias>
    <frequency>360</frequency>
  </localfile>

  <localfile>
    <log_format>full_command</log_format>
    <command>last -n 20</command>
    <frequency>360</frequency>
  </localfile>

  <ruleset>
    <!-- Default ruleset -->
    <decoder_dir>ruleset/decoders</decoder_dir>
    <rule_dir>ruleset/rules</rule_dir>
    <rule_exclude>0215-policy_rules.xml</rule_exclude>
    <list>etc/lists/audit-keys</list>
    <list>etc/lists/amazon/aws-eventnames</list>
    <list>etc/lists/security-eventchannel</list>
    <list>etc/lists/malicious-ioc/malware-hashes</list>
    <list>etc/lists/malicious-ioc/malicious-ip</list>
    <list>etc/lists/malicious-ioc/malicious-domains</list>

    <!-- User-defined ruleset -->
    <decoder_dir>etc/decoders</decoder_dir>
    <rule_dir>etc/rules</rule_dir>
  </ruleset>

  <rule_test>
    <enabled>yes</enabled>
    <threads>1</threads>
    <max_sessions>64</max_sessions>
    <session_timeout>15m</session_timeout>
  </rule_test>

  <!-- Configuration for wazuh-authd -->
  <auth>
    <disabled>no</disabled>
    <port>1515</port>
    <use_source_ip>no</use_source_ip>
    <purge>yes</purge>
    <use_password>no</use_password>
    <ciphers>HIGH:!ADH:!EXP:!MD5:!RC4:!3DES:!CAMELLIA:@STRENGTH</ciphers>
    <!-- <ssl_agent_ca></ssl_agent_ca> -->
    <ssl_verify_host>no</ssl_verify_host>
    <ssl_manager_cert>etc/sslmanager.cert</ssl_manager_cert>
    <ssl_manager_key>etc/sslmanager.key</ssl_manager_key>
    <ssl_auto_negotiate>no</ssl_auto_negotiate>
  </auth>

  <cluster>
    <name>wazuh</name>
    <node_name>node01</node_name>
    <node_type>master</node_type>
    <key></key>
    <port>1516</port>
    <bind_addr>0.0.0.0</bind_addr>
    <nodes>
        <node>NODE_IP</node>
    </nodes>
    <hidden>no</hidden>
    <disabled>yes</disabled>
  </cluster>

</ossec_config>

<ossec_config>
  <localfile>
    <log_format>syslog</log_format>
    <location>/var/ossec/logs/active-responses.log</location>
  </localfile>

</ossec_config>
EOH
        destination = "local/ossec.conf"
        perms       = "0644"
      }

      resources {
        cpu    = 1000
        memory = 1024
      }

      service {
        name = "wazuh-manager"
        port = "manager_api"
        tags = ["metrics"]

        meta {
          api_port = "${NOMAD_HOST_PORT_manager_api}"
        }

        check {
          type     = "tcp"
          port     = "manager_api"
          interval = "10s"
          timeout  = "2s"
        }
      }

      service {
        name = "wazuh-agent-comm"
        port = "manager"
        tags = ["agent-communication"]

        check {
          type     = "tcp"
          port     = "manager"
          interval = "10s"
          timeout  = "2s"
        }
      }

      service {
        name = "wazuh-agent-reg"
        port = "manager_reg"
        tags = ["agent-registration"]

        check {
          type     = "tcp"
          port     = "manager_reg"
          interval = "10s"
          timeout  = "2s"
        }
      }
    }

    # Wazuh Dashboard (Web UI)
    task "wazuh-dashboard" {
      driver = "docker"

      volume_mount {
        volume      = "wazuh-dashboard"
        destination = "/usr/share/wazuh-dashboard/data"
        read_only   = false
      }

      config {
        image      = "wazuh/wazuh-dashboard:4.14.4"
        force_pull = true
        ports      = ["dashboard"]
        volumes = [
          "local/opensearch_dashboards.yml:/usr/share/wazuh-dashboard/config/opensearch_dashboards.yml",
          "local/wazuh.yml:/usr/share/wazuh-dashboard/data/wazuh/config/wazuh.yml:ro",
        ]
      }

      template {
        data = <<EOH
OPENSEARCH_HOSTS=https://{{ env "NOMAD_IP_indexer" }}:{{ env "NOMAD_HOST_PORT_indexer" }}
OPENSEARCH_USERNAME=admin
OPENSEARCH_PASSWORD=admin
OPENSEARCH_SSL_VERIFICATIONMODE=none
SERVER_HOST=0.0.0.0
SERVER_PORT=443
SERVER_SSL_ENABLED=true
SERVER_SSL_CERTIFICATE=/usr/share/wazuh-dashboard/config/certs/dashboard.pem
SERVER_SSL_KEY=/usr/share/wazuh-dashboard/config/certs/dashboard-key.pem
WAZUH_API_URL=https://{{ env "NOMAD_IP_manager_api" }}:{{ env "NOMAD_HOST_PORT_manager_api" }}
API_USERNAME=wazuh-wui
API_PASSWORD=${var.wazuh_api_password}
EOH
        destination = "secrets/dashboard.env"
        env         = true
        change_mode = "noop"
      }

      template {
        data = <<EOH
server.host: "0.0.0.0"
server.port: 443
opensearch.hosts: ["https://{{ env "NOMAD_IP_indexer" }}:{{ env "NOMAD_HOST_PORT_indexer" }}"]
opensearch.ssl.verificationMode: none
opensearch.username: "admin"
opensearch.password: "admin"
opensearch.requestHeadersWhitelist: ["securitytenant","Authorization"]
opensearch_security.multitenancy.enabled: false
opensearch_security.readonly_mode.roles: ["kibana_read_only"]
server.ssl.enabled: true
server.ssl.certificate: /usr/share/wazuh-dashboard/config/certs/dashboard.pem
server.ssl.key: /usr/share/wazuh-dashboard/config/certs/dashboard-key.pem
uiSettings.overrides.defaultRoute: "/app/wz-home"
csp.warnLegacyBrowsers: false
EOH
        destination = "local/opensearch_dashboards.yml"
        perms       = "0644"
        change_mode = "noop"
      }

      template {
        data = <<EOH
hosts:
  - default:
      url: https://{{ env "NOMAD_IP_manager_api" }}
      port: {{ env "NOMAD_HOST_PORT_manager_api" }}
      username: wazuh-wui
      password: ${var.wazuh_api_password}
      run_as: false
EOH
        destination = "local/wazuh.yml"
        perms       = "0644"
        change_mode = "noop"
      }

      resources {
        cpu    = 500
        memory = 1024
      }

      service {
        name = "wazuh-dashboard"
        port = "dashboard"
        tags = [
          "traefik.enable=true",
          "traefik.http.routers.wazuh.rule=Host(`wazuh.${var.tld}`)",
          "traefik.http.routers.wazuh.entrypoints=websecure",
          "traefik.http.routers.wazuh.tls=true",
          "traefik.http.routers.wazuh.tls.certresolver=letsencrypt",
          "traefik.http.services.wazuh.loadbalancer.server.scheme=https",
          "traefik.http.services.wazuh.loadbalancer.serversTransport=insecure-skip-verify@file",
        ]

        check {
          type     = "tcp"
          port     = "dashboard"
          interval = "10s"
          timeout  = "2s"
        }
      }
    }

  }
}

variable "region" {
  type = string
}

variable "tld" {
  type = string
}

variable "shared_dir" {
  type = string
}

variable "wazuh_indexer_password" {
  type = string
  description = "Password for Wazuh indexer admin user"
}

variable "wazuh_api_password" {
  type = string
  description = "Password for Wazuh API user"
}

variable "wazuh_dashboard_password" {
  type = string
  description = "Password for Wazuh dashboard kibanaserver user"
}


================================================
FILE: nomad_jobs/security/wazuh-server/volume-dashboard.hcl
================================================
type = "csi"
id = "wazuh-dashboard"
name = "wazuh-dashboard"
plugin_id = "org.democratic-csi.iscsi"

capability {
  access_mode = "single-node-writer"
  attachment_mode = "file-system"
}

# iSCSI volume will be created via democratic-csi
# No additional context needed - managed by TrueNAS/democratic-csi


================================================
FILE: nomad_jobs/security/wazuh-server/volume-indexer.hcl
================================================
type = "csi"
id = "wazuh-indexer"
name = "wazuh-indexer"
plugin_id = "org.democratic-csi.iscsi"

capability {
  access_mode = "single-node-writer"
  attachment_mode = "file-system"
}

# iSCSI volume will be created via democratic-csi
# No additional context needed - managed by TrueNAS/democratic-csi


================================================
FILE: nomad_jobs/security/wazuh-server/volume-manager.hcl
================================================
type = "csi"
id = "wazuh-manager"
name = "wazuh-manager"
plugin_id = "org.democratic-csi.iscsi"

capability {
  access_mode = "single-node-writer"
  attachment_mode = "file-system"
}

# iSCSI volume will be created via democratic-csi
# No additional context needed - managed by TrueNAS/democratic-csi


================================================
FILE: nomad_jobs/smart-home/deconz/nomad.job
================================================
job "deconz" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/smart-home/deconz/nomad.job"
service_owner = "@pmanuk"
    version = "3"
  }

  constraint {
    attribute = "${meta.zigbee}"
    operator  = "="
    value     = "true"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "homeautomation" {
    count = 1 

    network {
      port "web" {
        static = "8182"
        host_network = "lan"
      }
      port "ws" {
        host_network = "lan"
      }
    }

    volume "deconz" {
      type      = "csi"
      read_only = false

      source    = "deconz"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "deconz" {
      driver = "docker"
      config {
        image = "deconzcommunity/deconz:2.33.0"
        force_pull = true
        ports = ["web", "ws"]
        privileged = true
        volumes = [
          "/dev/ttyACM0:/dev/ttyACM0",
        ]
      }

      volume_mount {
        volume      = "deconz"
        destination = "/opt/deCONZ"
        read_only   = false
      }

      service {
        port = "web"
	name = "deconz"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",
          "traefik.http.middlewares.cors.headers.accesscontrolallowmethods=GET,OPTIONS,PUT",
          "traefik.http.middlewares.cors.headers.accesscontrolmaxage=100",
          "traefik.http.middlewares.cors.headers.addvaryheader=true",


          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.middlewares.malpotAuth.basicauth.users=${var.auth}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth, malpotAuth"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      env {
        TZ = "Europe/Amsterdam"
        DECONZ_WEB_PORT = "${NOMAD_PORT_web}"
        DECONZ_WS_PORT = "${NOMAD_PORT_ws}"
        DECONZ_DEVICE = "/dev/ttyACM0"
        DECONZ_VNC_MODE = "0"
        DECONZ_VNC_PASSWORD = "changeme"
        DECONZ_VNC_PORT = "5901"
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "auth" {
   type = string
}


================================================
FILE: nomad_jobs/smart-home/deconz/volume.hcl
================================================
id           = "deconz"
external_id  = "deconz"
name         = "deconz"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/smart-home/home-assistant/nomad.job
================================================
job "home-assistant" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/smart-home/home-assistant/nomad.job"
service_owner = "@pmanuk"
    version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  constraint {
    attribute = "${meta.zigbee}"
    operator  = "="
    value     = "true"
  }

  group "home-automation" {
    count = 1 

    network {
      port "http" {
        static = "8123"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "hass" {
      driver = "docker"
      config {
        image = "homeassistant/home-assistant:2026.4.3"
        network_mode = "host"
        privileged = "true"
        volumes = [
          "/run/dbus:/run/dbus",
          "${var.shared_dir}home-assistant:/config",
        ]
      }

      service {
        port = "http"
        name = "hass"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
        check {
          type     = "tcp"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 100
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/smart-home/home-assistant/volume.hcl
================================================
id           = "home-assistant"
external_id  = "home-assistant"
name         = "home-assistant"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "1GiB"
capacity_max = "1GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/smart-home/mqtt/nomad.job
================================================
job "mosquitto" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/smart-home/mqtt/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "homeautomation" {
    count = 1 

    network {
      port "0" {
        host_network = "tailscale"
        to = "9001"
      }
      port "1" {
        host_network = "tailscale"
        to = "1883"
      }
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "mosquitto" {
      driver = "docker"
      config {
        image = "docker-registry.${var.tld}/mosquitto:2"
        force_pull = true
        network_mode = "host"
        ports = ["0", "1"]
        volumes = [
          "${var.shared_dir}mosquitto:/mosquitto/",
        ]
      }

      service {
         tags = ["mqtt", "net-internal"]
         name = "mqtt"
         port = "1"
      }

      env {
        TZ = "Europe/Amsterdam"
      }

      resources {
        cpu    = 100
        memory = 64
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/smart-home/owntracks-recorder/nomad.job
================================================
job "owntracks-recorder" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/smart-home/owntracks-recorder/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "tracking" {
    count = 1 

    network {
      port "http" {
        host_network = "tailscale"
        to = "8083"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "owntracks" {
      driver = "docker"
      config {
        image = "owntracks/recorder:1.0.1"
        args = [
          "--http-host", "${NOMAD_IP_http}"
        ]
        force_pull = true
        #network_mode = "host"
        ports = ["http"]
        volumes = [
          "${var.shared_dir}owntracks-recorder:/store/",
          "${var.shared_dir}owntracks-recorder/views:/htdocs/views/",
        ]
      }

      service {
        port = "http"
        name = "owntracks"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.middlewares.malpotAuthNew.basicauth.users=${var.auth}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth, forward-auth"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "10s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      env {
        TZ = "Europe/Amsterdam"
        OTR_HOST = "mqtt-pub.${var.tld}"
        OTR_PORT = "8883"
        OTR_USER = "mqtt"
        OTR_PASS = var.otr_pass
        OTR_STORAGEDIR = "/store"
        OTR_VIEWSDIR = "/store/views"
        #OTR_CAPATH = "/etc/ssl/certs"
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {}

variable "tld" {}

variable "shared_dir" {}

variable "auth" {}

variable "otr_pass" {}


================================================
FILE: nomad_jobs/smart-home/zigbee2mqtt/nomad.job
================================================
job "zigbee2mqtt" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  meta {
      job_file = "nomad_jobs/smart-home/zigbee2mqtt/nomad.job"
service_owner = "@pmanuk"
    version = "15"
  }

  group "homeautomation" {
    count = 1 
    network {
      port "tcp" {
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "zigbee2mqtt" {
      driver = "docker"
      config {
        image = "koenkk/zigbee2mqtt"
        force_pull = true
        network_mode = "host"
        ports = ["tcp"]
        privileged = true
        volumes = [
          "${var.shared_dir}zigbee2mqtt:/app/data",
          "${var.shared_dir}zigbee2mqtt/zigbee-shepherd-converters:/app/node_modules/zigbee-shepherd-converters",
          "/dev/ttyACM0:/dev/ttyACM0",
        ]
      }

      env {
        TZ = "Europe/Amsterdam"
      }

      resources {
        cpu    = 100
        memory = 256
      }
    }
  }
}

variable "region" {
    type = string
}


variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/storage-backends/docker-registry/nomad.job
================================================
job "docker-registry" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/storage-backends/docker-registry/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "infrastructure" {
    count = 1 

    network {
      port "http" {
        static = "5000"
        host_network = "lan"
      }
    }

    volume "docker-registry" {
      type      = "csi"
      read_only = false
      source    = "docker-registry-data"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "docker-registry" {
      driver = "docker"
      config {
        image = "registry:3.1.0"
        ports = ["http"]
        network_mode = "host"
      }

      volume_mount {
        volume      = "docker-registry"
        destination = "/data"
        read_only   = false
      }

      env {
        REGISTRY_STORAGE_FILESYSTEM_ROOTDIRECTORY = "/data"
        REGISTRY_HTTP_ADDR = "${NOMAD_ADDR_http}"
      }
      service {
        port = "http"
	      name = "docker-registry"
        tags = [
          "traefik.enable=true"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 20
        memory = 64
      }
    }
  }
}

variable "region" {
    type = string
}

variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/storage-backends/docker-registry/volume.hcl
================================================
id           = "docker-registry-data"
external_id  = "docker-registry-data"
name         = "docker-registry-data"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "10GiB"
capacity_max = "10GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime", "nodiratime", "data=ordered"]
}


================================================
FILE: nomad_jobs/storage-backends/mariadb/nomad.job
================================================
job "mariadb" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/storage-backends/mariadb/nomad.job"
version = "2"  // Incremented version number
  }

  group "db" {
    network {
      mode = "host"
      port "mariadb" {
        static = "3306"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "mariadb" {
      driver = "docker"

      config {
        image = "mariadb:11"
        volumes = [
          "${var.shared_dir}shared-mariadb:/var/lib/mysql",
        ]
        ports = ["mariadb"]
      }

      env {
        MARIADB_ROOT_PASSWORD = "${var.db_password}"
      }

      service {
        name = "${NOMAD_JOB_NAME}"
        tags = ["mariadb"]
        port = "mariadb"

        check {
          type     = "tcp"
          port     = "mariadb"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = "200"
        memory = "512"
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "db_password" {
    type = string
    description = "Password for MariaDB root user"
}


================================================
FILE: nomad_jobs/storage-backends/neo4j/nomad.job
================================================
job "neo4j" {
  region = var.region
  datacenters = ["dc1"]
  type = "service"

  meta {
    job_file = "nomad_jobs/storage-backends/neo4j/nomad.job"
    version = "3"
  }

  group "neo4j" {
    count = 1

    network {
      mode = "host"
      port "http" {
        static = 7474
        host_network = "lan"
      }
      port "https" {
        static = 7473
        host_network = "lan"
      }
      port "bolt" {
        static = 7687
        host_network = "lan"
      }
    }

    volume "neo4j-data" {
      type            = "csi"
      read_only       = false
      source          = "neo4j-data"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "neo4j" {
      driver = "docker"

      config {
        image = "neo4j:5.26"
        ports = ["http", "https", "bolt"]
      }

      volume_mount {
        volume      = "neo4j-data"
        destination = "/data"
        read_only   = false
      }

      env {
        NEO4J_AUTH = "neo4j/ChAnGeMe"
        NEO4J_PLUGINS = "[\"apoc\"]"
        NEO4J_apoc_export_file_enabled = "true"
        NEO4J_apoc_import_file_enabled = "true"
        NEO4J_apoc_import_file_use__neo4j__config = "true"
      }

      resources {
        cpu    = 100
        memory = 1600
      }

      service {
        name = "neo4j"
        tags = ["graph-db", "ai"]
        port = "bolt"

        check {
          type     = "tcp"
          port     = "bolt"
          interval = "30s"
          timeout  = "2s"
        }
      }
    }
  }

}
variable "region" {
  type = string
  default = "global"
}


================================================
FILE: nomad_jobs/storage-backends/neo4j/setup.job
================================================
job "neo4j-setup" {
  region = var.region
  datacenters = ["dc1"]
  type = "batch"

  meta {
    job_file = "nomad_jobs/storage-backends/neo4j/setup.job"
    version = "2"
  }

  group "setup" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "neo4j-init" {
      driver = "docker"

      config {
        image = "neo4j:5.26"
        command = "cypher-shell"
        args = [
          "-a", "neo4j.service.consul:7687",
          "-u", "neo4j", 
          "-p", "ChAnGeMe",
          "CREATE CONSTRAINT cognee_node_id IF NOT EXISTS FOR (n:CogneeNode) REQUIRE n.id IS UNIQUE;"
        ]
      }

      template {
        data = <<EOH
NEO4J_PASSWORD="changeme"
EOH
        destination = "secrets/neo4j-config.env"
        env = true
      }

      resources {
        cpu    = 200
        memory = 256
      }
    }
  }

}
variable "region" {
  type = string
  default = "global"
}


================================================
FILE: nomad_jobs/storage-backends/neo4j/volume.hcl
================================================
# Neo4j graph database storage volume
id           = "neo4j-data"
name         = "neo4j-data"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "8GiB"
capacity_max = "8GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/storage-backends/pgvector/nomad.job
================================================
job "pgvector" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/storage-backends/pgvector/nomad.job"
    version = "5"  // Reduced memory 256MB -> 128MB
  }

  group "db" {
    network {
      mode = "host"
      port "pgvector" {
        static = "5432"  
        host_network = "lan"
      }
    }
    

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "pgvector" {
      driver = "docker"
      config {
        image = "pgvector/pgvector:pg16"
        volumes = [
          "${var.shared_dir}pgvector-data:/var/lib/postgresql/data",
        ]
        ports = ["pgvector"]
      }

      env {
        POSTGRES_DB       = "vectordb"
        POSTGRES_USER     = "postgres"
        POSTGRES_PASSWORD = "${var.postgres_pass}"
        PGDATA            = "/var/lib/postgresql/data"
      }

      service {
        name = "${NOMAD_JOB_NAME}"
        tags = ["pgvector", "database", "vector-database"]
        port = "pgvector"

        check {
          type     = "tcp"
          port     = "pgvector"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = "100"
        memory = "128"
      }
    }
  }
}

variable "region" {}
variable "shared_dir" {}
variable "pgvector_admin_password" {}


================================================
FILE: nomad_jobs/storage-backends/pgvector/pgvector-setup.job
================================================
job "pgvector-setup" {
  type = "batch"
  datacenters = ["dc1"]
  
  meta {
    job_file = "nomad_jobs/storage-backends/pgvector/pgvector-setup.job"
    version = "1"
  }
  
  group "setup" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "initialize-pgvector" {
      driver = "docker"
      
      config {
        image = "pgvector/pgvector:pg16"
        command = "sh"
        args = [
          "-c",
          "PGPASSWORD=$PGVECTOR_PASSWORD psql -h 192.168.50.120 -p 5432 -U postgres -d cognee_db -c \"CREATE EXTENSION IF NOT EXISTS vector;\" && PGPASSWORD=$PGVECTOR_PASSWORD psql -h 192.168.50.120 -p 5432 -U postgres -c \"DO \\$\\$ BEGIN CREATE DATABASE embeddings; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'embeddings database exists'; END \\$\\$;\" && PGPASSWORD=$PGVECTOR_PASSWORD psql -h 192.168.50.120 -p 5432 -U postgres -d embeddings -c \"CREATE EXTENSION IF NOT EXISTS vector;\""
        ]
      }
      
      env {
        PGVECTOR_PASSWORD = "${var.pgvector_pass}"
      }
      
      resources {
        cpu    = 200
        memory = 256
      }
    }
  }
}

variable "pgvector_pass" {
  type = string
  description = "Admin password for the pgvector PostgreSQL server"
}


================================================
FILE: nomad_jobs/storage-backends/postgres/nomad.job
================================================
job "postgres" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/storage-backends/postgres/nomad.job"
version = "5"  // Fixed postgres password variable
  }

  group "db" {
    network {
      mode = "host"
      port "postgres" {
        static = "5432"
        host_network = "lan"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "postgres" {
      driver = "docker"

      config {
        image = "postgres:15.17"
        volumes = [
          "${var.shared_dir}paperless-postgres:/appdata/postgres",
        ]
        ports = ["postgres"]
      }

      env {
        POSTGRES_DB       = "paperless"
        POSTGRES_USER     = "postgres"
        POSTGRES_PASSWORD = "${var.postgres_pass}"
        PGDATA            = "/appdata/postgres"
      }

      service {
        name = "${NOMAD_JOB_NAME}"
        tags = ["postgres"]
        port = "postgres"

        check {
          type     = "tcp"
          port     = "postgres"
          interval = "30s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = "200"
        memory = "512"
      }
    }
  }
}

variable "region" {
    type = string
}

variable "shared_dir" {
    type = string
}

variable "postgres_pass" {
    type = string
    description = "Admin password for PostgreSQL"
}


================================================
FILE: nomad_jobs/storage-backends/postgres/postgres-setup.job
================================================
job "postgres-setup" {
  type = "batch"
  datacenters = ["dc1"]
  
  meta {
      job_file = "nomad_jobs/storage-backends/postgres/postgres-setup.job"
version = "2"
  }
  
  group "setup" {

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "create-dbs" {
      driver = "docker"
      
      config {
        image = "postgres:15"
        command = "sh"
        args = [
          "-c",
          "PGPASSWORD=$POSTGRES_PASSWORD psql -h postgres.service.consul -U postgres -c \"DO \\$\\$ BEGIN CREATE DATABASE sonarr_main; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'sonarr_main exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE sonarr_logs; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'sonarr_logs exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE radarr_main; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'radarr_main exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE radarr_logs; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'radarr_logs exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE lidarr_main; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'lidarr_main exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE lidarr_logs; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'lidarr_logs exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE litellm; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'litellm exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE nextcloud; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'nextcloud exists'; END \\$\\$;\" -c \"DO \\$\\$ BEGIN CREATE DATABASE paperless; EXCEPTION WHEN duplicate_database THEN RAISE NOTICE 'paperless exists'; END \\$\\$;\" "
        ]
      }
      
      env {
        POSTGRES_PASSWORD = "${var.postgres_pass}"
      }
      
      resources {
        cpu    = 200
        memory = 256
      }
    }
  }
}

variable "postgres_pass" {
  type = string
  description = "Admin password for the PostgreSQL server"
}


================================================
FILE: nomad_jobs/storage-backends/qdrant/nomad.job
================================================
job "qdrant" {
  region = var.region
  datacenters = ["dc1"]
  type = "service"

  meta {
    job_file = "nomad_jobs/storage-backends/qdrant/nomad.job"
    version = "3"
  }

  group "qdrant" {
    count = 1

    network {
      mode = "host"
      port "http" {
        static = 6333
        to = 6333
        host_network = "lan"
      }
      port "grpc" {
        static = 6334
        to = 6334
        host_network = "lan"
      }
    }

    volume "qdrant-data" {
      type = "csi"
      read_only = false
      source = "qdrant-data"
      access_mode = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "qdrant" {
      driver = "docker"

      config {
        image = "qdrant/qdrant:v1.17"
        ports = ["http", "grpc"]
      }

      volume_mount {
        volume      = "qdrant-data"
        destination = "/qdrant/storage"
        read_only   = false
      }

      resources {
        cpu    = 500
        memory = 128
      }

      service {
        name = "qdrant"
        tags = ["vector-db", "ai", "http"]
        port = "http"

        check {
          type     = "tcp"
          port     = "http"
          interval = "30s"
          timeout  = "2s"
        }
      }
    }
  }

}
variable "region" {
  type = string
  default = "global"
}


================================================
FILE: nomad_jobs/storage-backends/qdrant/volume.hcl
================================================
# Qdrant vector database storage volume
id           = "qdrant-data"
name         = "qdrant-data"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "10GiB"
capacity_max = "10GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime"]
}


================================================
FILE: nomad_jobs/storage-backends/redis/nomad.job
================================================
job "redis" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/storage-backends/redis/nomad.job"
    version  = "4"  // Reduced memory 512MB -> 128MB
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "db" {
    count = 1

    network {
      mode = "host"
      port "redis" {
        static       = 6379
        host_network = "lan"
      }
    }

    volume "redis" {
      type            = "csi"
      read_only       = false
      source          = "redis-data"
      access_mode     = "single-node-writer"
      attachment_mode = "file-system"
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "prep-disk" {
      driver = "docker"
      volume_mount {
        volume      = "redis"
        destination = "/volume/"
        read_only   = false
      }
      config {
        image   = "busybox:latest"
        command = "sh"
        args    = ["-c", "chmod 777 /volume/"]
      }
      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }

    task "redis" {
      driver = "docker"

      config {
        image = "redis:8.6.2-alpine"
        ports = ["redis"]
      }

      volume_mount {
        volume      = "redis"
        destination = "/data"
        read_only   = false
      }

      env {
        # Save settings - save to disk every 60 seconds if at least 1 change
        REDIS_SAVE_TO_DISK = "60 1"
        # Set appendonly for durability
        REDIS_APPENDONLY = "yes"
      }

      service {
        name = "redis"
        port = "redis"

        check {
          type     = "tcp"
          port     = "redis"
          interval = "10s"
          timeout  = "2s"
        }
      }

      resources {
        cpu    = 300
        memory = 128
      }
    }
  }
}

variable "region" {
  type = string
}

variable "shared_dir" {
  type = string
}

================================================
FILE: nomad_jobs/storage-backends/redis/volume.hcl
================================================
id           = "redis-data"
external_id  = "redis-data"
name         = "redis-data"
type         = "csi"
plugin_id    = "org.democratic-csi.iscsi"
capacity_min = "5GiB"
capacity_max = "5GiB"

capability {
  access_mode     = "single-node-writer"
  attachment_mode = "block-device"
}

mount_options {
  fs_type     = "ext4"
  mount_flags = ["noatime", "nodiratime", "data=ordered"]
}

================================================
FILE: nomad_jobs/storage-backends/volumes/nfs-example.hcl
================================================
type = "csi"
id = "example"
name = "example"
plugin_id = "nfsofficial"
external_id = "example"
capability {
  access_mode = "multi-node-multi-writer"
  attachment_mode = "file-system"
}
context {
  server = "192.168.50.208"
  share = "/mnt/pool0/share/example"
  mountPermissions = "0"  
}
mount_options {
  fs_type = "nfs"
  mount_flags = [ "timeo=30", "intr", "vers=3", "_netdev" , "nolock" ]
}


================================================
FILE: nomad_jobs/system/docker-cleanup/nomad.job
================================================
job "docker-cleanup" {
  region = var.region
  datacenters = ["dc1"]
  type = "sysbatch"

  meta {
    job_file = "nomad_jobs/system/docker-cleanup/nomad.job"
    version = "1"
  }

  # Run weekly on Sundays at 2 AM
  periodic {
    crons            = ["0 2 * * 0"]
    prohibit_overlap = true
    time_zone        = "UTC"
  }

  group "cleanup" {
    # sysbatch will automatically run on all eligible nodes

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    task "docker-prune" {
      driver = "raw_exec"
      
      config {
        command = "/bin/bash"
        args    = ["-c", <<EOF
          echo "Starting Docker cleanup on node: ${node.unique.name}"
          echo "Current disk usage:"
          df -h /
          
          echo "Docker system info before cleanup:"
          docker system df
          
          echo "Running docker system prune..."
          # Prune unused containers, networks, images (dangling), and build cache
          docker system prune -f
          
          # Prune unused images (including non-dangling)
          docker image prune -a -f --filter "until=168h"  # Remove images older than 1 week
          
          echo "Docker system info after cleanup:"
          docker system df
          
          echo "Final disk usage:"
          df -h /
          
          echo "Docker cleanup completed on node: ${node.unique.name}"
        EOF
        ]
      }

      resources {
        cpu    = 100
        memory = 128
      }

      # Only run on nodes that have docker command available
      constraint {
        attribute = "${attr.kernel.name}"
        value     = "linux"
      }
    }
  }
}

variable "region" {
  type = string
}

================================================
FILE: nomad_jobs/web-apps/alertmanager-dashboard/nomad.job
================================================
job "alertmanager-dashboard" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/web-apps/alertmanager-dashboard/nomad.job"
version = "1"
  }

  group "ui" {
    count = 1 
    task "alertmanager-dashboard" {
      driver = "docker"
      config {
        image = "lmierzwa/karma:v0.129"
        network_mode = "host"
      }
      env {
        ALERTMANAGER_URI = "http://alertmanager.service.consul:9093"
        HOST = "${NOMAD_IP_http}"
        PORT = "${NOMAD_PORT_http}"
        ALERTMANAGER_PROXY = "true"
      }
      service {
        port = "http"
	      name = "alerts"
        tags = ["net-internal"]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 20
        memory = 24
        network {
          port "http" {}
        }
      }
    }
  }
}

variable "region" {
    type = string
}


================================================
FILE: nomad_jobs/web-apps/firecrawl/nomad.job
================================================
job "firecrawl" {
  region      = "global"
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/web-apps/firecrawl/nomad.job" 
    version  = "0.1.2" 
  }

  group "firecrawl" {
    count = 1

    network {
      mode = "host"
      port "http" {
        to     = 3002
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "firecrawl" {
      driver = "docker"

      config {
        image = "mendable/firecrawl:0.1.23" 
        ports = ["http"]
      }

      resources {
        cpu    = 500 # MHz
        memory = 512 # MiB
      }

      env {
        PORT = "3002"
      }

      service {
        name = "firecrawl"
        port = "http"
        tags = ["traefik.enable=true"]

        check {
          type     = "http" # Changed from tcp
          path     = "/"    # Added health check path
          port     = "http"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }
    }
  }
}


================================================
FILE: nomad_jobs/web-apps/heimdall/nomad.job
================================================
job "heimdall" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/web-apps/heimdall/nomad.job"
version = "4"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "downloaders" {
    count = 1 
    network {
      port "http" {
        host_network = "tailscale"
        to = "80"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "heimdall" {
      driver = "docker"
      config {
        image = "linuxserver/heimdall:2021.11.28"
        ports = ["http"]
        volumes = [
          "${var.shared_dir}heimdall:/config",
        ]
      }

      env {
        TZ = "Etc/UTC"
        PUID = "1000"
        PGID = "1000"
      }

      service {
        port = "http"
	name = "heimdall"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",


          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 100
        memory = 512
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: nomad_jobs/web-apps/homepage/nomad.job
================================================
job "homepage" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/web-apps/homepage/nomad.job"
    version  = "1"
  }

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "homepage" {
    count = 1

    network {
      port "http" {
        host_network = "tailscale"
        to           = 3000
      }
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "homepage" {
      driver = "docker"
      config {
        image = "ghcr.io/gethomepage/homepage:v1.12.3"
        ports = ["http"]
        volumes = [
          "local/config:/app/config",
        ]
      }

      env {
        TZ                     = "Etc/UTC"
        HOMEPAGE_ALLOWED_HOSTS = "homepage.${var.tld}"
      }

      template {
        data        = <<EOH
---
EOH
        destination = "local/config/settings.yaml"
      }

      template {
        data        = <<EOH
---
- Media:
    - Plex:
        icon: plex.svg
        href: "https://plex.${var.tld}"
        description: Media Server
    - Sonarr:
        icon: sonarr.svg
        href: "https://sonarr.${var.tld}"
        description: TV Shows
    - Radarr:
        icon: radarr.svg
        href: "https://radarr.${var.tld}"
        description: Movies
    - Lidarr:
        icon: lidarr.svg
        href: "https://lidarr.${var.tld}"
        description: Music
    - Overseerr:
        icon: overseerr.svg
        href: "https://overseerr.${var.tld}"
        description: Media Requests
    - Tautulli:
        icon: tautulli.svg
        href: "https://tautulli.${var.tld}"
        description: Plex Statistics

- Downloads:
    - SABnzbd:
        icon: sabnzbd.svg
        href: "https://sabnzbd.${var.tld}"
        description: Usenet
    - qBittorrent:
        icon: qbittorrent.svg
        href: "https://qbittorrent.${var.tld}"
        description: Torrents
    - Prowlarr:
        icon: prowlarr.svg
        href: "https://prowlarr.${var.tld}"
        description: Indexer Manager
    - Jackett:
        icon: jackett.svg
        href: "https://jackett.${var.tld}"
        description: Indexer Proxy
    - Tdarr:
        icon: tdarr.svg
        href: "https://tdarr.${var.tld}"
        description: Media Transcoding
    - Maintainerr:
        icon: maintainerr.svg
        href: "https://maintainerr.${var.tld}"
        description: Media Maintenance

- Personal Cloud:
    - Nextcloud:
        icon: nextcloud.svg
        href: "https://nextcloud.${var.tld}"
        description: Cloud Storage
    - Bitwarden:
        icon: bitwarden.svg
        href: "https://bitwarden.${var.tld}"
        description: Password Manager
    - Actual Budget:
        icon: actual-budget.svg
        href: "https://actualbudget.${var.tld}"
        description: Budget Manager
    - Paperless:
        icon: paperless-ngx.svg
        href: "https://paperless.${var.tld}"
        description: Document Management
    - Ntfy:
        icon: ntfy.svg
        href: "https://ntfy.${var.tld}"
        description: Push Notifications
    - Navidrome:
        icon: navidrome.svg
        href: "https://navidrome.${var.tld}"
        description: Music Streaming

- Music Discovery:
    - Multi-Scrobbler:
        icon: si-lastdotfm
        href: "https://multi-scrobbler.${var.tld}"
        description: Scrobbling Hub
    - Lidify:
        icon: lidarr.svg
        href: "https://lidify.${var.tld}"
        description: Artist Discovery
    - MediaSage:
        icon: si-openai
        href: "https://mediasage.${var.tld}"
        description: AI Playlist Generator

- AI & ML:
    - Open WebUI:
        icon: open-webui.svg
        href: "https://open-webui.${var.tld}"
        description: Chat Interface
    - LiteLLM:
        icon: si-openai
        href: "https://litellm.${var.tld}"
        description: LLM Proxy
    - Manyfold:
        icon: si-threedotjs
        href: "https://manyfold.${var.tld}"
        description: 3D Model Library

- Observability:
    - Grafana:
        icon: grafana.svg
        href: "https://grafana.${var.tld}"
        description: Dashboards
    - Prometheus:
        icon: prometheus.svg
        href: "https://prometheus.${var.tld}"
        description: Metrics
    - Alertmanager:
        icon: alertmanager.svg
        href: "https://alertmanager.${var.tld}"
        description: Alert Routing

- Infrastructure:
    - Traefik:
        icon: traefik.svg
        href: "https://traefik.${var.tld}"
        description: Reverse Proxy
    - Nomad:
        icon: nomad.svg
        href: "http://192.168.50.113:4646"
        description: Workload Orchestrator
    - Consul:
        icon: consul.svg
        href: "http://192.168.50.113:8500"
        description: Service Discovery
    - TrueNAS:
        icon: truenas.svg
        href: "https://192.168.50.208"
        description: Storage

- Smart Home:
    - Home Assistant:
        icon: home-assistant.svg
        href: "https://home-assistant.${var.tld}"
        description: Home Automation
    - Zigbee2MQTT:
        icon: zigbee2mqtt.svg
        href: "https://zigbee2mqtt.${var.tld}"
        description: Zigbee Bridge
EOH
        destination = "local/config/services.yaml"
      }

      template {
        data        = <<EOH
---
- Developer:
    - GitHub:
        icon: github.svg
        href: "https://github.com"
    - ChatGPT:
        icon: openai.svg
        href: "https://chat.openai.com"
    - Claude:
        icon: si-anthropic
        href: "https://claude.ai"
EOH
        destination = "local/config/bookmarks.yaml"
      }

      template {
        data        = <<EOH
---
EOH
        destination = "local/config/widgets.yaml"
      }

      template {
        data        = <<EOH
---
EOH
        destination = "local/config/docker.yaml"
      }

      template {
        data        = <<EOH
---
EOH
        destination = "local/config/kubernetes.yaml"
      }

      service {
        port = "http"
        name = "homepage"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 200
        memory = 256
      }
    }
  }
}

variable "region" {
  type = string
}

variable "shared_dir" {
  type = string
}

variable "tld" {
  type = string
}


================================================
FILE: nomad_jobs/web-apps/kideo/nomad.job
================================================
job "kideo" {
  region      = var.region
  datacenters = ["cheese"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/web-apps/kideo/nomad.job"
    version  = "1"
  }

  group "kideo" {
    count = 1

    constraint {
      attribute = "${attr.unique.hostname}"
      value     = "cheese01"
    }

    network {
      port "http" {
        host_network = "lan"
        to           = "8000"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel      = 1
      min_healthy_time  = "30s"
      healthy_deadline  = "5m"
      progress_deadline = "10m"
      auto_revert       = true
    }

    task "kideo" {
      driver = "docker"

      config {
        image      = "ghcr.io/perrymanuk/kideo:v0.37"
        ports      = ["http"]
        runtime    = "nvidia"
        privileged = true

        volumes = [
          "${var.shared_dir}kideo:/data",
        ]
      }

      env {
        TZ                      = "Etc/UTC"
        NVIDIA_VISIBLE_DEVICES  = "all"
        KIDEO_POSTGRES_HOST     = "postgres.service.consul"
        KIDEO_POSTGRES_PORT     = "5432"
        KIDEO_POSTGRES_USER     = "postgres"
        KIDEO_POSTGRES_PASSWORD = var.postgres_pass
        KIDEO_POSTGRES_DB       = "kideo"
        KIDEO_JWT_SECRET        = var.kideo_jwt_secret
        KIDEO_VIDEO_DIR         = "/data/videos"
        KIDEO_THUMBNAIL_DIR     = "/data/thumbnails"
        KIDEO_DEFAULT_QUALITY   = "720"
        KIDEO_COOKIES_FILE            = "/data/cookies.txt"
        KIDEO_CURIOSITYSTREAM_USER    = var.kideo_curiositystream_user
        KIDEO_CURIOSITYSTREAM_PASS    = var.kideo_curiositystream_pass
      }

      service {
        port = "http"
        name = "kideo"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/api/health"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 500
        memory = 1024
      }
    }
  }
}

variable "region" {
  type = string
}

variable "shared_dir" {
  type = string
}

variable "postgres_pass" {
  type        = string
  description = "Shared PostgreSQL password"
}

variable "kideo_jwt_secret" {
  type        = string
  description = "JWT signing secret for admin auth"
}

variable "kideo_curiositystream_user" {
  type        = string
  description = "CuriosityStream email"
  default     = ""
}

variable "kideo_curiositystream_pass" {
  type        = string
  description = "CuriosityStream password"
  default     = ""
}


================================================
FILE: nomad_jobs/web-apps/minecraftmath/nomad.job
================================================
job "minecraftmath" {
  region      = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
    job_file = "nomad_jobs/web-apps/minecraftmath/nomad.job"
    version  = "1"
  }

  group "minecraftmath" {
    count = 1

    network {
      port "http" {
        host_network = "lan"
        to           = "8000"
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel      = 1
      min_healthy_time  = "30s"
      healthy_deadline  = "5m"
      progress_deadline = "10m"
      auto_revert       = true
    }

    task "minecraftmath" {
      driver = "docker"

      config {
        image = "ghcr.io/perrymanuk/minecraftmath:v0.7"
        ports = ["http"]
      }

      env {
        TZ                       = "Etc/UTC"
        MCMATH_POSTGRES_HOST     = "postgres.service.consul"
        MCMATH_POSTGRES_PORT     = "5432"
        MCMATH_POSTGRES_USER     = "postgres"
        MCMATH_POSTGRES_PASSWORD = var.postgres_pass
        MCMATH_POSTGRES_DB       = "minecraftmath"
        MCMATH_JWT_SECRET        = var.minecraftmath_jwt_secret
      }

      service {
        port = "http"
        name = "minecraftmath"
        tags = [
          "traefik.enable=true",
        ]
        check {
          type     = "http"
          path     = "/api/health"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }

      resources {
        cpu    = 300
        memory = 256
      }
    }
  }
}

variable "region" {
  type = string
}

variable "postgres_pass" {
  type        = string
  description = "Shared PostgreSQL password"
}

variable "minecraftmath_jwt_secret" {
  type        = string
  description = "JWT signing secret for parent auth"
}


================================================
FILE: nomad_jobs/web-apps/wordpress/nomad.job
================================================
job "wordpress" {
  
  meta {
  job_file = "nomad_jobs/web-apps/wordpress/nomad.job"
  }
region = var.region
  datacenters = ["dc1"]

  constraint {
    attribute = "${meta.shared_mount}"
    operator  = "="
    value     = "true"
  }

  group "database" {
    network {
      port "db" {
        to = 3306
      }
    }

    service {
      name = "wordpress-db"
      port = "db"

      check {
        type     = "tcp"
        port     = "db"
        interval = "10s"
        timeout  = "2s"
      }
    }


    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "mysql" {
      driver = "docker"

      env {
        MYSQL_ROOT_PASSWORD="somewordpress"
        MYSQL_DATABASE="wordpress"
        MYSQL_USER="wordpress"
        MYSQL_PASSWORD="wordpress"
      }

      volume_mount {
        volume      = "wordpress-db"
        destination = "/var/lib/mysql"
      }

      config {
        image = "mysql:9.6"
        volumes = [
          "${var.shared_dir}wordpress-db:/var/lib/mysql",
        ]
      }

      resources {
        cpu    = 500
        memory = 256
      }
    }
  }

  group "wordpress" {
    network {
      port "http" {
        to = 80
      }
    }

    restart {
      attempts = 3
      delay    = "15s"
      interval = "10m"
      mode     = "delay"
    }

    service {
      name = "wordpress"
      tags = ["www"]
      port = "http"

      check {
        type     = "tcp"
        port     = "http"
        interval = "10s"
        timeout  = "2s"
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "await-wordpress" {
      driver = "docker"

      config {
        image        = "alpine:3.23.4"
        command      = "sh"
        args         = ["-c", "echo -n 'Waiting for service'; until nslookup -port=8600 wordpress-db.service.consul ${NOMAD_IP_http} 2>&1 >/dev/null; do echo '.'; sleep 2; done"]
        network_mode = "host"
      }

      resources {
        cpu    = 200
        memory = 128
      }

      lifecycle {
        hook    = "prestart"
        sidecar = false
      }
    }


    update {
      max_parallel     = 1
      min_healthy_time = "30s"
      auto_revert      = true
    }

    task "wordpress" {
      driver = "docker"

      template {
        data = <<EOH
{{- if service "wordpress-db" -}}
{{- with index (service "wordpress-db") 0 -}}
WORDPRESS_DB_HOST={{ .Address }}:{{ .Port }}
{{- end -}}
{{- end }}
WORDPRESS_DB_USER=wordpress
WORDPRESS_DB_PASSWORD=wordpress
WORDPRESS_DB_NAME=wordpress
  EOH

        destination = "local/envvars.txt"
        env = true
      }

      config {
        image = "wordpress:6.9.4"
        ports = ["http"]
      }

      resources {
        cpu    = 500
        memory = 256
      }
    }
  }
}


================================================
FILE: nomad_jobs/web-apps/www/Dockerfile
================================================
FROM nginx
ADD main.jpg /usr/local/www/nginx/images/main.jpg
CMD ["nginx", "-g", "daemon off;"]


================================================
FILE: nomad_jobs/web-apps/www/nomad.job
================================================
job "www" {
  region = var.region
  datacenters = ["dc1"]
  type        = "service"

  meta {
      job_file = "nomad_jobs/web-apps/www/nomad.job"
version = "2"
  }

  group "nginx" {
    count = 1 
    network {
      port "http" {
        host_network = "tailscale"
      }
    }
    task "www" {
      driver = "docker"
      config {
        image = "docker-registry.${var.tld}/www:2"
        network_mode = "host"
        ports = ["http"]
        command = "nginx"
        args = ["-c", "/usr/local/etc/nginx/nginx.conf", "-g", "daemon off;"]
        volumes = [
          "local/index.html:/usr/local/www/nginx/index.html",
          "local/nginx.conf:/usr/local/etc/nginx/nginx.conf",
        ]
      }

      service {
        port = "http"
	name = "www"
        tags = [
          "traefik.enable=true",
          "traefik.http.middlewares.httpsRedirect.redirectscheme.scheme=https",
          "traefik.http.routers.${NOMAD_TASK_NAME}.tls.domains[0].sans=${NOMAD_TASK_NAME}.${var.tld}",
          "traefik.http.routers.${NOMAD_TASK_NAME}.middlewares=forward-auth"
        ]
        check {
          type     = "http"
          path     = "/"
          interval = "10s"
          timeout  = "2s"
          check_restart {
            limit           = 3
            grace           = "60s"
            ignore_warnings = false
          }
        }
      }
      template {
data = <<EOH
worker_processes  1;

#error_log  /var/log/nginx/error.log;

events {
    worker_connections  1024;
}


http {
    access_log /dev/stdout;
    error_log /dev/stderr;
    #include       mime.types;
    default_type  application/octet-stream;

    sendfile        on;
    keepalive_timeout  65;

    server {
        listen       {{ env "NOMAD_PORT_http" }};
        server_name  localhost;

        location / {
            root   /usr/local/www/nginx;
            index  index.html index.htm;
        }

        error_page   500 502 503 504  /50x.html;
        location = /50x.html {
            root   /usr/local/www/nginx-dist;
        }
    }
}
EOH
        destination = "local/nginx.conf"
        env         = false
        perms       = 755
        change_mode = "signal"
        change_signal = "SIGHUP"
        left_delimiter  = "{{"
        right_delimiter = "}}"

      }
      template {
data = <<EOH
<html>
<body bgcolor="#303030">
    <p align=center><img width="50%" src=images/main.jpg></p>
</body>
</html>
EOH
        destination = "local/index.html"
        env         = false
        perms       = 755
        change_mode = "signal"
        change_signal = "SIGHUP"
        left_delimiter  = "{{"
        right_delimiter = "}}"

      }


      resources {
        cpu    = 100
        memory = 128
      }
    }
  }
}

variable "region" {
    type = string
}


variable "tld" {
    type = string
}

variable "shared_dir" {
    type = string
}


================================================
FILE: renovate.json
================================================
{
  "$schema": "https://docs.renovatebot.com/renovate-schema.json",
  "extends": [
    "config:recommended"
  ],
  "dependencyDashboard": true,
  "dependencyDashboardTitle": "🔄 Dependency Dashboard - Homelab Updates",
  "assignees": [
    "perrymanuk"
  ],
  "reviewers": [
    "perrymanuk"
  ],
  "packageRules": [
    {
      "matchPackageNames": [
        "prom/prometheus"
      ],
      "allowedVersions": "/^v[0-9]+\\.[0-9]+\\.[2-9]+$/",
      "automerge": true,
      "ignoreTests": true
    },
    {
      "matchUpdateTypes": [
        "minor",
        "patch",
        "pin",
        "digest"
      ],
      "automerge": true,
      "ignoreTests": true
    },
    {
      "matchPackageNames": [
        "postgres",
        "mariadb",
        "mysql"
      ],
      "matchUpdateTypes": [
        "major"
      ],
      "enabled": false,
      "description": "Block major database version updates - require manual approval",
      "dependencyDashboardApproval": true,
      "prCreation": "approval"
    },
    {
      "versioning": "regex:^(?<compatibility>.*?)-(?<major>\\d+)\\.(?<minor>\\d+)\\.(?<patch>\\d+)$",
      "matchPackageNames": [
        "/^lscr.io\\/linuxserver\\//"
      ]
    },
    {
      "matchPackageNames": [
        "ghcr.io/perrymanuk/radbot"
      ],
      "enabled": false,
      "description": "Managed by radbot CI dispatch workflow"
    }
  ],
  "customManagers": [
    {
      "customType": "regex",
      "managerFilePatterns": [
        "/(^|/)*\\.job$/"
      ],
      "matchStrings": [
        "\\s*image\\s*=\\s*\"(?<depName>.*?)[@:](?<currentValue>.*?)\"\\n"
      ],
      "datasourceTemplate": "docker"
    }
  ]
}


================================================
FILE: services/beefcake.json
================================================
{
  "Service": {
    "Name": "beefcake",
    "ID": "beefcake-instance-1",
    "Address": "192.168.50.208",
    "Port": 80,
    "Check": {
      "HTTP": "http://192.168.50.208:80",
      "Interval": "10s",
      "Timeout": "5s"
    },
    "Tags": ["traefik.enable=true"]
  }
}