homelab-nomad/ansible_playbooks/setup-cluster.yml

365 lines
9.4 KiB
YAML
Raw Permalink Normal View History

2022-02-16 17:56:18 +00:00
---
- name: Update DNS for bootstrapping with non-Nomad host
2023-09-18 04:43:04 +00:00
hosts: nomad_instances
become: true
gather_facts: false
vars:
non_nomad_dns: 192.168.2.170
tasks:
- name: Add non-nomad bootstrap DNS
lineinfile:
dest: /etc/resolv.conf
create: true
line: "nameserver {{ non_nomad_dns }}"
- name: Install Docker
hosts: nomad_clients
become: true
vars:
docker_architecture_map:
x86_64: amd64
armv7l: armhf
aarch64: arm64
docker_apt_arch: "{{ docker_architecture_map[ansible_architecture] }}"
docker_compose_arch: "{{ (ansible_architecture == 'armv7l') | ternary('armv7', ansible_architecture) }}"
roles:
- geerlingguy.docker
tasks:
- name: Remove snapd
package:
name: snapd
state: absent
# Not on Ubuntu 20.04
# - name: Install Podman
# hosts: nomad_instances
# become: true
#
# tasks:
# - name: Install Podman
# package:
# name: podman
# state: present
- name: Create NFS mounts
hosts: nomad_clients
become: true
vars:
2023-02-14 21:31:04 +00:00
shared_nfs_mounts:
- src: 192.168.2.10:/Media
path: /srv/volumes/media-read
opts: proto=tcp,port=2049,ro
- src: 192.168.2.10:/Media
path: /srv/volumes/media-write
opts: proto=tcp,port=2049,rw
- src: 192.168.2.10:/Photos
path: /srv/volumes/photos
opts: proto=tcp,port=2049,rw
- src: 192.168.2.10:/Container
path: /srv/volumes/nas-container
opts: proto=tcp,port=2049,rw
tasks:
- name: Install nfs
package:
name: nfs-common
state: present
- name: Mount NFS volumes
2022-08-30 22:14:55 +00:00
ansible.posix.mount:
src: "{{ item.src }}"
path: "{{ item.path }}"
opts: "{{ item.opts }}"
2022-08-30 22:14:55 +00:00
state: mounted
fstype: nfs4
loop: "{{ shared_nfs_mounts + (nfs_mounts | default([])) }}"
2022-08-30 22:14:55 +00:00
2023-03-24 05:08:20 +00:00
- import_playbook: wesher.yml
2022-02-17 22:03:42 +00:00
- name: Build Nomad cluster
2022-02-16 17:56:18 +00:00
hosts: nomad_instances
any_errors_fatal: true
become: true
vars:
2023-02-14 21:31:04 +00:00
shared_host_volumes:
- name: media-read
path: /srv/volumes/media-write
read_only: true
- name: media-write
path: /srv/volumes/media-write
owner: "root"
group: "root"
mode: "0755"
read_only: false
- name: media-downloads
path: /srv/volumes/media-write/Downloads
read_only: false
2023-02-27 19:43:07 +00:00
- name: sabnzbd-config
path: /srv/volumes/media-write/Downloads/sabnzbd
read_only: false
2023-02-14 21:31:04 +00:00
- name: photoprism-media
path: /srv/volumes/photos/Photoprism
read_only: false
- name: photoprism-storage
path: /srv/volumes/nas-container/photoprism
read_only: false
- name: nzbget-config
path: /srv/volumes/nas-container/nzbget
read_only: false
- name: sonarr-config
path: /srv/volumes/nas-container/sonarr
read_only: false
2023-07-25 18:05:23 +00:00
- name: lidarr-config
path: /srv/volumes/nas-container/lidarr
read_only: false
2024-02-20 18:09:48 +00:00
- name: radarr-config
path: /srv/volumes/nas-container/radarr
read_only: false
2023-08-21 17:54:57 +00:00
- name: bazarr-config
path: /srv/volumes/nas-container/bazarr
read_only: false
- name: gitea-data
path: /srv/volumes/nas-container/gitea
read_only: false
2023-02-14 21:31:04 +00:00
- name: all-volumes
path: /srv/volumes
owner: "root"
group: "root"
mode: "0755"
read_only: false
2022-02-16 17:56:18 +00:00
roles:
- name: ansible-nomad
vars:
2024-04-17 17:45:27 +00:00
nomad_version: "1.7.6-1"
nomad_install_upgrade: true
nomad_allow_purge_config: true
nomad_node_role: "{% if 'nomad_clients' in group_names %}{% if 'nomad_servers' in group_names %}both{% else %}client{% endif %}{% else %}server{% endif %}"
# Where nomad gets installed to
nomad_bin_dir: /usr/bin
nomad_install_from_repo: true
2022-06-23 16:51:21 +00:00
nomad_bootstrap_expect: "{{ [(play_hosts | length), 3] | min }}"
nomad_raft_protocol: 3
2022-05-25 03:11:18 +00:00
nomad_autopilot: true
nomad_encrypt_enable: true
# nomad_use_consul: true
# Metrics
nomad_telemetry: true
nomad_telemetry_prometheus_metrics: true
nomad_telemetry_publish_allocation_metrics: true
nomad_telemetry_publish_node_metrics: true
# Enable container plugins
nomad_cni_enable: true
nomad_cni_version: 1.0.1
nomad_docker_enable: true
nomad_docker_dmsetup: false
# nomad_podman_enable: true
# Merge shared host volumes with node volumes
nomad_host_volumes: "{{ shared_host_volumes + (nomad_unique_host_volumes | default([])) }}"
# Customize docker plugin
nomad_plugins:
docker:
config:
2022-06-17 22:19:19 +00:00
allow_privileged: true
2023-02-28 20:17:28 +00:00
gc:
image_delay: "24h"
volumes:
enabled: true
selinuxlabel: "z"
# Send logs to journald so we can scrape them for Loki
# logging:
# type: journald
extra_labels:
- "job_name"
- "job_id"
- "task_group_name"
- "task_name"
- "namespace"
- "node_name"
- "node_id"
# Bind nomad
nomad_bind_address: 0.0.0.0
# Default interface for binding tasks
# This is now set at the inventory level
# nomad_network_interface: eth0
# Create networks for binding task ports
nomad_host_networks:
- name: loopback
interface: lo
reserved_ports: "22"
2023-03-24 05:08:20 +00:00
- name: wesher
2023-03-25 05:22:11 +00:00
interface: wgoverlay
2023-03-24 05:08:20 +00:00
reserved_ports: "22"
2022-03-22 03:13:13 +00:00
# Enable ACLs
nomad_acl_enabled: true
nomad_config_custom:
ui:
enabled: true
2022-09-28 04:28:02 +00:00
- name: Bootstrap Nomad ACLs and scheduler
hosts: nomad_servers
2022-09-28 04:28:02 +00:00
tasks:
- name: Start Nomad
systemd:
state: started
name: nomad
2022-03-22 04:26:04 +00:00
- name: Nomad API reachable?
uri:
url: "http://127.0.0.1:4646/v1/status/leader"
method: GET
status_code: 200
register: nomad_check_result
retries: 8
until: nomad_check_result is succeeded
delay: 15
changed_when: false
run_once: true
2022-03-22 04:26:04 +00:00
- name: Bootstrap ACLs
command:
argv:
- "nomad"
- "acl"
- "bootstrap"
- "-json"
run_once: true
ignore_errors: true
register: bootstrap_result
changed_when: bootstrap_result is succeeded
2022-03-22 04:26:04 +00:00
- name: Save bootstrap result
copy:
content: "{{ bootstrap_result.stdout }}"
2022-11-02 21:20:09 +00:00
dest: "../nomad_bootstrap.json"
2022-03-22 04:26:04 +00:00
when: bootstrap_result is succeeded
delegate_to: localhost
run_once: true
- name: Read secret
command:
argv:
- jq
- -r
- .SecretID
2022-11-02 21:20:09 +00:00
- ../nomad_bootstrap.json
2022-03-22 04:26:04 +00:00
delegate_to: localhost
run_once: true
2022-04-15 19:12:28 +00:00
no_log: true
changed_when: false
2022-03-22 04:26:04 +00:00
register: read_secretid
2022-08-30 22:15:29 +00:00
- name: Look for policy
command:
argv:
- nomad
- acl
- policy
- list
environment:
NOMAD_TOKEN: "{{ read_secretid.stdout }}"
register: policies
run_once: true
changed_when: false
2022-08-30 22:15:29 +00:00
2022-03-22 04:26:04 +00:00
- name: Copy policy
copy:
2022-11-02 21:20:09 +00:00
src: ../acls/nomad-anon-policy.hcl
2022-03-22 04:26:04 +00:00
dest: /tmp/anonymous.policy.hcl
delegate_to: "{{ play_hosts[0] }}"
2022-03-22 04:26:04 +00:00
run_once: true
2023-03-25 04:12:02 +00:00
register: anon_policy
2022-03-22 04:26:04 +00:00
- name: Create anon-policy
command:
argv:
- nomad
- acl
- policy
- apply
2022-08-23 17:31:03 +00:00
- -description="Anon read only"
2022-03-22 04:26:04 +00:00
- anonymous
- /tmp/anonymous.policy.hcl
environment:
NOMAD_TOKEN: "{{ read_secretid.stdout }}"
when: policies.stdout == "No policies found" or anon_policy.changed
delegate_to: "{{ play_hosts[0] }}"
run_once: true
- name: Read scheduler config
command:
argv:
- nomad
- operator
- scheduler
- get-config
- -json
run_once: true
register: scheduler_config
changed_when: false
- name: Enable service scheduler preemption
command:
argv:
- nomad
- operator
- scheduler
- set-config
- -preempt-service-scheduler=true
environment:
NOMAD_TOKEN: "{{ read_secretid.stdout }}"
run_once: true
when: (scheduler_config.stdout | from_json)["SchedulerConfig"]["PreemptionConfig"]["ServiceSchedulerEnabled"] is false
- name: Enable system scheduler preemption
command:
argv:
- nomad
- operator
- scheduler
- set-config
- -preempt-system-scheduler=true
environment:
NOMAD_TOKEN: "{{ read_secretid.stdout }}"
run_once: true
when: (scheduler_config.stdout | from_json)["SchedulerConfig"]["PreemptionConfig"]["SystemSchedulerEnabled"] is false
# - name: Set up Nomad backend and roles in Vault
# community.general.terraform:
# project_path: ../acls
# force_init: true
# variables:
# consul_address: "{{ play_hosts[0] }}:8500"
# vault_token: "{{ root_token }}"
# nomad_secret_id: "{{ read_secretid.stdout }}"
# delegate_to: localhost
# run_once: true
# notify:
# - Restart Nomad
2022-09-28 04:28:02 +00:00
handlers:
- name: Restart Nomad
systemd:
state: restarted
name: nomad
retries: 6
delay: 5