File tree Expand file tree Collapse file tree 15 files changed +3
-362
lines changed
environments/common/inventory Expand file tree Collapse file tree 15 files changed +3
-362
lines changed Original file line number Diff line number Diff line change @@ -32,11 +32,11 @@ jobs:
3232 - image_name : openhpc-extra-RL8
3333 source_image_name_key : RL8 # key into environments/.stackhpc/tofu/cluster_image.auto.tfvars.json
3434 inventory_groups : doca,cuda,lustre
35- volume_size : 35 # needed for cuda
35+ volume_size : 30 # needed for cuda
3636 - image_name : openhpc-extra-RL9
3737 source_image_name_key : RL9
3838 inventory_groups : doca,cuda,lustre
39- volume_size : 35 # needed for cuda
39+ volume_size : 30 # needed for cuda
4040 env :
4141 ANSIBLE_FORCE_COLOR : True
4242 OS_CLOUD : openstack
Original file line number Diff line number Diff line change @@ -90,7 +90,5 @@ roles/*
9090! roles /gateway /**
9191! roles /alertmanager /
9292! roles /alertmanager /**
93- ! roles /slurm_recompile /**
94- ! roles /slurm_recompile /**
9593! roles /nhc /
9694! roles /nhc /**
Original file line number Diff line number Diff line change 4848 name : cuda
4949 tasks_from : " {{ 'runtime.yml' if appliances_mode == 'configure' else 'install.yml' }}"
5050
51- - name : Setup vGPU
52- hosts : vgpu
53- become : yes
54- gather_facts : yes
55- tags : vgpu
56- tasks :
57- - include_role :
58- name : stackhpc.linux.vgpu
59- tasks_from : " {{ 'configure.yml' if appliances_mode == 'configure' else 'install.yml' }}"
60- handlers :
61- - name : reboot
62- fail :
63- msg : Reboot handler for stackhpc.linux.vgpu role fired unexpectedly. This was supposed to be unreachable.
64-
6551- name : Persist hostkeys across rebuilds
6652 # Must be after filesystems.yml (for storage)
6753 # and before portal.yml (where OOD login node hostkeys are scanned)
Original file line number Diff line number Diff line change 250250 name : cloudalchemy.grafana
251251 tasks_from : install.yml
252252
253- - name : Add support for NVIDIA GPU auto detection to Slurm
254- hosts : cuda
255- become : yes
256- tasks :
257- - name : Recompile slurm
258- import_role :
259- name : slurm_recompile
260- vars :
261- slurm_recompile_with_nvml : " {{ groups.cuda | length > 0 }}"
262-
263253- name : Run post.yml hook
264254 vars :
265255 appliances_environment_root : " {{ lookup('env', 'APPLIANCES_ENVIRONMENT_ROOT') }}"
Original file line number Diff line number Diff line change @@ -75,7 +75,6 @@ it also requires an image build with the role name added to the
7575| extras.yml | basic_users | All functionality [ 6] | No |
7676| extras.yml | eessi | All functionality [ 7] | No |
7777| extras.yml | cuda | None required - use image build | Yes [ 8] |
78- | extras.yml | vgpu | All functionality | Yes |
7978| extras.yml | persist_hostkeys | Not relevant for compute nodes | n/a |
8079| extras.yml | compute_init (export) | Not relevant for compute nodes | n/a |
8180| extras.yml | k9s (install) | Not relevant during boot | n/a |
Original file line number Diff line number Diff line change 1919 enable_basic_users : " {{ os_metadata.meta.basic_users | default(false) | bool }}"
2020 enable_eessi : " {{ os_metadata.meta.eessi | default(false) | bool }}"
2121 enable_chrony : " {{ os_metadata.meta.chrony | default(false) | bool }}"
22- enable_vgpu : " {{ os_metadata.meta.vpgu | default(false) | bool }}"
2322 enable_nhc : " {{ os_metadata.meta.nhc | default(false) | bool }}"
2423
2524 # TODO: "= role defaults" - could be moved to a vars_file: on play with similar precedence effects
297296 cmd : " cvmfs_config setup"
298297 when : enable_eessi
299298
300- - name : Configure VGPUs
301- include_role :
302- name : stackhpc.linux.vgpu
303- tasks_from : ' configure.yml'
304- when : enable_vgpu
305-
306299 # NB: don't need conditional block on enable_compute as have already exited
307300 # if not the case
308301 - name : Write Munge key
Load Diff This file was deleted.
Load Diff This file was deleted.
Load Diff This file was deleted.
Load Diff This file was deleted.
You can’t perform that action at this time.
0 commit comments