File tree Expand file tree Collapse file tree 13 files changed +37
-25
lines changed
inventory/group_vars/selinux
common/inventory/group_vars/all
skeleton/{{cookiecutter.environment}}/terraform Expand file tree Collapse file tree 13 files changed +37
-25
lines changed Original file line number Diff line number Diff line change 44
44
become : true
45
45
- name : Reset ssh connection to allow user changes to affect ansible_user
46
46
meta : reset_connection
47
+ - name : Set dnf releasever
48
+ ansible.builtin.copy :
49
+ dest : /etc/yum/vars/releasever
50
+ content : " {{ releasever }}"
51
+ become : true
47
52
48
53
- hosts : systemd
49
54
become : yes
154
159
sleep : 15
155
160
- name : update facts
156
161
setup :
157
- when : (sestatus.changed | default(false)) or (sestatus.reboot_required | default(false))
162
+ when : (sestatus.changed | default(false)) or (sestatus.reboot_required | default(false))
Original file line number Diff line number Diff line change 4
4
vars :
5
5
sacct_stdout_expected : |- # based on CI running hpctests as the first job - NB note no trailing newline
6
6
JobID,JobName,State
7
- 2 ,pingpong.sh,COMPLETED
8
- 3 ,pingmatrix.sh,COMPLETED
9
- 4 ,hpl-build-linux64.sh,COMPLETED
10
- 5_0 ,hpl-solo.sh,COMPLETED
11
- 5_1 ,hpl-solo.sh,COMPLETED
7
+ 1 ,pingpong.sh,COMPLETED
8
+ 2 ,pingmatrix.sh,COMPLETED
9
+ 3 ,hpl-build-linux64.sh,COMPLETED
10
+ 4_0 ,hpl-solo.sh,COMPLETED
11
+ 4_1 ,hpl-solo.sh,COMPLETED
12
12
tasks :
13
13
- name : Get info for ended jobs
14
14
shell :
Original file line number Diff line number Diff line change 1
1
---
2
2
hpctests_rootdir :
3
- hpctests_pingmatrix_modules : [gnu9 openmpi4]
4
- hpctests_pingpong_modules : [gnu9 openmpi4 imb]
3
+ hpctests_pingmatrix_modules : [gnu12 openmpi4]
4
+ hpctests_pingpong_modules : [gnu12 openmpi4 imb]
5
5
hpctests_pingpong_plot : yes
6
- hpctests_hpl_modules : [gnu9 openmpi4 openblas]
6
+ hpctests_hpl_modules : [gnu12 openmpi4 openblas]
7
7
hpctests_outdir : " {{ lookup('env', 'APPLIANCES_ENVIRONMENT_ROOT') }}/hpctests"
8
8
hpctests_ucx_net_devices : all
9
9
hpctests_hpl_version : " 2.3"
Original file line number Diff line number Diff line change 9
9
# if using PAM auth we need apache installed but NOT started so split the osc.ood role up:
10
10
- include_role :
11
11
name : osc.ood
12
- tasks_from : install-rpm .yml
12
+ tasks_from : install-package .yml
13
13
vars_from : Rocky.yml
14
14
public : yes # Expose the vars from this role to the rest of the play
15
15
# can't set vars: from a dict hence the workaround above
Original file line number Diff line number Diff line change 14
14
tags : install
15
15
yum :
16
16
name :
17
- - turbovnc-2.2.7 # see https://discourse.osc.edu/t/turbovnc-seems-to-no-longer-have-the-nohttpd-option/1856/6 and https://github.com/OSC/ood_core/issues/737
17
+ - turbovnc-3.0.1
18
18
- nmap-ncat
19
19
- python3
20
20
Original file line number Diff line number Diff line change 1
1
flavor = " vm.alaska.cpu.general.small"
2
2
networks = [" a262aabd-e6bf-4440-a155-13dbc1b5db0e" ] # WCDC-iLab-60
3
- source_image_name = " openhpc-221027-1557 .qcow2"
3
+ source_image_name = " openhpc-221118-1422 .qcow2"
4
4
ssh_keypair_name = " slurm-app-ci"
5
5
security_groups = [" default" , " SSH" ]
6
6
ssh_bastion_host = " 128.232.222.183"
Original file line number Diff line number Diff line change
1
+ selinux_state : disabled
Original file line number Diff line number Diff line change @@ -14,6 +14,12 @@ variable "create_nodes" {
14
14
default = true
15
15
}
16
16
17
+ variable "cluster_image" {
18
+ description = " single image for all cluster nodes - a convenience for CI"
19
+ type = string
20
+ default = " openhpc-221118-1422.qcow2" # https://github.com/stackhpc/slurm_image_builder/pull/12
21
+ }
22
+
17
23
module "cluster" {
18
24
source = " ../../skeleton/{{cookiecutter.environment}}/terraform/"
19
25
@@ -24,22 +30,22 @@ module "cluster" {
24
30
key_pair = " slurm-app-ci"
25
31
control_node = {
26
32
flavor: " vm.alaska.cpu.general.small"
27
- image: " openhpc-221027-1557.qcow2 "
33
+ image: var.cluster_image
28
34
}
29
35
login_nodes = {
30
36
login- 0 : {
31
37
flavor: " vm.alaska.cpu.general.small"
32
- image: " openhpc-221027-1557.qcow2 "
38
+ image: var.cluster_image
33
39
}
34
40
}
35
41
compute_types = {
36
42
small: {
37
43
flavor: " vm.alaska.cpu.general.small"
38
- image: " openhpc-221027-1557.qcow2 "
44
+ image: var.cluster_image
39
45
}
40
46
extra: {
41
47
flavor: " vm.alaska.cpu.general.small"
42
- image: " openhpc-221027-1557.qcow2 "
48
+ image: var.cluster_image
43
49
}
44
50
}
45
51
compute_nodes = {
Original file line number Diff line number Diff line change @@ -4,6 +4,7 @@ ansible_user: rocky
4
4
appliances_repository_root : " {{ lookup('env', 'APPLIANCES_REPO_ROOT') }}"
5
5
appliances_environment_root : " {{ lookup('env', 'APPLIANCES_ENVIRONMENT_ROOT') }}"
6
6
# appliances_state_dir: # define an absolute path here to use for persistent state
7
+ releasever : ' 8.6'
7
8
8
9
# Address(ip/dns) for internal communication between services. This is
9
10
# normally traffic you do no want to expose to users.
Original file line number Diff line number Diff line change @@ -19,8 +19,8 @@ openhpc_slurm_partitions:
19
19
- name : " compute"
20
20
openhpc_packages_default :
21
21
- slurm-libpmi-ohpc # to allow intel mpi to work properly
22
- - ohpc-gnu9 -openmpi4-perf-tools # for hpctests
23
- - openblas-gnu9 -ohpc # for hpctests (HPL)
22
+ - ohpc-gnu12 -openmpi4-perf-tools # for hpctests
23
+ - openblas-gnu12 -ohpc # for hpctests (HPL)
24
24
openhpc_packages_extra : []
25
25
openhpc_packages : " {{ openhpc_packages_default + openhpc_packages_extra }}"
26
26
openhpc_munge_key : " {{ vault_openhpc_mungekey | b64decode }}"
Original file line number Diff line number Diff line change 7
7
8
8
# openondemand_servername: '' # Must be defined when using openondemand
9
9
10
+ ondemand_package : ondemand-2.0.29
11
+
10
12
openondemand_dashboard_links : # TODO: should really only be deployed if grafana is deployed and proxying configured
11
13
- name : Grafana
12
14
app_name : grafana
Original file line number Diff line number Diff line change @@ -52,7 +52,7 @@ variable "environment_root" {
52
52
variable "block_device_prefix" {
53
53
type = string
54
54
description = " Prefix for block device names"
55
- default = " vd "
55
+ default = " sd "
56
56
}
57
57
58
58
variable "state_dir" {
Original file line number Diff line number Diff line change 1
1
---
2
2
roles :
3
3
- src : stackhpc.nfs
4
- version : v21.2 .1
4
+ version : v22.9 .1
5
5
- src : https://github.com/stackhpc/ansible-role-openhpc.git
6
6
version : v0.16.0
7
7
name : stackhpc.openhpc
8
8
- src : https://github.com/stackhpc/ansible-node-exporter.git
9
9
version : feature/no-install
10
10
name : cloudalchemy.node_exporter
11
- - src : cloudalchemy.blackbox-exporter
12
- version : 1.0.0
13
11
- src : https://github.com/cloudalchemy/ansible-prometheus.git
14
12
version : 4d2c8d742de39e50387e0aa6d5510b21c7451343 # need fix in preceeding commit for rocky
15
13
name : cloudalchemy.prometheus
@@ -18,11 +16,10 @@ roles:
18
16
- src : https://github.com/stackhpc/ansible-grafana.git
19
17
name : cloudalchemy.grafana
20
18
version : service-state
21
- - src : jriguera.configdrive
22
19
# No versions available
23
- - src : https://github.com/OSC /ood-ansible.git
20
+ - src : https://github.com/stackhpc /ood-ansible.git
24
21
name : osc.ood
25
- version : v2.0.5
22
+ version : shpc/releasever # based on v2.0.8
26
23
27
24
collections :
28
25
- name : containers.podman
You can’t perform that action at this time.
0 commit comments