Skip to content

Commit c6596fe

Browse files
committed
Merge branch 'main' into feat/remove-cloud-init
2 parents 895c82a + f47c982 commit c6596fe

File tree

13 files changed

+37
-25
lines changed

13 files changed

+37
-25
lines changed

ansible/bootstrap.yml

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -44,6 +44,11 @@
4444
become: true
4545
- name: Reset ssh connection to allow user changes to affect ansible_user
4646
meta: reset_connection
47+
- name: Set dnf releasever
48+
ansible.builtin.copy:
49+
dest: /etc/yum/vars/releasever
50+
content: "{{ releasever }}"
51+
become: true
4752

4853
- hosts: systemd
4954
become: yes
@@ -154,4 +159,4 @@
154159
sleep: 15
155160
- name: update facts
156161
setup:
157-
when: (sestatus.changed | default(false)) or (sestatus.reboot_required | default(false))
162+
when: (sestatus.changed | default(false)) or (sestatus.reboot_required | default(false))

ansible/ci/check_sacct_hpctests.yml

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -4,11 +4,11 @@
44
vars:
55
sacct_stdout_expected: |- # based on CI running hpctests as the first job - NB note no trailing newline
66
JobID,JobName,State
7-
2,pingpong.sh,COMPLETED
8-
3,pingmatrix.sh,COMPLETED
9-
4,hpl-build-linux64.sh,COMPLETED
10-
5_0,hpl-solo.sh,COMPLETED
11-
5_1,hpl-solo.sh,COMPLETED
7+
1,pingpong.sh,COMPLETED
8+
2,pingmatrix.sh,COMPLETED
9+
3,hpl-build-linux64.sh,COMPLETED
10+
4_0,hpl-solo.sh,COMPLETED
11+
4_1,hpl-solo.sh,COMPLETED
1212
tasks:
1313
- name: Get info for ended jobs
1414
shell:

ansible/roles/hpctests/defaults/main.yml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,9 +1,9 @@
11
---
22
hpctests_rootdir:
3-
hpctests_pingmatrix_modules: [gnu9 openmpi4]
4-
hpctests_pingpong_modules: [gnu9 openmpi4 imb]
3+
hpctests_pingmatrix_modules: [gnu12 openmpi4]
4+
hpctests_pingpong_modules: [gnu12 openmpi4 imb]
55
hpctests_pingpong_plot: yes
6-
hpctests_hpl_modules: [gnu9 openmpi4 openblas]
6+
hpctests_hpl_modules: [gnu12 openmpi4 openblas]
77
hpctests_outdir: "{{ lookup('env', 'APPLIANCES_ENVIRONMENT_ROOT') }}/hpctests"
88
hpctests_ucx_net_devices: all
99
hpctests_hpl_version: "2.3"

ansible/roles/openondemand/tasks/main.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@
99
# if using PAM auth we need apache installed but NOT started so split the osc.ood role up:
1010
- include_role:
1111
name: osc.ood
12-
tasks_from: install-rpm.yml
12+
tasks_from: install-package.yml
1313
vars_from: Rocky.yml
1414
public: yes # Expose the vars from this role to the rest of the play
1515
# can't set vars: from a dict hence the workaround above

ansible/roles/openondemand/tasks/vnc_compute.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
tags: install
1515
yum:
1616
name:
17-
- turbovnc-2.2.7 # see https://discourse.osc.edu/t/turbovnc-seems-to-no-longer-have-the-nohttpd-option/1856/6 and https://github.com/OSC/ood_core/issues/737
17+
- turbovnc-3.0.1
1818
- nmap-ncat
1919
- python3
2020

environments/arcus/builder.pkrvars.hcl

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
flavor = "vm.alaska.cpu.general.small"
22
networks = ["a262aabd-e6bf-4440-a155-13dbc1b5db0e"] # WCDC-iLab-60
3-
source_image_name = "openhpc-221027-1557.qcow2"
3+
source_image_name = "openhpc-221118-1422.qcow2"
44
ssh_keypair_name = "slurm-app-ci"
55
security_groups = ["default", "SSH"]
66
ssh_bastion_host = "128.232.222.183"
Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1 @@
1+
selinux_state: disabled

environments/arcus/terraform/main.tf

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,6 +14,12 @@ variable "create_nodes" {
1414
default = true
1515
}
1616

17+
variable "cluster_image" {
18+
description = "single image for all cluster nodes - a convenience for CI"
19+
type = string
20+
default = "openhpc-221118-1422.qcow2" # https://github.com/stackhpc/slurm_image_builder/pull/12
21+
}
22+
1723
module "cluster" {
1824
source = "../../skeleton/{{cookiecutter.environment}}/terraform/"
1925

@@ -24,22 +30,22 @@ module "cluster" {
2430
key_pair = "slurm-app-ci"
2531
control_node = {
2632
flavor: "vm.alaska.cpu.general.small"
27-
image: "openhpc-221027-1557.qcow2"
33+
image: var.cluster_image
2834
}
2935
login_nodes = {
3036
login-0: {
3137
flavor: "vm.alaska.cpu.general.small"
32-
image: "openhpc-221027-1557.qcow2"
38+
image: var.cluster_image
3339
}
3440
}
3541
compute_types = {
3642
small: {
3743
flavor: "vm.alaska.cpu.general.small"
38-
image: "openhpc-221027-1557.qcow2"
44+
image: var.cluster_image
3945
}
4046
extra: {
4147
flavor: "vm.alaska.cpu.general.small"
42-
image: "openhpc-221027-1557.qcow2"
48+
image: var.cluster_image
4349
}
4450
}
4551
compute_nodes = {

environments/common/inventory/group_vars/all/defaults.yml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -4,6 +4,7 @@ ansible_user: rocky
44
appliances_repository_root: "{{ lookup('env', 'APPLIANCES_REPO_ROOT') }}"
55
appliances_environment_root: "{{ lookup('env', 'APPLIANCES_ENVIRONMENT_ROOT') }}"
66
#appliances_state_dir: # define an absolute path here to use for persistent state
7+
releasever: '8.6'
78

89
# Address(ip/dns) for internal communication between services. This is
910
# normally traffic you do no want to expose to users.

environments/common/inventory/group_vars/all/openhpc.yml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -19,8 +19,8 @@ openhpc_slurm_partitions:
1919
- name: "compute"
2020
openhpc_packages_default:
2121
- slurm-libpmi-ohpc # to allow intel mpi to work properly
22-
- ohpc-gnu9-openmpi4-perf-tools # for hpctests
23-
- openblas-gnu9-ohpc # for hpctests (HPL)
22+
- ohpc-gnu12-openmpi4-perf-tools # for hpctests
23+
- openblas-gnu12-ohpc # for hpctests (HPL)
2424
openhpc_packages_extra: []
2525
openhpc_packages: "{{ openhpc_packages_default + openhpc_packages_extra }}"
2626
openhpc_munge_key: "{{ vault_openhpc_mungekey | b64decode }}"

environments/common/inventory/group_vars/all/openondemand.yml

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,8 @@
77

88
# openondemand_servername: '' # Must be defined when using openondemand
99

10+
ondemand_package: ondemand-2.0.29
11+
1012
openondemand_dashboard_links: # TODO: should really only be deployed if grafana is deployed and proxying configured
1113
- name: Grafana
1214
app_name: grafana

environments/skeleton/{{cookiecutter.environment}}/terraform/variables.tf

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ variable "environment_root" {
5252
variable "block_device_prefix" {
5353
type = string
5454
description = "Prefix for block device names"
55-
default = "vd"
55+
default = "sd"
5656
}
5757

5858
variable "state_dir" {

requirements.yml

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,13 @@
11
---
22
roles:
33
- src: stackhpc.nfs
4-
version: v21.2.1
4+
version: v22.9.1
55
- src: https://github.com/stackhpc/ansible-role-openhpc.git
66
version: v0.16.0
77
name: stackhpc.openhpc
88
- src: https://github.com/stackhpc/ansible-node-exporter.git
99
version: feature/no-install
1010
name: cloudalchemy.node_exporter
11-
- src: cloudalchemy.blackbox-exporter
12-
version: 1.0.0
1311
- src: https://github.com/cloudalchemy/ansible-prometheus.git
1412
version: 4d2c8d742de39e50387e0aa6d5510b21c7451343 # need fix in preceeding commit for rocky
1513
name: cloudalchemy.prometheus
@@ -18,11 +16,10 @@ roles:
1816
- src: https://github.com/stackhpc/ansible-grafana.git
1917
name: cloudalchemy.grafana
2018
version: service-state
21-
- src: jriguera.configdrive
2219
# No versions available
23-
- src: https://github.com/OSC/ood-ansible.git
20+
- src: https://github.com/stackhpc/ood-ansible.git
2421
name: osc.ood
25-
version: v2.0.5
22+
version: shpc/releasever # based on v2.0.8
2623

2724
collections:
2825
- name: containers.podman

0 commit comments

Comments
 (0)