Skip to content

Commit 2eae901

Browse files
authored
Merge pull request #161 from stackhpc/feat/update-slurmconf
Non-functional changes to slurm.conf
2 parents f7e8d1a + b1632fa commit 2eae901

File tree

9 files changed

+267
-93
lines changed

9 files changed

+267
-93
lines changed

.github/workflows/ci.yml

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -25,8 +25,7 @@ jobs:
2525
matrix:
2626
image:
2727
- 'centos:7'
28-
- 'rockylinux:8.6'
29-
- 'rockylinux:8.7'
28+
- 'rockylinux:8.8'
3029
scenario:
3130
- test1
3231
- test1b

files/slurm.conf.ohpc

Lines changed: 160 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,160 @@
1+
#
2+
# Example slurm.conf file. Please run configurator.html
3+
# (in doc/html) to build a configuration file customized
4+
# for your environment.
5+
#
6+
#
7+
# slurm.conf file generated by configurator.html.
8+
# Put this file on all nodes of your cluster.
9+
# See the slurm.conf man page for more information.
10+
#
11+
ClusterName=cluster
12+
SlurmctldHost=linux0
13+
#SlurmctldHost=
14+
#
15+
#DisableRootJobs=NO
16+
#EnforcePartLimits=NO
17+
#Epilog=
18+
#EpilogSlurmctld=
19+
#FirstJobId=1
20+
#MaxJobId=67043328
21+
#GresTypes=
22+
#GroupUpdateForce=0
23+
#GroupUpdateTime=600
24+
#JobFileAppend=0
25+
#JobRequeue=1
26+
#JobSubmitPlugins=lua
27+
#KillOnBadExit=0
28+
#LaunchType=launch/slurm
29+
#Licenses=foo*4,bar
30+
#MailProg=/bin/mail
31+
#MaxJobCount=10000
32+
#MaxStepCount=40000
33+
#MaxTasksPerNode=512
34+
MpiDefault=none
35+
#MpiParams=ports=#-#
36+
#PluginDir=
37+
#PlugStackConfig=
38+
#PrivateData=jobs
39+
ProctrackType=proctrack/cgroup
40+
#Prolog=
41+
#PrologFlags=
42+
#PrologSlurmctld=
43+
#PropagatePrioProcess=0
44+
#PropagateResourceLimits=
45+
#PropagateResourceLimitsExcept=
46+
#RebootProgram=
47+
SlurmctldPidFile=/var/run/slurmctld.pid
48+
SlurmctldPort=6817
49+
SlurmdPidFile=/var/run/slurmd.pid
50+
SlurmdPort=6818
51+
SlurmdSpoolDir=/var/spool/slurmd
52+
SlurmUser=slurm
53+
#SlurmdUser=root
54+
#SrunEpilog=
55+
#SrunProlog=
56+
StateSaveLocation=/var/spool/slurmctld
57+
SwitchType=switch/none
58+
#TaskEpilog=
59+
TaskPlugin=task/affinity
60+
#TaskProlog=
61+
#TopologyPlugin=topology/tree
62+
#TmpFS=/tmp
63+
#TrackWCKey=no
64+
#TreeWidth=
65+
#UnkillableStepProgram=
66+
#UsePAM=0
67+
#
68+
#
69+
# TIMERS
70+
#BatchStartTimeout=10
71+
#CompleteWait=0
72+
#EpilogMsgTime=2000
73+
#GetEnvTimeout=2
74+
#HealthCheckInterval=0
75+
#HealthCheckProgram=
76+
InactiveLimit=0
77+
KillWait=30
78+
#MessageTimeout=10
79+
#ResvOverRun=0
80+
MinJobAge=300
81+
#OverTimeLimit=0
82+
SlurmctldTimeout=120
83+
SlurmdTimeout=300
84+
#UnkillableStepTimeout=60
85+
#VSizeFactor=0
86+
Waittime=0
87+
#
88+
#
89+
# SCHEDULING
90+
#DefMemPerCPU=0
91+
#MaxMemPerCPU=0
92+
#SchedulerTimeSlice=30
93+
SchedulerType=sched/backfill
94+
SelectType=select/cons_tres
95+
SelectTypeParameters=CR_Core
96+
#
97+
#
98+
# JOB PRIORITY
99+
#PriorityFlags=
100+
#PriorityType=priority/basic
101+
#PriorityDecayHalfLife=
102+
#PriorityCalcPeriod=
103+
#PriorityFavorSmall=
104+
#PriorityMaxAge=
105+
#PriorityUsageResetPeriod=
106+
#PriorityWeightAge=
107+
#PriorityWeightFairshare=
108+
#PriorityWeightJobSize=
109+
#PriorityWeightPartition=
110+
#PriorityWeightQOS=
111+
#
112+
#
113+
# LOGGING AND ACCOUNTING
114+
#AccountingStorageEnforce=0
115+
#AccountingStorageHost=
116+
#AccountingStoragePass=
117+
#AccountingStoragePort=
118+
AccountingStorageType=accounting_storage/none
119+
#AccountingStorageUser=
120+
#AccountingStoreFlags=
121+
#JobCompHost=
122+
#JobCompLoc=
123+
#JobCompPass=
124+
#JobCompPort=
125+
JobCompType=jobcomp/none
126+
#JobCompUser=
127+
#JobContainerType=job_container/none
128+
JobAcctGatherFrequency=30
129+
JobAcctGatherType=jobacct_gather/none
130+
SlurmctldDebug=info
131+
SlurmctldLogFile=/var/log/slurmctld.log
132+
SlurmdDebug=info
133+
SlurmdLogFile=/var/log/slurmd.log
134+
#SlurmSchedLogFile=
135+
#SlurmSchedLogLevel=
136+
#DebugFlags=
137+
#
138+
#
139+
# POWER SAVE SUPPORT FOR IDLE NODES (optional)
140+
#SuspendProgram=
141+
#ResumeProgram=
142+
#SuspendTimeout=
143+
#ResumeTimeout=
144+
#ResumeRate=
145+
#SuspendExcNodes=
146+
#SuspendExcParts=
147+
#SuspendRate=
148+
#SuspendTime=
149+
#
150+
#
151+
# COMPUTE NODES
152+
# OpenHPC default configuration
153+
TaskPlugin=task/affinity
154+
PropagateResourceLimitsExcept=MEMLOCK
155+
JobCompType=jobcomp/filetxt
156+
Epilog=/etc/slurm/slurm.epilog.clean
157+
NodeName=c[1-4] Sockets=2 CoresPerSocket=8 ThreadsPerCore=2 State=UNKNOWN
158+
PartitionName=normal Nodes=c[1-4] Default=YES MaxTime=24:00:00 State=UP Oversubscribe=EXCLUSIVE
159+
SlurmctldParameters=enable_configless
160+
ReturnToService=1

molecule/README.md

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -29,10 +29,11 @@ test14 | 1 | N | As for #5 but also tests `extr
2929
Local installation on a RockyLinux 8.x machine looks like:
3030

3131
sudo dnf install -y podman
32+
sudo dnf install podman-plugins # required for DNS
3233
sudo yum install -y git
3334
git clone [email protected]:stackhpc/ansible-role-openhpc.git
3435
cd ansible-role-openhpc/
35-
python3.8 -m venv venv
36+
python3.9 -m venv venv
3637
. venv/bin/activate
3738
pip install -U pip
3839
pip install -r molecule/requirements.txt
@@ -44,8 +45,6 @@ Then to run tests, e.g.::
4445
MOLECULE_IMAGE=centos:7 molecule test --all # NB some won't work as require OpenHPC v2.x (-> CentOS 8.x) features - see `.github/workflows/ci.yml`
4546
MOLECULE_IMAGE=rockylinux:8.6 molecule test --all
4647

47-
**NB:** If the host network has an MTU smaller than 1500 (the docker default), check `molecule.yml` for the relevant test contains `DOCKER_MTU`, then prepend `DOCKER_MTU=<mtu>` to your command. If you have already run molecule you will need to destroy the instances and run `docker network prune` before retrying.
48-
4948
During development you may want to:
5049

5150
- See some debugging information by prepending:

molecule/requirements.txt

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
11
pip
22
setuptools
3-
molecule[podman,lint,ansible]
3+
molecule[lint,ansible]
4+
molecule-plugins[podman]
45
ansible>=2.9.0

molecule/test12/molecule.yml

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,10 +14,6 @@ platforms:
1414
volumes:
1515
- /sys/fs/cgroup:/sys/fs/cgroup:ro
1616
network: net1
17-
docker_networks:
18-
- name: net1
19-
driver_options:
20-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
2117
- name: testohpc-compute-0
2218
image: ${MOLECULE_IMAGE}
2319
pre_build_image: true

molecule/test14/molecule.yml

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -14,10 +14,6 @@ platforms:
1414
volumes:
1515
- /sys/fs/cgroup:/sys/fs/cgroup:ro
1616
network: net1
17-
docker_networks:
18-
- name: net1
19-
driver_options:
20-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
2117
- name: testohpc-compute-0
2218
image: ${MOLECULE_IMAGE}
2319
pre_build_image: true
@@ -30,10 +26,6 @@ platforms:
3026
volumes:
3127
- /sys/fs/cgroup:/sys/fs/cgroup:ro
3228
network: net1
33-
docker_networks:
34-
- name: net1
35-
driver_options:
36-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
3729
- name: testohpc-compute-1
3830
image: ${MOLECULE_IMAGE}
3931
pre_build_image: true
@@ -46,10 +38,6 @@ platforms:
4638
volumes:
4739
- /sys/fs/cgroup:/sys/fs/cgroup:ro
4840
network: net1
49-
docker_networks:
50-
- name: net1
51-
driver_options:
52-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
5341
provisioner:
5442
name: ansible
5543
verifier:

molecule/test5/molecule.yml

Lines changed: 0 additions & 12 deletions
Original file line numberDiff line numberDiff line change
@@ -14,10 +14,6 @@ platforms:
1414
volumes:
1515
- /sys/fs/cgroup:/sys/fs/cgroup:ro
1616
network: net1
17-
docker_networks:
18-
- name: net1
19-
driver_options:
20-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
2117
- name: testohpc-compute-0
2218
image: ${MOLECULE_IMAGE}
2319
pre_build_image: true
@@ -30,10 +26,6 @@ platforms:
3026
volumes:
3127
- /sys/fs/cgroup:/sys/fs/cgroup:ro
3228
network: net1
33-
docker_networks:
34-
- name: net1
35-
driver_options:
36-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
3729
- name: testohpc-compute-1
3830
image: ${MOLECULE_IMAGE}
3931
pre_build_image: true
@@ -46,10 +38,6 @@ platforms:
4638
volumes:
4739
- /sys/fs/cgroup:/sys/fs/cgroup:ro
4840
network: net1
49-
docker_networks:
50-
- name: net1
51-
driver_options:
52-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
5341
provisioner:
5442
name: ansible
5543
verifier:

molecule/test6/molecule.yml

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -14,10 +14,6 @@ platforms:
1414
volumes:
1515
- /sys/fs/cgroup:/sys/fs/cgroup:ro
1616
network: net1
17-
docker_networks:
18-
- name: net1
19-
driver_options:
20-
com.docker.network.driver.mtu: ${DOCKER_MTU:-1500} # 1500 is docker default
2117
provisioner:
2218
name: ansible
2319
inventory:

0 commit comments

Comments
 (0)