From 4c4c4da79d516046f2733e0ca9af2f59d0089da9 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Thorsten=20M=C3=BCller?= Date: Tue, 29 Jun 2021 22:25:09 +0200 Subject: [PATCH] parametric additional partition --- roles/slurm/tasks/main.yml | 8 ++++++++ roles/slurm/templates/slurm.conf.j2 | 16 ++++++++++++++-- 2 files changed, 22 insertions(+), 2 deletions(-) diff --git a/roles/slurm/tasks/main.yml b/roles/slurm/tasks/main.yml index d4f1a9d..abbbde5 100644 --- a/roles/slurm/tasks/main.yml +++ b/roles/slurm/tasks/main.yml @@ -81,6 +81,14 @@ - name: "{{ inventory_hostname }}" addr: "{{ slurm_network_data.network.IPAM.Config[0].Gateway }}" alloc_nodes: "{{ slurm_alloc_nodes_default + extra_nodes | default([])}}" + partitions: + - name: cobald + nodeprefix: drone + num_nodes: 10 + node_cores: 3 + node_mem: 4900 + port: 16818 + initstate: FUTURE notify: reconfigure slurm tags: slurm-config diff --git a/roles/slurm/templates/slurm.conf.j2 b/roles/slurm/templates/slurm.conf.j2 index 990f0fe..b1feff4 100644 --- a/roles/slurm/templates/slurm.conf.j2 +++ b/roles/slurm/templates/slurm.conf.j2 @@ -9,6 +9,7 @@ ControlMachine=slurm-ctl AuthType=auth/munge #CheckpointType=checkpoint/none CryptoType=crypto/munge +CommunicationParameters=NoAddrCache #DisableRootJobs=NO #EnforcePartLimits=NO #Epilog= @@ -166,13 +167,24 @@ SlurmSchedLogFile={{slurm_log_path_sched}} NodeName=slurm-exec[1-{{ num_nodes }}] CPUs={{ slurm_exec_node_cores }} {{'' }} RealMemory={{ slurm_exec_node_mem }} {{'' }} CoresPerSocket={{ slurm_exec_node_cores }} State=UNKNOWN -# RealMemory=5964 +{% for p in partitions | default([]) %} +NodeName={{ p.nodeprefix }}[1-{{ p.num_nodes }}] CPUs={{ p.node_cores }} {{'' + }} RealMemory={{ p.node_mem }} {{'' + }} CoresPerSocket={{ p.node_cores }} {{'' + }} {%- if p.port is defined %} Port={{ p.port}} {% endif %}{{'' + }} State={{ p.initstate | default('UNKNOWN') }} +{% endfor %} {% for i in alloc_nodes -%} NodeName={{i.name}} {%- if i.hostname is defined %} NodeHostname={{i.hostname}} {% endif %} {%- if i.addr is defined %} NodeAddr={{i.addr}} {% endif %} State=UNKNOWN {% endfor %} -PartitionName=debug Nodes=slurm-exec[1-{{num_nodes}}] {{ '' +PartitionName=container Nodes=slurm-exec[1-{{num_nodes}}] {{ '' }} AllocNodes={{alloc_nodes |map(attribute='name') | join(',')}} {{ '' }} Default=YES MaxTime=INFINITE State=UP +{% for p in partitions | default([]) %} +PartitionName={{ p.name }} Nodes={{ p.nodeprefix }}[1-{{ p.num_nodes }}] {{ '' + }} AllocNodes={{alloc_nodes |map(attribute='name') | join(',')}} {{ '' + }} MaxTime=INFINITE State=UP +{% endfor %}