diff --git a/playbooks/slurm-cluster/templates/slurm.conf b/playbooks/slurm-cluster/templates/slurm.conf index 6136fc16..e280ce48 100644 --- a/playbooks/slurm-cluster/templates/slurm.conf +++ b/playbooks/slurm-cluster/templates/slurm.conf @@ -110,28 +110,27 @@ AccountingStorageEnforce=associations,limits,qos AccountingStorageUser=slurm AccountingStoragePass=/var/run/munge/munge.socket.2 - # COMPUTE NODES GresTypes=gpu -NodeName=dlc-articuno Gres=gpu:nvidia_geforce_rtx_2080_ti:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=366292 State=UNKNOWN -#NodeName=dlc-jynx Gres=gpu:nvidia_geforce_gtx_titan_x:4 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=60990 State=UNKNOWN +NodeName=dlc-articuno Gres=gpu:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=366292 State=UNKNOWN +#NodeName=dlc-jynx Gres=gpu:4 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=60990 State=UNKNOWN #NodeName=dlc-magmar Gres=gpu:4 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=244759 State=UNKNOWN -NodeName=dlc-drowzee Gres=gpu:nvidia_geforce_gtx_1080:2 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=244768 State=UNKNOWN -NodeName=dlc-groudon Gres=gpu:nvidia_a100-pcie-40gb:2 CPUs=112 Sockets=2 CoresPerSocket=28 ThreadsPerCore=2 Procs=56 RealMemory=367254 State=UNKNOWN +NodeName=dlc-drowzee Gres=gpu:2 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=244768 State=UNKNOWN +NodeName=dlc-groudon Gres=gpu:2 CPUs=112 Sockets=2 CoresPerSocket=28 ThreadsPerCore=2 Procs=56 RealMemory=367254 State=UNKNOWN #NodeName=dlc-togepi Gres=gpu:4 CPUs=40 Sockets=2 CoresPerSocket=10 ThreadsPerCore=2 Procs=20 RealMemory=244919 State=UNKNOWN -NodeName=dlc-tyranitar Gres=gpu:nvidia_geforce_rtx_2080_ti:1 CPUs=16 Sockets=1 CoresPerSocket=8 ThreadsPerCore=2 Procs=8 RealMemory=61030 State=UNKNOWN -NodeName=dlc-tornadus Gres=gpu:nvidia_geforce_rtx_3080_ti:8 CPUs=96 Sockets=2 CoresPerSocket=24 ThreadsPerCore=2 Procs=48 RealMemory=489825 State=UNKNOWN -NodeName=dlc-electabuzz Gres=gpu:nvidia_geforce_gtx_titan_x:1 CPUs=20 Sockets=1 CoresPerSocket=10 ThreadsPerCore=2 Procs=10 RealMemory=122284 State=UNKNOWN -NodeName=dlc-scyther Gres=gpu:nvidia_geforce_gtx_titan_x:1 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=30430 State=UNKNOWN -NodeName=dlc-venusaur Gres=gpu:nvidia_geforce_gtx_1080_ti:3 CPUs=40 Sockets=2 CoresPerSocket=10 ThreadsPerCore=2 Procs=20 RealMemory=248000 State=UNKNOWN +NodeName=dlc-tyranitar Gres=gpu:1 CPUs=16 Sockets=1 CoresPerSocket=8 ThreadsPerCore=2 Procs=8 RealMemory=61030 State=UNKNOWN +NodeName=dlc-tornadus Gres=gpu:8 CPUs=96 Sockets=2 CoresPerSocket=24 ThreadsPerCore=2 Procs=48 RealMemory=489825 State=UNKNOWN +NodeName=dlc-electabuzz Gres=gpu:1 CPUs=20 Sockets=1 CoresPerSocket=10 ThreadsPerCore=2 Procs=10 RealMemory=122284 State=UNKNOWN +NodeName=dlc-scyther Gres=gpu:1 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=30430 State=UNKNOWN +NodeName=dlc-venusaur Gres=gpu:3 CPUs=40 Sockets=2 CoresPerSocket=10 ThreadsPerCore=2 Procs=20 RealMemory=248000 State=UNKNOWN #NodeName=dlc-magneton Gres=gpu:4 CPUs=12 Sockets=1 CoresPerSocket=6 ThreadsPerCore=2 Procs=6 RealMemory=244759 State=UNKNOWN -NodeName=dlc-nidoking Gres=gpu:nvidia_geforce_rtx_2080_ti:8 CPUs=80 Sockets=2 CoresPerSocket=20 ThreadsPerCore=2 Procs=40 RealMemory=244684 State=UNKNOWN +NodeName=dlc-nidoking Gres=gpu:8 CPUs=80 Sockets=2 CoresPerSocket=20 ThreadsPerCore=2 Procs=40 RealMemory=244684 State=UNKNOWN #NodeName=dlc-starmie Gres=gpu:2 CPUs=32 Sockets=1 CoresPerSocket=16 ThreadsPerCore=2 Procs=16 RealMemory=60954 State=UNKNOWN #NodeName=dlc-charizard Gres=gpu:4 CPUs=40 Sockets=2 CoresPerSocket=10 ThreadsPerCore=2 Procs=20 RealMemory=244919 State=UNKNOWN -NodeName=dlc-lugia Gres=gpu:nvidia_geforce_rtx_2080_ti:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=385572 State=UNKNOWN -NodeName=dlc-moltres Gres=gpu:nvidia_geforce_rtx_2080_ti:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=256836 State=UNKNOWN -NodeName=dlc-zapdos Gres=gpu:nvidia_geforce_rtx_2080_ti:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=248000 State=UNKNOWN -NodeName=dlc-meowth Gres=gpu:nvidia_l40s:4 CPUs=96 Sockets=2 CoresPerSocket=24 ThreadsPerCore=2 Procs=48 RealMemory=248000 State=UNKNOWN +NodeName=dlc-lugia Gres=gpu:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=385572 State=UNKNOWN +NodeName=dlc-moltres Gres=gpu:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=256836 State=UNKNOWN +NodeName=dlc-zapdos Gres=gpu:8 CPUs=88 Sockets=2 CoresPerSocket=22 ThreadsPerCore=2 Procs=44 RealMemory=248000 State=UNKNOWN +NodeName=dlc-meowth Gres=gpu:4 CPUs=96 Sockets=2 CoresPerSocket=24 ThreadsPerCore=2 Procs=48 RealMemory=248000 State=UNKNOWN # hardcoding the partitions and default memory per node # TODO: automatically define the partitions by resource