# Put this file on all nodes of your cluster.
# See the slurm.conf man page for more information.
#SlurmctldPort=6817
#SlurmdPort=6818
# TIMERS
#KillWait=30
#MinJobAge=300
#SlurmctldTimeout=120
#SlurmdTimeout=300
#SchedulerPort=7321
#The time it takes for a completed job to disappear of the queue
CompleteWait=60
#The name of the user the controller executes as, can either be root or slurm user
SlurmdUser=root
#The machine name we use as the controller
ControlMachine=cot1
#Can also execute jobs on another machine using a backup controller
BackupController=cot2
#let srun figure out the mpi type
MpiDefault=none
#Track jobs by process group id
ProctrackType=proctrack/pgid
#A down node will automatically return to service except during a failure
ReturnToService=1
#Authenticate nodes with munge
AuthType=auth/munge
####SLURM FILE LOCATIONS####
SlurmctldPidFile=/var/run/slurmctl.pid
SlurmdPidFile=/var/run/slurmd.pid
SlurmdSpoolDir=/var/spool/slurmd
StateSaveLocation=/var/spool/slurm
SlurmctldLogFile=/var/log/slurmctl/controller.log
#Do we need special switch i.e elan (we use ehternet so no)
SwitchType=switch/none
#Type of task plugin - don't have special handling of cpu_bind or mem_bind jobs
TaskPlugin=task/none
#consdider the node definitions, if it is less, make the node go down
FastSchedule=1
#initiate lower priority jobs if they don't consume too much
#augments FIFO, first in first out
SchedulerType=sched/backfill
ClusterName=TSRI
#each cpu is considered a resource
SelectType=select/linear
### LOGGING AND ACCOUNTING
#Basic Logging to text file
AccountingStorageType=accounting_storage/filetxt
#and where should that logging go
AccountingStorageLoc=mypath/logging/account_text.txt
#use linux rules to gather, this doesn't do anything yet
#JobAcctGatherType=jobacct_gather/linux
#### COMPUTE NODES ####
NodeName=imperial-node[01-10] CPUs=24 RealMemory=64 Sockets=2 CoresPerSocket=12 ThreadsPerCore=1
NodeName=silver-node[01-28] CPUs=32 RealMemory=128 Sockets=2 CoresPerSocket=8 ThreadsPerCore=2
#Note that ocean-node01 is different from the rest of the Oceans...dan..
NodeName=ocean-node01 CPUs=16 Procs=16 RealMemory=256 Sockets=2 CoresPerSocket=8 ThreadsPerCore=1
NodeName=ocean-node[02-05] CPUs=32 RealMemory=256 Sockets=2 CoresPerSocket=8 ThreadsPerCore=2
NodeName=loma-node[01-10] CPUs=24 RealMemory=64 Sockets=2 CoresPerSocket=6 ThreadsPerCore=2
### Partitions ####
PartitionName=all Nodes=imperial-node[01-10],silver-node[01-28],ocean-node[01-05],loma-node[01-10] State=UP Default=YES
PartitionName=imperial Nodes=imperial-node[01-10] Default=NO MaxTime=INFINITE State=UP
PartitionName=silver Nodes=silver-node[01-28] Default=NO MaxTime=INFINITE State=UP
PartitionName=ocean Nodes=ocean-node[01-05] Default=NO MaxTime=INFINITE State=UP
PartitionName=loma Nodes=loma-node[01-10] Default=NO MaxTime=INFINITE State=UP