# # /uufs/kingspeak.peaks/sys/var/slurm/slurm.conf for kprm.wasatch.peaks # # slurm.conf file generated by configurator.html. # See the slurm.conf man page for more information. # ControlMachine=kprm ControlAddr=kprm #BackupController= #BackupAddr= # AuthType=auth/munge CryptoType=crypto/munge EnforcePartLimits=YES Epilog=/uufs/kingspeak.peaks/sys/var/slurm/etc/epilog EpilogSlurmctld=/uufs/kingspeak.peaks/sys/var/slurm/etc/epilog-slurmctld #FirstJobId=1 #MaxJobId=999999 LaunchType=launch/slurm MpiDefault=none PrivateData=cloud ProctrackType=proctrack/pgid Prolog=/uufs/kingspeak.peaks/sys/var/slurm/etc/prolog PrologFlags=Alloc PrologSlurmctld=/uufs/kingspeak.peaks/sys/var/slurm/etc/prolog-slurmctld #RebootProgram= ReturnToService=2 SlurmctldPidFile=/var/run/slurmctld.pid SlurmctldPort=6817 SlurmdPidFile=/var/run/slurmd.pid SlurmdPort=6818 SlurmdSpoolDir=/uufs/kingspeak.peaks/sys/var/slurm/slurmd.spool SlurmUser=slurm StateSaveLocation=/uufs/kingspeak.peaks/sys/var/slurm/slurm.state SwitchType=switch/none TaskPlugin=task/none # 4-28-15: PLAN TO CHANGE TO AFFINITY WITH PARAM SCHED AFTER FURTHER TESTING FROM MARTIN ON SCRUBPEAK -bdh #TaskPlugin=task/affinity #TaskPluginParam=Sched TreeWidth=64 # # # TIMERS BatchStartTimeout=180 #CompleteWait=0 #EpilogMsgTime=2000 #GetEnvTimeout=2 #HealthCheckInterval=0 #HealthCheckProgram= InactiveLimit=0 KillWait=60 MessageTimeout=100 #ResvOverRun=0 MinJobAge=300 #OverTimeLimit=0 SlurmctldTimeout=600 SlurmdTimeout=600 #UnkillableStepTimeout=60 #VSizeFactor=0 Waittime=0 # # # SCHEDULING #DefMemPerCPU=0 FastSchedule=1 #MaxMemPerCPU=0 SchedulerType=sched/backfill SchedulerPort=7321 SelectType=select/linear SelectTypeParameters=CR_ONE_TASK_PER_CORE # 4-28-15: PLAN TO CHANGE TO CONS_RES AFTER FURTHER TESTING ON SCRUBPEAK. -bdh #SelectType=select/cons_res #SelectTypeParameters=CR_Core,CR_ONE_TASK_PER_CORE JobRequeue=0 # # # PREEMPTION PreemptMode=CANCEL PreemptType=preempt/qos # # # JOB PRIORITY PriorityFlags=SMALL_RELATIVE_TO_TIME PriorityType=priority/multifactor PriorityDecayHalfLife=14-0 PriorityCalcPeriod=5 PriorityFavorSmall=NO PriorityMaxAge=14-0 PriorityUsageResetPeriod=NONE PriorityWeightAge=10000 PriorityWeightFairshare=10000 PriorityWeightJobSize=100000 PriorityWeightPartition=0 PriorityWeightQOS=1000000 # # # LOGGING AND ACCOUNTING AccountingStorageEnforce=associations,limits,qos AccountingStorageHost=slurmdbd.wasatch.peaks AccountingStoragePort=6819 AccountingStorageType=accounting_storage/slurmdbd AccountingStoreJobComment=YES ClusterName=kingspeak DebugFlags=NO_CONF_HASH JobCompLoc=/uufs/kingspeak.peaks/sys/var/slurm/log/slurm.job.log JobCompType=jobcomp/filetxt JobAcctGatherFrequency=30 JobAcctGatherType=jobacct_gather/none SlurmctldDebug=5 SlurmdDebug=5 # # # "Cloud" ELASTIC & POWER SAVE SUPPORT FOR IDLE NODES (optional) #SuspendProgram=/uufs/kingspeak.peaks/sys/var/slurm/etc/PowerSaveDown.sh #ResumeProgram=/uufs/kingspeak.peaks/sys/var/slurm/etc/PowerSaveUp.sh #SuspendTimeout=120 #ResumeTimeout=600 #ResumeRate=15 #SuspendExcNodes= #SuspendExcParts= #SuspendRate=15 #SuspendTime=3600 # # # COMPUTE NODES TmpFS=/scratch/local #NodeName=DEFAULT State=CLOUD NodeName=DEFAULT State=UNKNOWN # # CHPC General Nodes NodeName=kp[001-032] Feature=chpc,c16 Weight=1 NodeAddr=10.242.65.[1-32] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # NodeName=kp[110-111,158-167] Feature=chpc,c20 Weight=1 NodeAddr=10.242.65.[110-111,158-167] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # NodeName=kp[196-199] Feature=chpc,hadoop,c20 Weight=1 NodeAddr=10.242.65.[196-199] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=384000 TmpDisk=19070000 # # Lin Owner Nodes NodeName=kp[033-047] Feature=lin,c16 Weight=1 NodeAddr=10.242.65.[33-47] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # # ZPu Owner Nodes NodeName=kp[048-054] Feature=zpu,c16 Weight=1 NodeAddr=10.242.65.[48-54] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # # Facelli Owner Nodes NodeName=kp[055-060] Feature=facelli,c16 Weight=1 NodeAddr=10.242.65.[55-60] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # # Frost Owner Nodes NodeName=kp[061-063] Feature=frost,c16 Weight=1 NodeAddr=10.242.65.[61-63] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # # Steele Owner Nodes NodeName=kp[064-083] Feature=steele,c16 Weight=1 NodeAddr=10.242.65.[64-83] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=32000 TmpDisk=1840000 # # HCI Owner Nodes NodeName=kp[084-087] Feature=hci,c16 Weight=1 NodeAddr=10.242.65.[84-87] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # NodeName=kp[148-151] Feature=hci,c20 Weight=1 NodeAddr=10.242.65.[148-151] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # Molinero Owner Nodes NodeName=kp[088-091] Feature=molinero,c16 Weight=1 NodeAddr=10.242.65.[88-91] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # NodeName=kp[140-147] Feature=molinero,c20 Weight=1 NodeAddr=10.242.65.[140-147] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # Bedrov Owner Nodes NodeName=kp[092-095] Feature=bedrov,c16 Weight=1 NodeAddr=10.242.65.[92-95] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=340000 # # Calaf Owner Nodes NodeName=kp[096-099] Feature=calaf,c20 Weight=1 NodeAddr=10.242.65.[96-99] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=128000 TmpDisk=690000 # # Strong Owner Nodes NodeName=kp[101-104] Feature=strong,c20 Weight=1 NodeAddr=10.242.65.[101-104] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # Avey Owner Nodes NodeName=kp105 Feature=avey,c20 Weight=1 NodeAddr=10.242.65.105 Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # WJohnson Owner Nodes NodeName=kp[106-108] Feature=wjohnson,c20 Weight=1 NodeAddr=10.242.65.[106-108] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # SDSS Owner Nodes NodeName=kp[112-139] Feature=sdss,c16 Weight=1 NodeAddr=10.242.65.[112-139] Sockets=2 CPUs=16 CoresPerSocket=8 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # Varley Owner Nodes NodeName=kp[152-153] Feature=varley,c20 Weight=1 NodeAddr=10.242.65.[152-153] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=128000 TmpDisk=690000 # # Gertz Owner Nodes NodeName=kp[154-155] Feature=gertz,c20 Weight=1 NodeAddr=10.242.65.[154-155] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=128000 TmpDisk=690000 # # Sigman Owner Nodes NodeName=kp156 Feature=sigman,c20 Weight=1 NodeAddr=10.242.65.156 Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # Lebohec Owner Nodes NodeName=kp157 Feature=lebohec,c20 Weight=1 NodeAddr=10.242.65.157 Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=64000 TmpDisk=820000 # # UCGD Owner Nodes NodeName=kp[168-195] Feature=ucgd,c20 Weight=1 NodeAddr=10.242.65.[168-195] Sockets=2 CPUs=20 CoresPerSocket=10 ThreadsPerCore=1 RealMemory=128000 TmpDisk=690000 # NodeName=kp[200-227] Feature=ucgd,c24 Weight=1 NodeAddr=10.242.65.[200-227] Sockets=2 CPUs=24 CoresPerSocket=12 ThreadsPerCore=1 RealMemory=128000 TmpDisk=690000 # # Tavtigian Owner Nodes NodeName=kp228 Feature=tavtigian,c24 Weight=1 NodeAddr=10.242.65.228 Sockets=2 CPUs=24 CoresPerSocket=12 ThreadsPerCore=1 RealMemory=128000 TmpDisk=690000 # # Mason Owner Nodes NodeName=kp[229-233] Feature=mason,c24 Weight=1 NodeAddr=10.242.65.[229-233] Sockets=2 CPUs=24 CoresPerSocket=12 ThreadsPerCore=1 RealMemory=128000 TmpDisk=3500000 # # # # Partitoins PartitionName=DEFAULT State=UP #4-28-15: PLAN TO CHANGE TO 'Shared=exclusive' AFTER FURTHER TESTING OF CONS_RES ON SCRUBPEAK. -bdh #PartitionName=DEFAULT State=UP Shared=exclusive # # KingsPeak General Partition PartitionName=kingspeak Nodes=kp[001-032,110-111,158-167,196-199] MaxTime=4320 MaxNodes=48 State=UP AllowQos=kingspeak,kingspeak-long Default=YES # # KingsPeak Freecycle Partition PartitionName=kingspeak-freecycle Nodes=kp[001-032,110-111,158-167,196-199] MaxTime=4320 MaxNodes=48 State=UP AllowQos=kingspeak-freecycle # # KingsPeak Owner Guest Partition PartitionName=kingspeak-guest Nodes=kp[033-099,101-108,112-157,168-195,200-233] MaxTime=4320 MaxNodes=183 State=UP AllowAccounts=owner-guest # # KingsPeak Lin Owner Partition PartitionName=lin-kp Nodes=kp[033-047] MaxTime=20160 MaxNodes=15 State=UP AllowAccounts=lin-kp # # KingsPeak ZPu Owner Partition PartitionName=zpu-kp Nodes=kp[048-054] MaxTime=20160 MaxNodes=7 State=UP AllowAccounts=zpu-kp # # KingsPeak Facelli Owner Partition PartitionName=facelli-kp Nodes=kp[055-060] MaxTime=20160 MaxNodes=6 State=UP AllowAccounts=facelli-kp # # KingsPeak Frost Owner Partition PartitionName=frost-kp Nodes=kp[061-063] MaxTime=20160 MaxNodes=3 State=UP AllowAccounts=frost-kp # # KingsPeak Steele Owner Partition PartitionName=steele-kp Nodes=kp[064-083] MaxTime=20160 MaxNodes=20 State=UP AllowAccounts=steele-kp # # KingsPeak HCI Owner Partition PartitionName=hci-kp Nodes=kp[084-087,148-151] MaxTime=20160 MaxNodes=8 State=UP AllowAccounts=hci-kp # # KingsPeak Molinero Owner Partition PartitionName=molinero-kp Nodes=kp[088-091,140-147] MaxTime=20160 MaxNodes=12 State=UP AllowAccounts=molinero-kp # # KingsPeak Bedrov Owner Partition PartitionName=bedrov-kp Nodes=kp[092-095] MaxTime=20160 MaxNodes=4 State=UP AllowAccounts=bedrov-kp # # KingsPeak Calaf Owner Partition PartitionName=calaf-kp Nodes=kp[096-099] MaxTime=20160 MaxNodes=4 State=UP AllowAccounts=calaf-kp # # KingsPeak Strong Owner Partition PartitionName=strong-kp Nodes=kp[101-104] MaxTime=20160 MaxNodes=4 State=UP AllowAccounts=strong-kp # # KingsPeak Avey Owner Partition PartitionName=avey-kp Nodes=kp105 MaxTime=20160 MaxNodes=1 State=UP AllowAccounts=avey-kp # # KingsPeak WJohnson Owner Partition PartitionName=wjohnson-kp Nodes=kp[106-108] MaxTime=20160 MaxNodes=3 State=UP AllowAccounts=wjohnson-kp # # KingsPeak SDSS Owner Partition PartitionName=sdss-kp Nodes=kp[112-139] MaxTime=20160 MaxNodes=28 State=UP AllowAccounts=sdss-kp,sdss-kp-fast # # KingsPeak Varley Owner Partition PartitionName=varley-kp Nodes=kp[152-153] MaxTime=20160 MaxNodes=2 State=UP AllowAccounts=varley-kp,gertz-kp # # KingsPeak Gertz Owner Partition PartitionName=gertz-kp Nodes=kp[154-155] MaxTime=20160 MaxNodes=2 State=UP AllowAccounts=gertz-kp,varley-kp # # KingsPeak Sigman Owner Partition PartitionName=sigman-kp Nodes=kp156 MaxTime=20160 MaxNodes=1 State=UP AllowAccounts=sigman-kp # # KingsPeak Lebohec Owner Partition PartitionName=lebohec-kp Nodes=kp157 MaxTime=20160 MaxNodes=1 State=UP AllowAccounts=lebohec-kp # # KingsPeak UCGD Owner Partition PartitionName=ucgd-kp Nodes=kp[168-195,200-227] MaxTime=20160 MaxNodes=56 State=UP AllowAccounts=ucgd-kp # # KingsPeak Tavtigian Owner Partition PartitionName=tavtigian-kp Nodes=kp228 MaxTime=20160 MaxNodes=1 State=UP AllowAccounts=tavtigian-kp # # KingsPeak Mason Owner Partition PartitionName=mason-kp Nodes=kp[229-233] MaxTime=20160 MaxNodes=5 State=UP AllowAccounts=mason-kp # # KingsPeak HCI Owner guest Partition PartitionName=hci-owner-guest Nodes=kp228 MaxTime=20160 MaxNodes=1 State=UP AllowAccounts=hci-owner-guest # #