|
老师您好,我尝试了这四种设置,结果是能提交任务但是都不能排队,您知道是什么原因吗?附件是我slurm.conf文件,麻烦您看一下。
#slurm.conf file generated by configurator easy.html.
# Put this file on all nodes of your cluster.
# See the slurm.conf man page for more information.
#
#ControlAddr=
SlurmctldHost=node0
#DebugFlags=NO_CONF_HASH
#
#MailProg=/bin/mail
MpiDefault=none
#MpiParams=ports=#-#
ProctrackType=proctrack/cgroup
ReturnToService=2
SlurmctldPidFile=/var/run/slurmctld.pid
SlurmctldPort=6817
SlurmdPidFile=/var/run/slurmd.pid
SlurmdPort=6818
SlurmdSpoolDir=/var/spool/slurm/slurmd
SlurmUser=slurm
#SlurmdUser=root
#SlurmdUser=
StateSaveLocation=/var/spool/slurm/
SwitchType=switch/none
TaskPlugin=task/cgroup
#TaskPlugin=task/affinity
#
#
# TIMERS
KillWait=30
MinJobAge=300
SlurmctldTimeout=120
SlurmdTimeout=300
InactiveLimit=0
WaitTime=0
#
#
# SCHEDULING
SchedulerType=sched/backfill
#SelectType=select/cons_res
SelectType=select/cons_tres
#SelectTypeParameters=CR_CPU_memory
#SelectTypeParameters=CR_CPU
SelectTypeParameters=CR_Core_memory
DefMemPerCPU=6000
#SelectTypeParameters=CR_Core
#
#
# LOGGING AND ACCOUNTING
#AccountingStorageType=accounting_storage/slurmdbd
#AccountingStoreFlags=JobComment
#AccountingStorageEnforce=associations,limits,qos
#AccountingStoragePass=/var/run/munge/munge.socket.2
#AccountingStorageHost=node0
AccountingStoragePort=6819
ClusterName=cluster
#JobAcctGatherFrequency=30
JobAcctGatherType=jobacct_gather/none
SlurmctldDebug=info
SlurmctldLogFile=/var/log/slurmctld.log
SlurmdDebug=info
SlurmdLogFile=/var/log/slurmd.log
AllowSpecResourcesUsage=YES
#
#
# COMPUTE NODES
# NodeName=clustermaster CPUs=144 Boards=1 SocketsPerBoard=2 CoresPerSocket=36 ThreadsPerCore=2 RealMemory=515457
NodeName=node0 CPUs=144 Boards=1 SocketsPerBoard=2 CoresPerSocket=36 ThreadsPerCore=2 RealMemory=488448 Procs=2 State=IDLE
NodeName=node1 CPUs=144 Boards=1 SocketsPerBoard=2 CoresPerSocket=36 ThreadsPerCore=2 RealMemory=253952 Procs=2 State=IDLE
NodeName=node2 CPUs=144 Boards=1 SocketsPerBoard=2 CoresPerSocket=36 ThreadsPerCore=2 RealMemory=252928 procs=2 State=IDLE
NodeName=node3 CPUs=144 Boards=1 SocketsPerBoard=2 CoresPerSocket=36 ThreadsPerCore=2 RealMemory=252928 Procs=2 State=IDLE
NodeName=node4 CPUs=128 Boards=1 SocketsPerBoard=2 CoresPerSocket=32 ThreadsPerCore=2 RealMemory=498688 Procs=2 State=IDLE
PartitionName=test Nodes=node[0-4] Default=YES MaxTime=INFINITE State=UP OverSubscribe=NO
# PartitionName=test Nodes=192.168.1.243,linux[1-32] Default=YES MaxTime=INFINITE State=UP
# DefMemPerNode=1000
# MaxMemPerNode=1000
# DefMemPerCPU=4000
# MaxMemPerCPU=4096
|
|