[slurm-users] systemctl enable slurmd.service Failed to execute operation: No such file or directory

Ole Holm Nielsen Ole.H.Nielsen at fysik.dtu.dk
Thu Jan 27 10:05:06 UTC 2022


Maybe my Slurm Wiki pages will help you get started:
https://wiki.fysik.dtu.dk/niflheim/SLURM

Best regards,
Ole

On 1/27/22 10:53, Nousheen wrote:
> I am installing slurm on Centos 7 following tutorial: 
> https://www.slothparadise.com/how-to-install-slurm-on-centos-7-cluster/ 
> <https://www.slothparadise.com/how-to-install-slurm-on-centos-7-cluster/>
> 
> I am at the step where we start slurm but it gives me the following error:
> 
> [root at exxact slurm-21.08.5]# systemctl enable slurmd.service
> Failed to execute operation: No such file or directory
> 
> I have run the command to check if slurm is configured properly
> 
> [root at exxact slurm-21.08.5]# slurmd -C
> NodeName=exxact CPUs=12 Boards=1 SocketsPerBoard=1 CoresPerSocket=6 
> ThreadsPerCore=2 RealMemory=31889
> UpTime=19-16:06:00
> 
> I am new to this and unable to understand the problem. Kindly help me 
> resolve this.
> 
> My slurm.conf file is as follows:
> 
> # slurm.conf file generated by configurator.html.
> # Put this file on all nodes of your cluster.
> # See the slurm.conf man page for more information.
> #
> ClusterName=cluster194
> SlurmctldHost=192.168.60.194
> #SlurmctldHost=
> #
> #DisableRootJobs=NO
> #EnforcePartLimits=NO
> #Epilog=
> #EpilogSlurmctld=
> #FirstJobId=1
> #MaxJobId=67043328
> #GresTypes=
> #GroupUpdateForce=0
> #GroupUpdateTime=600
> #JobFileAppend=0
> #JobRequeue=1
> #JobSubmitPlugins=lua
> #KillOnBadExit=0
> #LaunchType=launch/slurm
> #Licenses=foo*4,bar
> #MailProg=/bin/mail
> #MaxJobCount=10000
> #MaxStepCount=40000
> #MaxTasksPerNode=512
> MpiDefault=none
> #MpiParams=ports=#-#
> #PluginDir=
> #PlugStackConfig=
> #PrivateData=jobs
> ProctrackType=proctrack/cgroup
> #Prolog=
> #PrologFlags=
> #PrologSlurmctld=
> #PropagatePrioProcess=0
> #PropagateResourceLimits=
> #PropagateResourceLimitsExcept=
> #RebootProgram=
> ReturnToService=1
> SlurmctldPidFile=/var/run/slurmctld.pid
> SlurmctldPort=6817
> SlurmdPidFile=/var/run/slurmd.pid
> SlurmdPort=6818
> SlurmdSpoolDir=/var/spool/slurmd
> SlurmUser=nousheen
> #SlurmdUser=root
> #SrunEpilog=
> #SrunProlog=
> StateSaveLocation=/home/nousheen/Documents/SILICS/slurm-21.08.5/slurmctld
> SwitchType=switch/none
> #TaskEpilog=
> TaskPlugin=task/affinity
> #TaskProlog=
> #TopologyPlugin=topology/tree
> #TmpFS=/tmp
> #TrackWCKey=no
> #TreeWidth=
> #UnkillableStepProgram=
> #UsePAM=0
> #
> #
> # TIMERS
> #BatchStartTimeout=10
> #CompleteWait=0
> #EpilogMsgTime=2000
> #GetEnvTimeout=2
> #HealthCheckInterval=0
> #HealthCheckProgram=
> InactiveLimit=0
> KillWait=30
> #MessageTimeout=10
> #ResvOverRun=0
> MinJobAge=300
> #OverTimeLimit=0
> SlurmctldTimeout=120
> SlurmdTimeout=300
> #UnkillableStepTimeout=60
> #VSizeFactor=0
> Waittime=0
> #
> #
> # SCHEDULING
> #DefMemPerCPU=0
> #MaxMemPerCPU=0
> #SchedulerTimeSlice=30
> SchedulerType=sched/backfill
> SelectType=select/cons_tres
> SelectTypeParameters=CR_Core
> #
> #
> # JOB PRIORITY
> #PriorityFlags=
> #PriorityType=priority/basic
> #PriorityDecayHalfLife=
> #PriorityCalcPeriod=
> #PriorityFavorSmall=
> #PriorityMaxAge=
> #PriorityUsageResetPeriod=
> #PriorityWeightAge=
> #PriorityWeightFairshare=
> #PriorityWeightJobSize=
> #PriorityWeightPartition=
> #PriorityWeightQOS=
> #
> #
> # LOGGING AND ACCOUNTING
> #AccountingStorageEnforce=0
> #AccountingStorageHost=
> #AccountingStoragePass=
> #AccountingStoragePort=
> AccountingStorageType=accounting_storage/none
> #AccountingStorageUser=
> #AccountingStoreFlags=
> #JobCompHost=
> #JobCompLoc=
> #JobCompPass=
> #JobCompPort=
> JobCompType=jobcomp/none
> #JobCompUser=
> #JobContainerType=job_container/none
> JobAcctGatherFrequency=30
> JobAcctGatherType=jobacct_gather/none
> SlurmctldDebug=info
> SlurmctldLogFile=/var/log/slurmctld.log
> SlurmdDebug=info
> SlurmdLogFile=/var/log/slurmd.log
> #SlurmSchedLogFile=
> #SlurmSchedLogLevel=
> #DebugFlags=
> #
> #
> # POWER SAVE SUPPORT FOR IDLE NODES (optional)
> #SuspendProgram=
> #ResumeProgram=
> #SuspendTimeout=
> #ResumeTimeout=
> #ResumeRate=
> #SuspendExcNodes=
> #SuspendExcParts=
> #SuspendRate=
> #SuspendTime=
> #
> #
> # COMPUTE NODES
> NodeName=linux[1-32] CPUs=11 State=UNKNOWN
> PartitionName=debug Nodes=ALL Default=YES MaxTime=INFINITE State=UP



More information about the slurm-users mailing list