[slurm-users] JobState=FAILED Reason=NonZeroExitCode Dependency=(null) ExitCode=1:0

Robert Kudyba rkudyba at fordham.edu
Tue Jul 9 14:30:56 UTC 2019


>From this tutorial
https://www.brightcomputing.com/blog/bid/174099/slurm-101-basic-slurm-usage-for-linux-clusters
I
am trying to run the below and it always fails. I've made sure to run
'module load slurm'. What could be wrong? Logs from slurmctld show ok:
[2019-07-09T10:19:44.183] prolog_running_decr: Configuration for JobID=402
is complete
[2019-07-09T10:19:44.266] _job_complete: JobID=402 State=0x1 NodeCnt=1
WEXITSTATUS 1
[2019-07-09T10:19:44.266] _job_complete: JobID=402 State=0x8005 NodeCnt=1
done
[2019-07-09T10:21:31.934] _slurm_rpc_submit_batch_job: JobId=403
InitPrio=4294901690 usec=321

cat slurm-job.sh
#!/usr/bin/bash

#SBATCH -o slurm.sh.out
#SBATCH -p defq

echo "In the directory: `pwd`"
echo "As the user: `whoami`"
echo "write this is a file" > analysis.output
sleep 60

scontrol show job 402
JobId=402 JobName=slurm-job.sh
   UserId=root(0) GroupId=root(0) MCS_label=N/A
   Priority=4294901691 Nice=0 Account=root QOS=normal
   JobState=FAILED Reason=NonZeroExitCode Dependency=(null)
   Requeue=1 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=1:0
   RunTime=00:00:01 TimeLimit=365-00:00:00 TimeMin=N/A
   SubmitTime=2019-07-09T10:19:43 EligibleTime=2019-07-09T10:19:43
   StartTime=2019-07-09T10:19:43 EndTime=2019-07-09T10:19:44 Deadline=N/A
   PreemptTime=None SuspendTime=None SecsPreSuspend=0
   LastSchedEval=2019-07-09T10:19:43
   Partition=defq AllocNode:Sid=ciscluster:349904
   ReqNodeList=(null) ExcNodeList=(null)
   NodeList=node001
   BatchHost=node001
   NumNodes=1 NumCPUs=1 NumTasks=0 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
   TRES=cpu=1,node=1,billing=1
   Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
   MinCPUsNode=1 MinMemoryNode=0 MinTmpDiskNode=0
   Features=(null) DelayBoot=00:00:00
   Gres=(null) Reservation=(null)
   OverSubscribe=YES Contiguous=0 Licenses=(null) Network=(null)
   Command=/root/testing/slurm-job.sh
   WorkDir=/root/testing
   StdErr=/root/testing/slurm.sh.out
   StdIn=/dev/null
   StdOut=/root/testing/slurm.sh.out
   Power=
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://lists.schedmd.com/pipermail/slurm-users/attachments/20190709/6a89d264/attachment.htm>


More information about the slurm-users mailing list