[slurm-users] JobState=FAILED Reason=NonZeroExitCode Dependency=(null) ExitCode=1:0
Robert Kudyba
rkudyba at fordham.edu
Tue Jul 9 14:30:56 UTC 2019
>From this tutorial
https://www.brightcomputing.com/blog/bid/174099/slurm-101-basic-slurm-usage-for-linux-clusters
I
am trying to run the below and it always fails. I've made sure to run
'module load slurm'. What could be wrong? Logs from slurmctld show ok:
[2019-07-09T10:19:44.183] prolog_running_decr: Configuration for JobID=402
is complete
[2019-07-09T10:19:44.266] _job_complete: JobID=402 State=0x1 NodeCnt=1
WEXITSTATUS 1
[2019-07-09T10:19:44.266] _job_complete: JobID=402 State=0x8005 NodeCnt=1
done
[2019-07-09T10:21:31.934] _slurm_rpc_submit_batch_job: JobId=403
InitPrio=4294901690 usec=321
cat slurm-job.sh
#!/usr/bin/bash
#SBATCH -o slurm.sh.out
#SBATCH -p defq
echo "In the directory: `pwd`"
echo "As the user: `whoami`"
echo "write this is a file" > analysis.output
sleep 60
scontrol show job 402
JobId=402 JobName=slurm-job.sh
UserId=root(0) GroupId=root(0) MCS_label=N/A
Priority=4294901691 Nice=0 Account=root QOS=normal
JobState=FAILED Reason=NonZeroExitCode Dependency=(null)
Requeue=1 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=1:0
RunTime=00:00:01 TimeLimit=365-00:00:00 TimeMin=N/A
SubmitTime=2019-07-09T10:19:43 EligibleTime=2019-07-09T10:19:43
StartTime=2019-07-09T10:19:43 EndTime=2019-07-09T10:19:44 Deadline=N/A
PreemptTime=None SuspendTime=None SecsPreSuspend=0
LastSchedEval=2019-07-09T10:19:43
Partition=defq AllocNode:Sid=ciscluster:349904
ReqNodeList=(null) ExcNodeList=(null)
NodeList=node001
BatchHost=node001
NumNodes=1 NumCPUs=1 NumTasks=0 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
TRES=cpu=1,node=1,billing=1
Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
MinCPUsNode=1 MinMemoryNode=0 MinTmpDiskNode=0
Features=(null) DelayBoot=00:00:00
Gres=(null) Reservation=(null)
OverSubscribe=YES Contiguous=0 Licenses=(null) Network=(null)
Command=/root/testing/slurm-job.sh
WorkDir=/root/testing
StdErr=/root/testing/slurm.sh.out
StdIn=/dev/null
StdOut=/root/testing/slurm.sh.out
Power=
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://lists.schedmd.com/pipermail/slurm-users/attachments/20190709/6a89d264/attachment.htm>
More information about the slurm-users
mailing list