MaxRAM=35.8G |
01476962(465151495 Francois Meyer) GroupId=eresearch_hpc_users(1221947160) MCS_label=N/A
Priority=7546 Nice=0 Account=nlpgroup80 QOS=nlpgroup80
JobState=RUNNING Reason=None Dependency=(null)
Requeue=0 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=0:0
DerivedExitCode=0:0
RunTime=01:28:59 TimeLimit=3-00:00:00 TimeMin=N/A
SubmitTime=2026-03-31T08:53:01 EligibleTime=2026-03-31T08:53:01
AccrueTime=2026-03-31T08:53:02
StartTime=2026-03-31T08:53:02 EndTime=2026-04-03T08:53:02 Deadline=N/A
SuspendTime=None SecsPreSuspend=0 LastSchedEval=2026-03-31T08:53:02 Scheduler=Main
Partition=a100 AllocNode:Sid=srvrochpc001:1117295
ReqNodeList=(null) ExcNodeList=(null)
NodeList=srvrocgpu011
BatchHost=srvrocgpu011
NumNodes=1 NumCPUs=4 NumTasks=4 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
ReqTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
AllocTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
JOB_GRES=gpu:ampere80:1
Nodes=srvrocgpu011 CPU_IDs=3-4,31-32 Mem=36568 GRES=gpu:ampere80:1(IDX:1)
MinCPUsNode=1 MinMemoryCPU=9142M MinTmpDiskNode=0
Features=(null) DelayBoot=00:00:00
OverSubscribe=OK Contiguous=0 Licenses=(null) Network=(null)
Command=/home/01476962/lowgeo/all_ckpt.sh
WorkDir=/home/01476962/lowgeo
StdErr=/home/01476962/lowgeo/debug_ckpt.log
StdIn=/dev/null
StdOut=/home/01476962/lowgeo/debug_ckpt.log
Power=
TresPerNode=gres/gpu:ampere80:1
|
01476962(465151495 Francois Meyer) GroupId=eresearch_hpc_users(1221947160) MCS_label=N/A
Priority=7546 Nice=0 Account=nlpgroup80 QOS=nlpgroup80
JobState=OUT_OF_MEMORY Reason=OutOfMemory Dependency=(null)
Requeue=0 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=0:125
DerivedExitCode=0:0
RunTime=01:29:36 TimeLimit=3-00:00:00 TimeMin=N/A
SubmitTime=2026-03-31T08:53:01 EligibleTime=2026-03-31T08:53:01
AccrueTime=2026-03-31T08:53:02
StartTime=2026-03-31T08:53:02 EndTime=2026-03-31T10:22:38 Deadline=N/A
SuspendTime=None SecsPreSuspend=0 LastSchedEval=2026-03-31T08:53:02 Scheduler=Main
Partition=a100 AllocNode:Sid=srvrochpc001:1117295
ReqNodeList=(null) ExcNodeList=(null)
NodeList=srvrocgpu011
BatchHost=srvrocgpu011
NumNodes=1 NumCPUs=4 NumTasks=4 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
ReqTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
AllocTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
JOB_GRES=gpu:ampere80:1
Nodes=srvrocgpu011 CPU_IDs=3-4,31-32 Mem=36568 GRES=
MinCPUsNode=1 MinMemoryCPU=9142M MinTmpDiskNode=0
Features=(null) DelayBoot=00:00:00
OverSubscribe=OK Contiguous=0 Licenses=(null) Network=(null)
Command=/home/01476962/lowgeo/all_ckpt.sh
WorkDir=/home/01476962/lowgeo
StdErr=/home/01476962/lowgeo/debug_ckpt.log
StdIn=/dev/null
StdOut=/home/01476962/lowgeo/debug_ckpt.log
Power=
TresPerNode=gres/gpu:ampere80:1
|
01476962(465151495 Francois Meyer) GroupId=eresearch_hpc_users(1221947160) MCS_label=N/A
Priority=7546 Nice=0 Account=nlpgroup80 QOS=nlpgroup80
JobState=OUT_OF_MEMORY Reason=OutOfMemory Dependency=(null)
Requeue=0 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=0:125
DerivedExitCode=0:0
RunTime=01:29:36 TimeLimit=3-00:00:00 TimeMin=N/A
SubmitTime=2026-03-31T08:53:01 EligibleTime=2026-03-31T08:53:01
AccrueTime=2026-03-31T08:53:02
StartTime=2026-03-31T08:53:02 EndTime=2026-03-31T10:22:38 Deadline=N/A
SuspendTime=None SecsPreSuspend=0 LastSchedEval=2026-03-31T08:53:02 Scheduler=Main
Partition=a100 AllocNode:Sid=srvrochpc001:1117295
ReqNodeList=(null) ExcNodeList=(null)
NodeList=srvrocgpu011
BatchHost=srvrocgpu011
NumNodes=1 NumCPUs=4 NumTasks=4 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
ReqTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
AllocTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
JOB_GRES=gpu:ampere80:1
Nodes=srvrocgpu011 CPU_IDs=3-4,31-32 Mem=36568 GRES=
MinCPUsNode=1 MinMemoryCPU=9142M MinTmpDiskNode=0
Features=(null) DelayBoot=00:00:00
OverSubscribe=OK Contiguous=0 Licenses=(null) Network=(null)
Command=/home/01476962/lowgeo/all_ckpt.sh
WorkDir=/home/01476962/lowgeo
StdErr=/home/01476962/lowgeo/debug_ckpt.log
StdIn=/dev/null
StdOut=/home/01476962/lowgeo/debug_ckpt.log
Power=
TresPerNode=gres/gpu:ampere80:1
|
01476962(465151495 Francois Meyer) GroupId=eresearch_hpc_users(1221947160) MCS_label=N/A
Priority=7546 Nice=0 Account=nlpgroup80 QOS=nlpgroup80
JobState=OUT_OF_MEMORY Reason=OutOfMemory Dependency=(null)
Requeue=0 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=0:125
DerivedExitCode=0:0
RunTime=01:29:36 TimeLimit=3-00:00:00 TimeMin=N/A
SubmitTime=2026-03-31T08:53:01 EligibleTime=2026-03-31T08:53:01
AccrueTime=2026-03-31T08:53:02
StartTime=2026-03-31T08:53:02 EndTime=2026-03-31T10:22:38 Deadline=N/A
SuspendTime=None SecsPreSuspend=0 LastSchedEval=2026-03-31T08:53:02 Scheduler=Main
Partition=a100 AllocNode:Sid=srvrochpc001:1117295
ReqNodeList=(null) ExcNodeList=(null)
NodeList=srvrocgpu011
BatchHost=srvrocgpu011
NumNodes=1 NumCPUs=4 NumTasks=4 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
ReqTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
AllocTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
JOB_GRES=gpu:ampere80:1
Nodes=srvrocgpu011 CPU_IDs=3-4,31-32 Mem=36568 GRES=
MinCPUsNode=1 MinMemoryCPU=9142M MinTmpDiskNode=0
Features=(null) DelayBoot=00:00:00
OverSubscribe=OK Contiguous=0 Licenses=(null) Network=(null)
Command=/home/01476962/lowgeo/all_ckpt.sh
WorkDir=/home/01476962/lowgeo
StdErr=/home/01476962/lowgeo/debug_ckpt.log
StdIn=/dev/null
StdOut=/home/01476962/lowgeo/debug_ckpt.log
Power=
TresPerNode=gres/gpu:ampere80:1
|
01476962(465151495 Francois Meyer) GroupId=eresearch_hpc_users(1221947160) MCS_label=N/A
Priority=7546 Nice=0 Account=nlpgroup80 QOS=nlpgroup80
JobState=OUT_OF_MEMORY Reason=OutOfMemory Dependency=(null)
Requeue=0 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=0:125
DerivedExitCode=0:0
RunTime=01:29:36 TimeLimit=3-00:00:00 TimeMin=N/A
SubmitTime=2026-03-31T08:53:01 EligibleTime=2026-03-31T08:53:01
AccrueTime=2026-03-31T08:53:02
StartTime=2026-03-31T08:53:02 EndTime=2026-03-31T10:22:38 Deadline=N/A
SuspendTime=None SecsPreSuspend=0 LastSchedEval=2026-03-31T08:53:02 Scheduler=Main
Partition=a100 AllocNode:Sid=srvrochpc001:1117295
ReqNodeList=(null) ExcNodeList=(null)
NodeList=srvrocgpu011
BatchHost=srvrocgpu011
NumNodes=1 NumCPUs=4 NumTasks=4 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
ReqTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
AllocTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
JOB_GRES=gpu:ampere80:1
Nodes=srvrocgpu011 CPU_IDs=3-4,31-32 Mem=36568 GRES=
MinCPUsNode=1 MinMemoryCPU=9142M MinTmpDiskNode=0
Features=(null) DelayBoot=00:00:00
OverSubscribe=OK Contiguous=0 Licenses=(null) Network=(null)
Command=/home/01476962/lowgeo/all_ckpt.sh
WorkDir=/home/01476962/lowgeo
StdErr=/home/01476962/lowgeo/debug_ckpt.log
StdIn=/dev/null
StdOut=/home/01476962/lowgeo/debug_ckpt.log
Power=
TresPerNode=gres/gpu:ampere80:1
|
01476962(465151495 Francois Meyer) GroupId=eresearch_hpc_users(1221947160) MCS_label=N/A
Priority=7546 Nice=0 Account=nlpgroup80 QOS=nlpgroup80
JobState=OUT_OF_MEMORY Reason=OutOfMemory Dependency=(null)
Requeue=0 Restarts=0 BatchFlag=1 Reboot=0 ExitCode=0:125
DerivedExitCode=0:0
RunTime=01:29:36 TimeLimit=3-00:00:00 TimeMin=N/A
SubmitTime=2026-03-31T08:53:01 EligibleTime=2026-03-31T08:53:01
AccrueTime=2026-03-31T08:53:02
StartTime=2026-03-31T08:53:02 EndTime=2026-03-31T10:22:38 Deadline=N/A
SuspendTime=None SecsPreSuspend=0 LastSchedEval=2026-03-31T08:53:02 Scheduler=Main
Partition=a100 AllocNode:Sid=srvrochpc001:1117295
ReqNodeList=(null) ExcNodeList=(null)
NodeList=srvrocgpu011
BatchHost=srvrocgpu011
NumNodes=1 NumCPUs=4 NumTasks=4 CPUs/Task=1 ReqB:S:C:T=0:0:*:*
ReqTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
AllocTRES=cpu=4,mem=36568M,node=1,billing=8,gres/gpu=1,gres/gpu:ampere80=1
Socks/Node=* NtasksPerN:B:S:C=0:0:*:* CoreSpec=*
JOB_GRES=gpu:ampere80:1
Nodes=srvrocgpu011 CPU_IDs=3-4,31-32 Mem=36568 GRES=
MinCPUsNode=1 MinMemoryCPU=9142M MinTmpDiskNode=0
Features=(null) DelayBoot=00:00:00
OverSubscribe=OK Contiguous=0 Licenses=(null) Network=(null)
Command=/home/01476962/lowgeo/all_ckpt.sh
WorkDir=/home/01476962/lowgeo
StdErr=/home/01476962/lowgeo/debug_ckpt.log
StdIn=/dev/null
StdOut=/home/01476962/lowgeo/debug_ckpt.log
Power=
TresPerNode=gres/gpu:ampere80:1
|