University of Cape Town
UCT High Performance Computing SLURM Cluster

Blog       UCT-HPC       Citations       Contact us       Help
Wed Jun 28 22:40:01 SAST 2017

CLUSTER LOAD Hold mouse over bars and indicators for more info. Lamp status
Partitions   
ucthi   uctlo
ucthimem
uctlomem

400

12

401

0

402

0

406

0

407

6

408

3

409

0

410

0

411

0

412

0

413

0

414

0

415

0

416

0

417

0

418

0
Disk space:
 / = 10% of 96G
/home = 79% of 504G
/scratch = 76% of 24T
Users logged in: rndroj001

Head Node load: 0.03     Head Node RAM free: 98%
Currently computing: 80 hours     Jobs running: 4     Jobs queued: 0
Efficiency: 56%    System overview    Queue accounting    Graphs

JOBS RUNNING
#  JOBID PARTITION              NAME     USER  ACCOUNT      STATE       TIME  CPUS  NODES     NODELIST(REASON)      QOS PRIORITY     CPU TIME
-----------------------------------------------------------------------------------------------------------------------------------------------
1   2108  ucthimem             48p008 arossgil    maths    RUNNING    6:27:37     3      1         srvcnthpc407   normal    10041     19:22:54
2   2109  ucthimem             48p006 arossgil    maths    RUNNING    6:26:26     3      1         srvcnthpc407   normal    10041     19:19:21
3   2110  ucthimem             48p004 arossgil    maths    RUNNING    6:25:43     3      1         srvcnthpc408   normal    10041     19:17:12
4   2111     ucthi            robm0p4 rndroj00 astronom    RUNNING    1:49:46    12      1         srvcnthpc400   normal    10154     21:57:24

CLUSTER STATUS
PARTITION AVAIL  TIMELIMIT  NODES  STATE NODELIST
 ucthi        up 208-08:00:      1  alloc srvcnthpc400
 ucthi        up 208-08:00:      2   idle srvcnthpc[401-402]
 uctlo        up 208-08:00:      1  alloc srvcnthpc400
 uctlo        up 208-08:00:      2   idle srvcnthpc[401-402]
 ucthimem*    up 208-08:00:      2    mix srvcnthpc[407-408]
 ucthimem*    up 208-08:00:     11   idle srvcnthpc[406,409-418]
 uctlomem     up 208-08:00:      2    mix srvcnthpc[407-408]
 uctlomem     up 208-08:00:     11   idle srvcnthpc[406,409-418]

PartitionName=ucthi
    AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL
    AllocNodes=ALL Default=NO QoS=N/A
    DefaultTime=NONE DisableRootJobs=NO ExclusiveUser=NO GraceTime=0 Hidden=NO
    MaxNodes=UNLIMITED MaxTime=208-08:00:00 MinNodes=1 LLN=NO MaxCPUsPerNode=UNLIMITED
    Nodes=srvcnthpc[400-402]
    PriorityJobFactor=20 PriorityTier=20 RootOnly=NO ReqResv=NO OverSubscribe=FORCE:1
    OverTimeLimit=NONE PreemptMode=REQUEUE
    State=UP TotalCPUs=36 TotalNodes=3 SelectTypeParameters=NONE
    DefMemPerCPU=1000 MaxMemPerCPU=2000
 
 PartitionName=uctlo
    AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL
    AllocNodes=ALL Default=NO QoS=N/A
    DefaultTime=NONE DisableRootJobs=NO ExclusiveUser=NO GraceTime=0 Hidden=NO
    MaxNodes=UNLIMITED MaxTime=208-08:00:00 MinNodes=1 LLN=NO MaxCPUsPerNode=UNLIMITED
    Nodes=srvcnthpc[400-402]
    PriorityJobFactor=20 PriorityTier=20 RootOnly=NO ReqResv=NO OverSubscribe=FORCE:1
    OverTimeLimit=NONE PreemptMode=REQUEUE
    State=UP TotalCPUs=36 TotalNodes=3 SelectTypeParameters=NONE
    DefMemPerCPU=1000 MaxMemPerCPU=2000
 
 PartitionName=ucthimem
    AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL
    AllocNodes=ALL Default=YES QoS=N/A
    DefaultTime=NONE DisableRootJobs=NO ExclusiveUser=NO GraceTime=0 Hidden=NO
    MaxNodes=UNLIMITED MaxTime=208-08:00:00 MinNodes=1 LLN=NO MaxCPUsPerNode=UNLIMITED
    Nodes=srvcnthpc[406-418]
    PriorityJobFactor=20 PriorityTier=20 RootOnly=NO ReqResv=NO OverSubscribe=FORCE:4
    OverTimeLimit=NONE PreemptMode=REQUEUE
    State=UP TotalCPUs=104 TotalNodes=13 SelectTypeParameters=NONE
    DefMemPerCPU=2000 MaxMemPerCPU=4000
 
 PartitionName=uctlomem
    AllowGroups=ALL AllowAccounts=ALL AllowQos=ALL
    AllocNodes=ALL Default=NO QoS=N/A
    DefaultTime=NONE DisableRootJobs=NO ExclusiveUser=NO GraceTime=0 Hidden=NO
    MaxNodes=UNLIMITED MaxTime=208-08:00:00 MinNodes=1 LLN=NO MaxCPUsPerNode=UNLIMITED
    Nodes=srvcnthpc[406-418]
    PriorityJobFactor=10 PriorityTier=10 RootOnly=NO ReqResv=NO OverSubscribe=FORCE:4
    OverTimeLimit=NONE PreemptMode=REQUEUE
    State=UP TotalCPUs=104 TotalNodes=13 SelectTypeParameters=NONE
    DefMemPerCPU=2000 MaxMemPerCPU=4000
 

WORKER NODE STATUS
NodeName=srvcnthpc400 Arch=x86_64 CoresPerSocket=6
   CPUAlloc=12 CPUErr=0 CPUTot=12 CPULoad=21.69
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G7:12
   NodeAddr=srvcnthpc400 NodeHostName=srvcnthpc400 Version=17.02
   OS=Linux RealMemory=64000 AllocMem=60000 FreeMem=46454 Sockets=2 Boards=1
   State=ALLOCATED ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthi,uctlo 
   BootTime=2017-06-01T15:09:49 SlurmdStartTime=2017-06-01T15:10:10
   CfgTRES=cpu=12,mem=62.50G
   AllocTRES=cpu=12,mem=60000M
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s
      2111 ucthi robm0p4 rndroj00 R 1:49:47 srvcnthpc400

NodeName=srvcnthpc401 Arch=x86_64 CoresPerSocket=6
   CPUAlloc=0 CPUErr=0 CPUTot=12 CPULoad=12.18
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G7:12
   NodeAddr=srvcnthpc401 NodeHostName=srvcnthpc401 Version=17.02
   OS=Linux RealMemory=22700 AllocMem=0 FreeMem=20571 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthi,uctlo 
   BootTime=2017-06-01T15:09:31 SlurmdStartTime=2017-06-01T15:09:58
   CfgTRES=cpu=12,mem=22700M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc402 Arch=x86_64 CoresPerSocket=6
   CPUAlloc=0 CPUErr=0 CPUTot=12 CPULoad=12.13
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G7:12
   NodeAddr=srvcnthpc402 NodeHostName=srvcnthpc402 Version=17.02
   OS=Linux RealMemory=22700 AllocMem=0 FreeMem=20913 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthi,uctlo 
   BootTime=2017-06-01T15:09:29 SlurmdStartTime=2017-06-01T15:09:45
   CfgTRES=cpu=12,mem=22700M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc406 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G6:8
   NodeAddr=srvcnthpc406 NodeHostName=srvcnthpc406 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=45302 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:06:34 SlurmdStartTime=2017-06-01T15:07:05
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc407 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=6 CPUErr=0 CPUTot=8 CPULoad=2.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G6:8
   NodeAddr=srvcnthpc407 NodeHostName=srvcnthpc407 Version=17.02
   OS=Linux RealMemory=48000 AllocMem=24000 FreeMem=38746 Sockets=2 Boards=1
   State=MIXED ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:06:46 SlurmdStartTime=2017-06-01T15:07:11
   CfgTRES=cpu=8,mem=48000M
   AllocTRES=cpu=6,mem=24000M
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s
      2109 ucthimem 48p006 arossgil R 6:26:27 srvcnthpc407
      2108 ucthimem 48p008 arossgil R 6:27:38 srvcnthpc407

NodeName=srvcnthpc408 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=3 CPUErr=0 CPUTot=8 CPULoad=1.00
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G6:8
   NodeAddr=srvcnthpc408 NodeHostName=srvcnthpc408 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=12000 FreeMem=25990 Sockets=2 Boards=1
   State=MIXED ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:06:26 SlurmdStartTime=2017-06-01T15:06:50
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=cpu=3,mem=12000M
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s
      2110 ucthimem 48p004 arossgil R 6:25:44 srvcnthpc408

NodeName=srvcnthpc409 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G1:8
   NodeAddr=srvcnthpc409 NodeHostName=srvcnthpc409 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29299 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:05:23 SlurmdStartTime=2017-06-01T15:06:13
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc410 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G1:8
   NodeAddr=srvcnthpc410 NodeHostName=srvcnthpc410 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29381 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:05:23 SlurmdStartTime=2017-06-01T15:06:13
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc411 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G1:8
   NodeAddr=srvcnthpc411 NodeHostName=srvcnthpc411 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29403 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:05:23 SlurmdStartTime=2017-06-01T15:06:08
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc412 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G1:8
   NodeAddr=srvcnthpc412 NodeHostName=srvcnthpc412 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29415 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:05:23 SlurmdStartTime=2017-06-01T15:05:54
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc413 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G1:8
   NodeAddr=srvcnthpc413 NodeHostName=srvcnthpc413 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29647 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:05:23 SlurmdStartTime=2017-06-01T15:17:16
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc414 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G1:8
   NodeAddr=srvcnthpc414 NodeHostName=srvcnthpc414 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29426 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:05:23 SlurmdStartTime=2017-06-01T15:06:08
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc415 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G6:8
   NodeAddr=srvcnthpc415 NodeHostName=srvcnthpc415 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29426 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:06:19 SlurmdStartTime=2017-06-01T15:06:44
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc416 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G1:8
   NodeAddr=srvcnthpc416 NodeHostName=srvcnthpc416 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29424 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T15:05:23 SlurmdStartTime=2017-06-01T15:06:07
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc417 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G6:8
   NodeAddr=srvcnthpc417 NodeHostName=srvcnthpc417 Version=17.02
   OS=Linux RealMemory=48000 AllocMem=0 FreeMem=44624 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-01T14:47:53 SlurmdStartTime=2017-06-01T14:48:18
   CfgTRES=cpu=8,mem=48000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s

NodeName=srvcnthpc418 Arch=x86_64 CoresPerSocket=4
   CPUAlloc=0 CPUErr=0 CPUTot=8 CPULoad=0.01
   AvailableFeatures=(null)
   ActiveFeatures=(null)
   Gres=chip:G6:8
   NodeAddr=srvcnthpc418 NodeHostName=srvcnthpc418 Version=17.02
   OS=Linux RealMemory=32000 AllocMem=0 FreeMem=29607 Sockets=2 Boards=1
   State=IDLE ThreadsPerCore=1 TmpDisk=0 Weight=1 Owner=N/A MCS_label=N/A
   Partitions=ucthimem,uctlomem 
   BootTime=2017-06-06T09:56:57 SlurmdStartTime=2017-06-06T09:57:21
   CfgTRES=cpu=8,mem=32000M
   AllocTRES=
   CapWatts=n/a
   CurrentWatts=0 LowestJoules=0 ConsumedJoules=0
   ExtSensorsJoules=n/s ExtSensorsWatts=0 ExtSensorsTemp=n/s