Torque & Maui Important Commands

root@n1:~# checknode n1

checking node n1

State:      Idle  (in current state for 00:06:12)
Configured Resources: PROCS: 4  MEM: 995M  SWAP: 2017M  DISK: 1M
Utilized   Resources: SWAP: 223M
Dedicated  Resources: [NONE]
Opsys:         linux  Arch:      [NONE]
Speed:      1.00  Load:       0.000
Network:    [DEFAULT]
Features:   [NONE]
Attributes: [Batch]
Classes:    [batch 4:4]

Total Time: 1:47:36  Up: 1:47:36 (100.00%)  Active: 00:07:51 (7.30%)

Reservations:
NOTE:  no reservations on node 

root@n1:~# diagnose -n

diagnosing node table (5120 slots)
Name                    State  Procs     Memory         Disk          Swap      Speed  Opsys   Arch Par   Load Res Classes                        Network                        Features

n1                       Idle   4:4      995:995         1:1        1794:2017    1.00  linux [NONE] DEF   0.00 000 [batch_4:4]                    [DEFAULT]                      [NONE]
-----                     ---   4:4      995:995         1:1        1794:2017

Total Nodes: 1  (Active: 0  Idle: 1  Down: 0)

root@n1:~# diagnose -c

Class/Queue Status

Name           Priority Flags        QDef              QOSList* PartitionList        Target Limits

batch                 0 [NONE]       [NONE]             [NONE]  [NONE]                0.00  MAXJOB=0:4
  MAXPROCPERJOB=4
root@n1:~# diagnose -j
Name                  State Par Proc QOS     WCLimit R  Min     User    Group  Account  QueuedTime  Network  Opsys   Arch    Mem   Disk  Procs       Class Features

12                  Running DEF    4 DEF     1:00:00 1    4    rravi    rravi        -    00:00:02   [NONE] [NONE] [NONE]    >=0    >=0    NC0   [batch:1] [NONE]


Total Jobs: 1  Active Jobs: 1

root@n1:~# tracejob -q 13

Job: 13.n1.test.com

08/01/2013 09:54:16  S    enqueuing into batch, state 1 hop 1
08/01/2013 09:54:16  A    queue=batch
08/01/2013 09:54:17  S    Job Run at request of root@n1.test.com
08/01/2013 09:54:17  S    Not sending email: User does not want mail of this type.
08/01/2013 09:54:17  A    user=rravi group=rravi jobname=host queue=batch ctime=1375331056 qtime=1375331056 etime=1375331056 start=1375331057 owner=rravi@n1.test.com exec_host=n1/3+n1/2+n1/1+n1/0 Resource_List.ncpus=1
                          Resource_List.neednodes=1:ppn=4 Resource_List.nodect=1 Resource_List.nodes=1:ppn=4 Resource_List.walltime=01:00:00

root@n1:~# checkjob 13

checking job 13

State: Running
Creds:  user:rravi  group:rravi  class:batch  qos:DEFAULT
WallTime: 00:00:31 of 1:00:00
SubmitTime: Thu Aug  1 09:54:16
  (Time Queued  Total: 00:00:01  Eligible: 00:00:01)

StartTime: Thu Aug  1 09:54:17
Total Tasks: 4

Req[0]  TaskCount: 4  Partition: DEFAULT
Network: [NONE]  Memory >= 0  Disk >= 0  Swap >= 0
Opsys: [NONE]  Arch: [NONE]  Features: [NONE]
Allocated Nodes:
[n1:4]


IWD: [NONE]  Executable:  [NONE]
Bypass: 0  StartCount: 1
PartitionMask: [ALL]
Flags:       RESTARTABLE

Reservation '13' (-00:00:31 -> 00:59:29  Duration: 1:00:00)
PE:  4.00  StartPriority:  1

root@n1:~# qstat

Job ID                    Name             User            Time Use S Queue
------------------------- ---------------- --------------- -------- - -----
13.n1                      host             rravi           00:00:00 R batch

root@n1:~# showq

ACTIVE JOBS--------------------
JOBNAME            USERNAME      STATE  PROC   REMAINING            STARTTIME

13                    rravi    Running     4    00:58:58  Thu Aug  1 09:54:17

     1 Active Job        4 of    4 Processors Active (100.00%)
                         1 of    1 Nodes Active      (100.00%)

IDLE JOBS----------------------
JOBNAME            USERNAME      STATE  PROC     WCLIMIT            QUEUETIME


0 Idle Jobs

BLOCKED JOBS----------------
JOBNAME            USERNAME      STATE  PROC     WCLIMIT            QUEUETIME


Total Jobs: 1   Active Jobs: 1   Idle Jobs: 0   Blocked Jobs: 0

root@n1:~# showbf

backfill window (user: 'root' group: 'root' partition: ALL) Thu Aug  1 09:55:50

no procs available

root@n1:~# canceljob 13

job '13' cancelled

root@n1:~# qmgr -c ‘print server’ || qmgr -c ‘p s’

#
# Create queues and set their attributes.
#
#
# Create and define queue batch
#
create queue batch
set queue batch queue_type = Execution
set queue batch max_running = 4
set queue batch resources_max.ncpus = 4
set queue batch resources_max.nodes = 2
set queue batch resources_min.ncpus = 1
set queue batch resources_default.ncpus = 1
set queue batch resources_default.nodect = 1
set queue batch resources_default.nodes = 1
set queue batch resources_default.walltime = 01:00:00
set queue batch enabled = True
set queue batch started = True
#
# Set server attributes.
#
set server scheduling = True
set server acl_hosts = n1
set server default_queue = batch
set server log_events = 511
set server mail_from = adm
set server scheduler_iteration = 600
set server node_check_rate = 150
set server tcp_timeout = 300
set server job_stat_rate = 45
set server poll_jobs = True
set server mom_job_sync = True
set server keep_completed = 0
set server next_job_number = 14
set server moab_array_compatible = True
Advertisements

Leave a Reply

Fill in your details below or click an icon to log in:

WordPress.com Logo

You are commenting using your WordPress.com account. Log Out / Change )

Twitter picture

You are commenting using your Twitter account. Log Out / Change )

Facebook photo

You are commenting using your Facebook account. Log Out / Change )

Google+ photo

You are commenting using your Google+ account. Log Out / Change )

Connecting to %s