User Tools

Site Tools


administration:torque-maui-config

Differences

This shows you the differences between two versions of the page.

Link to this comparison view

Both sides previous revisionPrevious revision
Next revision
Previous revision
administration:torque-maui-config [2008/08/07 10:51] cangianiadministration:torque-maui-config [2009/05/06 16:57] (current) damir
Line 1: Line 1:
 ==== Torque ==== ==== Torque ====
-The magic command for torque configuration is ''qmgr''Used either as interpreter (interactive and/or stdin redirect) or for running one directive at a time (''qmgr -c "directive"''). Directives are of the form ''command server|queue|node [names] [attr OP value[,attr OP value,...]]'', where ''command'' is one of {''set'', ''unset'', ''print'', ''create'', ''delete'', ''list''}; ''names'' is for example the name of the queue, and the attributes are described in the following links for [[http://www.clusterresources.com/torquedocs21/a.bserverparameters.shtml#open|server]] and [[http://www.clusterresources.com/torquedocs21/4.1queueconfig.shtml|queue]] parameters.+The gateway to Torque configuration is the command ''qmgr''It reads configuration directives from ''stdin'' or from command-line argument (''qmgr -c "directive"'').  
 +Configuration directives are of the form  
 +<code> 
 +command server|queue|node [names] [attr OP value[,attr OP value,...]] 
 +</code> 
 +where ''command'' is ''set unset print create delete | list'', ''names'' is a list of object names such as a queue name, and attributes are various object properties. Refer to the following links for detailed information on [[http://www.clusterresources.com/torquedocs21/a.bserverparameters.shtml#open|server]] and [[http://www.clusterresources.com/torquedocs21/4.1queueconfig.shtml|queue]] parameters
 + 
 +The directive ''print server'' (''qmgr -c "print server"'' or ''qmgr -c "p s"'') prints all the server configuration in a format that is just the list of commands that needs to be given to qmgr to reconfigure the server exactly as it is. Example:\\ 
 +configuration at 6 of May 2009.
  
-The directive ''print server'' (''qmgr -c "print server"'' or ''qmgr -c "p s"'') prints all the server configuration in a format that is just the list of commands that needs to be given to qmgr to reconfigure the server exactly as it is. Example: 
 <code> <code>
 [root@licossrv4 maui]# qmgr -c 'p s' [root@licossrv4 maui]# qmgr -c 'p s'
Line 14: Line 21:
 set queue long queue_type = Execution set queue long queue_type = Execution
 set queue long Priority = 60 set queue long Priority = 60
-set queue long max_running = 150+set queue long max_running = 130
 set queue long resources_default.nice = 5 set queue long resources_default.nice = 5
 set queue long acl_group_enable = True set queue long acl_group_enable = True
Line 25: Line 32:
 set queue long acl_groups += student set queue long acl_groups += student
 set queue long max_user_run = 150 set queue long max_user_run = 150
-set queue long enabled = True+set queue long enabled = False
 set queue long started = True set queue long started = True
 # #
Line 32: Line 39:
 create queue default create queue default
 set queue default queue_type = Route set queue default queue_type = Route
 +set queue default resources_default.neednodes = general
 set queue default route_destinations = short set queue default route_destinations = short
 set queue default route_destinations += long set queue default route_destinations += long
 +set queue default route_destinations += smallmem
 +set queue default route_destinations += night
 +set queue default route_destinations += bertrand
 +set queue default route_destinations += nolimit
 set queue default route_destinations += algo set queue default route_destinations += algo
 set queue default enabled = True set queue default enabled = True
 set queue default started = True set queue default started = True
-...+
 +# Create and define queue nolimit 
 +
 +create queue nolimit 
 +set queue nolimit queue_type = Execution 
 +set queue nolimit Priority = 60 
 +set queue nolimit max_running = 130 
 +set queue nolimit resources_default.neednodes = nows 
 +set queue nolimit resources_default.nice = 5 
 +set queue nolimit acl_group_enable = True 
 +set queue nolimit acl_groups = algo 
 +set queue nolimit acl_groups += licos 
 +set queue nolimit acl_groups += arni 
 +set queue nolimit acl_groups += lthc 
 +set queue nolimit acl_groups += lthi 
 +set queue nolimit acl_groups += lcm 
 +set queue nolimit acl_groups += student 
 +set queue nolimit max_user_run = 150 
 +set queue nolimit enabled = True 
 +set queue nolimit started = True 
 +
 +# Create and define queue smallmem 
 +
 +create queue smallmem 
 +set queue smallmem queue_type = Execution 
 +set queue smallmem Priority = 80 
 +set queue smallmem max_running = 130 
 +set queue smallmem resources_max.mem = 512mb 
 +set queue smallmem resources_default.nice = 5 
 +set queue smallmem acl_group_enable = True 
 +set queue smallmem acl_groups = algo 
 +set queue smallmem acl_groups += licos 
 +set queue smallmem acl_groups += arni 
 +set queue smallmem acl_groups += lthc 
 +set queue smallmem acl_groups += lthi 
 +set queue smallmem acl_groups += lcm 
 +set queue smallmem acl_groups += student 
 +set queue smallmem acl_groups += 11240 
 +set queue smallmem max_user_run = 150 
 +set queue smallmem enabled = True 
 +set queue smallmem started = True 
 +
 +# Create and define queue night 
 +
 +create queue night 
 +set queue night queue_type = Execution 
 +set queue night Priority = 60 
 +set queue night max_running = 130 
 +set queue night resources_max.cput = 08:00:00 
 +set queue night resources_default.nice = 5 
 +set queue night acl_group_enable = True 
 +set queue night acl_groups = algo 
 +set queue night acl_groups += licos 
 +set queue night acl_groups += arni 
 +set queue night acl_groups += lthc 
 +set queue night acl_groups += lthi 
 +set queue night acl_groups += lcm 
 +set queue night acl_groups += student 
 +set queue night max_user_run = 150 
 +set queue night enabled = False 
 +set queue night started = False 
 +
 +# Create and define queue short 
 +
 +create queue short 
 +set queue short queue_type = Execution 
 +set queue short Priority = 100 
 +set queue short resources_max.cput = 01:00:00 
 +set queue short resources_default.cput = 01:00:00 
 +set queue short resources_default.nice = 5 
 +set queue short acl_group_enable = True 
 +set queue short acl_groups = algo 
 +set queue short acl_groups += licos 
 +set queue short acl_groups += arni 
 +set queue short acl_groups += lthc 
 +set queue short acl_groups += lthi 
 +set queue short acl_groups += lcm 
 +set queue short acl_groups += student 
 +set queue short max_user_run = 100 
 +set queue short enabled = True 
 +set queue short started = True 
 +
 +# Create and define queue algo 
 +
 +create queue algo 
 +set queue algo queue_type = Execution 
 +set queue algo Priority = 60 
 +set queue algo resources_max.cput = 24:00:00 
 +set queue algo resources_default.neednodes = algo 
 +set queue algo resources_default.nice = 5 
 +set queue algo resources_default.walltime = 01:00:00 
 +set queue algo acl_group_enable = False 
 +set queue algo acl_groups = algo 
 +set queue algo enabled = True 
 +set queue algo started = True 
 +
 +# Create and define queue bertrand 
 +
 +create queue bertrand 
 +set queue bertrand queue_type = Execution 
 +set queue bertrand acl_user_enable = True 
 +set queue bertrand acl_users = bertrand 
 +set queue bertrand acl_users += cangiani 
 +set queue bertrand acl_users += damir 
 +set queue bertrand resources_default.neednodes = bertrand 
 +set queue bertrand enabled = True 
 +set queue bertrand started = True
 # #
 # Set server attributes. # Set server attributes.
Line 44: Line 162:
 set server managers = cangiani@*.epfl.ch set server managers = cangiani@*.epfl.ch
 set server managers += damir@*.epfl.ch set server managers += damir@*.epfl.ch
-set server managers += root@licossrv4.epfl.ch+set server managers += laurenzi@*.epfl.ch 
 +set server managers += root@iscsrv27.epfl.ch
 set server operators = cangiani@*.epfl.ch set server operators = cangiani@*.epfl.ch
 set server operators += damir@*.epfl.ch set server operators += damir@*.epfl.ch
 +set server operators += laurenzi@*.epfl.ch
 set server default_queue = default set server default_queue = default
 set server log_events = 511 set server log_events = 511
 set server mail_from = adm set server mail_from = adm
 set server query_other_jobs = True set server query_other_jobs = True
 +set server resources_default.cput = 01:00:00
 +set server resources_default.mem = 512mb
 set server resources_default.nodect = 1 set server resources_default.nodect = 1
 set server resources_default.nodes = 1 set server resources_default.nodes = 1
Line 59: Line 181:
 set server pbs_version = 2.1.10 set server pbs_version = 2.1.10
 set server allow_node_submit = True set server allow_node_submit = True
 +
 +
 +</code>
 +
 +
 +==== Maui ====
 +Maui reads its configuration from a simple text file: ''/usr/local/maui/maui.cfg''. Here is a [[http://www.clusterresources.com/products/maui/docs/a.fparameters.shtml|full list of parameters]], and here the [[http://www.clusterresources.com/products/maui/docs/mauiadmin.pdf|the maui administration guide in pdf]].
 +
 +current configuration 6 of may 2009
 +<code>
 +# maui.cfg 3.2.6p19
 +
 +SERVERHOST            iscsrv27.epfl.ch
 +# primary admin must be first in list
 +ADMIN1                root damir cangiani
 +ADMIN2                damir cangiani
 +ADMINHOST             localhost iscsrv27 iscsrv27.epfl.ch lthipc1.epfl.ch lthipc1
 +
 +# Resource Manager Definition
 +RMTYPE[0] PBS
 +RMHOST[0] iscsrv27.epfl.ch
 +RMPOST[0] 15001
 +
 +#RMCFG[LICOSSRV4.EPFL.CH] TYPE=PBS@RMNMHOST@
 +
 +# Allocation Manager Definition
 +
 +AMCFG[bank]  TYPE=NONE
 +
 +# full parameter docs at http://supercluster.org/mauidocs/a.fparameters.html
 +# use the 'schedctl -l' command to display current configuration
 +
 +RMPOLLINTERVAL        00:01:00
 +
 +SERVERPORT            42559
 +#SERVERPORT            15004
 +SERVERMODE            NORMAL
 +#SERVERMODE            TEST
 +
 +# Admin: http://supercluster.org/mauidocs/a.esecurity.html
 +
 +
 +LOGFILE               maui.log
 +LOGFILEMAXSIZE        100000000
 +LOGLEVEL              3
 +
 +# Job Priority: http://supercluster.org/mauidocs/5.1jobprioritization.html
 +
 +QUEUETIMEWEIGHT       
 +JOBPRIOACCRUALPOLICY  FULLPOLICY
 +MAXJOBQUEUEDPERUSER   32
 +# MAXPROCPERUSER        0
 +XFWEIGHT              200
 +
 +# FairShare: http://supercluster.org/mauidocs/6.3fairshare.html
 +
 +FSPOLICY              DEDICATEDPES
 +FSDEPTH               7
 +FSINTERVAL            86400
 +FSDECAY               0.80
 +
 +FSWEIGHT              20
 +FSUSERWEIGHT          1
 +FSGROUPWEIGHT         0
 +USERCFG[DEFAULT]      FSTARGET=100
 +
 +# Throttling Policies: http://supercluster.org/mauidocs/6.2throttlingpolicies.html
 +
 +# NONE SPECIFIED
 +
 +# Backfill: http://supercluster.org/mauidocs/8.2backfill.html
 +
 +BACKFILLPOLICY        FIRSTFIT
 +RESERVATIONPOLICY     CURRENTHIGHEST
 +
 +# Node Allocation: http://supercluster.org/mauidocs/5.2nodeallocation.html
 +
 +# NODEALLOCATIONPOLICY  MINRESOURCE
 +# get always the fastest node instead
 +NODEALLOCATIONPOLICY  FASTEST
 +
 +# QOS: http://supercluster.org/mauidocs/7.3qos.html
 +
 +# QOSCFG[hi]  PRIORITY=100 XFTARGET=100 FLAGS=PREEMPTOR:IGNMAXJOB
 +# QOSCFG[low] PRIORITY=-1000 FLAGS=PREEMPTEE
 +
 +# Standing Reservations: http://supercluster.org/mauidocs/7.1.3standingreservations.html
 +
 +# SRSTARTTIME[test] 8:00:00
 +# SRENDTIME[test]   17:00:00
 +# SRDAYS[test]      MON TUE WED THU FRI
 +# SRTASKCOUNT[test] 20
 +# SRMAXTIME[test]   0:30:00
 +
 +# Creds: http://supercluster.org/mauidocs/6.1fairnessoverview.html
 +
 +# USERCFG[DEFAULT]      FSTARGET=100
 +# GROUPCFG[DEFAULT]     FSTARGET=100
 +# USERCFG[john]         PRIORITY=100  FSTARGET=10.0-
 +# GROUPCFG[staff]       PRIORITY=1000 QLIST=hi:low QDEF=hi
 +# CLASSCFG[batch]       FLAGS=PREEMPTEE
 +# CLASSCFG[interactive] FLAGS=PREEMPTOR
 +
 +# node configurations
 +# NODECFG[nodename] properties list
 +# where nodename can also be 'DEFAULT', and (some of the) properties are
 +# PARTITION=string a way to group machines. Multi CPU jobs are always
 +# runned within the same partition.
 +#                       (e.g. PARTITION=algo_cluster) It can also be used to
 +# give exclusive use of certain machines to a given group
 +# GROUPCFG[algo] PLIST=algo_cluster
 +# PROCSPEED=integer the processor clock in MHz
 +# SPEED=float the overall speed of the machine with respect to a
 +# standard reference. 0.0 < float <= 100.0
 +# FEATURES=stringlist a set of "opaque" feature of the node (e.g. 
 +# FEATURES=Opteron:myrinet:fpga:matlab
 +# MAXJOB=integer maximum number of job that can run simultaneusly
 +#
 +#NODECFG[DEFAULT] MAXLOAD=2.5
 +#NODECFG[DEFAULT] MAXJOB=2
 +
 +DEFERTIME 0
  
 </code> </code>
  
administration/torque-maui-config.1218106299.txt.gz · Last modified: 2008/08/07 10:51 by cangiani