[Mauiusers] Couldn`t submit any job: Cannot set hostlist
renyanliang
yanliangren_2002 at yahoo.com.cn
Wed Apr 12 20:48:41 MDT 2006
Dear everybody:
Glad to meet you, I used the openpbs v2.3.16 and maui 3.2.6p14, However, anybody submitted job always couldn`t run and alway defered by maui, the shown reason is :
===========================
checking job 5111
State: Idle EState: Deferred
Creds: user:ren group:[DEFAULT] class:rcmm1 qos:DEFAULT
WallTime: 00:00:00 of 99:23:59:59
SubmitTime: Thu Apr 13 10:26:04
(Time Queued Total: 00:32:05 Eligible: 00:00:01)
StartDate: -00:32:03 Thu Apr 13 10:26:06
Total Tasks: 2
Req[0] TaskCount: 2 Partition: ALL
Network: [NONE] Memory >= 0 Disk >= 0 Swap >= 0
Opsys: [NONE] Arch: [NONE] Features: [NONE]
IWD: [NONE] Executable: [NONE]
Bypass: 0 StartCount: 1
PartitionMask: [ALL]
job is deferred. Reason: RMFailure (job cannot be started - cannot set hostlist)
Holds: Defer (hold reason: RMFailure)
PE: 2.00 StartPriority: 1
cannot select job 5111 for partition DEFAULT (job hold active)
===============================
Hope somebody can give me some advice, Thanks advance!
Best Regard!
The openpbs config is following:
#
# Create queues and set their attributes.
#
#
# Create and define queue rcmm1
#
create queue rcmm1
set queue rcmm1 queue_type = Execution
set queue rcmm1 acl_host_enable = False
set queue rcmm1 acl_hosts = +rcmm5+rcmm6+rcmm7+rcmm8+rcmm9+rcmm10+rcmm11+rcmm12+rcmm13
set queue rcmm1 max_user_proc = 4
set queue rcmm1 enabled = True
set queue rcmm1 started = True
#
# Create and define queue rcmm2
#
create queue rcmm2
set queue rcmm2 queue_type = Execution
set queue rcmm2 max_user_proc = 4
set queue rcmm2 enabled = True
set queue rcmm2 started = True
#
# Set server attributes.
#
set server scheduling = True
set server managers = liu@*
set server default_queue = rcmm1
set server log_events = 511
set server mail_from = Rcmm1
set server query_other_jobs = True
set server scheduler_iteration = 600
set server default_node = rcmm5
set server node_pack = True
--------------------------------------------------------------------------
The showconfig result is:
# Maui version (PID: 32661)
# global policies
REJECTNEGPRIOJOBS[0] FALSE
ENABLENEGJOBPRIORITY[0] FALSE
ENABLEMULTINODEJOBS[0] TRUE
ENABLEMULTIREQJOBS[0] FALSE
BFPRIORITYPOLICY[0] [NONE]
JOBPRIOACCRUALPOLICY QUEUEPOLICY
NODELOADPOLICY ADJUSTSTATE
USEMACHINESPEED FALSE
USESYSTEMQUEUETIME TRUE
USELOCALMACHINEPRIORITY FALSE
NODEUNTRACKEDLOADFACTOR 1.2
JOBNODEMATCHPOLICY[0]
JOBMAXSTARTTIME[0] INFINITY
METAMAXTASKS[0] 0
NODESETPOLICY[0] [NONE]
NODESETATTRIBUTE[0] [NONE]
NODESETLIST[0]
NODESETDELAY[0] 00:00:00
NODESETPRIORITYTYPE[0] MINLOSS
NODESETTOLERANCE[0] 0.00
BACKFILLPOLICY[0] FIRSTFIT
BACKFILLDEPTH[0] 0
BACKFILLPROCFACTOR[0] 0
BACKFILLMAXSCHEDULES[0] 10000
BACKFILLMETRIC[0] PROCS
BFCHUNKDURATION[0] 00:00:00
BFCHUNKSIZE[0] 0
PREEMPTPOLICY[0] REQUEUE
MINADMINSTIME[0] 00:00:00
RESOURCELIMITPOLICY[0]
NODEAVAILABILITYPOLICY[0] COMBINED:[DEFAULT]
NODEALLOCATIONPOLICY[0] MINRESOURCE
TASKDISTRIBUTIONPOLICY[0] DEFAULT
RESERVATIONPOLICY[0] CURRENTHIGHEST
RESERVATIONRETRYTIME[0] 00:00:00
RESERVATIONTHRESHOLDTYPE[0] NONE
RESERVATIONTHRESHOLDVALUE[0] 0
FSPOLICY [NONE]
FSINTERVAL 12:00:00
FSDEPTH 8
FSDECAY 1.00
# Priority Weights
SERVICEWEIGHT[0] 1
TARGETWEIGHT[0] 1
CREDWEIGHT[0] 1
ATTRWEIGHT[0] 1
FSWEIGHT[0] 1
RESWEIGHT[0] 1
USAGEWEIGHT[0] 1
QUEUETIMEWEIGHT[0] 1
XFACTORWEIGHT[0] 0
SPVIOLATIONWEIGHT[0] 0
BYPASSWEIGHT[0] 0
TARGETQUEUETIMEWEIGHT[0] 0
TARGETXFACTORWEIGHT[0] 0
USERWEIGHT[0] 0
GROUPWEIGHT[0] 0
ACCOUNTWEIGHT[0] 0
QOSWEIGHT[0] 0
CLASSWEIGHT[0] 0
FSUSERWEIGHT[0] 0
FSGROUPWEIGHT[0] 0
FSACCOUNTWEIGHT[0] 0
FSQOSWEIGHT[0] 0
FSCLASSWEIGHT[0] 0
ATTRATTRWEIGHT[0] 0
ATTRSTATEWEIGHT[0] 0
NODEWEIGHT[0] 0
PROCWEIGHT[0] 0
MEMWEIGHT[0] 0
SWAPWEIGHT[0] 0
DISKWEIGHT[0] 0
PSWEIGHT[0] 0
PEWEIGHT[0] 0
WALLTIMEWEIGHT[0] 0
UPROCWEIGHT[0] 0
UJOBWEIGHT[0] 0
CONSUMEDWEIGHT[0] 0
REMAININGWEIGHT[0] 0
PERCENTWEIGHT[0] 0
XFMINWCLIMIT[0] 00:02:00
# partition DEFAULT policies
REJECTNEGPRIOJOBS[1] FALSE
ENABLENEGJOBPRIORITY[1] FALSE
ENABLEMULTINODEJOBS[1] TRUE
ENABLEMULTIREQJOBS[1] FALSE
BFPRIORITYPOLICY[1] [NONE]
JOBPRIOACCRUALPOLICY QUEUEPOLICY
NODELOADPOLICY ADJUSTSTATE
JOBNODEMATCHPOLICY[1]
JOBMAXSTARTTIME[1] INFINITY
METAMAXTASKS[1] 0
NODESETPOLICY[1] [NONE]
NODESETATTRIBUTE[1] [NONE]
NODESETLIST[1]
NODESETDELAY[1] 00:00:00
NODESETPRIORITYTYPE[1] MINLOSS
NODESETTOLERANCE[1] 0.00
# Priority Weights
XFMINWCLIMIT[1] 00:00:00
RMAUTHTYPE[0] CHECKSUM
CLASSCFG[[NONE]] DEFAULT.FEATURES=[NONE]
CLASSCFG[[ALL]] DEFAULT.FEATURES=[NONE]
CLASSCFG[rcmm1] DEFAULT.FEATURES=[NONE]
CLASSCFG[rcmm2] DEFAULT.FEATURES=[NONE]
QOSPRIORITY[0] 0
QOSQTWEIGHT[0] 0
QOSXFWEIGHT[0] 0
QOSTARGETXF[0] 0.00
QOSTARGETQT[0] 00:00:00
QOSFLAGS[0]
QOSPRIORITY[1] 0
QOSQTWEIGHT[1] 0
QOSXFWEIGHT[1] 0
QOSTARGETXF[1] 0.00
QOSTARGETQT[1] 00:00:00
QOSFLAGS[1]
# SERVER MODULES: MX
SERVERMODE NORMAL
SERVERNAME
SERVERHOST rcmm1
SERVERPORT 42559
LOGFILE maui.log
LOGFILEMAXSIZE 10000000
LOGFILEROLLDEPTH 1
LOGLEVEL 8
LOGFACILITY fALL
SERVERHOMEDIR /usr/local/maui/
TOOLSDIR /usr/local/maui/tools/
LOGDIR /usr/local/maui/log/
STATDIR /usr/local/maui/stats/
LOCKFILE /usr/local/maui/maui.pid
SERVERCONFIGFILE /usr/local/maui/maui.cfg
CHECKPOINTFILE /usr/local/maui/maui.ck
CHECKPOINTINTERVAL 00:05:00
CHECKPOINTEXPIRATIONTIME 3:11:20:00
TRAPJOB
TRAPNODE
TRAPFUNCTION
RESDEPTH 24
RMPOLLINTERVAL 00:00:30
NODEACCESSPOLICY SHARED
ALLOCLOCALITYPOLICY [NONE]
SIMTIMEPOLICY [NONE]
ADMIN1 ren
ADMINHOSTS ALL
NODEPOLLFREQUENCY 0
DISPLAYFLAGS
DEFAULTDOMAIN
DEFAULTCLASSLIST [DEFAULT:1]
FEATURENODETYPEHEADER
FEATUREPROCSPEEDHEADER
FEATUREPARTITIONHEADER
DEFERTIME 1:00:00
DEFERCOUNT 24
DEFERSTARTCOUNT 1
JOBPURGETIME 0
NODEPURGETIME 2140000000
APIFAILURETHRESHHOLD 6
NODESYNCTIME 600
JOBSYNCTIME 600
JOBMAXOVERRUN 00:10:00
NODEMAXLOAD 0.0
PLOTMINTIME 120
PLOTMAXTIME 245760
PLOTTIMESCALE 11
PLOTMINPROC 1
PLOTMAXPROC 512
PLOTPROCSCALE 9
SCHEDCFG[] MODE=NORMAL SERVER=rcmm1:42559
# RM MODULES: PBS SSS WIKI NATIVE
RMCFG[rcmm1] AUTHTYPE=CHECKSUM EPORT=15004 TIMEOUT=00:00:09 TYPE=PBS
SIMWORKLOADTRACEFILE workload
SIMRESOURCETRACEFILE resource
SIMAUTOSHUTDOWN OFF
SIMSTARTTIME 0
SIMSCALEJOBRUNTIME FALSE
SIMFLAGS
SIMJOBSUBMISSIONPOLICY CONSTANTJOBDEPTH
SIMINITIALQUEUEDEPTH 16
SIMWCACCURACY 0.00
SIMWCACCURACYCHANGE 0.00
SIMNODECOUNT 0
SIMNODECONFIGURATION NORMAL
SIMWCSCALINGPERCENT 100
SIMCOMRATE 0.10
SIMCOMTYPE ROUNDROBIN
COMINTRAFRAMECOST 0.30
COMINTERFRAMECOST 0.30
SIMSTOPITERATION -1
SIMEXITITERATION -1
-----------------------------------------------------------------------------
Part log file:
04/13 11:02:17 MQueueSelectJobs(SrcQ,DstQ,HARD,5120,4096,2140000000,EVERY,FReason,FALSE)
04/13 11:02:17 INFO: idle job queue is empty on iteration 79
04/13 11:02:17 MQueueSelectJobs(SrcQ,DstQ,SOFT,5120,4096,2140000000,EVERY,FReason,TRUE)
04/13 11:02:17 INFO: idle job queue is empty on iteration 79
04/13 11:02:17 MQueueSelectJobs(SrcQ,DstQ,HARD,5120,4096,2140000000,EVERY,FReason,TRUE)
04/13 11:02:17 INFO: idle job queue is empty on iteration 79
04/13 11:02:17 INFO: cannot finalize RM cycle (RM 'rcmm1' does not support function 'cyclefinalize')
04/13 11:02:17 MQueueSelectJobs(SrcQ,DstQ,SOFT,5120,4096,2140000000,EVERY,FReason,TRUE)
04/13 11:02:17 INFO: idle job queue is empty on iteration 79
04/13 11:02:17 MSchedUpdateStats()
04/13 11:02:17 INFO: iteration: 79 scheduling time: 0.134 seconds
04/13 11:02:17 MResUpdateStats()
04/13 11:02:17 INFO: current util[79]: 4/6 (66.67%) PH: 0.35% active jobs: 1 of 1 (completed: 0)
04/13 11:02:17 MQueueCheckStatus()
04/13 11:02:17 INFO: checking purge criteria for job '5104'
04/13 11:02:17 INFO: checking purge criteria for job '5108'
04/13 11:02:17 INFO: checking purge criteria for job '5111'
04/13 11:02:17 MNodeCheckStatus()
04/13 11:02:17 INFO: checking node 'rcmm5'
04/13 11:02:17 INFO: checking node 'rcmm6'
04/13 11:02:17 INFO: checking node 'rcmm7'
04/13 11:02:17 INFO: checking node 'rcmm8'
04/13 11:02:17 INFO: checking node 'rcmm9'
04/13 11:02:17 INFO: checking node 'rcmm10'
04/13 11:02:17 INFO: checking node 'rcmm11'
04/13 11:02:17 INFO: checking node 'rcmm12'
04/13 11:02:17 INFO: checking node 'rcmm13'
04/13 11:02:17 INFO: checking node 'rcmm14'
04/13 11:02:17 INFO: checking node 'rcmm15'
04/13 11:02:17 INFO: checking node 'rcmm16'
04/13 11:02:17 INFO: checking node 'rcmm52'
04/13 11:02:17 INFO: checking node 'rcmm53'
04/13 11:02:17 INFO: checking node 'rcmm55'
04/13 11:02:17 INFO: checking node 'rcmm54'
04/13 11:02:17 INFO: checking node 'rcmm56'
04/13 11:02:17 INFO: checking node 'rcmm57'
04/13 11:02:17 MSysCheck()
04/13 11:02:17 MLimitEnforceAll(ALL)
04/13 11:02:17 MUClearChild(PID)
04/13 11:02:17 MParUpdate(ALL)
04/13 11:02:17 INFO: P[ALL]: Total 18:36 Up 6:12 Idle 2:12 Active 4:4
04/13 11:02:17 INFO: MNode[rcmm5] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm6] added to MPar[DEFAULT] (2:2)
04/13 11:02:17 INFO: MNode[rcmm7] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm8] added to MPar[DEFAULT] (2:2)
04/13 11:02:17 INFO: MNode[rcmm9] added to MPar[DEFAULT] (2:2)
04/13 11:02:17 INFO: MNode[rcmm10] added to MPar[DEFAULT] (2:2)
04/13 11:02:17 INFO: MNode[rcmm11] added to MPar[DEFAULT] (2:2)
04/13 11:02:17 INFO: MNode[rcmm12] added to MPar[DEFAULT] (2:2)
04/13 11:02:17 INFO: MNode[rcmm13] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm14] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm15] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm16] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm52] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm53] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm55] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm54] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm56] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: MNode[rcmm57] added to MPar[DEFAULT] (0:2)
04/13 11:02:17 INFO: P[ALL]: Total 18:36 Up 6:12 Idle 2:12 Active 4:4
04/13 11:02:17 MResCheckStatus(NULL)
04/13 11:02:17 INFO: checking R[000]: '5104' end: 99:11:47:26
04/13 11:02:17 INFO: scheduling complete. sleeping 30 seconds
04/13 11:02:17 UIProcessClients(6,30)
04/13 11:02:47 UIProcessClients(7,1)
04/13 11:02:48 ServerProcessRequests()
04/13 11:02:48 MLogRoll(NULL,0,1)
04/13 11:02:48 INFO: not rolling logs (1991856 < 10000000)
04/13 11:02:48 MResAdjust(NULL,0,0)
04/13 11:02:48 MJobSetAttr(,PAL,Value,1,2)
04/13 11:02:48 INFO: job flags for job : 0, req napolicy=SHARED
04/13 11:02:48 MJobSetAttr(,GAttr,Value,1,5)
04/13 11:02:48 INFO: attribute 'PREEMPTEE' cleared for job
04/13 11:02:48 MStatInitializeActiveSysUsage()
04/13 11:02:48 MStatClearUsage([NONE],Active)
04/13 11:02:48 INFO: clearing usage stats for user zhangli
04/13 11:02:48 INFO: clearing usage stats for user ys
04/13 11:02:48 INFO: clearing usage stats for user zqy
04/13 11:02:48 INFO: clearing usage stats for user DEFAULT
04/13 11:02:48 INFO: clearing usage stats for user ren
04/13 11:02:48 INFO: clearing usage stats for group [DEFAULT]
04/13 11:02:48 INFO: clearing usage stats for group NOGROUP
04/13 11:02:48 INFO: clearing usage stats for group DEFAULT
04/13 11:02:48 INFO: clearing usage stats for acct DEFAULT
04/13 11:02:48 INFO: clearing usage stats for qos DEFAULT
04/13 11:02:48 INFO: clearing usage stats for qos [ALL]
04/13 11:02:48 INFO: clearing usage stats for class [NONE]
04/13 11:02:48 INFO: clearing usage stats for class [ALL]
04/13 11:02:48 INFO: clearing usage stats for class rcmm1
04/13 11:02:48 INFO: clearing usage stats for class rcmm2
04/13 11:02:48 INFO: clearing usage stats for par ALL
04/13 11:02:48 INFO: clearing usage stats for par DEFAULT
04/13 11:02:48 ServerUpdate()
04/13 11:02:48 MSysUpdateTime()
04/13 11:02:48 INFO: starting iteration 80
04/13 11:02:48 MSchedProcessJobs()
04/13 11:02:48 MRMGetInfo()
04/13 11:02:48 MClusterClearUsage()
04/13 11:02:48 MRMClusterQuery()
04/13 11:02:48 MPBSClusterQuery(rcmm1,RCount,SC)
04/13 11:02:48 __MPBSGetNodeState(Name,State,PNode)
04/13 11:02:48 INFO: PBS node rcmm5 set to state Down (state-unknown,down)
04/13 11:02:48 MNodeFind(rcmm5,N)
04/13 11:02:48 MRMNodePreUpdate(rcmm5,Down,rcmm1)
04/13 11:02:48 MPBSNodeUpdate(rcmm5,rcmm5,Down,rcmm1)
04/13 11:02:48 MPBSLoadQueueInfo(rcmm1,rcmm5,SC)
04/13 11:02:48 INFO: queue 'rcmm1' started state set to True
04/13 11:02:48 INFO: class to node mapping enabled for queue 'rcmm1'
04/13 11:02:48 INFO: queue 'rcmm2' started state set to True
04/13 11:02:48 INFO: class to node not mapping enabled for queue 'rcmm2' adding class to all nodes
04/13 11:02:48 INFO: MNode[000] ' rcmm5' Down VM: 10 Mem: 1 Dk: 1 Cl: [rcmm1 0:2][rcmm2 0:2] [rcmm1]
04/13 11:02:48 INFO: MNode[000] ' rcmm5' C/A/D procs: 2/0/0
04/13 11:02:48 MRMNodePostUpdate(rcmm5,Down)
04/13 11:02:48 __MPBSGetNodeState(Name,State,PNode)
04/13 11:02:48 INFO: PBS node rcmm6 set to state Idle (free)
04/13 11:02:48 MNodeFind(rcmm6,N)
04/13 11:02:48 MRMNodePreUpdate(rcmm6,Idle,rcmm1)
04/13 11:02:48 INFO: node 'rcmm6' changed states from Running to Idle
04/13 11:02:48 MPBSNodeUpdate(rcmm6,rcmm6,Idle,rcmm1)
04/13 11:02:48 MPBSQueryMOM(rcmm6,rcmm1,Msg,SC)
04/13 11:02:48 ALERT: cannot get req from MOM on node 'rcmm6' (errno: 0:5)
04/13 11:02:48 INFO: MOM info for host 'rcmm6' successfully updated (Thu Apr 13 11:02:48
)
04/13 11:02:48 INFO: node rcmm6 has joblist '0/5104.rcmm1'
04/13 11:02:48 MJobFind('5104.rcmm1',J,0)
04/13 11:02:48 MUGetHash(5104)
04/13 11:02:48 INFO: hash '5104' --> 5223525
04/13 11:02:48 INFO: job '5104' hash 1125
04/13 11:02:48 INFO: job '5104' found at hash[1125] 1 '5104' (J->Name: 5104)
04/13 11:02:48 INFO: job 5104 adds 1 processors per task to node rcmm6 (1)
04/13 11:02:48 MPBSLoadQueueInfo(rcmm1,rcmm6,SC)
04/13 11:02:48 INFO: queue 'rcmm1' started state set to True
04/13 11:02:48 INFO: class to node mapping enabled for queue 'rcmm1'
04/13 11:02:48 INFO: queue 'rcmm2' started state set to True
04/13 11:02:48 INFO: class to node not mapping enabled for queue 'rcmm2' adding class to all nodes
04/13 11:02:48 INFO: MNode[001] ' rcmm6' Idle VM: 10 Mem: 1 Dk: 1 Cl: [rcmm1 2:2][rcmm2 2:2] [rcmm1]
04/13 11:02:48 INFO: MNode[001] ' rcmm6' C/A/D procs: 2/2/1
04/13 11:02:48 MRMNodePostUpdate(rcmm6,Running)
04/13 11:02:48 __MPBSGetNodeState(Name,State,PNode)
04/13 11:02:48 INFO: PBS node rcmm7 set to state Down (state-unknown,down)
04/13 11:02:48 MNodeFind(rcmm7,N)
04/13 11:02:48 MRMNodePreUpdate(rcmm7,Down,rcmm1) 04/13 11:02:48 MPBSNodeUpdate(rcmm7,rcmm7,Down,rcmm1)
04/13 11:02:48 MPBSLoadQueueInfo(rcmm1,rcmm7,SC)
04/13 11:02:48 INFO: queue 'rcmm1' started state set to True
04/13 11:02:48 INFO: class to node mapping enabled for queue 'rcmm1'
04/13 11:02:48 INFO: queue 'rcmm2' started state set to True
04/13 11:02:48 INFO: class to node not mapping enabled for queue 'rcmm2' adding class to all nodes
04/13 11:02:48 INFO: MNode[002] ' rcmm7' Down VM: 10 Mem: 1 Dk: 1 Cl: [rcmm1 0:2][rcmm2 0
:2] [rcmm1]
04/13 11:02:48 INFO: MNode[002] ' rcmm7' C/A/D procs: 2/0/0
04/13 11:02:48 MRMNodePostUpdate(rcmm7,Down)
04/13 11:02:48 __MPBSGetNodeState(Name,State,PNode)
04/13 11:02:48 INFO: PBS node rcmm8 set to state Idle (free)
04/13 11:02:48 MNodeFind(rcmm8,N)
04/13 11:02:48 MRMNodePreUpdate(rcmm8,Idle,rcmm1)
04/13 11:02:48 INFO: node 'rcmm8' changed states from Running to Idle
04/13 11:02:48 MPBSNodeUpdate(rcmm8,rcmm8,Idle,rcmm1)
04/13 11:02:48 MPBSQueryMOM(rcmm8,rcmm1,Msg,SC)
04/13 11:02:48 ALERT: cannot get req from MOM on node 'rcmm8' (errno: 0:5)
04/13 11:02:48 INFO: MOM info for host 'rcmm8' successfully updated (Thu Apr 13 11:02:48
)
04/13 11:02:48 INFO: node rcmm8 has joblist '0/5104.rcmm1'
04/13 11:02:48 MJobFind('5104.rcmm1',J,0)
04/13 11:02:48 MUGetHash(5104)
04/13 11:02:48 INFO: hash '5104' --> 5223525
04/13 11:02:48 INFO: job '5104' hash 1125
04/13 11:02:48 INFO: job '5104' found at hash[1125] 1 '5104' (J->Name: 5104) 04/13 11:02:48 INFO: job 5104 adds 1 processors per task to node rcmm8 (1)
04/13 11:02:48 MPBSLoadQueueInfo(rcmm1,rcmm8,SC)
04/13 11:02:48 INFO: queue 'rcmm1' started state set to True
04/13 11:02:48 INFO: class to node mapping enabled for queue 'rcmm1'
04/13 11:02:48 INFO: queue 'rcmm2' started state set to True
04/13 11:02:48 INFO: class to node not mapping enabled for queue 'rcmm2' adding class to all nodes
04/13 11:02:48 INFO: MNode[003] ' rcmm8' Idle VM: 10 Mem: 1 Dk: 1 Cl: [rcmm1 2:2][rcmm2 2:2] [rcmm1]
04/13 11:02:48 INFO: MNode[003] ' rcmm8' C/A/D procs: 2/2/1
04/13 11:02:48 MRMNodePostUpdate(rcmm8,Running)
04/13 11:02:48 __MPBSGetNodeState(Name,State,PNode)
04/13 11:02:48 INFO: PBS node rcmm9 set to state Idle (free)
04/13 11:02:48 MNodeFind(rcmm9,N)
04/13 11:02:48 MRMNodePreUpdate(rcmm9,Idle,rcmm1)
04/13 11:02:48 INFO: node 'rcmm9' changed states from Running to Idle
04/13 11:02:48 MPBSNodeUpdate(rcmm9,rcmm9,Idle,rcmm1)
04/13 11:02:48 MPBSQueryMOM(rcmm9,rcmm1,Msg,SC)
04/13 11:02:48 ALERT: cannot get req from MOM on node 'rcmm9' (errno: 0:5)
04/13 11:02:48 INFO: MOM info for host 'rcmm9' successfully updated (Thu Apr 13 11:02:48
)
04/13 11:02:48 INFO: node rcmm9 has joblist '0/5104.rcmm1'
04/13 11:02:48 MJobFind('5104.rcmm1',J,0)
04/13 11:02:48 MUGetHash(5104)
04/13 11:02:48 INFO: hash '5104' --> 5223525
04/13 11:02:48 INFO: job '5104' hash 1125
04/13 11:02:48 INFO: job '5104' found at hash[1125] 1 '5104' (J->Name: 5104)
04/13 11:02:48 INFO: job 5104 adds 1 processors per task to node rcmm9 (1)
04/13 11:02:48 MPBSLoadQueueInfo(rcmm1,rcmm9,SC)
04/13 11:02:48 INFO: queue 'rcmm1' started state set to True
04/13 11:02:48 INFO: class to node mapping enabled for queue 'rcmm1'
04/13 11:02:48 INFO: queue 'rcmm2' started state set to True
04/13 11:02:48 INFO: class to node not mapping enabled for queue 'rcmm2' adding class to all nodes
04/13 11:02:48 INFO: MNode[004] ' rcmm9' Idle VM: 10 Mem: 1 Dk: 1 Cl: [rcmm1 2:2][rcmm2 2:2] [rcmm1]
04/13 11:02:48 INFO: MNode[004] ' rcmm9' C/A/D procs: 2/2/1
04/13 11:02:48 MRMNodePostUpdate(rcmm9,Running)
04/13 11:02:48 __MPBSGetNodeState(Name,State,PNode)
04/13 11:02:48 INFO: PBS node rcmm10 set to state Idle (free)
04/13 11:02:48 MNodeFind(rcmm10,N)
04/13 11:02:48 MRMNodePreUpdate(rcmm10,Idle,rcmm1) 04/13 11:02:48 INFO: node 'rcmm10' changed states from Running to Idle
04/13 11:02:48 MPBSNodeUpdate(rcmm10,rcmm10,Idle,rcmm1)
04/13 11:02:48 MPBSQueryMOM(rcmm10,rcmm1,Msg,SC)
04/13 11:02:48 ALERT: cannot get req from MOM on node 'rcmm10' (errno: 0:5)
04/13 11:02:48 INFO: MOM info for host 'rcmm10' successfully updated (Thu Apr 13 11:02:48
)
04/13 11:02:48 INFO: node rcmm10 has joblist '0/5104.rcmm1'
04/13 11:02:48 MJobFind('5104.rcmm1',J,0)
04/13 11:02:48 MUGetHash(5104)
04/13 11:02:48 INFO: hash '5104' --> 5223525
04/13 11:02:48 INFO: job '5104' hash 1125
04/13 11:02:48 INFO: job '5104' found at hash[1125] 1 '5104' (J->Name: 5104)
04/13 11:02:48 INFO: job 5104 adds 1 processors per task to node rcmm10 (1)
04/13 11:02:48 MPBSLoadQueueInfo(rcmm1,rcmm10,SC)
04/13 11:02:48 INFO: queue 'rcmm1' started state set to True
04/13 11:02:48 INFO: class to node mapping enabled for queue 'rcmm1'
04/13 11:02:48 INFO: queue 'rcmm2' started state set to True
04/13 11:02:48 INFO: class to node not mapping enabled for queue 'rcmm2' adding class to all nodes
04/13 11:02:48 INFO: MNode[005] ' rcmm10' Idle VM: 10 Mem: 1 Dk: 1 Cl: [rcmm1 2:2][rcmm2 2
:2] [rcmm1]
04/13 11:02:48 INFO: MNode[005] ' rcmm10' C/A/D procs: 2/2/1
04/13 11:02:48 MRMNodePostUpdate(rcmm10,Running)
04/13 11:02:48 __MPBSGetNodeState(Name,State,PNode)
04/13 11:02:48 INFO: PBS node rcmm11 set to state Idle (free)
04/13 11:02:48 MNodeFind(rcmm11,N)
04/13 11:02:48 MRMNodePreUpdate(rcmm11,Idle,rcmm1) 04/13 11:02:48 MPBSNodeUpdate(rcmm11,rcmm11,Idle,rcmm1)
04/13 11:02:48 MPBSQueryMOM(rcmm11,rcmm1,Msg,SC)
---------------------------------
ÑÅ»¢1GÃâ·ÑÓÊÏä°Ù·Ö°Ù·ÀÀ¬»øÐÅ
ÑÅ»¢ÖúÊÖ-ËÑË÷¡¢É±¶¾¡¢·ÀɧÈÅ
-------------- next part --------------
An HTML attachment was scrubbed...
URL: http://www.supercluster.org/pipermail/mauiusers/attachments/20060413/f9475597/attachment-0001.html
More information about the mauiusers
mailing list