@@ -1058,7 +1058,6 @@ func (qjm *XController) ScheduleNext(qj *arbv1.AppWrapper) {
10581058 klog .V (3 ).Infof ("[ScheduleNext] Cannot pop QueueJob from qjqueue! err=%#v" , retryErr )
10591059 return err
10601060 }
1061- klog .V (3 ).Infof ("[ScheduleNext] activeQ.Pop_afterPriorityUpdate %s/%s *Delay=%.6f seconds RemainingLength=%d" , qj .Namespace , qj .Name , time .Now ().Sub (qj .Status .ControllerFirstTimestamp .Time ).Seconds (), qjm .qjqueue .Length ())
10621061 klog .V (4 ).Infof ("[ScheduleNext] activeQ.Pop_afterPriorityUpdate %s/%s *Delay=%.6f seconds RemainingLength=%d Version=%s Status=%+v" , qj .Namespace , qj .Name , time .Now ().Sub (qj .Status .ControllerFirstTimestamp .Time ).Seconds (), qjm .qjqueue .Length (), qj .ResourceVersion , qj .Status )
10631062 apiCacheAWJob , retryErr := qjm .getAppWrapper (qj .Namespace , qj .Name , "[ScheduleNext] -- after dynamic priority pop" )
10641063 if retryErr != nil {
@@ -1069,7 +1068,6 @@ func (qjm *XController) ScheduleNext(qj *arbv1.AppWrapper) {
10691068 return err
10701069 }
10711070 if apiCacheAWJob .Status .CanRun {
1072- klog .V (3 ).Infof ("[ScheduleNext] AppWrapper job: %s/%s from API is already scheduled. Ignoring request" , qj .Namespace , qj .Name )
10731071 klog .V (4 ).Infof ("[ScheduleNext] AppWrapper job: %s/%s from API is already scheduled. Ignoring request: Status=%+v" , qj .Namespace , qj .Name , qj .Status )
10741072 return nil
10751073 }
@@ -1095,10 +1093,8 @@ func (qjm *XController) ScheduleNext(qj *arbv1.AppWrapper) {
10951093
10961094 klog .V (4 ).Infof ("[ScheduleNext] after Pop qjqLength=%d qj %s/%s Version=%s activeQ=%t Unsched=%t Status=%v" , qjm .qjqueue .Length (), qj .Namespace , qj .Name , qj .ResourceVersion , qjm .qjqueue .IfExistActiveQ (qj ), qjm .qjqueue .IfExistUnschedulableQ (qj ), qj .Status )
10971095 if qjm .isDispatcher {
1098- klog .V (3 ).Infof ("[ScheduleNext] [Dispatcher Mode] Attempting to dispatch next appwrapper: '%s/%s" , qj .Namespace , qj .Name )
10991096 klog .V (4 ).Infof ("[ScheduleNext] [Dispatcher Mode] Attempting to dispatch next appwrapper: '%s/%s Status=%v" , qj .Namespace , qj .Name , qj .Status )
11001097 } else {
1101- klog .V (3 ).Infof ("[ScheduleNext] [Agent Mode] Attempting to dispatch next appwrapper: '%s/%s'" , qj .Namespace , qj .Name )
11021098 klog .V (4 ).Infof ("[ScheduleNext] [Agent Mode] Attempting to dispatch next appwrapper: '%s/%s' Status=%v" , qj .Namespace , qj .Name , qj .Status )
11031099 }
11041100
@@ -1236,16 +1232,14 @@ func (qjm *XController) ScheduleNext(qj *arbv1.AppWrapper) {
12361232 klog .Info ("%s %s %s" , quotaFits , preemptAWs , msg )
12371233
12381234 if quotaFits {
1239- klog .V (3 ).Infof ("[ScheduleNext] [Agent mode] quota evaluation successful for app wrapper '%s/%s'" , qj .Namespace , qj .Name )
12401235 klog .V (4 ).Infof ("[ScheduleNext] [Agent mode] quota evaluation successful for app wrapper '%s/%s' activeQ=%t Unsched=%t Version=%s Status=%+v" ,
12411236 qj .Namespace , qj .Name , time .Now ().Sub (HOLStartTime ), qjm .qjqueue .IfExistActiveQ (qj ), qjm .qjqueue .IfExistUnschedulableQ (qj ), qj .ResourceVersion , qj .Status )
12421237 // Set any jobs that are marked for preemption
12431238 qjm .preemptAWJobs (ctx , preemptAWs )
12441239 } else { // Not enough free quota to dispatch appwrapper
12451240 dispatchFailedMessage = "Insufficient quota and/or resources to dispatch AppWrapper."
12461241 dispatchFailedReason = "quota limit exceeded"
1247- klog .V (3 ).Infof ("[ScheduleNext] [Agent Mode] Blocking dispatch for app wrapper '%s/%s' due to quota limits, msg=%s" , qj .Namespace , qj .Name , msg )
1248- klog .V (4 ).Infof ("[ScheduleNext] [Agent Mode] Blocking dispatch for app wrapper '%s/%s' due to quota limits, activeQ=%t Unsched=%t Version=%s Status=%+v msg=%s" ,
1242+ klog .Infof ("[ScheduleNext] [Agent Mode] Blocking dispatch for app wrapper '%s/%s' due to quota limits, activeQ=%t Unsched=%t Version=%s Status=%+v msg=%s" ,
12491243 qj .Namespace , qj .Name , time .Now ().Sub (HOLStartTime ), qjm .qjqueue .IfExistActiveQ (qj ), qjm .qjqueue .IfExistUnschedulableQ (qj ), qj .ResourceVersion , qj .Status , msg )
12501244 // Call update etcd here to retrigger AW execution for failed quota
12511245 // TODO: quota management tests fail if this is converted into go-routine, need to inspect why?
@@ -1264,15 +1258,12 @@ func (qjm *XController) ScheduleNext(qj *arbv1.AppWrapper) {
12641258
12651259 if aggqj .LessEqual (resources ) { // Check if enough resources to dispatch
12661260 fits = true
1267- klog .V (3 ).Infof ("[ScheduleNext] [Agent Mode] available resource successful check for '%s/%s'" , qj .Namespace , qj .Name )
12681261 klog .V (4 ).Infof ("[ScheduleNext] [Agent Mode] available resource successful check for '%s/%s' at %s activeQ=%t Unsched=%t Version=%s Status=%+v." ,
12691262 qj .Namespace , qj .Name , time .Now ().Sub (HOLStartTime ), qjm .qjqueue .IfExistActiveQ (qj ), qjm .qjqueue .IfExistUnschedulableQ (qj ), qj .ResourceVersion , qj .Status )
12701263 } else { // Not enough free resources to dispatch HOL
12711264 fits = false
12721265 dispatchFailedMessage = "Insufficient resources to dispatch AppWrapper."
1273- klog .V (3 ).Infof ("[ScheduleNext] [Agent Mode] Failed to dispatch app wrapper '%s/%s' due to insufficient resources" ,
1274- qj .Namespace , qj .Name )
1275- klog .V (4 ).Infof ("[ScheduleNext] [Agent Mode] Failed to dispatch app wrapper '%s/%s' due to insufficient resources, activeQ=%t Unsched=%t Version=%s Status=%+v" ,
1266+ klog .Infof ("[ScheduleNext] [Agent Mode] Failed to dispatch app wrapper '%s/%s' due to insufficient resources, activeQ=%t Unsched=%t Version=%s Status=%+v" ,
12761267 qj .Namespace , qj .Name , qjm .qjqueue .IfExistActiveQ (qj ),
12771268 qjm .qjqueue .IfExistUnschedulableQ (qj ), qj .ResourceVersion , qj .Status )
12781269 // TODO: Remove forwarded logic as a big AW will never be forwarded
@@ -1336,9 +1327,7 @@ func (qjm *XController) ScheduleNext(qj *arbv1.AppWrapper) {
13361327 fowardingLoopCount += 1
13371328 }
13381329 if ! forwarded { // start thread to backoff
1339- klog .V (3 ).Infof ("[ScheduleNext] [Agent Mode] backing off app wrapper '%s/%s' after waiting for %s" ,
1340- qj .Namespace , qj .Name , time .Now ().Sub (HOLStartTime ))
1341- klog .V (4 ).Infof ("[ScheduleNext] [Agent Mode] backing off app wrapper '%s/%s' after waiting for %s activeQ=%t Unsched=%t Version=%s Status=%+v" ,
1330+ klog .Infof ("[ScheduleNext] [Agent Mode] backing off app wrapper '%s/%s' after waiting for %s activeQ=%t Unsched=%t Version=%s Status=%+v" ,
13421331 qj .Namespace , qj .Name , time .Now ().Sub (HOLStartTime ), qjm .qjqueue .IfExistActiveQ (qj ), qjm .qjqueue .IfExistUnschedulableQ (qj ), qj .ResourceVersion , qj .Status )
13431332 if qjm .quotaManager != nil && quotaFits {
13441333 qjm .quotaManager .Release (qj )
@@ -1477,8 +1466,6 @@ func (qjm *XController) backoff(ctx context.Context, q *arbv1.AppWrapper, reason
14771466 klog .Errorf ("[backoff] Failed to update status for %s/%s. Continuing with possible stale object without updating conditions. err=%s" , q .Namespace , q .Name , err )
14781467 }
14791468 qjm .qjqueue .AddUnschedulableIfNotPresent (q )
1480- klog .V (3 ).Infof ("[backoff] %s/%s move to unschedulableQ before sleep for %d seconds. Unsched=%t" , q .Namespace , q .Name ,
1481- qjm .config .BackoffTimeOrDefault (defaultBackoffTime ), qjm .qjqueue .IfExistUnschedulableQ (q ))
14821469 klog .V (4 ).Infof ("[backoff] %s/%s move to unschedulableQ before sleep for %d seconds. activeQ=%t Unsched=%t Version=%s Status=%+v" , q .Namespace , q .Name ,
14831470 qjm .config .BackoffTimeOrDefault (defaultBackoffTime ), qjm .qjqueue .IfExistActiveQ (q ), qjm .qjqueue .IfExistUnschedulableQ (q ), q .ResourceVersion , q .Status )
14841471 time .Sleep (time .Duration (qjm .config .BackoffTimeOrDefault (defaultBackoffTime )) * time .Second )
@@ -1587,8 +1574,6 @@ func (qjm *XController) UpdateQueueJobs(newjob *arbv1.AppWrapper) {
15871574 qjm .eventQueue .Delete (updateQj )
15881575 qjm .qjqueue .Delete (updateQj )
15891576 }
1590- klog .V (3 ).Infof ("[UpdateQueueJobs] Done getting completion status for app wrapper '%s/%s' Status.CanRun=%t Status.State=%s" , newjob .Namespace , newjob .Name ,
1591- newjob .Status .CanRun , newjob .Status .State )
15921577 klog .V (4 ).Infof ("[UpdateQueueJobs] Done getting completion status for app wrapper '%s/%s' Version=%s Status.CanRun=%t Status.State=%s, pod counts [Pending: %d, Running: %d, Succeded: %d, Failed %d]" , newjob .Namespace , newjob .Name , newjob .ResourceVersion ,
15931578 newjob .Status .CanRun , newjob .Status .State , newjob .Status .Pending , newjob .Status .Running , newjob .Status .Succeeded , newjob .Status .Failed )
15941579 }
@@ -1839,7 +1824,7 @@ func (cc *XController) agentEventQueueWorker() {
18391824
18401825 return nil
18411826 }
1842- klog .V (3 ).Infof ("[Controller: Dispatcher Mode] XQJ Status Update from AGENT: Name:%s, Namespace:%s, Status: %+v\n " , queuejob .Name , queuejob .Namespace , queuejob .Status )
1827+ klog .V (4 ).Infof ("[Controller: Dispatcher Mode] XQJ Status Update from AGENT: Name:%s, Namespace:%s, Status: %+v\n " , queuejob .Name , queuejob .Namespace , queuejob .Status )
18431828
18441829 // sync AppWrapper
18451830 if err := cc .updateQueueJobStatus (ctx , queuejob ); err != nil {
@@ -2160,7 +2145,6 @@ func (cc *XController) manageQueueJob(ctx context.Context, qj *arbv1.AppWrapper,
21602145 }
21612146 return nil
21622147 } else if qj .Status .CanRun && qj .Status .State == arbv1 .AppWrapperStateActive {
2163- klog .V (3 ).Infof ("[manageQueueJob] Getting completion status for app wrapper '%s/%s' Status.CanRun=%t Status.State=%s" , qj .Namespace , qj .Name , qj .Status .CanRun , qj .Status .State )
21642148 klog .V (4 ).Infof ("[manageQueueJob] Getting completion status for app wrapper '%s/%s' Version=%s Status.CanRun=%t Status.State=%s, pod counts [Pending: %d, Running: %d, Succeded: %d, Failed %d]" , qj .Namespace , qj .Name , qj .ResourceVersion ,
21652149 qj .Status .CanRun , qj .Status .State , qj .Status .Pending , qj .Status .Running , qj .Status .Succeeded , qj .Status .Failed )
21662150
0 commit comments