diff --git a/src/job_manager.go b/src/job_manager.go index 029abaf..f2de46c 100644 --- a/src/job_manager.go +++ b/src/job_manager.go @@ -94,7 +94,17 @@ func (jm *JobManager) start() { GPUs = append(GPUs, GPU.UUID) } - for attemp := 0; attemp < 3; attemp++ { + for attempt := 0; attemp < 3; attemp++ { + if attempt == 2 { //failed more than once + //for { + // resource := jm.scheduler.AcquireResource(jm.job, jm.job.Tasks[i], jm.resources) + // if len(resource.Status) > 0 { + // break + // } + time.Sleep(time.Second * 1) + //} + } + v := url.Values{} v.Set("image", jm.job.Tasks[i].Image) v.Set("cmd", jm.job.Tasks[i].Cmd)