mirror of
https://github.com/newnius/YAO-scheduler.git
synced 2025-12-15 08:16:43 +00:00
update
This commit is contained in:
@@ -98,6 +98,7 @@ func (jm *JobManager) start() {
|
|||||||
for {
|
for {
|
||||||
res := jm.status()
|
res := jm.status()
|
||||||
flag := false
|
flag := false
|
||||||
|
onlyPS := true
|
||||||
for i := range res.Status {
|
for i := range res.Status {
|
||||||
if res.Status[i].Status == "ready" {
|
if res.Status[i].Status == "ready" {
|
||||||
log.Debug(jm.job.Name, "-", i, " is ready to run")
|
log.Debug(jm.job.Name, "-", i, " is ready to run")
|
||||||
@@ -105,10 +106,12 @@ func (jm *JobManager) start() {
|
|||||||
} else if res.Status[i].Status == "running" {
|
} else if res.Status[i].Status == "running" {
|
||||||
log.Debug(jm.job.Name, "-", i, " is running")
|
log.Debug(jm.job.Name, "-", i, " is running")
|
||||||
flag = true
|
flag = true
|
||||||
|
if !jm.job.Tasks[i].IsPS {
|
||||||
|
onlyPS = false
|
||||||
|
}
|
||||||
InstanceJobHistoryLogger().submitTaskStatus(jm.job.Name, res.Status[i])
|
InstanceJobHistoryLogger().submitTaskStatus(jm.job.Name, res.Status[i])
|
||||||
} else {
|
} else {
|
||||||
log.Info(jm.job.Name, "-", i, " ", res.Status[i].Status)
|
log.Info(jm.job.Name, "-", i, " ", res.Status[i].Status)
|
||||||
|
|
||||||
/* save logs etc. */
|
/* save logs etc. */
|
||||||
|
|
||||||
/* remove exited containers */
|
/* remove exited containers */
|
||||||
@@ -132,6 +135,10 @@ func (jm *JobManager) start() {
|
|||||||
InstanceJobHistoryLogger().submitTaskStatus(jm.job.Name, res.Status[i])
|
InstanceJobHistoryLogger().submitTaskStatus(jm.job.Name, res.Status[i])
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
if onlyPS {
|
||||||
|
jm.stop()
|
||||||
|
break
|
||||||
|
}
|
||||||
if !flag {
|
if !flag {
|
||||||
break
|
break
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -141,6 +141,8 @@ type Task struct {
|
|||||||
Memory int `json:"memory"`
|
Memory int `json:"memory"`
|
||||||
NumberGPU int `json:"gpu_number"`
|
NumberGPU int `json:"gpu_number"`
|
||||||
MemoryGPU int `json:"gpu_memory"`
|
MemoryGPU int `json:"gpu_memory"`
|
||||||
|
IsPS bool `json:"is_ps"`
|
||||||
|
ModelGPU bool `json:"gpu_model"`
|
||||||
}
|
}
|
||||||
|
|
||||||
type Group struct {
|
type Group struct {
|
||||||
|
|||||||
Reference in New Issue
Block a user