2019-03-04 09:19:55 +00:00
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"sync"
|
2019-04-29 09:05:15 +00:00
|
|
|
"time"
|
|
|
|
"strconv"
|
|
|
|
"fmt"
|
|
|
|
)
|
2019-03-04 09:19:55 +00:00
|
|
|
|
|
|
|
type ResourcePool struct {
|
2019-04-29 09:05:15 +00:00
|
|
|
mu sync.Mutex
|
2019-04-18 09:25:37 +00:00
|
|
|
nodes map[string]NodeStatus
|
2019-04-29 09:05:15 +00:00
|
|
|
|
|
|
|
history []map[string]string
|
|
|
|
}
|
|
|
|
|
|
|
|
func (pool *ResourcePool) start() {
|
|
|
|
go func() {
|
|
|
|
for {
|
|
|
|
summary := map[string]string{}
|
|
|
|
|
|
|
|
UtilCPU := 0.0
|
|
|
|
TotalCPU := 0
|
|
|
|
TotalMem := 0
|
|
|
|
AvailableMem := 0
|
|
|
|
|
|
|
|
TotalGPU := 0
|
|
|
|
UtilGPU := 0
|
|
|
|
TotalMemGPU := 0
|
|
|
|
AvailableMemGPU := 0
|
|
|
|
for _, node := range pool.nodes {
|
|
|
|
if i, err := strconv.ParseFloat(node.UtilCPU, 64); err != nil {
|
|
|
|
UtilCPU += i
|
|
|
|
}
|
|
|
|
TotalCPU += node.NumCPU
|
|
|
|
TotalMem += str2int(node.MemTotal, 0)
|
|
|
|
AvailableMem += str2int(node.MemAvailable, 0)
|
|
|
|
|
|
|
|
for _, GPU := range node.Status {
|
|
|
|
UtilGPU += GPU.UtilizationGPU
|
|
|
|
TotalGPU ++
|
|
|
|
TotalMemGPU += GPU.MemoryTotal
|
|
|
|
AvailableMemGPU += GPU.MemoryFree
|
|
|
|
}
|
|
|
|
}
|
|
|
|
summary["ts"] = time.Now().Format("2006-01-02 15:04:05")
|
|
|
|
summary["cpu_util"] = fmt.Sprintf("%.2f", UtilCPU/(float64(len(pool.nodes))+0.001))
|
|
|
|
summary["cpu_total"] = strconv.Itoa(TotalCPU)
|
|
|
|
summary["mem_total"] = strconv.Itoa(TotalMem)
|
|
|
|
summary["mem_available"] = strconv.Itoa(AvailableMem)
|
|
|
|
summary["gpu_total"] = strconv.Itoa(TotalGPU)
|
|
|
|
if TotalGPU == 0 {
|
|
|
|
summary["gpu_util"] = "0"
|
|
|
|
} else {
|
|
|
|
summary["gpu_util"] = fmt.Sprintf("%2d", UtilGPU/TotalGPU)
|
|
|
|
}
|
|
|
|
summary["gpu_mem_total"] = strconv.Itoa(TotalMemGPU)
|
|
|
|
summary["gpu_mem_available"] = strconv.Itoa(AvailableMemGPU)
|
|
|
|
|
|
|
|
pool.history = append(pool.history, summary)
|
|
|
|
|
|
|
|
if len(pool.history) > 60 {
|
|
|
|
pool.history = pool.history[0:60]
|
|
|
|
}
|
|
|
|
time.Sleep(time.Second * 60)
|
|
|
|
}
|
|
|
|
}()
|
2019-03-04 09:19:55 +00:00
|
|
|
}
|
|
|
|
|
2019-04-16 08:59:19 +00:00
|
|
|
func (pool *ResourcePool) update(node NodeStatus) {
|
2019-03-04 09:19:55 +00:00
|
|
|
pool.mu.Lock()
|
|
|
|
defer pool.mu.Unlock()
|
|
|
|
|
2019-03-20 03:14:07 +00:00
|
|
|
status, ok := pool.nodes[node.ClientID]
|
|
|
|
if ok {
|
2019-04-16 08:59:19 +00:00
|
|
|
for i, GPU := range status.Status {
|
|
|
|
if GPU.UUID == node.Status[i].UUID {
|
|
|
|
node.Status[i].MemoryAllocated = GPU.MemoryAllocated
|
2019-03-20 03:14:07 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2019-04-16 08:59:19 +00:00
|
|
|
pool.nodes[node.ClientID] = node
|
2019-03-20 03:14:07 +00:00
|
|
|
|
|
|
|
//log.Println(pool.nodes)
|
2019-03-04 09:19:55 +00:00
|
|
|
}
|
|
|
|
|
2019-04-18 09:25:37 +00:00
|
|
|
func (pool *ResourcePool) getByID(id string) NodeStatus {
|
2019-03-04 09:19:55 +00:00
|
|
|
pool.mu.Lock()
|
|
|
|
defer pool.mu.Unlock()
|
|
|
|
|
|
|
|
status, ok := pool.nodes[id]
|
|
|
|
if ok {
|
|
|
|
return status
|
|
|
|
}
|
2019-04-16 08:59:19 +00:00
|
|
|
return NodeStatus{}
|
2019-03-04 09:19:55 +00:00
|
|
|
}
|
2019-04-29 09:05:15 +00:00
|
|
|
|
|
|
|
func (pool *ResourcePool) list() MsgResource {
|
|
|
|
return MsgResource{Code: 0, Resource: pool.nodes}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (pool *ResourcePool) statusHistory() MsgPoolStatusHistory {
|
|
|
|
return MsgPoolStatusHistory{Code: 0, Data: pool.history}
|
|
|
|
}
|