package status import ( "gitlink.org.cn/JointCloud/pcm-coordinator/internal/scheduler/service/inference" "gitlink.org.cn/JointCloud/pcm-coordinator/internal/storeLink" "gitlink.org.cn/JointCloud/pcm-coordinator/internal/svc" "gitlink.org.cn/JointCloud/pcm-coordinator/pkg/constants" "gitlink.org.cn/JointCloud/pcm-coordinator/pkg/models" "net/http" "strconv" "time" ) func UpdateDeployInstanceStatusBatch(svc *svc.ServiceContext, insList []*models.AiInferDeployInstance, needfilter bool) { list := make([]*models.AiInferDeployInstance, len(insList)) copy(list, insList) if needfilter { for i := len(list) - 1; i >= 0; i-- { if list[i].Status == constants.Running || list[i].Status == constants.Stopped || list[i].Status == constants.Failed { list = append(list[:i], list[i+1:]...) } } } if len(list) == 0 { return } buffer := make(chan bool, 3) for _, instance := range list { buffer <- true go UpdateDeployInstanceStatus(svc, instance, false, buffer) } } func UpdateDeployTaskStatus(svc *svc.ServiceContext) { list, err := svc.Scheduler.AiStorages.GetAllDeployTasks() if err != nil { return } ins := list[0] for i := range list { uTime, _ := time.Parse(time.RFC3339, ins.UpdateTime) latest, _ := time.Parse(time.RFC3339, list[i].UpdateTime) if latest.After(uTime) { ins = list[i] } } inslist, err := svc.Scheduler.AiStorages.GetInstanceListByDeployTaskId(ins.Id) if err != nil { return } buffer := make(chan bool, 2) for _, instance := range inslist { buffer <- true go UpdateDeployInstanceStatus(svc, instance, false, buffer) } } func UpdateDeployInstanceStatus(svc *svc.ServiceContext, instance *models.AiInferDeployInstance, updatetime bool, ch chan bool) { amap, found := svc.Scheduler.AiService.InferenceAdapterMap[strconv.FormatInt(instance.AdapterId, 10)] if !found { if ch != nil { <-ch return } return } cmap, found := amap[strconv.FormatInt(instance.ClusterId, 10)] if !found { if ch != nil { <-ch return } return } h := http.Request{} ins, err := cmap.GetInferDeployInstance(h.Context(), instance.InstanceId) if err != nil { if ch != nil { <-ch return } return } switch instance.ClusterType { case storeLink.TYPE_OCTOPUS: switch ins.Status { case "running": if instance.Status == constants.Running { if ch != nil { <-ch return } return } instance.Status = constants.Running case "stopped": if instance.Status == constants.Stopped { if ch != nil { <-ch return } return } instance.Status = constants.Stopped default: instance.Status = ins.Status } case storeLink.TYPE_MODELARTS: switch ins.Status { case "running": if instance.Status == constants.Running { if ch != nil { <-ch return } return } instance.Status = constants.Running case "stopped": if instance.Status == constants.Stopped { if ch != nil { <-ch return } return } instance.Status = constants.Stopped default: instance.Status = ins.Status } case storeLink.TYPE_SHUGUANGAI: switch ins.Status { case "Running": if instance.Status == constants.Running { if ch != nil { <-ch return } return } instance.Status = constants.Running case "Terminated": if instance.Status == constants.Stopped { if ch != nil { <-ch return } return } instance.Status = constants.Stopped default: instance.Status = ins.Status } case storeLink.TYPE_OPENI: switch ins.Status { case "RUNNING": if instance.Status == constants.Running { if ch != nil { <-ch return } return } instance.Status = constants.Running case "STOPPED": if instance.Status == constants.Stopped { if ch != nil { <-ch return } return } instance.Status = constants.Stopped case "CREATED_FAILED": if instance.Status == constants.Failed { if ch != nil { <-ch return } return } instance.Status = constants.Failed default: instance.Status = ins.Status } } err = svc.Scheduler.AiStorages.UpdateInferDeployInstance(instance, updatetime) if err != nil { if ch != nil { <-ch return } return } if ch != nil { <-ch return } } func UpdateAutoStoppedInstance(svc *svc.ServiceContext) { list, err := svc.Scheduler.AiStorages.GetInferDeployInstanceList() if err != nil { return } if len(list) == 0 { return } UpdateDeployInstanceStatusBatch(svc, list, false) } func CheckStopStatus(in *inference.DeployInstance) bool { switch in.ClusterType { case storeLink.TYPE_OCTOPUS: switch in.Status { case "stopped": return true default: return false } case storeLink.TYPE_MODELARTS: switch in.Status { case "stopped": return true default: return false } case storeLink.TYPE_SHUGUANGAI: switch in.Status { case "Terminated": return true default: return false } default: return false } } func CheckRunningStatus(in *inference.DeployInstance) bool { switch in.ClusterType { case storeLink.TYPE_OCTOPUS: switch in.Status { case "running": return true default: return false } case storeLink.TYPE_MODELARTS: switch in.Status { case "running": return true default: return false } case storeLink.TYPE_SHUGUANGAI: switch in.Status { case "Running": return true default: return false } default: return false } }