You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

aiService.go 5.3 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131
  1. package service
  2. import (
  3. "github.com/zeromicro/go-zero/zrpc"
  4. hpcacclient "gitlink.org.cn/JointCloud/pcm-ac/hpcacclient"
  5. "gitlink.org.cn/JointCloud/pcm-coordinator/internal/config"
  6. "gitlink.org.cn/JointCloud/pcm-coordinator/internal/scheduler/database"
  7. "gitlink.org.cn/JointCloud/pcm-coordinator/internal/scheduler/service/collector"
  8. "gitlink.org.cn/JointCloud/pcm-coordinator/internal/scheduler/service/executor"
  9. "gitlink.org.cn/JointCloud/pcm-coordinator/internal/scheduler/service/inference"
  10. "gitlink.org.cn/JointCloud/pcm-coordinator/internal/storeLink"
  11. "gitlink.org.cn/JointCloud/pcm-coordinator/internal/types"
  12. "gitlink.org.cn/JointCloud/pcm-modelarts/client/imagesservice"
  13. "gitlink.org.cn/JointCloud/pcm-modelarts/client/modelartsservice"
  14. "gitlink.org.cn/JointCloud/pcm-octopus/octopusclient"
  15. "strconv"
  16. "sync"
  17. )
  18. const (
  19. OCTOPUS = "octopus"
  20. MODELARTS = "modelarts"
  21. SHUGUANGAI = "shuguangAi"
  22. )
  23. type AiService struct {
  24. AiExecutorAdapterMap map[string]map[string]executor.AiExecutor
  25. AiCollectorAdapterMap map[string]map[string]collector.AiCollector
  26. InferenceAdapterMap map[string]map[string]inference.ICluster
  27. Storage *database.AiStorage
  28. mu sync.Mutex
  29. }
  30. func NewAiService(conf *config.Config, storages *database.AiStorage) (*AiService, error) {
  31. var aiType = "1"
  32. adapterIds, err := storages.GetAdapterIdsByType(aiType)
  33. if err != nil {
  34. return nil, err
  35. }
  36. aiService := &AiService{
  37. AiExecutorAdapterMap: make(map[string]map[string]executor.AiExecutor),
  38. AiCollectorAdapterMap: make(map[string]map[string]collector.AiCollector),
  39. InferenceAdapterMap: make(map[string]map[string]inference.ICluster),
  40. Storage: storages,
  41. }
  42. for _, id := range adapterIds {
  43. clusters, err := storages.GetClustersByAdapterId(id)
  44. if err != nil {
  45. return nil, err
  46. }
  47. if len(clusters.List) == 0 {
  48. continue
  49. }
  50. exeClusterMap, colClusterMap, inferMap := InitAiClusterMap(conf, clusters.List)
  51. aiService.AiExecutorAdapterMap[id] = exeClusterMap
  52. aiService.AiCollectorAdapterMap[id] = colClusterMap
  53. aiService.InferenceAdapterMap[id] = inferMap
  54. }
  55. return aiService, nil
  56. }
  57. func InitAiClusterMap(conf *config.Config, clusters []types.ClusterInfo) (map[string]executor.AiExecutor, map[string]collector.AiCollector, map[string]inference.ICluster) {
  58. executorMap := make(map[string]executor.AiExecutor)
  59. collectorMap := make(map[string]collector.AiCollector)
  60. inferenceMap := make(map[string]inference.ICluster)
  61. for _, c := range clusters {
  62. switch c.Name {
  63. case OCTOPUS:
  64. id, _ := strconv.ParseInt(c.Id, 10, 64)
  65. octopusRpc := octopusclient.NewOctopus(zrpc.MustNewClient(conf.OctopusRpcConf))
  66. octopus := storeLink.NewOctopusLink(octopusRpc, c.Nickname, id)
  67. collectorMap[c.Id] = octopus
  68. executorMap[c.Id] = octopus
  69. inferenceMap[c.Id] = octopus
  70. case MODELARTS:
  71. id, _ := strconv.ParseInt(c.Id, 10, 64)
  72. modelArtsRpc := modelartsservice.NewModelArtsService(zrpc.MustNewClient(conf.ModelArtsRpcConf))
  73. modelArtsImgRpc := imagesservice.NewImagesService(zrpc.MustNewClient(conf.ModelArtsImgRpcConf))
  74. modelarts := storeLink.NewModelArtsLink(modelArtsRpc, modelArtsImgRpc, c.Name, id, c.Nickname)
  75. collectorMap[c.Id] = modelarts
  76. executorMap[c.Id] = modelarts
  77. inferenceMap[c.Id] = modelarts
  78. case SHUGUANGAI:
  79. id, _ := strconv.ParseInt(c.Id, 10, 64)
  80. aCRpc := hpcacclient.NewHpcAC(zrpc.MustNewClient(conf.ACRpcConf))
  81. sgai := storeLink.NewShuguangAi(aCRpc, c.Nickname, id)
  82. collectorMap[c.Id] = sgai
  83. executorMap[c.Id] = sgai
  84. inferenceMap[c.Id] = sgai
  85. }
  86. }
  87. return executorMap, collectorMap, inferenceMap
  88. }
  89. func (as *AiService) UpdateClusterMaps(conf *config.Config, adapterId string, clusters []types.ClusterInfo) {
  90. for _, c := range clusters {
  91. _, ok := as.AiExecutorAdapterMap[adapterId][c.Id]
  92. _, ok2 := as.AiCollectorAdapterMap[adapterId][c.Id]
  93. _, ok3 := as.InferenceAdapterMap[adapterId][c.Id]
  94. if !ok && !ok2 && !ok3 {
  95. switch c.Name {
  96. case OCTOPUS:
  97. id, _ := strconv.ParseInt(c.Id, 10, 64)
  98. octopusRpc := octopusclient.NewOctopus(zrpc.MustNewClient(conf.OctopusRpcConf))
  99. octopus := storeLink.NewOctopusLink(octopusRpc, c.Nickname, id)
  100. as.AiExecutorAdapterMap[adapterId][c.Id] = octopus
  101. as.AiCollectorAdapterMap[adapterId][c.Id] = octopus
  102. as.InferenceAdapterMap[adapterId][c.Id] = octopus
  103. case MODELARTS:
  104. id, _ := strconv.ParseInt(c.Id, 10, 64)
  105. modelArtsRpc := modelartsservice.NewModelArtsService(zrpc.MustNewClient(conf.ModelArtsRpcConf))
  106. modelArtsImgRpc := imagesservice.NewImagesService(zrpc.MustNewClient(conf.ModelArtsImgRpcConf))
  107. modelarts := storeLink.NewModelArtsLink(modelArtsRpc, modelArtsImgRpc, c.Name, id, c.Nickname)
  108. as.AiExecutorAdapterMap[adapterId][c.Id] = modelarts
  109. as.AiCollectorAdapterMap[adapterId][c.Id] = modelarts
  110. as.InferenceAdapterMap[adapterId][c.Id] = modelarts
  111. case SHUGUANGAI:
  112. id, _ := strconv.ParseInt(c.Id, 10, 64)
  113. aCRpc := hpcacclient.NewHpcAC(zrpc.MustNewClient(conf.ACRpcConf))
  114. sgai := storeLink.NewShuguangAi(aCRpc, c.Nickname, id)
  115. as.AiExecutorAdapterMap[adapterId][c.Id] = sgai
  116. as.AiCollectorAdapterMap[adapterId][c.Id] = sgai
  117. as.InferenceAdapterMap[adapterId][c.Id] = sgai
  118. }
  119. } else {
  120. continue
  121. }
  122. }
  123. }

PCM is positioned as Software stack over Cloud, aiming to build the standards and ecology of heterogeneous cloud collaboration for JCC in a non intrusive and autonomous peer-to-peer manner.