You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

serve.go 10 kB

10 months ago
10 months ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371
  1. package cmd
  2. import (
  3. "context"
  4. "fmt"
  5. "net"
  6. "os"
  7. "time"
  8. "github.com/go-co-op/gocron/v2"
  9. "gitlink.org.cn/cloudream/storage/agent/internal/http"
  10. "gitlink.org.cn/cloudream/storage/agent/internal/tickevent"
  11. "gitlink.org.cn/cloudream/common/pkgs/ioswitch/exec"
  12. "gitlink.org.cn/cloudream/common/pkgs/logger"
  13. "gitlink.org.cn/cloudream/common/pkgs/mq"
  14. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  15. "gitlink.org.cn/cloudream/storage/agent/internal/config"
  16. "gitlink.org.cn/cloudream/storage/agent/internal/task"
  17. stgglb "gitlink.org.cn/cloudream/storage/common/globals"
  18. stgmod "gitlink.org.cn/cloudream/storage/common/models"
  19. "gitlink.org.cn/cloudream/storage/common/pkgs/accessstat"
  20. "gitlink.org.cn/cloudream/storage/common/pkgs/connectivity"
  21. "gitlink.org.cn/cloudream/storage/common/pkgs/distlock"
  22. "gitlink.org.cn/cloudream/storage/common/pkgs/downloader"
  23. "gitlink.org.cn/cloudream/storage/common/pkgs/downloader/strategy"
  24. agtrpc "gitlink.org.cn/cloudream/storage/common/pkgs/grpc/agent"
  25. "gitlink.org.cn/cloudream/storage/common/pkgs/metacache"
  26. "gitlink.org.cn/cloudream/storage/common/pkgs/storage/agtpool"
  27. "gitlink.org.cn/cloudream/storage/common/pkgs/sysevent"
  28. "gitlink.org.cn/cloudream/storage/common/pkgs/uploader"
  29. "google.golang.org/grpc"
  30. agtmq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/agent"
  31. coormq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/coordinator"
  32. grpcsvc "gitlink.org.cn/cloudream/storage/agent/internal/grpc"
  33. cmdsvc "gitlink.org.cn/cloudream/storage/agent/internal/mq"
  34. )
  35. func serve(configPath string) {
  36. err := config.Init(configPath)
  37. if err != nil {
  38. fmt.Printf("init config failed, err: %s", err.Error())
  39. os.Exit(1)
  40. }
  41. err = logger.Init(&config.Cfg().Logger)
  42. if err != nil {
  43. fmt.Printf("init logger failed, err: %s", err.Error())
  44. os.Exit(1)
  45. }
  46. stgglb.InitLocal(&config.Cfg().Local)
  47. stgglb.InitMQPool(config.Cfg().RabbitMQ)
  48. stgglb.InitAgentRPCPool(&agtrpc.PoolConfig{})
  49. stgglb.Stats.SetupHubStorageTransfer(*config.Cfg().Local.HubID)
  50. stgglb.Stats.SetupHubTransfer(*config.Cfg().Local.HubID)
  51. // 获取Hub配置
  52. hubCfg := downloadHubConfig()
  53. // 初始化存储服务管理器
  54. stgAgts := agtpool.NewPool()
  55. for _, stg := range hubCfg.Storages {
  56. err := stgAgts.SetupAgent(stg)
  57. if err != nil {
  58. fmt.Printf("init storage %v: %v", stg.Storage.String(), err)
  59. os.Exit(1)
  60. }
  61. }
  62. // 初始化执行器
  63. worker := exec.NewWorker()
  64. // 初始化HTTP服务
  65. httpSvr, err := http.NewServer(config.Cfg().ListenAddr, http.NewService(&worker, stgAgts))
  66. if err != nil {
  67. logger.Fatalf("new http server failed, err: %s", err.Error())
  68. }
  69. go serveHTTP(httpSvr)
  70. // 启动网络连通性检测,并就地检测一次
  71. conCol := connectivity.NewCollector(&config.Cfg().Connectivity, func(collector *connectivity.Collector) {
  72. log := logger.WithField("Connectivity", "")
  73. coorCli, err := stgglb.CoordinatorMQPool.Acquire()
  74. if err != nil {
  75. log.Warnf("acquire coordinator mq failed, err: %s", err.Error())
  76. return
  77. }
  78. defer stgglb.CoordinatorMQPool.Release(coorCli)
  79. cons := collector.GetAll()
  80. hubCons := make([]cdssdk.HubConnectivity, 0, len(cons))
  81. for _, con := range cons {
  82. var delay *float32
  83. if con.Latency != nil {
  84. v := float32(con.Latency.Microseconds()) / 1000
  85. delay = &v
  86. }
  87. hubCons = append(hubCons, cdssdk.HubConnectivity{
  88. FromHubID: *stgglb.Local.HubID,
  89. ToHubID: con.ToHubID,
  90. Latency: delay,
  91. TestTime: con.TestTime,
  92. })
  93. }
  94. _, err = coorCli.UpdateHubConnectivities(coormq.ReqUpdateHubConnectivities(hubCons))
  95. if err != nil {
  96. log.Warnf("update hub connectivities: %v", err)
  97. }
  98. })
  99. conCol.CollectInPlace()
  100. // 初始化元数据缓存服务
  101. metacacheHost := metacache.NewHost()
  102. go metacacheHost.Serve()
  103. stgMeta := metacacheHost.AddStorageMeta()
  104. hubMeta := metacacheHost.AddHubMeta()
  105. conMeta := metacacheHost.AddConnectivity()
  106. // 启动访问统计服务
  107. acStat := accessstat.NewAccessStat(accessstat.Config{
  108. // TODO 考虑放到配置里
  109. ReportInterval: time.Second * 10,
  110. })
  111. go serveAccessStat(acStat)
  112. // 初始化分布式锁服务
  113. distlock, err := distlock.NewService(&config.Cfg().DistLock)
  114. if err != nil {
  115. logger.Fatalf("new ipfs failed, err: %s", err.Error())
  116. }
  117. // 初始化下载策略选择器
  118. strgSel := strategy.NewSelector(config.Cfg().DownloadStrategy, stgMeta, hubMeta, conMeta)
  119. // 初始化下载器
  120. dlder := downloader.NewDownloader(config.Cfg().Downloader, &conCol, stgAgts, strgSel)
  121. // 初始化上传器
  122. uploader := uploader.NewUploader(distlock, &conCol, stgAgts, stgMeta)
  123. // 初始化任务管理器
  124. taskMgr := task.NewManager(distlock, &conCol, &dlder, acStat, stgAgts, uploader)
  125. // 初始化系统事件发布器
  126. evtPub, err := sysevent.NewPublisher(sysevent.ConfigFromMQConfig(config.Cfg().RabbitMQ), &stgmod.SourceHub{
  127. HubID: hubCfg.Hub.HubID,
  128. HubName: hubCfg.Hub.Name,
  129. })
  130. if err != nil {
  131. logger.Errorf("new sysevent publisher: %v", err)
  132. os.Exit(1)
  133. }
  134. go servePublisher(evtPub)
  135. // 初始化定时任务执行器
  136. sch := setupTickTask(stgAgts, evtPub)
  137. sch.Start()
  138. defer sch.Shutdown()
  139. // 启动命令服务器
  140. // TODO 需要设计AgentID持久化机制
  141. agtSvr, err := agtmq.NewServer(cmdsvc.NewService(&taskMgr, stgAgts), config.Cfg().ID, config.Cfg().RabbitMQ)
  142. if err != nil {
  143. logger.Fatalf("new agent server failed, err: %s", err.Error())
  144. }
  145. agtSvr.OnError(func(err error) {
  146. logger.Warnf("agent server err: %s", err.Error())
  147. })
  148. go serveAgentServer(agtSvr)
  149. // 启动GRPC服务
  150. listenAddr := config.Cfg().GRPC.MakeListenAddress()
  151. lis, err := net.Listen("tcp", listenAddr)
  152. if err != nil {
  153. logger.Fatalf("listen on %s failed, err: %s", listenAddr, err.Error())
  154. }
  155. s := grpc.NewServer()
  156. agtrpc.RegisterAgentServer(s, grpcsvc.NewService(&worker, stgAgts))
  157. go serveGRPC(s, lis)
  158. go serveDistLock(distlock)
  159. foever := make(chan struct{})
  160. <-foever
  161. }
  162. func downloadHubConfig() coormq.GetHubConfigResp {
  163. coorCli, err := stgglb.CoordinatorMQPool.Acquire()
  164. if err != nil {
  165. logger.Errorf("new coordinator client: %v", err)
  166. os.Exit(1)
  167. }
  168. defer stgglb.CoordinatorMQPool.Release(coorCli)
  169. cfgResp, err := coorCli.GetHubConfig(coormq.ReqGetHubConfig(cdssdk.HubID(config.Cfg().ID)))
  170. if err != nil {
  171. logger.Errorf("getting hub config: %v", err)
  172. os.Exit(1)
  173. }
  174. return *cfgResp
  175. }
  176. func servePublisher(evtPub *sysevent.Publisher) {
  177. logger.Info("start serving sysevent publisher")
  178. ch := evtPub.Start()
  179. loop:
  180. for {
  181. val, err := ch.Receive().Wait(context.Background())
  182. if err != nil {
  183. logger.Errorf("sysevent publisher stopped with error: %s", err.Error())
  184. break
  185. }
  186. switch val := val.(type) {
  187. case sysevent.PublishError:
  188. logger.Errorf("publishing event: %v", val)
  189. case sysevent.PublisherExited:
  190. if val.Err != nil {
  191. logger.Errorf("publisher exited with error: %v", val.Err)
  192. } else {
  193. logger.Info("publisher exited")
  194. }
  195. break loop
  196. case sysevent.OtherError:
  197. logger.Errorf("sysevent: %v", val)
  198. }
  199. }
  200. logger.Info("sysevent publisher stopped")
  201. // TODO 仅简单结束了程序
  202. os.Exit(1)
  203. }
  204. func setupTickTask(agtPool *agtpool.AgentPool, evtPub *sysevent.Publisher) gocron.Scheduler {
  205. sch, err := gocron.NewScheduler()
  206. if err != nil {
  207. logger.Errorf("new cron scheduler: %s", err.Error())
  208. os.Exit(1)
  209. }
  210. sch.NewJob(gocron.DailyJob(1, gocron.NewAtTimes(
  211. gocron.NewAtTime(0, 0, 0),
  212. )), gocron.NewTask(tickevent.ReportStorageStats, agtPool, evtPub))
  213. sch.NewJob(gocron.DailyJob(1, gocron.NewAtTimes(
  214. gocron.NewAtTime(0, 0, 1),
  215. )), gocron.NewTask(tickevent.ReportHubTransferStats, evtPub))
  216. sch.NewJob(gocron.DailyJob(1, gocron.NewAtTimes(
  217. gocron.NewAtTime(0, 0, 2),
  218. )), gocron.NewTask(tickevent.ReportHubStorageTransferStats, evtPub))
  219. // sch.NewJob(gocron.DurationJob(time.Minute), gocron.NewTask(tickevent.ReportStorageStats, agtPool, evtPub))
  220. // sch.NewJob(gocron.DurationJob(time.Minute), gocron.NewTask(tickevent.ReportHubTransferStats, evtPub))
  221. // sch.NewJob(gocron.DurationJob(time.Minute), gocron.NewTask(tickevent.ReportHubStorageTransferStats, agtPool, evtPub))
  222. return sch
  223. }
  224. func serveAgentServer(server *agtmq.Server) {
  225. logger.Info("start serving command server")
  226. ch := server.Start()
  227. loop:
  228. for {
  229. val, err := ch.Receive()
  230. if err != nil {
  231. logger.Errorf("command server stopped with error: %s", err.Error())
  232. break
  233. }
  234. switch val := val.(type) {
  235. case error:
  236. logger.Errorf("rabbitmq connect with error: %v", val)
  237. case mq.ServerExit:
  238. if val.Error != nil {
  239. logger.Errorf("rabbitmq server exit with error: %v", val.Error)
  240. } else {
  241. logger.Info("rabbitmq server exit")
  242. }
  243. break loop
  244. }
  245. }
  246. logger.Info("command server stopped")
  247. // TODO 仅简单结束了程序
  248. os.Exit(1)
  249. }
  250. func serveGRPC(s *grpc.Server, lis net.Listener) {
  251. logger.Info("start serving grpc")
  252. err := s.Serve(lis)
  253. if err != nil {
  254. logger.Errorf("grpc stopped with error: %s", err.Error())
  255. }
  256. logger.Info("grpc stopped")
  257. // TODO 仅简单结束了程序
  258. os.Exit(1)
  259. }
  260. func serveHTTP(server *http.Server) {
  261. logger.Info("start serving http")
  262. err := server.Serve()
  263. if err != nil {
  264. logger.Errorf("http stopped with error: %s", err.Error())
  265. }
  266. logger.Info("http stopped")
  267. // TODO 仅简单结束了程序
  268. os.Exit(1)
  269. }
  270. func serveDistLock(svc *distlock.Service) {
  271. logger.Info("start serving distlock")
  272. err := svc.Serve()
  273. if err != nil {
  274. logger.Errorf("distlock stopped with error: %s", err.Error())
  275. }
  276. logger.Info("distlock stopped")
  277. // TODO 仅简单结束了程序
  278. os.Exit(1)
  279. }
  280. func serveAccessStat(svc *accessstat.AccessStat) {
  281. logger.Info("start serving access stat")
  282. ch := svc.Start()
  283. loop:
  284. for {
  285. val, err := ch.Receive()
  286. if err != nil {
  287. logger.Errorf("access stat stopped with error: %v", err)
  288. break
  289. }
  290. switch val := val.(type) {
  291. case error:
  292. logger.Errorf("access stat stopped with error: %v", val)
  293. break loop
  294. }
  295. }
  296. logger.Info("access stat stopped")
  297. // TODO 仅简单结束了程序
  298. os.Exit(1)
  299. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。