You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

agent_check_state.go 3.8 kB

2 years ago
2 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117
  1. package event
  2. import (
  3. "database/sql"
  4. "time"
  5. "github.com/samber/lo"
  6. "gitlink.org.cn/cloudream/common/pkgs/logger"
  7. "gitlink.org.cn/cloudream/common/pkgs/mq"
  8. "gitlink.org.cn/cloudream/storage-common/consts"
  9. "gitlink.org.cn/cloudream/storage-common/globals"
  10. "gitlink.org.cn/cloudream/storage-common/pkgs/db/model"
  11. "gitlink.org.cn/cloudream/storage-common/pkgs/distlock/reqbuilder"
  12. agtmq "gitlink.org.cn/cloudream/storage-common/pkgs/mq/agent"
  13. scevt "gitlink.org.cn/cloudream/storage-common/pkgs/mq/scanner/event"
  14. "gitlink.org.cn/cloudream/storage-scanner/internal/config"
  15. )
  16. type AgentCheckState struct {
  17. scevt.AgentCheckState
  18. }
  19. func NewAgentCheckState(nodeID int64) *AgentCheckState {
  20. return &AgentCheckState{
  21. AgentCheckState: scevt.NewAgentCheckState(nodeID),
  22. }
  23. }
  24. func (t *AgentCheckState) TryMerge(other Event) bool {
  25. event, ok := other.(*AgentCheckState)
  26. if !ok {
  27. return false
  28. }
  29. return t.NodeID == event.NodeID
  30. }
  31. func (t *AgentCheckState) Execute(execCtx ExecuteContext) {
  32. log := logger.WithType[AgentCheckState]("Event")
  33. log.Debugf("begin with %v", logger.FormatStruct(t))
  34. defer log.Debugf("end")
  35. mutex, err := reqbuilder.NewBuilder().
  36. Metadata().
  37. // 查询、修改节点状态
  38. Node().WriteOne(t.NodeID).
  39. MutexLock(execCtx.Args.DistLock)
  40. if err != nil {
  41. log.Warnf("acquire locks failed, err: %s", err.Error())
  42. return
  43. }
  44. defer mutex.Unlock()
  45. node, err := execCtx.Args.DB.Node().GetByID(execCtx.Args.DB.SQLCtx(), t.NodeID)
  46. if err == sql.ErrNoRows {
  47. return
  48. }
  49. if err != nil {
  50. log.WithField("NodeID", t.NodeID).Warnf("get node by id failed, err: %s", err.Error())
  51. return
  52. }
  53. agentClient, err := globals.AgentMQPool.Acquire(t.NodeID)
  54. if err != nil {
  55. log.WithField("NodeID", t.NodeID).Warnf("create agent client failed, err: %s", err.Error())
  56. return
  57. }
  58. defer agentClient.Close()
  59. getResp, err := agentClient.GetState(agtmq.NewGetState(), mq.RequestOption{Timeout: time.Second * 30})
  60. if err != nil {
  61. log.WithField("NodeID", t.NodeID).Warnf("getting state: %s", err.Error())
  62. // 检查上次上报时间,超时的设置为不可用
  63. // TODO 没有上报过是否要特殊处理?
  64. if node.LastReportTime != nil && time.Since(*node.LastReportTime) > time.Duration(config.Cfg().NodeUnavailableSeconds)*time.Second {
  65. err := execCtx.Args.DB.Node().UpdateState(execCtx.Args.DB.SQLCtx(), t.NodeID, consts.NodeStateUnavailable)
  66. if err != nil {
  67. log.WithField("NodeID", t.NodeID).Warnf("set node state failed, err: %s", err.Error())
  68. return
  69. }
  70. caches, err := execCtx.Args.DB.Cache().GetNodeCaches(execCtx.Args.DB.SQLCtx(), t.NodeID)
  71. if err != nil {
  72. log.WithField("NodeID", t.NodeID).Warnf("get node caches failed, err: %s", err.Error())
  73. return
  74. }
  75. // 补充备份数
  76. execCtx.Executor.Post(NewCheckRepCount(lo.Map(caches, func(ch model.Cache, index int) string { return ch.FileHash })))
  77. return
  78. }
  79. return
  80. }
  81. // 根据返回结果修改节点状态
  82. if getResp.IPFSState != consts.IPFSStateOK {
  83. log.WithField("NodeID", t.NodeID).Warnf("IPFS status is %s, set node state unavailable", getResp.IPFSState)
  84. err := execCtx.Args.DB.Node().UpdateState(execCtx.Args.DB.SQLCtx(), t.NodeID, consts.NodeStateUnavailable)
  85. if err != nil {
  86. log.WithField("NodeID", t.NodeID).Warnf("change node state failed, err: %s", err.Error())
  87. }
  88. return
  89. }
  90. // TODO 如果以后还有其他的状态,要判断哪些状态下能设置Normal
  91. err = execCtx.Args.DB.Node().UpdateState(execCtx.Args.DB.SQLCtx(), t.NodeID, consts.NodeStateNormal)
  92. if err != nil {
  93. log.WithField("NodeID", t.NodeID).Warnf("change node state failed, err: %s", err.Error())
  94. }
  95. }
  96. func init() {
  97. RegisterMessageConvertor(func(msg scevt.AgentCheckState) Event { return NewAgentCheckState(msg.NodeID) })
  98. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。