You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

agent_check_state.go 3.8 kB

2 years ago
2 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117
  1. package event
  2. import (
  3. "database/sql"
  4. "time"
  5. "gitlink.org.cn/cloudream/common/pkgs/logger"
  6. "gitlink.org.cn/cloudream/common/pkgs/mq"
  7. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  8. "gitlink.org.cn/cloudream/storage/common/consts"
  9. stgglb "gitlink.org.cn/cloudream/storage/common/globals"
  10. "gitlink.org.cn/cloudream/storage/common/pkgs/distlock/reqbuilder"
  11. agtmq "gitlink.org.cn/cloudream/storage/common/pkgs/mq/agent"
  12. scevt "gitlink.org.cn/cloudream/storage/common/pkgs/mq/scanner/event"
  13. "gitlink.org.cn/cloudream/storage/scanner/internal/config"
  14. )
  15. type AgentCheckState struct {
  16. *scevt.AgentCheckState
  17. }
  18. func NewAgentCheckState(nodeID cdssdk.NodeID) *AgentCheckState {
  19. return &AgentCheckState{
  20. AgentCheckState: scevt.NewAgentCheckState(nodeID),
  21. }
  22. }
  23. func (t *AgentCheckState) TryMerge(other Event) bool {
  24. event, ok := other.(*AgentCheckState)
  25. if !ok {
  26. return false
  27. }
  28. return t.NodeID == event.NodeID
  29. }
  30. func (t *AgentCheckState) Execute(execCtx ExecuteContext) {
  31. log := logger.WithType[AgentCheckState]("Event")
  32. log.Debugf("begin with %v", logger.FormatStruct(t.AgentCheckState))
  33. defer log.Debugf("end")
  34. mutex, err := reqbuilder.NewBuilder().
  35. Metadata().
  36. // 查询、修改节点状态
  37. Node().WriteOne(t.NodeID).
  38. MutexLock(execCtx.Args.DistLock)
  39. if err != nil {
  40. log.Warnf("acquire locks failed, err: %s", err.Error())
  41. return
  42. }
  43. defer mutex.Unlock()
  44. node, err := execCtx.Args.DB.Node().GetByID(execCtx.Args.DB.SQLCtx(), t.NodeID)
  45. if err == sql.ErrNoRows {
  46. return
  47. }
  48. if err != nil {
  49. log.WithField("NodeID", t.NodeID).Warnf("get node by id failed, err: %s", err.Error())
  50. return
  51. }
  52. agtCli, err := stgglb.AgentMQPool.Acquire(t.NodeID)
  53. if err != nil {
  54. log.WithField("NodeID", t.NodeID).Warnf("create agent client failed, err: %s", err.Error())
  55. return
  56. }
  57. defer stgglb.AgentMQPool.Release(agtCli)
  58. getResp, err := agtCli.GetState(agtmq.NewGetState(), mq.RequestOption{Timeout: time.Second * 30})
  59. if err != nil {
  60. log.WithField("NodeID", t.NodeID).Warnf("getting state: %s", err.Error())
  61. // 检查上次上报时间,超时的设置为不可用
  62. // TODO 没有上报过是否要特殊处理?
  63. if node.LastReportTime != nil && time.Since(*node.LastReportTime) > time.Duration(config.Cfg().NodeUnavailableSeconds)*time.Second {
  64. err := execCtx.Args.DB.Node().UpdateState(execCtx.Args.DB.SQLCtx(), t.NodeID, consts.NodeStateUnavailable)
  65. if err != nil {
  66. log.WithField("NodeID", t.NodeID).Warnf("set node state failed, err: %s", err.Error())
  67. return
  68. }
  69. /*
  70. caches, err := execCtx.Args.DB.Cache().GetNodeCaches(execCtx.Args.DB.SQLCtx(), t.NodeID)
  71. if err != nil {
  72. log.WithField("NodeID", t.NodeID).Warnf("get node caches failed, err: %s", err.Error())
  73. return
  74. }
  75. // 补充备份数
  76. execCtx.Executor.Post(NewCheckRepCount(lo.Map(caches, func(ch model.Cache, index int) string { return ch.FileHash })))
  77. */
  78. return
  79. }
  80. return
  81. }
  82. // 根据返回结果修改节点状态
  83. if getResp.IPFSState != consts.IPFSStateOK {
  84. log.WithField("NodeID", t.NodeID).Warnf("IPFS status is %s, set node state unavailable", getResp.IPFSState)
  85. err := execCtx.Args.DB.Node().UpdateState(execCtx.Args.DB.SQLCtx(), t.NodeID, consts.NodeStateUnavailable)
  86. if err != nil {
  87. log.WithField("NodeID", t.NodeID).Warnf("change node state failed, err: %s", err.Error())
  88. }
  89. return
  90. }
  91. // TODO 如果以后还有其他的状态,要判断哪些状态下能设置Normal
  92. err = execCtx.Args.DB.Node().UpdateState(execCtx.Args.DB.SQLCtx(), t.NodeID, consts.NodeStateNormal)
  93. if err != nil {
  94. log.WithField("NodeID", t.NodeID).Warnf("change node state failed, err: %s", err.Error())
  95. }
  96. }
  97. func init() {
  98. RegisterMessageConvertor(func(msg *scevt.AgentCheckState) Event { return NewAgentCheckState(msg.NodeID) })
  99. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。