package tasks import ( "github.com/TeaOSLab/EdgeAPI/internal/db/models" "github.com/TeaOSLab/EdgeAPI/internal/utils/numberutils" "github.com/iwind/TeaGo/dbs" "github.com/iwind/TeaGo/logs" "time" ) func init() { dbs.OnReady(func() { task := NewNodeMonitorTask(60) ticker := time.NewTicker(60 * time.Second) go func() { for range ticker.C { err := task.loop() if err != nil { logs.Println("[TASK][NODE_MONITOR]" + err.Error()) } } }() }) } // 健康节点任务 type NodeMonitorTask struct { intervalSeconds int } func NewNodeMonitorTask(intervalSeconds int) *NodeMonitorTask { return &NodeMonitorTask{ intervalSeconds: intervalSeconds, } } func (this *NodeMonitorTask) Run() { } func (this *NodeMonitorTask) loop() error { // 检查上次运行时间,防止重复运行 settingKey := models.SettingCodeNodeMonitor + "Loop" timestamp := time.Now().Unix() c, err := models.SharedSysSettingDAO.CompareInt64Setting(settingKey, timestamp-int64(this.intervalSeconds)) if err != nil { return err } if c > 0 { return nil } // 记录时间 err = models.SharedSysSettingDAO.UpdateSetting(settingKey, []byte(numberutils.FormatInt64(timestamp))) if err != nil { return err } clusters, err := models.SharedNodeClusterDAO.FindAllEnableClusters() if err != nil { return err } for _, cluster := range clusters { err := this.monitorCluster(cluster) if err != nil { return err } } return nil } func (this *NodeMonitorTask) monitorCluster(cluster *models.NodeCluster) error { clusterId := int64(cluster.Id) // 检查离线节点 inactiveNodes, err := models.SharedNodeDAO.FindAllInactiveNodesWithClusterId(clusterId) if err != nil { return err } for _, node := range inactiveNodes { err = models.SharedMessageDAO.CreateNodeMessage(clusterId, int64(node.Id), models.MessageTypeNodeInactive, models.LevelError, "节点已处于离线状态", nil) if err != nil { return err } // 修改在线状态 err = models.SharedNodeDAO.UpdateNodeActive(int64(node.Id), false) if err != nil { return err } } // TODO 检查恢复连接 // 检查CPU、内存、磁盘不足节点,而且离线的节点不再重复提示 // TODO 需要实现 return nil }