2020-10-25 18:26:46 +08:00
|
|
|
|
package tasks
|
|
|
|
|
|
|
|
|
|
|
|
import (
|
|
|
|
|
|
"github.com/TeaOSLab/EdgeAPI/internal/db/models"
|
|
|
|
|
|
"github.com/TeaOSLab/EdgeAPI/internal/utils/numberutils"
|
|
|
|
|
|
"github.com/iwind/TeaGo/dbs"
|
|
|
|
|
|
"github.com/iwind/TeaGo/logs"
|
|
|
|
|
|
"time"
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
func init() {
|
|
|
|
|
|
dbs.OnReady(func() {
|
|
|
|
|
|
task := NewNodeMonitorTask(60)
|
|
|
|
|
|
ticker := time.NewTicker(60 * time.Second)
|
|
|
|
|
|
go func() {
|
|
|
|
|
|
for range ticker.C {
|
|
|
|
|
|
err := task.loop()
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
logs.Println("[TASK][NODE_MONITOR]" + err.Error())
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
}()
|
|
|
|
|
|
})
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// 健康节点任务
|
|
|
|
|
|
type NodeMonitorTask struct {
|
|
|
|
|
|
intervalSeconds int
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
func NewNodeMonitorTask(intervalSeconds int) *NodeMonitorTask {
|
|
|
|
|
|
return &NodeMonitorTask{
|
|
|
|
|
|
intervalSeconds: intervalSeconds,
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
func (this *NodeMonitorTask) Run() {
|
|
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
func (this *NodeMonitorTask) loop() error {
|
|
|
|
|
|
// 检查上次运行时间,防止重复运行
|
2020-12-02 20:31:29 +08:00
|
|
|
|
settingKey := models.SettingCodeNodeMonitor + "Loop"
|
2020-10-25 18:26:46 +08:00
|
|
|
|
timestamp := time.Now().Unix()
|
|
|
|
|
|
c, err := models.SharedSysSettingDAO.CompareInt64Setting(settingKey, timestamp-int64(this.intervalSeconds))
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
if c > 0 {
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// 记录时间
|
|
|
|
|
|
err = models.SharedSysSettingDAO.UpdateSetting(settingKey, []byte(numberutils.FormatInt64(timestamp)))
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
clusters, err := models.SharedNodeClusterDAO.FindAllEnableClusters()
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
for _, cluster := range clusters {
|
|
|
|
|
|
err := this.monitorCluster(cluster)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
func (this *NodeMonitorTask) monitorCluster(cluster *models.NodeCluster) error {
|
|
|
|
|
|
clusterId := int64(cluster.Id)
|
|
|
|
|
|
|
|
|
|
|
|
// 检查离线节点
|
|
|
|
|
|
inactiveNodes, err := models.SharedNodeDAO.FindAllInactiveNodesWithClusterId(clusterId)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
|
|
|
|
|
for _, node := range inactiveNodes {
|
|
|
|
|
|
err = models.SharedMessageDAO.CreateNodeMessage(clusterId, int64(node.Id), models.MessageTypeNodeInactive, models.LevelError, "节点已处于离线状态", nil)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
2020-11-16 09:20:24 +08:00
|
|
|
|
|
|
|
|
|
|
// 修改在线状态
|
|
|
|
|
|
err = models.SharedNodeDAO.UpdateNodeActive(int64(node.Id), false)
|
|
|
|
|
|
if err != nil {
|
|
|
|
|
|
return err
|
|
|
|
|
|
}
|
2020-10-25 18:26:46 +08:00
|
|
|
|
}
|
|
|
|
|
|
|
2020-10-25 21:27:46 +08:00
|
|
|
|
// TODO 检查恢复连接
|
|
|
|
|
|
|
2020-10-25 18:26:46 +08:00
|
|
|
|
// 检查CPU、内存、磁盘不足节点,而且离线的节点不再重复提示
|
|
|
|
|
|
// TODO 需要实现
|
|
|
|
|
|
|
|
|
|
|
|
return nil
|
|
|
|
|
|
}
|