mirror of
https://gitee.com/dromara/mayfly-go
synced 2025-11-01 23:10:26 +08:00
430 lines
13 KiB
Go
430 lines
13 KiB
Go
package application
|
||
|
||
import (
|
||
"cmp"
|
||
"context"
|
||
"encoding/json"
|
||
"fmt"
|
||
"mayfly-go/internal/db/dbm/dbi"
|
||
"mayfly-go/internal/db/domain/entity"
|
||
"mayfly-go/internal/db/domain/repository"
|
||
"mayfly-go/internal/db/imsg"
|
||
"mayfly-go/pkg/base"
|
||
"mayfly-go/pkg/cache"
|
||
"mayfly-go/pkg/contextx"
|
||
"mayfly-go/pkg/errorx"
|
||
"mayfly-go/pkg/i18n"
|
||
"mayfly-go/pkg/logx"
|
||
"mayfly-go/pkg/model"
|
||
"mayfly-go/pkg/scheduler"
|
||
"mayfly-go/pkg/utils/collx"
|
||
"regexp"
|
||
"strings"
|
||
"time"
|
||
|
||
"github.com/google/uuid"
|
||
"github.com/spf13/cast"
|
||
)
|
||
|
||
type DataSyncTask interface {
|
||
base.App[*entity.DataSyncTask]
|
||
|
||
// GetPageList 分页获取数据库实例
|
||
GetPageList(condition *entity.DataSyncTaskQuery, orderBy ...string) (*model.PageResult[*entity.DataSyncTask], error)
|
||
|
||
Save(ctx context.Context, instanceEntity *entity.DataSyncTask) error
|
||
|
||
Delete(ctx context.Context, id uint64) error
|
||
|
||
InitCronJob()
|
||
|
||
Run(ctx context.Context, id uint64) error
|
||
|
||
StopTask(ctx context.Context, id uint64) error
|
||
|
||
GetTaskLogList(condition *entity.DataSyncLogQuery, orderBy ...string) (*model.PageResult[*entity.DataSyncLog], error)
|
||
}
|
||
|
||
var _ (DataSyncTask) = (*dataSyncAppImpl)(nil)
|
||
|
||
type dataSyncAppImpl struct {
|
||
base.AppImpl[*entity.DataSyncTask, repository.DataSyncTask]
|
||
|
||
dbDataSyncLogRepo repository.DataSyncLog `inject:"T"`
|
||
|
||
dbApp Db `inject:"T"`
|
||
}
|
||
|
||
var (
|
||
whereReg = regexp.MustCompile(`(?i)where`)
|
||
)
|
||
|
||
func (app *dataSyncAppImpl) GetPageList(condition *entity.DataSyncTaskQuery, orderBy ...string) (*model.PageResult[*entity.DataSyncTask], error) {
|
||
return app.GetRepo().GetTaskList(condition, orderBy...)
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) Save(ctx context.Context, taskEntity *entity.DataSyncTask) error {
|
||
var err error
|
||
if taskEntity.Id == 0 {
|
||
// 新建时生成key
|
||
taskEntity.TaskKey = uuid.New().String()
|
||
err = app.Insert(ctx, taskEntity)
|
||
} else {
|
||
taskEntity.TaskKey = ""
|
||
err = app.UpdateById(ctx, taskEntity)
|
||
}
|
||
if err != nil {
|
||
return err
|
||
}
|
||
|
||
app.addCronJob(ctx, taskEntity)
|
||
return nil
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) Delete(ctx context.Context, id uint64) error {
|
||
task, err := app.GetById(id)
|
||
if err == nil {
|
||
return errorx.NewBiz("sync task not found")
|
||
}
|
||
scheduler.RemoveByKey(task.TaskKey)
|
||
app.MarkStop(id)
|
||
|
||
return app.DeleteById(ctx, id)
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) Run(ctx context.Context, id uint64) error {
|
||
if app.IsRunning(id) {
|
||
logx.Warnf("[%d] the db sync task is running...", id)
|
||
return nil
|
||
}
|
||
|
||
task, err := app.GetById(id)
|
||
if err != nil {
|
||
return errorx.NewBiz("task not found")
|
||
}
|
||
|
||
logx.InfofContext(ctx, "start the data sync task: %s => %s", task.TaskName, task.TaskKey)
|
||
|
||
if task.RunningState == entity.DataSyncTaskRunStateRunning {
|
||
return errorx.NewBiz("the task is in progress")
|
||
}
|
||
|
||
updateStateTask := &entity.DataSyncTask{
|
||
RunningState: entity.DataSyncTaskRunStateRunning,
|
||
}
|
||
updateStateTask.Id = id
|
||
if err := app.UpdateById(ctx, updateStateTask); err != nil {
|
||
return errorx.NewBizf("failed to update task running state: %s", err.Error())
|
||
}
|
||
|
||
// 标记该任务运行中
|
||
app.MarkRunning(id)
|
||
go func() {
|
||
now := time.Now()
|
||
syncLog := &entity.DataSyncLog{
|
||
TaskId: task.Id,
|
||
CreateTime: &now,
|
||
Status: entity.DataSyncTaskStateFail, // 默认失败
|
||
}
|
||
defer app.endRunning(task, syncLog)
|
||
|
||
// 通过占位符格式化sql
|
||
updSql := ""
|
||
orderSql := ""
|
||
if task.UpdFieldVal != "0" && task.UpdFieldVal != "" && task.UpdField != "" {
|
||
if err != nil {
|
||
logx.ErrorfContext(ctx, "data source connection unavailable: %s", err.Error())
|
||
return
|
||
}
|
||
srcConn, err := app.dbApp.GetDbConn(context.Background(), uint64(task.SrcDbId), task.SrcDbName)
|
||
if err != nil {
|
||
logx.ErrorfContext(ctx, "failed to connect to the source database: %s", err.Error())
|
||
return
|
||
}
|
||
|
||
updFieldDataType := dbi.DefaultDbDataType
|
||
srcConn.WalkQueryRows(context.Background(), task.DataSql, func(row map[string]any, columns []*dbi.QueryColumn) error {
|
||
for _, column := range columns {
|
||
if strings.EqualFold(column.Name, cmp.Or(task.UpdFieldSrc, task.UpdField)) {
|
||
updFieldDataType = column.DbDataType
|
||
break
|
||
}
|
||
}
|
||
return dbi.NewStopWalkQueryError("get column data type... ignore~")
|
||
})
|
||
|
||
updSql = fmt.Sprintf("and %s > %s", task.UpdField, updFieldDataType.DataType.SQLValue(task.UpdFieldVal))
|
||
orderSql = "order by " + task.UpdField + " asc "
|
||
}
|
||
// 正则判断DataSql是否以where .*结尾,如果是则不添加where 1 = 1
|
||
var where = "where 1=1"
|
||
if whereReg.MatchString(task.DataSql) {
|
||
where = ""
|
||
}
|
||
|
||
// 组装查询sql
|
||
sqlStr := fmt.Sprintf("%s %s %s %s", task.DataSql, where, updSql, orderSql)
|
||
syncLog.DataSqlFull = sqlStr
|
||
|
||
err := app.doDataSync(ctx, sqlStr, task, syncLog)
|
||
if err != nil {
|
||
syncLog.ErrText = i18n.T(imsg.DataSyncFailMsg, "msg", err.Error())
|
||
logx.ErrorContext(ctx, syncLog.ErrText)
|
||
syncLog.Status = entity.DataSyncTaskStateFail
|
||
} else {
|
||
syncLog.Status = entity.DataSyncTaskStateSuccess
|
||
}
|
||
}()
|
||
|
||
return nil
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) doDataSync(ctx context.Context, sql string, task *entity.DataSyncTask, syncLog *entity.DataSyncLog) error {
|
||
// 获取源数据库连接
|
||
srcConn, err := app.dbApp.GetDbConn(ctx, uint64(task.SrcDbId), task.SrcDbName)
|
||
|
||
if err != nil {
|
||
return errorx.NewBizf("failed to connect to the source database: %s", err.Error())
|
||
}
|
||
|
||
// 获取目标数据库连接
|
||
targetConn, err := app.dbApp.GetDbConn(ctx, uint64(task.TargetDbId), task.TargetDbName)
|
||
if err != nil {
|
||
return errorx.NewBizf("failed to connect to the target database: %s", err.Error())
|
||
}
|
||
|
||
// task.FieldMap为json数组字符串 [{"src":"id","target":"id"}],转为map
|
||
var fieldMap []map[string]string
|
||
err = json.Unmarshal([]byte(task.FieldMap), &fieldMap)
|
||
if err != nil {
|
||
return errorx.NewBizf("there was an error parsing the field map json: %s", err.Error())
|
||
}
|
||
|
||
// 记录本次同步数据总数
|
||
total := 0
|
||
batchSize := task.PageSize
|
||
result := make([]map[string]any, 0)
|
||
|
||
// 如果有数据库别名,则从UpdField中去掉数据库别名, 如:a.id => id,用于获取字段具体名称
|
||
updFieldName := task.UpdField
|
||
if task.UpdField != "" && strings.Contains(task.UpdField, ".") {
|
||
updFieldName = strings.Split(task.UpdField, ".")[1]
|
||
}
|
||
|
||
targetTableColumns, err := targetConn.GetMetadata().GetColumns(task.TargetTableName)
|
||
if err != nil {
|
||
return errorx.NewBizf("failed to get target table columns: %s", err.Error())
|
||
}
|
||
targetColumnName2Column := collx.ArrayToMap(targetTableColumns, func(column dbi.Column) string {
|
||
return column.ColumnName
|
||
})
|
||
|
||
// 目标库对应的insert columns
|
||
targetInsertColumns := collx.ArrayMap[map[string]string, dbi.Column](fieldMap, func(val map[string]string) dbi.Column {
|
||
return targetColumnName2Column[val["target"]]
|
||
})
|
||
|
||
_, err = srcConn.WalkQueryRows(context.Background(), sql, func(row map[string]any, columns []*dbi.QueryColumn) error {
|
||
total++
|
||
result = append(result, row)
|
||
if total%batchSize == 0 {
|
||
if err := app.srcData2TargetDb(result, fieldMap, updFieldName, task, targetConn, targetInsertColumns); err != nil {
|
||
return err
|
||
}
|
||
|
||
// 记录当前已同步的数据量
|
||
syncLog.ErrText = i18n.T(imsg.DataSyncingMsg, "count", total)
|
||
logx.InfoContext(ctx, syncLog.ErrText)
|
||
syncLog.ResNum = total
|
||
app.saveLog(syncLog)
|
||
|
||
result = result[:0]
|
||
|
||
// 运行过程中,判断状态是否为已关闭,是则结束运行,否则继续运行
|
||
if !app.IsRunning(task.Id) {
|
||
return errorx.NewBiz("the task has been terminated manually")
|
||
}
|
||
}
|
||
|
||
return nil
|
||
})
|
||
|
||
if err != nil {
|
||
return err
|
||
}
|
||
|
||
// 处理剩余的数据
|
||
if len(result) > 0 {
|
||
if err := app.srcData2TargetDb(result, fieldMap, updFieldName, task, targetConn, targetInsertColumns); err != nil {
|
||
return err
|
||
}
|
||
}
|
||
|
||
logx.InfofContext(ctx, "synchronous task: [%s], finished execution, save records successfully: [%d]", task.TaskName, total)
|
||
|
||
// 执行成功日志
|
||
syncLog.ErrText = i18n.T(imsg.DataSyncSuccessMsg, "count", total)
|
||
syncLog.ResNum = total
|
||
|
||
return nil
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) srcData2TargetDb(srcRes []map[string]any, fieldMap []map[string]string, updFieldName string, task *entity.DataSyncTask, targetDbConn *dbi.DbConn, targetInsertColumns []dbi.Column) (err error) {
|
||
// 遍历res,组装数据
|
||
var targetData = make([]map[string]any, 0)
|
||
for _, srcData := range srcRes {
|
||
var data = make(map[string]any)
|
||
// 遍历字段映射, target字段的值为src字段取值
|
||
for _, item := range fieldMap {
|
||
// target字段的值为src字段取值
|
||
data[item["target"]] = srcData[item["src"]]
|
||
}
|
||
targetData = append(targetData, data)
|
||
}
|
||
|
||
targetValues := make([][]any, 0)
|
||
for _, item := range targetData {
|
||
var values = make([]any, 0)
|
||
for _, column := range targetInsertColumns {
|
||
values = append(values, item[column.ColumnName])
|
||
}
|
||
targetValues = append(targetValues, values)
|
||
}
|
||
|
||
// 执行插入
|
||
targetDialect := targetDbConn.GetDialect()
|
||
|
||
// 生成目标数据库批量插入sql,并执行
|
||
sqls := targetDialect.GetSQLGenerator().GenInsert(task.TargetTableName, targetInsertColumns, targetValues, cmp.Or(task.DuplicateStrategy, dbi.DuplicateStrategyNone))
|
||
|
||
// 开启本批次执行事务
|
||
targetDbTx, err := targetDbConn.Begin()
|
||
if err != nil {
|
||
return errorx.NewBizf("failed to start the target database transaction: %s", err.Error())
|
||
}
|
||
defer func() {
|
||
if r := recover(); r != nil {
|
||
targetDbTx.Rollback()
|
||
err = fmt.Errorf("%v", r)
|
||
}
|
||
}()
|
||
|
||
for _, sql := range sqls {
|
||
_, err := targetDbTx.Exec(sql)
|
||
if err != nil {
|
||
targetDbTx.Rollback()
|
||
return err
|
||
}
|
||
}
|
||
|
||
// 如果是mssql,暂不手动提交事务,否则报错 mssql: The COMMIT TRANSACTION request has no corresponding BEGIN TRANSACTION.
|
||
if err := targetDbTx.Commit(); err != nil {
|
||
if targetDbConn.Info.Type != dbi.ToDbType("mssql") {
|
||
return errorx.NewBizf("data synchronization - The target database transaction failed to commit: %s", err.Error())
|
||
}
|
||
}
|
||
|
||
setUpdateFieldVal := func(field string) {
|
||
// 解决字段大小写问题
|
||
updFieldVal := srcRes[len(srcRes)-1][strings.ToUpper(field)]
|
||
if updFieldVal == "" || updFieldVal == nil {
|
||
updFieldVal = srcRes[len(srcRes)-1][strings.ToLower(field)]
|
||
}
|
||
|
||
task.UpdFieldVal = cast.ToString(updFieldVal)
|
||
}
|
||
// 如果指定了更新字段,则以更新字段取值
|
||
setUpdateFieldVal(cmp.Or(task.UpdFieldSrc, updFieldName))
|
||
|
||
return nil
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) StopTask(ctx context.Context, taskId uint64) error {
|
||
task := new(entity.DataSyncTask)
|
||
task.Id = taskId
|
||
task.RunningState = entity.DataSyncTaskRunStateStop
|
||
if err := app.UpdateById(ctx, task); err != nil {
|
||
return err
|
||
}
|
||
app.MarkStop(taskId)
|
||
return nil
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) endRunning(taskEntity *entity.DataSyncTask, log *entity.DataSyncLog) {
|
||
logx.Info(log.ErrText)
|
||
|
||
state := log.Status
|
||
task := new(entity.DataSyncTask)
|
||
task.Id = taskEntity.Id
|
||
task.RecentState = state
|
||
task.UpdFieldVal = taskEntity.UpdFieldVal
|
||
task.RunningState = entity.DataSyncTaskRunStateReady
|
||
_ = app.UpdateById(context.Background(), task)
|
||
// 保存执行日志
|
||
app.saveLog(log)
|
||
app.MarkStop(task.Id)
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) saveLog(log *entity.DataSyncLog) {
|
||
app.dbDataSyncLogRepo.Save(context.Background(), log)
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) InitCronJob() {
|
||
ctx := contextx.NewTraceId()
|
||
|
||
defer func() {
|
||
if err := recover(); err != nil {
|
||
logx.ErrorTraceContext(ctx, "the data synchronization task failed to initialize", err)
|
||
}
|
||
}()
|
||
|
||
// 修改执行中状态为待执行
|
||
_ = app.UpdateByCond(context.TODO(), &entity.DataSyncTask{RunningState: entity.DataSyncTaskRunStateReady}, &entity.DataSyncTask{RunningState: entity.DataSyncTaskRunStateRunning})
|
||
|
||
if err := app.CursorByCond(&entity.DataSyncTaskQuery{Status: entity.DataSyncTaskStatusEnable}, func(dst *entity.DataSyncTask) error {
|
||
app.MarkStop(dst.Id)
|
||
app.addCronJob(ctx, dst)
|
||
return nil
|
||
}); err != nil {
|
||
logx.ErrorTraceContext(ctx, "the db data sync task failed to initialize: %v", err)
|
||
}
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) GetTaskLogList(condition *entity.DataSyncLogQuery, orderBy ...string) (*model.PageResult[*entity.DataSyncLog], error) {
|
||
return app.dbDataSyncLogRepo.GetTaskLogList(condition, orderBy...)
|
||
}
|
||
|
||
// MarkRunning 标记任务执行中
|
||
func (app *dataSyncAppImpl) MarkRunning(taskId uint64) {
|
||
cache.Set(fmt.Sprintf("mayfly:db:syncdata:%d", taskId), 1, -1)
|
||
}
|
||
|
||
// MarkStop 标记任务结束
|
||
func (app *dataSyncAppImpl) MarkStop(taskId uint64) {
|
||
cache.Del(fmt.Sprintf("mayfly:db:syncdata:%d", taskId))
|
||
}
|
||
|
||
// IsRunning 判断任务是否执行中
|
||
func (app *dataSyncAppImpl) IsRunning(taskId uint64) bool {
|
||
return cache.GetStr(fmt.Sprintf("mayfly:db:syncdata:%d", taskId)) != ""
|
||
}
|
||
|
||
func (app *dataSyncAppImpl) addCronJob(ctx context.Context, taskEntity *entity.DataSyncTask) {
|
||
key := taskEntity.TaskKey
|
||
// 先移除旧的任务
|
||
scheduler.RemoveByKey(key)
|
||
|
||
// 根据状态添加新的任务
|
||
if taskEntity.Status == entity.DataSyncTaskStatusEnable {
|
||
taskId := taskEntity.Id
|
||
logx.InfofContext(ctx, "start add the data sync task job: %s, cron[%s]", taskEntity.TaskName, taskEntity.TaskCron)
|
||
if err := scheduler.AddFunByKey(key, taskEntity.TaskCron, func() {
|
||
if err := app.Run(context.Background(), taskId); err != nil {
|
||
logx.ErrorfContext(ctx, "the data sync task failed to execute at a scheduled time: %s", err.Error())
|
||
}
|
||
}); err != nil {
|
||
logx.ErrorTraceContext(ctx, "add db data sync job failed", err)
|
||
}
|
||
}
|
||
}
|