2024-01-12 13:15:30 +08:00
package postgres
2022-10-15 17:38:34 +08:00
import (
2022-12-22 18:41:34 +08:00
"database/sql"
2022-10-15 17:38:34 +08:00
"fmt"
2024-01-12 13:15:30 +08:00
"mayfly-go/internal/db/dbm/dbi"
2023-07-21 17:07:04 +08:00
"mayfly-go/pkg/utils/anyx"
2024-01-18 17:18:17 +08:00
"mayfly-go/pkg/utils/collx"
2022-12-22 18:41:34 +08:00
"strings"
"time"
2024-03-21 17:15:52 +08:00
"github.com/may-fly/cast"
2022-10-15 17:38:34 +08:00
)
2023-11-26 21:21:35 +08:00
type PgsqlDialect struct {
2024-03-18 12:25:40 +08:00
dbi . DefaultDialect
2022-10-15 17:38:34 +08:00
2024-03-18 12:25:40 +08:00
dc * dbi . DbConn
2024-01-05 08:55:34 +08:00
}
2024-01-05 05:31:32 +00:00
2024-03-01 04:03:03 +00:00
func ( pd * PgsqlDialect ) BatchInsert ( tx * sql . Tx , tableName string , columns [ ] string , values [ ] [ ] any , duplicateStrategy int ) ( int64 , error ) {
2024-01-05 05:31:32 +00:00
// 执行批量insert sql, 跟mysql一样 pg或高斯支持批量insert语法
// insert into table_name (column1, column2, ...) values (value1, value2, ...), (value1, value2, ...), ...
// 把二维数组转为一维数组
var args [ ] any
for _ , v := range values {
args = append ( args , v ... )
}
2024-01-06 22:36:50 +08:00
2024-01-08 11:24:37 +08:00
// 构建占位符字符串 "($1, $2, $3), ($4, $5, $6), ..." 用于指定参数
var placeholders [ ] string
for i := 0 ; i < len ( args ) ; i += len ( columns ) {
var placeholder [ ] string
for j := 0 ; j < len ( columns ) ; j ++ {
placeholder = append ( placeholder , fmt . Sprintf ( "$%d" , i + j + 1 ) )
}
placeholders = append ( placeholders , "(" + strings . Join ( placeholder , ", " ) + ")" )
}
2024-03-01 04:03:03 +00:00
// 根据冲突策略生成后缀
suffix := ""
if pd . dc . Info . Type == dbi . DbTypeGauss {
// 高斯db使用ON DUPLICATE KEY UPDATE 语法参考 https://support.huaweicloud.com/distributed-devg-v3-gaussdb/gaussdb-12-0607.html#ZH-CN_TOPIC_0000001633948138
suffix = pd . gaussOnDuplicateStrategySql ( duplicateStrategy , tableName , columns )
} else {
// pgsql 默认使用 on conflict 语法参考 http://www.postgres.cn/docs/12/sql-insert.html
// vastbase语法参考 https://docs.vastdata.com.cn/zh/docs/VastbaseE100Ver3.0.0/doc/SQL%E8%AF%AD%E6%B3%95/INSERT.html
// kingbase语法参考 https://help.kingbase.com.cn/v8/development/sql-plsql/sql/SQL_Statements_9.html#insert
suffix = pd . pgsqlOnDuplicateStrategySql ( duplicateStrategy , tableName , columns )
}
2024-11-01 17:27:22 +08:00
sqlStr := fmt . Sprintf ( "insert into %s (%s) values %s %s" , pd . QuoteIdentifier ( tableName ) , strings . Join ( columns , "," ) , strings . Join ( placeholders , ", " ) , suffix )
2024-01-08 11:24:37 +08:00
// 执行批量insert sql
2024-03-01 04:03:03 +00:00
return pd . dc . TxExec ( tx , sqlStr , args ... )
}
// pgsql默认唯一键冲突策略
2024-03-15 09:01:51 +00:00
func ( pd * PgsqlDialect ) pgsqlOnDuplicateStrategySql ( duplicateStrategy int , tableName string , columns [ ] string ) string {
2024-03-01 04:03:03 +00:00
suffix := ""
if duplicateStrategy == dbi . DuplicateStrategyIgnore {
suffix = " \n on conflict do nothing"
} else if duplicateStrategy == dbi . DuplicateStrategyUpdate {
// 生成 on conflict () do update set column1 = excluded.column1, column2 = excluded.column2, ...
var updateColumns [ ] string
for _ , col := range columns {
updateColumns = append ( updateColumns , fmt . Sprintf ( "%s = excluded.%s" , col , col ) )
}
// 查询唯一键名,拼接冲突sql
2024-03-21 03:35:18 +00:00
_ , keyRes , _ := pd . dc . Query ( "SELECT constraint_name FROM information_schema.table_constraints WHERE constraint_schema = $1 AND table_name = $2 AND constraint_type in ('PRIMARY KEY', 'UNIQUE') " , pd . dc . Info . CurrentSchema ( ) , tableName )
2024-03-01 04:03:03 +00:00
if len ( keyRes ) > 0 {
for _ , re := range keyRes {
key := anyx . ToString ( re [ "constraint_name" ] )
if key != "" {
suffix += fmt . Sprintf ( " \n on conflict on constraint %s do update set %s \n" , key , strings . Join ( updateColumns , ", " ) )
}
}
}
}
return suffix
}
// 高斯db唯一键冲突策略,使用ON DUPLICATE KEY UPDATE 参考: https://support.huaweicloud.com/distributed-devg-v3-gaussdb/gaussdb-12-0607.html#ZH-CN_TOPIC_0000001633948138
2024-03-15 09:01:51 +00:00
func ( pd * PgsqlDialect ) gaussOnDuplicateStrategySql ( duplicateStrategy int , tableName string , columns [ ] string ) string {
2024-03-01 04:03:03 +00:00
suffix := ""
2024-11-01 17:27:22 +08:00
metadata := pd . dc . GetMetadata ( )
2024-03-01 04:03:03 +00:00
if duplicateStrategy == dbi . DuplicateStrategyIgnore {
suffix = " \n ON DUPLICATE KEY UPDATE NOTHING"
} else if duplicateStrategy == dbi . DuplicateStrategyUpdate {
// 查出表里的唯一键涉及的字段
var uniqueColumns [ ] string
2024-03-15 13:31:53 +08:00
indexs , err := metadata . GetTableIndex ( tableName )
2024-03-01 04:03:03 +00:00
if err == nil {
for _ , index := range indexs {
if index . IsUnique {
cols := strings . Split ( index . ColumnName , "," )
for _ , col := range cols {
if ! collx . ArrayContains ( uniqueColumns , strings . ToLower ( col ) ) {
uniqueColumns = append ( uniqueColumns , strings . ToLower ( col ) )
}
}
}
}
}
suffix = " \n ON DUPLICATE KEY UPDATE "
for i , col := range columns {
// ON DUPLICATE KEY UPDATE语句不支持更新唯一键字段, 所以得去掉
2024-11-01 17:27:22 +08:00
if ! collx . ArrayContains ( uniqueColumns , pd . RemoveQuote ( strings . ToLower ( col ) ) ) {
2024-03-01 04:03:03 +00:00
suffix += fmt . Sprintf ( "%s = excluded.%s" , col , col )
if i < len ( columns ) - 1 {
suffix += ", "
}
}
}
}
return suffix
}
func ( pd * PgsqlDialect ) CopyTable ( copy * dbi . DbCopyTable ) error {
2024-01-23 04:08:02 +00:00
tableName := copy . TableName
// 生成新表名,为老表明+_copy_时间戳
newTableName := tableName + "_copy_" + time . Now ( ) . Format ( "20060102150405" )
// 执行根据旧表创建新表
2024-03-01 04:03:03 +00:00
_ , err := pd . dc . Exec ( fmt . Sprintf ( "create table %s (like %s)" , newTableName , tableName ) )
2024-01-23 04:08:02 +00:00
if err != nil {
return err
}
// 复制数据
if copy . CopyData {
go func ( ) {
2024-03-01 04:03:03 +00:00
_ , _ = pd . dc . Exec ( fmt . Sprintf ( "insert into %s select * from %s" , newTableName , tableName ) )
2024-01-23 04:08:02 +00:00
} ( )
}
// 查询旧表的自增字段名 重新设置新表的序列序列器
2024-03-01 04:03:03 +00:00
_ , res , err := pd . dc . Query ( fmt . Sprintf ( "select column_name from information_schema.columns where table_name = '%s' and column_default like 'nextval%%'" , tableName ) )
2024-01-23 04:08:02 +00:00
if err != nil {
return err
}
for _ , re := range res {
2024-03-21 17:15:52 +08:00
colName := cast . ToString ( re [ "column_name" ] )
2024-01-23 04:08:02 +00:00
if colName != "" {
// 查询自增列当前最大值
2024-03-01 04:03:03 +00:00
_ , maxRes , err := pd . dc . Query ( fmt . Sprintf ( "select max(%s) max_val from %s" , colName , tableName ) )
2024-01-23 04:08:02 +00:00
if err != nil {
return err
}
2024-03-21 17:15:52 +08:00
maxVal := cast . ToInt ( maxRes [ 0 ] [ "max_val" ] )
2024-01-23 04:08:02 +00:00
// 序列起始值为1或当前最大值+1
if maxVal <= 0 {
maxVal = 1
} else {
maxVal += 1
}
// 之所以不用tableName_colName_seq是因为gauss会自动创建同名的序列, 且无法修改序列起始值, 所以直接使用新序列值
newSeqName := fmt . Sprintf ( "%s_%s_copy_seq" , newTableName , colName )
// 创建自增序列,当前最大值为旧表最大值
2024-03-01 04:03:03 +00:00
_ , err = pd . dc . Exec ( fmt . Sprintf ( "CREATE SEQUENCE %s START %d INCREMENT 1" , newSeqName , maxVal ) )
2024-01-23 04:08:02 +00:00
if err != nil {
return err
}
// 将新表的自增主键序列与主键列相关联
2024-03-01 04:03:03 +00:00
_ , err = pd . dc . Exec ( fmt . Sprintf ( "alter table %s alter column %s set default nextval('%s')" , newTableName , colName , newSeqName ) )
2024-01-23 04:08:02 +00:00
if err != nil {
return err
}
}
}
return err
}
2024-03-15 09:01:51 +00:00
2024-11-01 17:27:22 +08:00
func ( pd * PgsqlDialect ) GenerateTableDDL ( columns [ ] dbi . Column , tableInfo dbi . Table , dropBeforeCreate bool ) [ ] string {
quoteTableName := pd . QuoteIdentifier ( tableInfo . TableName )
sqlArr := make ( [ ] string , 0 )
if dropBeforeCreate {
sqlArr = append ( sqlArr , fmt . Sprintf ( "DROP TABLE IF EXISTS %s" , quoteTableName ) )
}
// 组装建表语句
createSql := fmt . Sprintf ( "CREATE TABLE %s (\n" , quoteTableName )
fields := make ( [ ] string , 0 )
pks := make ( [ ] string , 0 )
columnComments := make ( [ ] string , 0 )
commentTmp := "comment on column %s.%s is '%s'"
for _ , column := range columns {
if column . IsPrimaryKey {
pks = append ( pks , pd . QuoteIdentifier ( column . ColumnName ) )
}
fields = append ( fields , pd . genColumnBasicSql ( column ) )
// 防止注释内含有特殊字符串导致sql出错
if column . ColumnComment != "" {
comment := pd . QuoteEscape ( column . ColumnComment )
columnComments = append ( columnComments , fmt . Sprintf ( commentTmp , quoteTableName , pd . QuoteIdentifier ( column . ColumnName ) , comment ) )
}
}
createSql += strings . Join ( fields , ",\n" )
if len ( pks ) > 0 {
createSql += fmt . Sprintf ( ", \nPRIMARY KEY (%s)" , strings . Join ( pks , "," ) )
}
createSql += "\n)"
tableCommentSql := ""
if tableInfo . TableComment != "" {
commentTmp := "comment on table %s is '%s'"
tableCommentSql = fmt . Sprintf ( commentTmp , quoteTableName , pd . QuoteEscape ( tableInfo . TableComment ) )
}
// create
sqlArr = append ( sqlArr , createSql )
// table comment
if tableCommentSql != "" {
sqlArr = append ( sqlArr , tableCommentSql )
}
// column comment
if len ( columnComments ) > 0 {
sqlArr = append ( sqlArr , columnComments ... )
}
return sqlArr
2024-03-15 09:01:51 +00:00
}
2024-11-01 17:27:22 +08:00
func ( pd * PgsqlDialect ) GenerateIndexDDL ( indexs [ ] dbi . Index , tableInfo dbi . Table ) [ ] string {
creates := make ( [ ] string , 0 )
drops := make ( [ ] string , 0 )
comments := make ( [ ] string , 0 )
for _ , index := range indexs {
unique := ""
if index . IsUnique {
unique = "unique"
}
// 如果索引名存在,先删除索引
drops = append ( drops , fmt . Sprintf ( "drop index if exists %s.%s" , pd . dc . Info . CurrentSchema ( ) , index . IndexName ) )
// 取出列名,添加引号
cols := strings . Split ( index . ColumnName , "," )
colNames := make ( [ ] string , len ( cols ) )
for i , name := range cols {
colNames [ i ] = pd . QuoteIdentifier ( name )
}
// 创建索引
creates = append ( creates , fmt . Sprintf ( "CREATE %s INDEX %s on %s.%s(%s)" , unique , pd . QuoteIdentifier ( index . IndexName ) , pd . QuoteIdentifier ( pd . dc . Info . CurrentSchema ( ) ) , pd . QuoteIdentifier ( tableInfo . TableName ) , strings . Join ( colNames , "," ) ) )
if index . IndexComment != "" {
comment := pd . QuoteEscape ( index . IndexComment )
comments = append ( comments , fmt . Sprintf ( "COMMENT ON INDEX %s.%s IS '%s'" , pd . dc . Info . CurrentSchema ( ) , index . IndexName , comment ) )
}
}
sqlArr := make ( [ ] string , 0 )
if len ( drops ) > 0 {
sqlArr = append ( sqlArr , drops ... )
}
if len ( creates ) > 0 {
sqlArr = append ( sqlArr , creates ... )
}
if len ( comments ) > 0 {
sqlArr = append ( sqlArr , comments ... )
}
return sqlArr
2024-03-15 09:01:51 +00:00
}
func ( pd * PgsqlDialect ) UpdateSequence ( tableName string , columns [ ] dbi . Column ) {
for _ , column := range columns {
if column . IsIdentity {
_ , _ = pd . dc . Exec ( fmt . Sprintf ( "select setval('%s_%s_seq', (SELECT max(%s) from %s))" , tableName , column . ColumnName , column . ColumnName , tableName ) )
}
}
}
2024-10-16 17:24:50 +08:00
2024-11-01 17:27:22 +08:00
func ( pd * PgsqlDialect ) GetDataHelper ( ) dbi . DataHelper {
2024-11-26 04:04:09 +00:00
return dataHelper
2024-11-01 17:27:22 +08:00
}
func ( pd * PgsqlDialect ) GetColumnHelper ( ) dbi . ColumnHelper {
2024-11-26 04:04:09 +00:00
return columnHelper
2024-11-01 17:27:22 +08:00
}
func ( pd * PgsqlDialect ) GetDumpHelper ( ) dbi . DumpHelper {
return new ( DumpHelper )
}
func ( pd * PgsqlDialect ) genColumnBasicSql ( column dbi . Column ) string {
colName := pd . QuoteIdentifier ( column . ColumnName )
dataType := string ( column . DataType )
// 如果数据类型是数字,则去掉长度
if collx . ArrayAnyMatches ( [ ] string { "int" } , strings . ToLower ( dataType ) ) {
column . NumPrecision = 0
column . CharMaxLength = 0
}
// 如果是自增类型, 需要转换为serial
if column . IsIdentity {
if dataType == "int4" {
column . DataType = "serial"
} else if dataType == "int2" {
column . DataType = "smallserial"
} else if dataType == "int8" {
column . DataType = "bigserial"
} else {
column . DataType = "bigserial"
}
return fmt . Sprintf ( " %s %s NOT NULL" , colName , column . GetColumnType ( ) )
}
nullAble := ""
if ! column . Nullable {
nullAble = " NOT NULL"
}
defVal := "" // 默认值需要判断引号,如函数是不需要引号的 // 为了防止跨源函数不支持 当默认值是函数时,不需要设置默认值
if column . ColumnDefault != "" && ! strings . Contains ( column . ColumnDefault , "(" ) {
mark := false
// 哪些字段类型默认值需要加引号
if collx . ArrayAnyMatches ( [ ] string { "char" , "text" , "date" , "time" , "lob" } , dataType ) {
// 当数据类型是日期时间,默认值是日期时间函数时,默认值不需要引号
if collx . ArrayAnyMatches ( [ ] string { "date" , "time" } , strings . ToLower ( dataType ) ) &&
collx . ArrayAnyMatches ( [ ] string { "date" , "time" } , strings . ToLower ( column . ColumnDefault ) ) {
mark = false
} else {
mark = true
}
}
// 如果数据类型是日期时间,则写死默认值函数
if collx . ArrayAnyMatches ( [ ] string { "date" , "time" } , strings . ToLower ( dataType ) ) {
column . ColumnDefault = "CURRENT_TIMESTAMP"
}
if mark {
defVal = fmt . Sprintf ( " DEFAULT '%s'" , column . ColumnDefault )
} else {
defVal = fmt . Sprintf ( " DEFAULT %s" , column . ColumnDefault )
}
}
// 如果是varchar, 长度翻倍, 防止报错
if collx . ArrayAnyMatches ( [ ] string { "char" } , strings . ToLower ( dataType ) ) {
column . CharMaxLength = column . CharMaxLength * 2
}
columnSql := fmt . Sprintf ( " %s %s%s%s" , colName , column . GetColumnType ( ) , nullAble , defVal )
return columnSql
2024-10-16 17:24:50 +08:00
}