2022-11-06 09:21:32 +00:00
|
|
|
package populatedb
|
|
|
|
|
|
|
|
import (
|
2022-11-06 10:56:31 +00:00
|
|
|
"context"
|
2022-11-06 09:21:32 +00:00
|
|
|
"database/sql"
|
|
|
|
"errors"
|
|
|
|
"fmt"
|
|
|
|
"net/url"
|
2022-11-06 10:56:31 +00:00
|
|
|
"strings"
|
2022-11-06 09:21:32 +00:00
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/go-sql-driver/mysql"
|
|
|
|
tblsconfig "github.com/k1LoW/tbls/config"
|
|
|
|
tblsdatasource "github.com/k1LoW/tbls/datasource"
|
|
|
|
tblsschema "github.com/k1LoW/tbls/schema"
|
|
|
|
)
|
|
|
|
|
|
|
|
const (
|
|
|
|
dialectMySQL = "mysql"
|
2022-11-06 10:56:31 +00:00
|
|
|
|
2022-11-06 16:56:16 +00:00
|
|
|
// 2^16
|
|
|
|
maxQuestionMarks = 65536
|
|
|
|
|
|
|
|
stmtInsert = "INSERT INTO %s (%s) VALUES %s;"
|
2022-11-06 09:21:32 +00:00
|
|
|
)
|
|
|
|
|
2022-11-06 10:56:31 +00:00
|
|
|
var (
|
2022-11-06 16:56:16 +00:00
|
|
|
ErrNotSupportDialect = errors.New("not support dialect")
|
|
|
|
ErrTableNotExist = errors.New("table not exist")
|
|
|
|
ErrMaximumQuestionMarks = errors.New("maximum question marks")
|
2022-11-06 10:56:31 +00:00
|
|
|
)
|
2022-11-06 09:21:32 +00:00
|
|
|
|
2022-11-06 10:56:31 +00:00
|
|
|
type Populator interface {
|
|
|
|
Insert(ctx context.Context, tableName string, numberRecord int) error
|
2022-11-06 17:13:18 +00:00
|
|
|
InsertBatch(ctx context.Context, tableName string, numberRecord int) error
|
2022-11-06 10:56:31 +00:00
|
|
|
}
|
2022-11-06 09:21:32 +00:00
|
|
|
|
|
|
|
type populator struct {
|
|
|
|
db *sql.DB
|
|
|
|
tblsSchema *tblsschema.Schema
|
2022-11-06 10:56:31 +00:00
|
|
|
tables map[string]*tblsschema.Table
|
|
|
|
verbose bool
|
|
|
|
dryRun bool
|
2022-11-06 09:21:32 +00:00
|
|
|
}
|
|
|
|
|
2022-11-06 10:56:31 +00:00
|
|
|
func NewPopulator(
|
|
|
|
dbDialect string,
|
|
|
|
dbURL string,
|
|
|
|
verbose bool,
|
|
|
|
dryRun bool,
|
|
|
|
) (Populator, error) {
|
2022-11-06 09:21:32 +00:00
|
|
|
if dbDialect != dialectMySQL {
|
2022-11-06 11:02:49 +00:00
|
|
|
return nil, fmt.Errorf("not support dialect [%s]: %w", dbDialect, ErrNotSupportDialect)
|
2022-11-06 09:21:32 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// https://go.dev/doc/tutorial/database-access
|
|
|
|
mysqlCfg, err := mysql.ParseDSN(dbURL)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("mysql: failed to parse dsn [%s]: %w", dbURL, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// https://github.com/go-sql-driver/mysql#timetime-support
|
|
|
|
mysqlCfg.ParseTime = true
|
|
|
|
mysqlCfg.AllowNativePasswords = true
|
|
|
|
mysqlCfg.Loc = time.UTC
|
|
|
|
|
|
|
|
mysqlURL := mysqlCfg.FormatDSN()
|
|
|
|
db, err := sql.Open(dbDialect, mysqlURL)
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("sql: failed to open [%s]: %w", mysqlURL, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
if err := db.Ping(); err != nil {
|
|
|
|
return nil, fmt.Errorf("database: failed to ping [%s] : %w", mysqlURL, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// https://github.com/k1LoW/tbls
|
|
|
|
// https://stackoverflow.com/q/48671938
|
|
|
|
tblsURL := "mysql://" + mysqlCfg.User + ":" + url.QueryEscape(mysqlCfg.Passwd) + "@" + mysqlCfg.Addr + "/" + mysqlCfg.DBName
|
|
|
|
tblsSchema, err := tblsdatasource.Analyze(tblsconfig.DSN{
|
|
|
|
URL: tblsURL,
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return nil, fmt.Errorf("tbls: faield to analyze [%s]: %w", tblsURL, err)
|
|
|
|
}
|
|
|
|
|
2022-11-06 10:56:31 +00:00
|
|
|
tables := make(map[string]*tblsschema.Table, len(tblsSchema.Tables))
|
|
|
|
for _, table := range tblsSchema.Tables {
|
|
|
|
tables[table.Name] = table
|
|
|
|
}
|
|
|
|
|
2022-11-06 09:21:32 +00:00
|
|
|
return &populator{
|
|
|
|
db: db,
|
|
|
|
tblsSchema: tblsSchema,
|
2022-11-06 10:56:31 +00:00
|
|
|
tables: tables,
|
|
|
|
verbose: verbose,
|
|
|
|
dryRun: dryRun,
|
2022-11-06 09:21:32 +00:00
|
|
|
}, nil
|
|
|
|
}
|
2022-11-06 10:56:31 +00:00
|
|
|
|
|
|
|
func (p *populator) Insert(ctx context.Context, tableName string, numberRecord int) error {
|
2022-11-06 16:56:16 +00:00
|
|
|
columnNames, questionMarks, argFns, err := p.prepareInsert(tableName)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2022-11-06 10:56:31 +00:00
|
|
|
}
|
|
|
|
|
2022-11-06 17:13:18 +00:00
|
|
|
// INSERT INTO table_name (column1, column2, column3) VALUES (?, ?, ?);
|
2022-11-06 10:56:31 +00:00
|
|
|
queryInsert := fmt.Sprintf(stmtInsert,
|
|
|
|
tableName,
|
|
|
|
strings.Join(columnNames, ", "),
|
2022-11-06 16:56:16 +00:00
|
|
|
fmt.Sprintf("(%s)", strings.Join(questionMarks, ", ")),
|
2022-11-06 10:56:31 +00:00
|
|
|
)
|
|
|
|
|
|
|
|
for i := 0; i < numberRecord; i++ {
|
2022-11-06 16:56:16 +00:00
|
|
|
// Generate each time insert for different value
|
2022-11-06 10:56:31 +00:00
|
|
|
args := make([]any, 0, len(argFns))
|
|
|
|
for _, argFn := range argFns {
|
|
|
|
args = append(args, argFn())
|
|
|
|
}
|
|
|
|
|
|
|
|
if p.verbose {
|
2022-11-06 17:31:03 +00:00
|
|
|
fmt.Printf("Index: [%d]\n", i)
|
2022-11-06 10:56:31 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if !p.dryRun {
|
|
|
|
if _, err := p.db.ExecContext(ctx, queryInsert, args...); err != nil {
|
|
|
|
return fmt.Errorf("database: failed to exec [%s]: %w", queryInsert, err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
2022-11-06 16:56:16 +00:00
|
|
|
|
2022-11-06 17:13:18 +00:00
|
|
|
func (p *populator) InsertBatch(ctx context.Context, tableName string, numberRecord int) error {
|
2022-11-06 16:56:16 +00:00
|
|
|
columnNames, questionMarks, argFns, err := p.prepareInsert(tableName)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if len(columnNames) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
numberRecordEachBatch := maxQuestionMarks / len(questionMarks)
|
|
|
|
if numberRecordEachBatch == 0 {
|
2022-11-06 17:13:18 +00:00
|
|
|
return fmt.Errorf("maximum question marks [%d]: %w", len(questionMarks), ErrMaximumQuestionMarks)
|
2022-11-06 16:56:16 +00:00
|
|
|
}
|
|
|
|
|
2022-11-06 17:16:36 +00:00
|
|
|
// Because the numberRecordLastBatch may less than numberRecordEachBatch
|
|
|
|
// For example
|
|
|
|
// numberRecord := 120
|
|
|
|
// numberRecordEachBatch := 50
|
|
|
|
// numberBatch := 120/50 + 1 = 3
|
|
|
|
// First 2 batches => 50 * 2 = 100
|
|
|
|
// Last batch => 120 - 100 = 20
|
2022-11-06 16:56:16 +00:00
|
|
|
numberBatch := numberRecord/numberRecordEachBatch + 1
|
|
|
|
numberRecordLastBatch := numberRecord - (numberBatch-1)*numberRecordEachBatch
|
|
|
|
|
|
|
|
generateQueryArgsInsertFn := func(tempNumberRecord int) (string, []any) {
|
|
|
|
valuesQuestionMarks := make([]string, 0, tempNumberRecord)
|
|
|
|
argsInsert := make([]any, 0, tempNumberRecord*len(argFns))
|
|
|
|
for i := 0; i < tempNumberRecord; i++ {
|
2022-11-06 17:16:36 +00:00
|
|
|
// (?, ?, ?)
|
2022-11-06 16:56:16 +00:00
|
|
|
valuesQuestionMarks = append(valuesQuestionMarks, fmt.Sprintf("(%s)", strings.Join(questionMarks, ", ")))
|
|
|
|
|
|
|
|
// Generate each time insert for different value
|
|
|
|
args := make([]any, 0, len(argFns))
|
|
|
|
for _, argFn := range argFns {
|
|
|
|
args = append(args, argFn())
|
|
|
|
}
|
|
|
|
argsInsert = append(argsInsert, args...)
|
|
|
|
}
|
|
|
|
|
2022-11-06 17:13:18 +00:00
|
|
|
// INSERT INTO table_name (column1, column2, column3) VALUES (?, ?, ?), (?, ?, ?), (?, ?, ?);
|
2022-11-06 16:56:16 +00:00
|
|
|
queryInsert := fmt.Sprintf(stmtInsert,
|
|
|
|
tableName,
|
|
|
|
strings.Join(columnNames, ", "),
|
|
|
|
strings.Join(valuesQuestionMarks, ", "),
|
|
|
|
)
|
|
|
|
|
|
|
|
return queryInsert, argsInsert
|
|
|
|
}
|
|
|
|
|
|
|
|
for i := 0; i < numberBatch-1; i++ {
|
|
|
|
queryInsert, argsInsert := generateQueryArgsInsertFn(numberRecordEachBatch)
|
|
|
|
|
|
|
|
if p.verbose {
|
2022-11-06 17:31:03 +00:00
|
|
|
fmt.Printf("Index: [%d]\n", i)
|
2022-11-06 16:56:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if !p.dryRun {
|
|
|
|
if _, err := p.db.ExecContext(ctx, queryInsert, argsInsert...); err != nil {
|
|
|
|
return fmt.Errorf("database: failed to exec [%s]: %w", queryInsert, err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
// Last batch
|
|
|
|
queryInsert, argsInsert := generateQueryArgsInsertFn(numberRecordLastBatch)
|
|
|
|
|
|
|
|
if p.verbose {
|
2022-11-06 17:31:03 +00:00
|
|
|
fmt.Printf("Index: [%d]\n", numberBatch-1)
|
2022-11-06 16:56:16 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
if !p.dryRun {
|
|
|
|
if _, err := p.db.ExecContext(ctx, queryInsert, argsInsert...); err != nil {
|
|
|
|
return fmt.Errorf("database: failed to exec [%s]: %w", queryInsert, err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return columnNames, questionMarks, argFns
|
2022-12-05 08:44:16 +00:00
|
|
|
func (p *populator) prepareInsert(tableName string) (columnNames, questionMarks []string, argFns []func() any, err error) {
|
2022-11-06 16:56:16 +00:00
|
|
|
table, ok := p.tables[tableName]
|
|
|
|
if !ok {
|
|
|
|
return nil, nil, nil, fmt.Errorf("table [%s] not exist: %w", tableName, ErrTableNotExist)
|
|
|
|
}
|
|
|
|
|
2022-12-05 08:44:16 +00:00
|
|
|
columnNames = make([]string, 0, len(table.Columns))
|
|
|
|
questionMarks = make([]string, 0, len(table.Columns))
|
|
|
|
argFns = make([]func() any, 0, len(table.Columns))
|
2022-11-06 16:56:16 +00:00
|
|
|
for _, column := range table.Columns {
|
2022-11-06 17:35:44 +00:00
|
|
|
dt, err := ParseDatabaseType(column)
|
2022-11-06 16:56:16 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, nil, nil, fmt.Errorf("failed to parse database type [%s]: %w", column.Type, err)
|
|
|
|
}
|
|
|
|
|
|
|
|
columnNames = append(columnNames, column.Name)
|
|
|
|
questionMarks = append(questionMarks, "?")
|
|
|
|
argFns = append(argFns, dt.Generate)
|
|
|
|
}
|
|
|
|
|
|
|
|
return columnNames, questionMarks, argFns, nil
|
|
|
|
}
|