telegraf/plugins/outputs/sql/sql.go

298 lines
7.6 KiB
Go
Raw Normal View History

//go:generate ../../../tools/readme_config_includer/generator
2021-06-04 12:49:55 +08:00
package sql
import (
gosql "database/sql"
_ "embed"
2021-06-04 12:49:55 +08:00
"fmt"
"strings"
"time"
2021-06-04 12:49:55 +08:00
//Register sql drivers
_ "github.com/ClickHouse/clickhouse-go" // clickhouse
_ "github.com/denisenkom/go-mssqldb" // mssql (sql server)
_ "github.com/go-sql-driver/mysql" // mysql
_ "github.com/jackc/pgx/v4/stdlib" // pgx (postgres)
_ "github.com/snowflakedb/gosnowflake" // snowflake
2021-06-04 12:49:55 +08:00
"github.com/influxdata/telegraf"
"github.com/influxdata/telegraf/plugins/outputs"
)
//go:embed sample.conf
var sampleConfig string
2021-06-04 12:49:55 +08:00
type ConvertStruct struct {
2022-03-03 23:21:39 +08:00
Integer string
Real string
Text string
Timestamp string
Defaultvalue string
Unsigned string
Bool string
ConversionStyle string
2021-06-04 12:49:55 +08:00
}
type SQL struct {
Driver string
DataSourceName string
TimestampColumn string
TableTemplate string
TableExistsTemplate string
InitSQL string `toml:"init_sql"`
Convert ConvertStruct
ConnectionMaxIdleTime time.Duration
ConnectionMaxLifetime time.Duration
ConnectionMaxIdle int
ConnectionMaxOpen int
2021-06-04 12:49:55 +08:00
db *gosql.DB
Log telegraf.Logger `toml:"-"`
tables map[string]bool
}
func (*SQL) SampleConfig() string {
return sampleConfig
}
2021-06-04 12:49:55 +08:00
func (p *SQL) Connect() error {
db, err := gosql.Open(p.Driver, p.DataSourceName)
if err != nil {
return err
}
err = db.Ping()
if err != nil {
return err
}
db.SetConnMaxIdleTime(p.ConnectionMaxIdleTime)
db.SetConnMaxLifetime(p.ConnectionMaxLifetime)
db.SetMaxIdleConns(p.ConnectionMaxIdle)
db.SetMaxOpenConns(p.ConnectionMaxOpen)
2021-06-04 12:49:55 +08:00
if p.InitSQL != "" {
_, err = db.Exec(p.InitSQL)
if err != nil {
return err
}
}
p.db = db
p.tables = make(map[string]bool)
return nil
}
func (p *SQL) Close() error {
return p.db.Close()
}
// Quote an identifier (table or column name)
func quoteIdent(name string) string {
return `"` + strings.ReplaceAll(sanitizeQuoted(name), `"`, `""`) + `"`
2021-06-04 12:49:55 +08:00
}
// Quote a string literal
func quoteStr(name string) string {
return "'" + strings.ReplaceAll(name, "'", "''") + "'"
2021-06-04 12:49:55 +08:00
}
func sanitizeQuoted(in string) string {
// https://dev.mysql.com/doc/refman/8.0/en/identifiers.html
// https://www.postgresql.org/docs/13/sql-syntax-lexical.html#SQL-SYNTAX-IDENTIFIERS
// Whitelist allowed characters
return strings.Map(func(r rune) rune {
switch {
case r >= '\u0001' && r <= '\uFFFF':
return r
default:
return '_'
}
}, in)
}
func (p *SQL) deriveDatatype(value interface{}) string {
var datatype string
switch value.(type) {
case int64:
datatype = p.Convert.Integer
case uint64:
2022-03-03 23:21:39 +08:00
if p.Convert.ConversionStyle == "unsigned_suffix" {
datatype = fmt.Sprintf("%s %s", p.Convert.Integer, p.Convert.Unsigned)
} else if p.Convert.ConversionStyle == "literal" {
datatype = p.Convert.Unsigned
} else {
p.Log.Errorf("unknown converstaion style: %s", p.Convert.ConversionStyle)
}
2021-06-04 12:49:55 +08:00
case float64:
datatype = p.Convert.Real
case string:
datatype = p.Convert.Text
case bool:
datatype = p.Convert.Bool
2021-06-04 12:49:55 +08:00
default:
datatype = p.Convert.Defaultvalue
p.Log.Errorf("Unknown datatype: '%T' %v", value, value)
}
return datatype
}
func (p *SQL) generateCreateTable(metric telegraf.Metric) string {
columns := make([]string, 0, len(metric.TagList())+len(metric.FieldList())+1)
2021-06-04 12:49:55 +08:00
// ## {KEY_COLUMNS} is a comma-separated list of key columns (timestamp and tags)
//var pk []string
if p.TimestampColumn != "" {
//pk = append(pk, quoteIdent(p.TimestampColumn))
columns = append(columns, fmt.Sprintf("%s %s", quoteIdent(p.TimestampColumn), p.Convert.Timestamp))
}
for _, tag := range metric.TagList() {
//pk = append(pk, quoteIdent(tag.Key))
columns = append(columns, fmt.Sprintf("%s %s", quoteIdent(tag.Key), p.Convert.Text))
}
var datatype string
for _, field := range metric.FieldList() {
datatype = p.deriveDatatype(field.Value)
columns = append(columns, fmt.Sprintf("%s %s", quoteIdent(field.Key), datatype))
}
query := p.TableTemplate
query = strings.ReplaceAll(query, "{TABLE}", quoteIdent(metric.Name()))
query = strings.ReplaceAll(query, "{TABLELITERAL}", quoteStr(metric.Name()))
query = strings.ReplaceAll(query, "{COLUMNS}", strings.Join(columns, ","))
//query = strings.ReplaceAll(query, "{KEY_COLUMNS}", strings.Join(pk, ","))
2021-06-04 12:49:55 +08:00
return query
}
func (p *SQL) generateInsert(tablename string, columns []string) string {
placeholders := make([]string, 0, len(columns))
quotedColumns := make([]string, 0, len(columns))
2021-06-04 12:49:55 +08:00
for _, column := range columns {
quotedColumns = append(quotedColumns, quoteIdent(column))
}
if p.Driver == "pgx" {
// Postgres uses $1 $2 $3 as placeholders
for i := 0; i < len(columns); i++ {
placeholders = append(placeholders, fmt.Sprintf("$%d", i+1))
}
} else {
// Everything else uses ? ? ? as placeholders
for i := 0; i < len(columns); i++ {
placeholders = append(placeholders, "?")
}
}
return fmt.Sprintf("INSERT INTO %s(%s) VALUES(%s)",
quoteIdent(tablename),
strings.Join(quotedColumns, ","),
strings.Join(placeholders, ","))
}
func (p *SQL) tableExists(tableName string) bool {
stmt := strings.ReplaceAll(p.TableExistsTemplate, "{TABLE}", quoteIdent(tableName))
2021-06-04 12:49:55 +08:00
_, err := p.db.Exec(stmt)
return err == nil
}
func (p *SQL) Write(metrics []telegraf.Metric) error {
var err error
2021-06-04 12:49:55 +08:00
for _, metric := range metrics {
tablename := metric.Name()
// create table if needed
if !p.tables[tablename] && !p.tableExists(tablename) {
createStmt := p.generateCreateTable(metric)
_, err := p.db.Exec(createStmt)
if err != nil {
return err
}
}
p.tables[tablename] = true
2021-06-04 12:49:55 +08:00
var columns []string
var values []interface{}
if p.TimestampColumn != "" {
columns = append(columns, p.TimestampColumn)
values = append(values, metric.Time())
}
for column, value := range metric.Tags() {
columns = append(columns, column)
values = append(values, value)
}
for column, value := range metric.Fields() {
columns = append(columns, column)
values = append(values, value)
}
sql := p.generateInsert(tablename, columns)
switch p.Driver {
case "clickhouse":
// ClickHouse needs to batch inserts with prepared statements
tx, err := p.db.Begin()
if err != nil {
return fmt.Errorf("begin failed: %v", err)
}
stmt, err := tx.Prepare(sql)
if err != nil {
return fmt.Errorf("prepare failed: %v", err)
}
defer stmt.Close() //nolint:revive // We cannot do anything about a failing close.
_, err = stmt.Exec(values...)
if err != nil {
return fmt.Errorf("execution failed: %v", err)
}
err = tx.Commit()
if err != nil {
return fmt.Errorf("commit failed: %v", err)
}
default:
_, err = p.db.Exec(sql, values...)
if err != nil {
return fmt.Errorf("execution failed: %v", err)
}
2021-06-04 12:49:55 +08:00
}
}
return nil
}
func init() {
outputs.Add("sql", func() telegraf.Output { return newSQL() })
}
func newSQL() *SQL {
return &SQL{
TableTemplate: "CREATE TABLE {TABLE}({COLUMNS})",
TableExistsTemplate: "SELECT 1 FROM {TABLE} LIMIT 1",
TimestampColumn: "timestamp",
Convert: ConvertStruct{
2022-03-03 23:21:39 +08:00
Integer: "INT",
Real: "DOUBLE",
Text: "TEXT",
Timestamp: "TIMESTAMP",
Defaultvalue: "TEXT",
Unsigned: "UNSIGNED",
Bool: "BOOL",
ConversionStyle: "unsigned_suffix",
2021-06-04 12:49:55 +08:00
},
// Defaults for the connection settings (ConnectionMaxIdleTime,
// ConnectionMaxLifetime, ConnectionMaxIdle, and ConnectionMaxOpen)
// mirror the golang defaults. As of go 1.18 all of them default to 0
// except max idle connections which is 2. See
// https://pkg.go.dev/database/sql#DB.SetMaxIdleConns
ConnectionMaxIdle: 2,
2021-06-04 12:49:55 +08:00
}
}