components-contrib/state/postgresql/postgresdbaccess.go

665 lines
15 KiB
Go

/*
Copyright 2021 The Dapr Authors
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package postgresql
import (
"context"
"database/sql"
"encoding/base64"
"encoding/json"
"errors"
"fmt"
"strconv"
"strings"
"time"
"github.com/dapr/components-contrib/metadata"
"github.com/dapr/components-contrib/state"
"github.com/dapr/components-contrib/state/query"
stateutils "github.com/dapr/components-contrib/state/utils"
"github.com/dapr/kit/logger"
"github.com/dapr/kit/ptr"
// Blank import for the underlying Postgres driver.
_ "github.com/jackc/pgx/v5/stdlib"
)
const (
defaultTableName = "state"
cleanupIntervalKey = "cleanupIntervalInSeconds"
defaultCleanupInternal = 3600 // In seconds = 1 hour
)
var errMissingConnectionString = errors.New("missing connection string")
// postgresDBAccess implements dbaccess.
type postgresDBAccess struct {
logger logger.Logger
metadata postgresMetadataStruct
cleanupInterval *time.Duration
db *sql.DB
ctx context.Context
cancel context.CancelFunc
}
// newPostgresDBAccess creates a new instance of postgresAccess.
func newPostgresDBAccess(logger logger.Logger) *postgresDBAccess {
logger.Debug("Instantiating new Postgres state store")
return &postgresDBAccess{
logger: logger,
}
}
type postgresMetadataStruct struct {
ConnectionString string
ConnectionMaxIdleTime time.Duration
TableName string // Could be in the format "schema.table" or just "table"
}
// Init sets up Postgres connection and ensures that the state table exists.
func (p *postgresDBAccess) Init(meta state.Metadata) error {
p.logger.Debug("Initializing Postgres state store")
p.ctx, p.cancel = context.WithCancel(context.Background())
err := p.parseMetadata(meta)
if err != nil {
p.logger.Errorf("Failed to parse metadata: %v", err)
return err
}
db, err := sql.Open("pgx", p.metadata.ConnectionString)
if err != nil {
p.logger.Error(err)
return err
}
p.db = db
pingErr := db.Ping()
if pingErr != nil {
return pingErr
}
p.db.SetConnMaxIdleTime(p.metadata.ConnectionMaxIdleTime)
if err != nil {
return err
}
err = p.ensureStateTable(p.metadata.TableName)
if err != nil {
return err
}
p.scheduleCleanupExpiredData()
return nil
}
func (p *postgresDBAccess) parseMetadata(meta state.Metadata) error {
m := postgresMetadataStruct{
TableName: defaultTableName,
}
err := metadata.DecodeMetadata(meta.Properties, &m)
if err != nil {
return err
}
p.metadata = m
if m.ConnectionString == "" {
return errMissingConnectionString
}
s, ok := meta.Properties[cleanupIntervalKey]
if ok && s != "" {
cleanupIntervalInSec, err := strconv.ParseInt(s, 10, 0)
if err != nil {
return fmt.Errorf("invalid value for '%s': %s", cleanupIntervalKey, s)
}
// Non-positive value from meta means disable auto cleanup.
if cleanupIntervalInSec > 0 {
p.cleanupInterval = ptr.Of(time.Duration(cleanupIntervalInSec) * time.Second)
}
} else {
p.cleanupInterval = ptr.Of(defaultCleanupInternal * time.Second)
}
return nil
}
// Set makes an insert or update to the database.
func (p *postgresDBAccess) Set(req *state.SetRequest) error {
err := state.CheckRequestOptions(req.Options)
if err != nil {
return err
}
if req.Key == "" {
return errors.New("missing key in set operation")
}
if v, ok := req.Value.(string); ok && v == "" {
return errors.New("empty string is not allowed in set operation")
}
v := req.Value
byteArray, isBinary := req.Value.([]uint8)
if isBinary {
v = base64.StdEncoding.EncodeToString(byteArray)
}
// Convert to json string
bt, _ := stateutils.Marshal(v, json.Marshal)
value := string(bt)
// TTL
var ttlSeconds int
ttl, ttlerr := stateutils.ParseTTL(req.Metadata)
if ttlerr != nil {
return fmt.Errorf("error parsing TTL: %w", ttlerr)
}
if ttl != nil {
ttlSeconds = *ttl
}
var result sql.Result
// Sprintf is required for table name because query.DB does not substitute parameters for table names.
// Other parameters use query.DB parameter substitution.
var (
query string
queryExpiredate string
params []any
)
if req.ETag == nil || *req.ETag == "" {
if req.Options.Concurrency == state.FirstWrite {
query = `INSERT INTO %[1]s
(key, value, isbinary, expiredate)
VALUES
($1, $2, $3, %[2]s)`
} else {
query = `INSERT INTO %[1]s
(key, value, isbinary, expiredate)
VALUES
($1, $2, $3, %[2]s)
ON CONFLICT (key)
DO UPDATE SET
value = $2,
isbinary = $3,
updatedate = CURRENT_TIMESTAMP,
expiredate = %[2]s`
}
params = []any{req.Key, value, isBinary}
} else {
// Convert req.ETag to uint32 for postgres XID compatibility
var etag64 uint64
etag64, err = strconv.ParseUint(*req.ETag, 10, 32)
if err != nil {
return state.NewETagError(state.ETagInvalid, err)
}
query = `UPDATE %[1]s
SET
value = $1,
isbinary = $2,
updatedate = CURRENT_TIMESTAMP,
expiredate = %[2]s
WHERE
key = $3
AND xmin = $4`
params = []any{value, isBinary, req.Key, uint32(etag64)}
}
if ttlSeconds > 0 {
queryExpiredate = "CURRENT_TIMESTAMP + interval '" + strconv.Itoa(ttlSeconds) + " seconds'"
} else {
queryExpiredate = "NULL"
}
result, err = p.db.Exec(fmt.Sprintf(query, p.metadata.TableName, queryExpiredate), params...)
if err != nil {
if req.ETag != nil && *req.ETag != "" {
return state.NewETagError(state.ETagMismatch, err)
}
return err
}
rows, err := result.RowsAffected()
if err != nil {
return err
}
if rows != 1 {
return errors.New("no item was updated")
}
return nil
}
func (p *postgresDBAccess) BulkSet(req []state.SetRequest) error {
tx, err := p.db.Begin()
if err != nil {
return err
}
if len(req) > 0 {
for _, s := range req {
sa := s // Fix for gosec G601: Implicit memory aliasing in for loop.
err = p.Set(&sa)
if err != nil {
tx.Rollback()
return err
}
}
}
err = tx.Commit()
return err
}
// Get returns data from the database. If data does not exist for the key an empty state.GetResponse will be returned.
func (p *postgresDBAccess) Get(req *state.GetRequest) (*state.GetResponse, error) {
if req.Key == "" {
return nil, errors.New("missing key in get operation")
}
var (
value []byte
isBinary bool
etag uint64 // Postgres uses uint32, but FormatUint requires uint64, so using uint64 directly to avoid re-allocations
)
query := `SELECT
value, isbinary, xmin AS etag
FROM %s
WHERE
key = $1
AND expiredate IS NULL OR expiredate >= CURRENT_TIMESTAMP`
err := p.db.
QueryRow(fmt.Sprintf(query, p.metadata.TableName), req.Key).
Scan(&value, &isBinary, &etag)
if err != nil {
// If no rows exist, return an empty response, otherwise return the error.
if err == sql.ErrNoRows {
return &state.GetResponse{}, nil
}
return nil, err
}
if isBinary {
var (
s string
data []byte
)
if err = json.Unmarshal(value, &s); err != nil {
return nil, err
}
if data, err = base64.StdEncoding.DecodeString(s); err != nil {
return nil, err
}
return &state.GetResponse{
Data: data,
ETag: ptr.Of(strconv.FormatUint(etag, 10)),
Metadata: req.Metadata,
}, nil
}
return &state.GetResponse{
Data: value,
ETag: ptr.Of(strconv.FormatUint(etag, 10)),
Metadata: req.Metadata,
}, nil
}
// Delete removes an item from the state store.
func (p *postgresDBAccess) Delete(req *state.DeleteRequest) (err error) {
if req.Key == "" {
return errors.New("missing key in delete operation")
}
var result sql.Result
if req.ETag == nil || *req.ETag == "" {
result, err = p.db.Exec("DELETE FROM state WHERE key = $1", req.Key)
} else {
// Convert req.ETag to uint32 for postgres XID compatibility
var etag64 uint64
etag64, err = strconv.ParseUint(*req.ETag, 10, 32)
if err != nil {
return state.NewETagError(state.ETagInvalid, err)
}
etag := uint32(etag64)
result, err = p.db.Exec("DELETE FROM state WHERE key = $1 AND xmin = $2", req.Key, etag)
}
if err != nil {
return err
}
rows, err := result.RowsAffected()
if err != nil {
return err
}
if rows != 1 && req.ETag != nil && *req.ETag != "" {
return state.NewETagError(state.ETagMismatch, nil)
}
return nil
}
func (p *postgresDBAccess) BulkDelete(req []state.DeleteRequest) error {
tx, err := p.db.Begin()
if err != nil {
return err
}
if len(req) > 0 {
for i := range req {
err = p.Delete(&req[i])
if err != nil {
tx.Rollback()
return err
}
}
}
err = tx.Commit()
return err
}
func (p *postgresDBAccess) ExecuteMulti(request *state.TransactionalStateRequest) error {
tx, err := p.db.Begin()
if err != nil {
return err
}
for _, o := range request.Operations {
switch o.Operation {
case state.Upsert:
var setReq state.SetRequest
setReq, err = getSet(o)
if err != nil {
tx.Rollback()
return err
}
err = p.Set(&setReq)
if err != nil {
tx.Rollback()
return err
}
case state.Delete:
var delReq state.DeleteRequest
delReq, err = getDelete(o)
if err != nil {
tx.Rollback()
return err
}
err = p.Delete(&delReq)
if err != nil {
tx.Rollback()
return err
}
default:
tx.Rollback()
return fmt.Errorf("unsupported operation: %s", o.Operation)
}
}
err = tx.Commit()
return err
}
// Query executes a query against store.
func (p *postgresDBAccess) Query(req *state.QueryRequest) (*state.QueryResponse, error) {
q := &Query{
query: "",
params: []any{},
tableName: p.metadata.TableName,
}
qbuilder := query.NewQueryBuilder(q)
if err := qbuilder.BuildQuery(&req.Query); err != nil {
return &state.QueryResponse{}, err
}
data, token, err := q.execute(p.logger, p.db)
if err != nil {
return &state.QueryResponse{}, err
}
return &state.QueryResponse{
Results: data,
Token: token,
}, nil
}
func (p *postgresDBAccess) scheduleCleanupExpiredData() {
if p.cleanupInterval == nil {
return
}
p.logger.Infof("Schedule expired data clean up every %d seconds", int(p.cleanupInterval.Seconds()))
ticker := time.NewTicker(*p.cleanupInterval)
go func() {
for {
select {
case <-ticker.C:
p.cleanupTimeout()
case <-p.ctx.Done():
p.logger.Debug("Stopped background cleanup of expired data")
return
}
}
}()
}
func (p *postgresDBAccess) cleanupTimeout() {
ctx, cancel := context.WithCancel(context.Background())
defer cancel()
tx, err := p.db.BeginTx(ctx, nil)
if err != nil {
p.logger.Errorf("Error removing expired data: failed to begin transaction: %v", err)
return
}
defer tx.Rollback()
stmt := fmt.Sprintf(`DELETE FROM %s WHERE expiredate IS NOT NULL AND expiredate < CURRENT_TIMESTAMP`, p.metadata.TableName)
res, err := tx.Exec(stmt)
if err != nil {
p.logger.Errorf("Error removing expired data: failed to execute query: %v", err)
return
}
cleaned, err := res.RowsAffected()
if err != nil {
p.logger.Errorf("Error removing expired data: failed to count affected rows: %v", err)
return
}
err = tx.Commit()
if err != nil {
p.logger.Errorf("Error removing expired data: failed to commit transaction: %v", err)
return
}
p.logger.Debugf("Removed %d expired rows", cleaned)
}
// Close implements io.Close.
func (p *postgresDBAccess) Close() error {
if p.cancel != nil {
p.cancel()
p.cancel = nil
}
if p.db != nil {
return p.db.Close()
}
return nil
}
func (p *postgresDBAccess) ensureStateTable(stateTableName string) error {
exists, schema, table, err := tableExists(p.db, stateTableName)
if err != nil {
return err
}
// Create the table if it doesn't exist
if !exists {
p.logger.Infof("Creating Postgres state table '%s'", stateTableName)
_, err = p.db.Exec(fmt.Sprintf(
`CREATE TABLE %s (
key text NOT NULL PRIMARY KEY,
value jsonb NOT NULL,
isbinary boolean NOT NULL,
insertdate TIMESTAMP WITH TIME ZONE NOT NULL DEFAULT NOW(),
updatedate TIMESTAMP WITH TIME ZONE NULL,
expiredate TIMESTAMP WITH TIME ZONE
)`,
stateTableName,
))
if err != nil {
return fmt.Errorf("failed to create state table: %w", err)
}
return nil
}
// If the table exists, ensure it has the "expiredate" column
exists, err = tableHasExpiredateCol(p.db, schema, table)
if err != nil {
return err
}
if !exists {
p.logger.Infof("Adding column 'expiredate' to Postgres state table '%s'", stateTableName)
_, err = p.db.Exec(fmt.Sprintf(`ALTER TABLE %s ADD expiredate TIMESTAMP WITH TIME ZONE`, stateTableName))
if err != nil {
return fmt.Errorf("failed to add expiredate column to state table: %w", err)
}
}
return nil
}
// If the table exists, returns true and the name of the table and schema
func tableExists(db *sql.DB, tableName string) (exists bool, schema string, table string, err error) {
table, schema, err = tableSchemaName(tableName)
if err != nil {
return false, "", "", err
}
if schema == "" {
err = db.
QueryRow(`
SELECT
table_name, table_schema
FROM
information_schema.tables
WHERE
table_name = $1`, table).
Scan(&table, &schema)
} else {
err = db.
QueryRow(
`SELECT
table_name, table_schema
FROM
information_schema.tables
WHERE
table_schema = $1
AND table_name = $2`, schema, table).
Scan(&table, &schema)
}
if err != nil && errors.Is(err, sql.ErrNoRows) {
return false, "", "", nil
} else if err != nil {
return false, "", "", fmt.Errorf("failed to check if table %s exists: %w", tableName, err)
}
return true, schema, table, nil
}
func tableHasExpiredateCol(db *sql.DB, schema string, table string) (colExists bool, err error) {
err = db.
QueryRow(`SELECT EXISTS (
SELECT 1
FROM
information_schema.columns
WHERE
table_schema = $1
AND table_name = $2
AND column_name='expiredate'
)`, schema, table).
Scan(&colExists)
if err != nil {
return false, fmt.Errorf("failed to check if table %s.%s has 'expiredate' column: %w", schema, table, err)
}
return colExists, nil
}
// If the table name includes a schema (e.g. `schema.table`, returns the two parts separately)
func tableSchemaName(tableName string) (table string, schema string, err error) {
parts := strings.Split(tableName, ".")
switch len(parts) {
case 1:
return parts[0], "", nil
case 2:
return parts[1], parts[0], nil
default:
return "", "", errors.New("invalid table name: must be in the format 'table' or 'schema.table'")
}
}
// Returns the set requests.
func getSet(req state.TransactionalStateOperation) (state.SetRequest, error) {
setReq, ok := req.Request.(state.SetRequest)
if !ok {
return setReq, errors.New("expecting set request")
}
if setReq.Key == "" {
return setReq, errors.New("missing key in upsert operation")
}
return setReq, nil
}
// Returns the delete requests.
func getDelete(req state.TransactionalStateOperation) (state.DeleteRequest, error) {
delReq, ok := req.Request.(state.DeleteRequest)
if !ok {
return delReq, errors.New("expecting delete request")
}
if delReq.Key == "" {
return delReq, errors.New("missing key in upsert operation")
}
return delReq, nil
}