components-contrib/state/sqlite/sqlite_dbaccess.go

570 lines
16 KiB
Go

/*
Copyright 2023 The Dapr Authors
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package sqlite
import (
"context"
"database/sql"
"encoding/base64"
"encoding/json"
"errors"
"fmt"
"net/url"
"strconv"
"strings"
"time"
"github.com/google/uuid"
// Blank import for the underlying SQLite Driver.
_ "modernc.org/sqlite"
internalsql "github.com/dapr/components-contrib/internal/component/sql"
"github.com/dapr/components-contrib/state"
stateutils "github.com/dapr/components-contrib/state/utils"
"github.com/dapr/kit/logger"
)
// DBAccess is a private interface which enables unit testing of SQLite.
type DBAccess interface {
Init(ctx context.Context, metadata state.Metadata) error
Ping(ctx context.Context) error
Set(ctx context.Context, req *state.SetRequest) error
Get(ctx context.Context, req *state.GetRequest) (*state.GetResponse, error)
Delete(ctx context.Context, req *state.DeleteRequest) error
BulkGet(ctx context.Context, req []state.GetRequest) ([]state.BulkGetResponse, error)
ExecuteMulti(ctx context.Context, reqs []state.TransactionalStateOperation) error
Close() error
}
// Interface for both sql.DB and sql.Tx
type querier interface {
ExecContext(ctx context.Context, query string, args ...any) (sql.Result, error)
QueryContext(ctx context.Context, query string, args ...any) (*sql.Rows, error)
QueryRowContext(ctx context.Context, query string, args ...any) *sql.Row
}
// sqliteDBAccess implements DBAccess.
type sqliteDBAccess struct {
logger logger.Logger
metadata sqliteMetadataStruct
db *sql.DB
gc internalsql.GarbageCollector
}
// newSqliteDBAccess creates a new instance of sqliteDbAccess.
func newSqliteDBAccess(logger logger.Logger) *sqliteDBAccess {
return &sqliteDBAccess{
logger: logger,
}
}
// Init sets up SQLite Database connection and ensures that the state table
// exists.
func (a *sqliteDBAccess) Init(ctx context.Context, md state.Metadata) error {
err := a.metadata.InitWithMetadata(md)
if err != nil {
return err
}
connString, err := a.getConnectionString()
if err != nil {
// Already logged
return err
}
db, err := sql.Open("sqlite", connString)
if err != nil {
return fmt.Errorf("failed to create connection: %w", err)
}
a.db = db
err = a.Ping(ctx)
if err != nil {
return fmt.Errorf("failed to ping: %w", err)
}
// Performs migrations
migrate := &migrations{
Logger: a.logger,
Conn: a.db,
MetadataTableName: a.metadata.MetadataTableName,
StateTableName: a.metadata.TableName,
}
err = migrate.Perform(ctx)
if err != nil {
return fmt.Errorf("failed to perform migrations: %w", err)
}
gc, err := internalsql.ScheduleGarbageCollector(internalsql.GCOptions{
Logger: a.logger,
UpdateLastCleanupQuery: fmt.Sprintf(`INSERT INTO %s (key, value)
VALUES ('last-cleanup', CURRENT_TIMESTAMP)
ON CONFLICT (key)
DO UPDATE SET value = CURRENT_TIMESTAMP
WHERE (unixepoch(CURRENT_TIMESTAMP) - unixepoch(value)) * 1000 > ?;`,
a.metadata.MetadataTableName,
),
DeleteExpiredValuesQuery: fmt.Sprintf(`DELETE FROM %s
WHERE
expiration_time IS NOT NULL
AND expiration_time < CURRENT_TIMESTAMP`,
a.metadata.TableName,
),
CleanupInterval: a.metadata.CleanupInterval,
DBSql: a.db,
})
if err != nil {
return err
}
a.gc = gc
return nil
}
func (a *sqliteDBAccess) CleanupExpired() error {
return a.gc.CleanupExpired()
}
func (a *sqliteDBAccess) getConnectionString() (string, error) {
// Check if we're using the in-memory database
lc := strings.ToLower(a.metadata.ConnectionString)
isMemoryDB := strings.HasPrefix(lc, ":memory:") || strings.HasPrefix(lc, "file::memory:")
// Get the "query string" from the connection string if present
idx := strings.IndexRune(a.metadata.ConnectionString, '?')
var qs url.Values
if idx > 0 {
qs, _ = url.ParseQuery(a.metadata.ConnectionString[(idx + 1):])
}
if len(qs) == 0 {
qs = make(url.Values, 2)
}
// If the database is in-memory, we must ensure that cache=shared is set
if isMemoryDB {
qs["cache"] = []string{"shared"}
}
// Check if the database is read-only or immutable
isReadOnly := false
if len(qs["mode"]) > 0 {
// Keep the first value only
qs["mode"] = []string{
qs["mode"][0],
}
if qs["mode"][0] == "ro" {
isReadOnly = true
}
}
if len(qs["immutable"]) > 0 {
// Keep the first value only
qs["immutable"] = []string{
qs["immutable"][0],
}
if qs["immutable"][0] == "1" {
isReadOnly = true
}
}
// We do not want to override a _txlock if set, but we'll show a warning if it's not "immediate"
if len(qs["_txlock"]) > 0 {
// Keep the first value only
qs["_txlock"] = []string{
strings.ToLower(qs["_txlock"][0]),
}
if qs["_txlock"][0] != "immediate" {
a.logger.Warn("Database connection is being created with a _txlock different from the recommended value 'immediate'")
}
} else {
qs["_txlock"] = []string{"immediate"}
}
// Add pragma values
if len(qs["_pragma"]) == 0 {
qs["_pragma"] = make([]string, 0, 2)
} else {
for _, p := range qs["_pragma"] {
p = strings.ToLower(p)
if strings.HasPrefix(p, "busy_timeout") {
a.logger.Error("Cannot set `_pragma=busy_timeout` option in the connection string; please use the `busyTimeout` metadata property instead")
return "", errors.New("found forbidden option '_pragma=busy_timeout' in the connection string")
} else if strings.HasPrefix(p, "journal_mode") {
a.logger.Error("Cannot set `_pragma=journal_mode` option in the connection string; please use the `disableWAL` metadata property instead")
return "", errors.New("found forbidden option '_pragma=journal_mode' in the connection string")
}
}
}
if a.metadata.BusyTimeout > 0 {
qs["_pragma"] = append(qs["_pragma"], fmt.Sprintf("busy_timeout(%d)", a.metadata.BusyTimeout.Milliseconds()))
}
if isMemoryDB {
// For in-memory databases, set the journal to MEMORY, the only allowed option besides OFF (which would make transactions ineffective)
qs["_pragma"] = append(qs["_pragma"], "journal_mode(MEMORY)")
} else if a.metadata.DisableWAL || isReadOnly {
// Set the journaling mode to "DELETE" (the default) if WAL is disabled or if the database is read-only
qs["_pragma"] = append(qs["_pragma"], "journal_mode(DELETE)")
} else {
// Enable WAL
qs["_pragma"] = append(qs["_pragma"], "journal_mode(WAL)")
}
// Build the final connection string
connString := a.metadata.ConnectionString
if idx > 0 {
connString = connString[:idx]
}
connString += "?" + qs.Encode()
// If the connection string doesn't begin with "file:", add the prefix
if !strings.HasPrefix(lc, "file:") {
a.logger.Debug("prefix 'file:' added to the connection string")
connString = "file:" + connString
}
return connString, nil
}
func (a *sqliteDBAccess) Ping(parentCtx context.Context) error {
ctx, cancel := context.WithTimeout(parentCtx, a.metadata.timeout)
err := a.db.PingContext(ctx)
cancel()
return err
}
func (a *sqliteDBAccess) Get(parentCtx context.Context, req *state.GetRequest) (*state.GetResponse, error) {
if req.Key == "" {
return nil, errors.New("missing key in get operation")
}
// Concatenation is required for table name because sql.DB does not substitute parameters for table names
stmt := `SELECT key, value, is_binary, etag FROM ` + a.metadata.TableName + `
WHERE
key = ?
AND (expiration_time IS NULL OR expiration_time > CURRENT_TIMESTAMP)`
ctx, cancel := context.WithTimeout(parentCtx, a.metadata.timeout)
defer cancel()
row := a.db.QueryRowContext(ctx, stmt, req.Key)
_, value, etag, err := readRow(row)
if err != nil {
if errors.Is(err, sql.ErrNoRows) {
return &state.GetResponse{}, nil
}
return nil, err
}
return &state.GetResponse{
Data: value,
ETag: etag,
Metadata: req.Metadata,
}, nil
}
func (a *sqliteDBAccess) BulkGet(parentCtx context.Context, req []state.GetRequest) ([]state.BulkGetResponse, error) {
if len(req) == 0 {
return []state.BulkGetResponse{}, nil
}
// SQLite doesn't support passing an array for an IN clause, so we need to build a custom query
inClause := strings.Repeat("?,", len(req))
inClause = inClause[:(len(inClause) - 1)]
params := make([]any, len(req))
for i, r := range req {
params[i] = r.Key
}
// Concatenation is required for table name because sql.DB does not substitute parameters for table names
stmt := `SELECT key, value, is_binary, etag FROM ` + a.metadata.TableName + `
WHERE
key IN (` + inClause + `)
AND (expiration_time IS NULL OR expiration_time > CURRENT_TIMESTAMP)`
ctx, cancel := context.WithTimeout(parentCtx, a.metadata.timeout)
defer cancel()
rows, err := a.db.QueryContext(ctx, stmt, params...)
if err != nil {
return nil, err
}
var n int
res := make([]state.BulkGetResponse, len(req))
for ; rows.Next(); n++ {
r := state.BulkGetResponse{}
r.Key, r.Data, r.ETag, err = readRow(rows)
if err != nil {
r.Error = err.Error()
}
res[n] = r
}
return res[:n], nil
}
func readRow(row interface{ Scan(dest ...any) error }) (key string, value []byte, etagP *string, err error) {
var (
isBinary bool
etag string
)
err = row.Scan(&key, &value, &isBinary, &etag)
if err != nil {
return key, nil, nil, err
}
if isBinary {
var n int
data := make([]byte, len(value))
n, err = base64.StdEncoding.Decode(data, value)
if err != nil {
return key, nil, nil, fmt.Errorf("failed to decode binary data: %w", err)
}
return key, data[:n], &etag, nil
}
return key, value, &etag, nil
}
func (a *sqliteDBAccess) Set(ctx context.Context, req *state.SetRequest) error {
return a.doSet(ctx, a.db, req)
}
func (a *sqliteDBAccess) doSet(parentCtx context.Context, db querier, req *state.SetRequest) error {
err := state.CheckRequestOptions(req.Options)
if err != nil {
return err
}
if req.Key == "" {
return errors.New("missing key in set option")
}
// TTL
var ttlSeconds int
ttl, ttlerr := stateutils.ParseTTL(req.Metadata)
if ttlerr != nil {
return fmt.Errorf("error parsing TTL: %w", ttlerr)
}
if ttl != nil {
ttlSeconds = *ttl
}
// Encode the value
var requestValue string
byteArray, isBinary := req.Value.([]uint8)
if isBinary {
requestValue = base64.StdEncoding.EncodeToString(byteArray)
} else {
var bt []byte
bt, err = json.Marshal(req.Value)
if err != nil {
return err
}
requestValue = string(bt)
}
// New ETag
etagObj, err := uuid.NewRandom()
if err != nil {
return err
}
newEtag := etagObj.String()
// Also resets expiration time in case of an update
expiration := "NULL"
if ttlSeconds > 0 {
expiration = "DATETIME(CURRENT_TIMESTAMP, '+" + strconv.Itoa(ttlSeconds) + " seconds')"
}
// Only check for etag if FirstWrite specified (ref oracledatabaseaccess)
var (
res sql.Result
mustCommit bool
stmt string
)
// Sprintf is required for table name because sql.DB does not substitute parameters for table names.
// And the same is for DATETIME function's seconds parameter (which is from an integer anyways).
if req.ETag == nil || *req.ETag == "" {
// If the operation uses first-write concurrency, we need to handle the special case of a row that has expired but hasn't been garbage collected yet
// In this case, the row should be considered as if it were deleted
// With SQLite, the only way we can handle that is by performing a SELECT query first
if req.Options.Concurrency == state.FirstWrite {
// If we're not in a transaction already, start one as we need to ensure consistency
if db == a.db {
db, err = a.db.BeginTx(parentCtx, nil)
if err != nil {
return fmt.Errorf("failed to begin transaction: %w", err)
}
defer db.(*sql.Tx).Rollback()
mustCommit = true
}
// Check if there's already a row with the given key that has not expired yet
var count int
stmt = `SELECT COUNT(key)
FROM ` + a.metadata.TableName + `
WHERE key = ?
AND (expiration_time IS NULL OR expiration_time > CURRENT_TIMESTAMP)`
err = db.QueryRowContext(parentCtx, stmt, req.Key).Scan(&count)
if err != nil {
return fmt.Errorf("failed to check for existing row with first-write concurrency: %w", err)
}
// If the row exists, then we just return an etag error
// Otherwise, we can fall through and continue with an INSERT OR REPLACE statement
if count > 0 {
return state.NewETagError(state.ETagMismatch, nil)
}
}
stmt = "INSERT OR REPLACE INTO " + a.metadata.TableName + `
(key, value, is_binary, etag, update_time, expiration_time)
VALUES(?, ?, ?, ?, CURRENT_TIMESTAMP, ` + expiration + `)`
ctx, cancel := context.WithTimeout(context.Background(), a.metadata.timeout)
defer cancel()
res, err = db.ExecContext(ctx, stmt, req.Key, requestValue, isBinary, newEtag, req.Key)
} else {
stmt = `UPDATE ` + a.metadata.TableName + ` SET
value = ?,
etag = ?,
is_binary = ?,
update_time = CURRENT_TIMESTAMP,
expiration_time = ` + expiration + `
WHERE
key = ?
AND etag = ?
AND (expiration_time IS NULL OR expiration_time > CURRENT_TIMESTAMP)`
ctx, cancel := context.WithTimeout(context.Background(), a.metadata.timeout)
defer cancel()
res, err = db.ExecContext(ctx, stmt, requestValue, newEtag, isBinary, req.Key, *req.ETag)
}
if err != nil {
return err
}
// Count the number of affected rows
rows, err := res.RowsAffected()
if err != nil {
return err
}
if rows == 0 {
if req.ETag != nil && *req.ETag != "" {
return state.NewETagError(state.ETagMismatch, nil)
}
return errors.New("no item was updated")
}
// Commit the transaction if needed
if mustCommit {
err = db.(*sql.Tx).Commit()
if err != nil {
return fmt.Errorf("failed to commit transaction: %w", err)
}
}
return nil
}
func (a *sqliteDBAccess) Delete(ctx context.Context, req *state.DeleteRequest) error {
return a.doDelete(ctx, a.db, req)
}
func (a *sqliteDBAccess) ExecuteMulti(parentCtx context.Context, reqs []state.TransactionalStateOperation) error {
tx, err := a.db.BeginTx(parentCtx, nil)
if err != nil {
return err
}
defer tx.Rollback()
for _, o := range reqs {
switch req := o.(type) {
case state.SetRequest:
err = a.doSet(parentCtx, tx, &req)
if err != nil {
return err
}
case state.DeleteRequest:
err = a.doDelete(parentCtx, tx, &req)
if err != nil {
return err
}
default:
// Do nothing
}
}
return tx.Commit()
}
// Close implements io.Close.
func (a *sqliteDBAccess) Close() error {
if a.db != nil {
_ = a.db.Close()
}
if a.gc != nil {
return a.gc.Close()
}
return nil
}
func (a *sqliteDBAccess) doDelete(parentCtx context.Context, db querier, req *state.DeleteRequest) error {
err := state.CheckRequestOptions(req.Options)
if err != nil {
return err
}
if req.Key == "" {
return fmt.Errorf("missing key in delete operation")
}
ctx, cancel := context.WithTimeout(parentCtx, a.metadata.timeout)
defer cancel()
var result sql.Result
if req.ETag == nil || *req.ETag == "" {
// Concatenation is required for table name because sql.DB does not substitute parameters for table names.
result, err = db.ExecContext(ctx, "DELETE FROM "+a.metadata.TableName+" WHERE key = ?",
req.Key)
} else {
// Concatenation is required for table name because sql.DB does not substitute parameters for table names.
result, err = db.ExecContext(ctx, "DELETE FROM "+a.metadata.TableName+" WHERE key = ? AND etag = ?",
req.Key, *req.ETag)
}
if err != nil {
return err
}
rows, err := result.RowsAffected()
if err != nil {
return err
}
if rows == 0 && req.ETag != nil && *req.ETag != "" {
return state.NewETagError(state.ETagMismatch, nil)
}
return nil
}
// GetConnection returns the database connection object.
// This is primarily used for tests.
func (a *sqliteDBAccess) GetConnection() *sql.DB {
return a.db
}
// GetCleanupInterval returns the cleanupInterval property.
// This is primarily used for tests.
func (a *sqliteDBAccess) GetCleanupInterval() time.Duration {
return a.metadata.CleanupInterval
}