client-go/integration_tests/lock_test.go

1705 lines
52 KiB
Go

// Copyright 2021 TiKV Authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
// NOTE: The code in this file is based on code from the
// TiDB project, licensed under the Apache License v 2.0
//
// https://github.com/pingcap/tidb/tree/cc5e161ac06827589c4966674597c137cc9e809c/store/tikv/tests/lock_test.go
//
// Copyright 2016 PingCAP, Inc.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package tikv_test
import (
"bytes"
"context"
"encoding/json"
stderrs "errors"
"fmt"
"io"
"math"
"net/http"
"sync"
"sync/atomic"
"testing"
"time"
"github.com/pingcap/failpoint"
deadlockpb "github.com/pingcap/kvproto/pkg/deadlock"
"github.com/pingcap/kvproto/pkg/kvrpcpb"
"github.com/pingcap/kvproto/pkg/metapb"
"github.com/pkg/errors"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/suite"
"github.com/tikv/client-go/v2/config"
"github.com/tikv/client-go/v2/config/retry"
tikverr "github.com/tikv/client-go/v2/error"
"github.com/tikv/client-go/v2/kv"
"github.com/tikv/client-go/v2/oracle"
"github.com/tikv/client-go/v2/tikv"
"github.com/tikv/client-go/v2/tikvrpc"
"github.com/tikv/client-go/v2/txnkv"
"github.com/tikv/client-go/v2/txnkv/transaction"
"github.com/tikv/client-go/v2/txnkv/txnlock"
"github.com/tikv/client-go/v2/util"
)
var getMaxBackoff = tikv.ConfigProbe{}.GetGetMaxBackoff()
func TestLock(t *testing.T) {
suite.Run(t, new(testLockSuite))
}
func TestLockWithTiKV(t *testing.T) {
suite.Run(t, new(testLockWithTiKVSuite))
}
type testLockSuite struct {
suite.Suite
store tikv.StoreProbe
}
func (s *testLockSuite) SetupTest() {
s.store = tikv.StoreProbe{KVStore: NewTestUniStore(s.T())}
}
func (s *testLockSuite) TearDownTest() {
s.store.Close()
}
func (s *testLockSuite) lockKey(key, value, primaryKey, primaryValue []byte, ttl uint64, commitPrimary bool, asyncCommit bool) (uint64, uint64) {
txn, err := s.store.Begin()
s.Nil(err)
if len(value) > 0 {
err = txn.Set(key, value)
} else {
err = txn.Delete(key)
}
s.Nil(err)
if len(primaryValue) > 0 {
err = txn.Set(primaryKey, primaryValue)
} else {
err = txn.Delete(primaryKey)
}
s.Nil(err)
tpc, err := txn.NewCommitter(0)
s.Nil(err)
tpc.SetPrimaryKey(primaryKey)
tpc.SetLockTTL(ttl)
if asyncCommit {
tpc.SetUseAsyncCommit()
}
ctx := context.Background()
err = tpc.PrewriteAllMutations(ctx)
s.Nil(err)
if commitPrimary {
commitTS, err := s.store.GetOracle().GetTimestamp(ctx, &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
tpc.SetCommitTS(commitTS)
err = tpc.CommitMutations(ctx)
s.Nil(err)
}
return txn.StartTS(), tpc.GetCommitTS()
}
func (s *testLockSuite) putAlphabets() {
for ch := byte('a'); ch <= byte('z'); ch++ {
s.putKV([]byte{ch}, []byte{ch})
}
}
func (s *testLockSuite) putKV(key, value []byte) (uint64, uint64) {
txn, err := s.store.Begin()
s.Nil(err)
err = txn.Set(key, value)
s.Nil(err)
err = txn.Commit(context.Background())
s.Nil(err)
return txn.StartTS(), txn.GetCommitTS()
}
func (s *testLockSuite) prepareAlphabetLocks() {
s.putKV([]byte("c"), []byte("cc"))
s.lockKey([]byte("c"), []byte("c"), []byte("z1"), []byte("z1"), 3000, true, false)
s.lockKey([]byte("d"), []byte("dd"), []byte("z2"), []byte("z2"), 3000, false, false)
s.lockKey([]byte("foo"), []byte("foo"), []byte("z3"), []byte("z3"), 3000, false, false)
s.putKV([]byte("bar"), []byte("bar"))
s.lockKey([]byte("bar"), nil, []byte("z4"), []byte("z4"), 3000, true, false)
}
func (s *testLockSuite) TestScanLockResolveWithGet() {
s.putAlphabets()
s.prepareAlphabetLocks()
txn, err := s.store.Begin()
s.Nil(err)
for ch := byte('a'); ch <= byte('z'); ch++ {
v, err := txn.Get(context.TODO(), []byte{ch})
s.Nil(err)
s.Equal(v, []byte{ch})
}
}
func (s *testLockSuite) TestScanLockResolveWithSeek() {
s.putAlphabets()
s.prepareAlphabetLocks()
txn, err := s.store.Begin()
s.Nil(err)
iter, err := txn.Iter([]byte("a"), nil)
s.Nil(err)
for ch := byte('a'); ch <= byte('z'); ch++ {
s.True(iter.Valid())
s.Equal(iter.Key(), []byte{ch})
s.Equal(iter.Value(), []byte{ch})
s.Nil(iter.Next())
}
}
func (s *testLockSuite) TestScanLockResolveWithSeekKeyOnly() {
s.putAlphabets()
s.prepareAlphabetLocks()
txn, err := s.store.Begin()
s.Nil(err)
txn.GetSnapshot().SetKeyOnly(true)
iter, err := txn.Iter([]byte("a"), nil)
s.Nil(err)
for ch := byte('a'); ch <= byte('z'); ch++ {
s.True(iter.Valid())
s.Equal(iter.Key(), []byte{ch})
s.Nil(iter.Next())
}
}
func (s *testLockSuite) TestScanLockResolveWithBatchGet() {
s.putAlphabets()
s.prepareAlphabetLocks()
var keys [][]byte
for ch := byte('a'); ch <= byte('z'); ch++ {
keys = append(keys, []byte{ch})
}
txn, err := s.store.Begin()
s.Nil(err)
m, err := toTiDBTxn(&txn).BatchGet(context.Background(), toTiDBKeys(keys))
s.Nil(err)
s.Equal(len(m), int('z'-'a'+1))
for ch := byte('a'); ch <= byte('z'); ch++ {
k := []byte{ch}
s.Equal(m[string(k)], k)
}
}
func (s *testLockSuite) TestCleanLock() {
for ch := byte('a'); ch <= byte('z'); ch++ {
k := []byte{ch}
s.lockKey(k, k, k, k, 3000, false, false)
}
txn, err := s.store.Begin()
s.Nil(err)
for ch := byte('a'); ch <= byte('z'); ch++ {
err = txn.Set([]byte{ch}, []byte{ch + 1})
s.Nil(err)
}
err = txn.Commit(context.Background())
s.Nil(err)
}
func (s *testLockSuite) TestGetTxnStatus() {
startTS, commitTS := s.putKV([]byte("a"), []byte("a"))
status, err := s.store.GetLockResolver().GetTxnStatus(startTS, startTS, []byte("a"))
s.Nil(err)
s.True(status.IsCommitted())
s.Equal(status.CommitTS(), commitTS)
startTS, commitTS = s.lockKey([]byte("a"), []byte("a"), []byte("a"), []byte("a"), 3000, true, false)
status, err = s.store.GetLockResolver().GetTxnStatus(startTS, startTS, []byte("a"))
s.Nil(err)
s.True(status.IsCommitted())
s.Equal(status.CommitTS(), commitTS)
startTS, _ = s.lockKey([]byte("a"), []byte("a"), []byte("a"), []byte("a"), 3000, false, false)
status, err = s.store.GetLockResolver().GetTxnStatus(startTS, startTS, []byte("a"))
s.Nil(err)
s.False(status.IsCommitted())
s.Greater(status.TTL(), uint64(0), fmt.Sprintf("action:%s", status.Action()))
}
func (s *testLockSuite) TestCheckTxnStatusTTL() {
txn, err := s.store.Begin()
s.Nil(err)
txn.Set([]byte("key"), []byte("value"))
s.prewriteTxnWithTTL(txn, 1000)
bo := tikv.NewBackofferWithVars(context.Background(), int(transaction.PrewriteMaxBackoff.Load()), nil)
lr := s.store.NewLockResolver()
callerStartTS, err := s.store.GetOracle().GetTimestamp(bo.GetCtx(), &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
// Check the lock TTL of a transaction.
status, err := lr.LockResolver.GetTxnStatus(txn.StartTS(), callerStartTS, []byte("key"))
s.Nil(err)
s.False(status.IsCommitted())
s.Greater(status.TTL(), uint64(0))
s.Equal(status.CommitTS(), uint64(0))
// Rollback the txn.
lock := s.mustGetLock([]byte("key"))
err = s.store.NewLockResolver().ForceResolveLock(context.Background(), lock)
s.Nil(err)
// Check its status is rollbacked.
status, err = lr.LockResolver.GetTxnStatus(txn.StartTS(), callerStartTS, []byte("key"))
s.Nil(err)
s.Equal(status.TTL(), uint64(0))
s.Equal(status.CommitTS(), uint64(0))
s.Equal(status.Action(), kvrpcpb.Action_NoAction)
// Check a committed txn.
startTS, commitTS := s.putKV([]byte("a"), []byte("a"))
status, err = lr.LockResolver.GetTxnStatus(startTS, callerStartTS, []byte("a"))
s.Nil(err)
s.Equal(status.TTL(), uint64(0))
s.Equal(status.CommitTS(), commitTS)
}
func (s *testLockSuite) TestTxnHeartBeat() {
txn, err := s.store.Begin()
s.Nil(err)
txn.Set([]byte("key"), []byte("value"))
s.prewriteTxn(txn)
newTTL, err := s.store.SendTxnHeartbeat(context.Background(), []byte("key"), txn.StartTS(), 6666)
s.Nil(err)
s.Equal(newTTL, uint64(6666))
newTTL, err = s.store.SendTxnHeartbeat(context.Background(), []byte("key"), txn.StartTS(), 5555)
s.Nil(err)
s.Equal(newTTL, uint64(6666))
lock := s.mustGetLock([]byte("key"))
err = s.store.NewLockResolver().ForceResolveLock(context.Background(), lock)
s.Nil(err)
newTTL, err = s.store.SendTxnHeartbeat(context.Background(), []byte("key"), txn.StartTS(), 6666)
s.NotNil(err)
s.Equal(newTTL, uint64(0))
}
func (s *testLockSuite) TestCheckTxnStatus() {
txn, err := s.store.Begin()
s.Nil(err)
txn.Set([]byte("key"), []byte("value"))
txn.Set([]byte("second"), []byte("xxx"))
s.prewriteTxnWithTTL(txn, 1000)
o := s.store.GetOracle()
currentTS, err := o.GetTimestamp(context.Background(), &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
s.Greater(currentTS, txn.StartTS())
bo := tikv.NewBackofferWithVars(context.Background(), int(transaction.PrewriteMaxBackoff.Load()), nil)
resolver := s.store.NewLockResolver()
// Call getTxnStatus to check the lock status.
status, err := resolver.GetTxnStatus(bo, txn.StartTS(), []byte("key"), currentTS, currentTS, true, false, nil)
s.Nil(err)
s.False(status.IsCommitted())
s.Greater(status.TTL(), uint64(0))
s.Equal(status.CommitTS(), uint64(0))
s.Equal(status.Action(), kvrpcpb.Action_MinCommitTSPushed)
// Test the ResolveLocks API
lock := s.mustGetLock([]byte("second"))
timeBeforeExpire, err := resolver.ResolveLocks(bo, currentTS, []*txnkv.Lock{lock})
s.Nil(err)
s.True(timeBeforeExpire > int64(0))
// Force rollback the lock using lock.TTL = 0.
lock.TTL = uint64(0)
timeBeforeExpire, err = resolver.ResolveLocks(bo, currentTS, []*txnkv.Lock{lock})
s.Nil(err)
s.Equal(timeBeforeExpire, int64(0))
// Then call getTxnStatus again and check the lock status.
currentTS, err = o.GetTimestamp(context.Background(), &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
status, err = s.store.NewLockResolver().GetTxnStatus(bo, txn.StartTS(), []byte("key"), currentTS, 0, true, false, nil)
s.Nil(err)
s.Equal(status.TTL(), uint64(0))
s.Equal(status.CommitTS(), uint64(0))
s.Equal(status.Action(), kvrpcpb.Action_NoAction)
// Call getTxnStatus on a committed transaction.
startTS, commitTS := s.putKV([]byte("a"), []byte("a"))
status, err = s.store.NewLockResolver().GetTxnStatus(bo, startTS, []byte("a"), currentTS, currentTS, true, false, nil)
s.Nil(err)
s.Equal(status.TTL(), uint64(0))
s.Equal(status.CommitTS(), commitTS)
}
func (s *testLockSuite) TestCheckTxnStatusNoWait() {
txn, err := s.store.Begin()
s.Nil(err)
txn.Set([]byte("key"), []byte("value"))
txn.Set([]byte("second"), []byte("xxx"))
committer, err := txn.NewCommitter(0)
s.Nil(err)
// Increase lock TTL to make CI more stable.
committer.SetLockTTLByTimeAndSize(txn.GetStartTime(), 200*1024*1024)
// Only prewrite the secondary key to simulate a concurrent prewrite case:
// prewrite secondary regions success and prewrite the primary region is pending.
err = committer.PrewriteMutations(context.Background(), committer.MutationsOfKeys([][]byte{[]byte("second")}))
s.Nil(err)
o := s.store.GetOracle()
currentTS, err := o.GetTimestamp(context.Background(), &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
bo := tikv.NewBackofferWithVars(context.Background(), int(transaction.PrewriteMaxBackoff.Load()), nil)
resolver := s.store.NewLockResolver()
// Call getTxnStatus for the TxnNotFound case.
_, err = resolver.GetTxnStatus(bo, txn.StartTS(), []byte("key"), currentTS, currentTS, false, false, nil)
s.NotNil(err)
s.True(resolver.IsErrorNotFound(err))
errCh := make(chan error)
go func() {
errCh <- committer.PrewriteMutations(context.Background(), committer.MutationsOfKeys([][]byte{[]byte("key")}))
}()
lock := &txnkv.Lock{
Key: []byte("second"),
Primary: []byte("key"),
TxnID: txn.StartTS(),
TTL: 100000,
}
// Call getTxnStatusFromLock to cover the retry logic.
status, err := resolver.GetTxnStatusFromLock(bo, lock, currentTS, false)
s.Nil(err)
s.Greater(status.TTL(), uint64(0))
s.Nil(<-errCh)
s.Nil(committer.CleanupMutations(context.Background()))
// Call getTxnStatusFromLock to cover TxnNotFound and retry timeout.
startTS, err := o.GetTimestamp(context.Background(), &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
lock = &txnkv.Lock{
Key: []byte("second"),
Primary: []byte("key_not_exist"),
TxnID: startTS,
TTL: 1000,
}
status, err = resolver.GetTxnStatusFromLock(bo, lock, currentTS, false)
s.Nil(err)
s.Equal(status.TTL(), uint64(0))
s.Equal(status.CommitTS(), uint64(0))
s.Equal(status.Action(), kvrpcpb.Action_LockNotExistRollback)
}
func (s *testLockSuite) prewriteTxn(txn transaction.TxnProbe) {
s.prewriteTxnWithTTL(txn, 0)
}
func (s *testLockSuite) prewriteTxnWithTTL(txn transaction.TxnProbe, ttl uint64) {
committer, err := txn.NewCommitter(0)
s.Nil(err)
if ttl > 0 {
elapsed := time.Since(txn.GetStartTime()) / time.Millisecond
committer.SetLockTTL(uint64(elapsed) + ttl)
}
err = committer.PrewriteAllMutations(context.Background())
s.Nil(err)
}
func (s *testLockSuite) mustGetLock(key []byte) *txnkv.Lock {
ver, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
s.Nil(err)
bo := tikv.NewBackofferWithVars(context.Background(), getMaxBackoff, nil)
req := tikvrpc.NewRequest(tikvrpc.CmdGet, &kvrpcpb.GetRequest{
Key: key,
Version: ver,
})
loc, err := s.store.GetRegionCache().LocateKey(bo, key)
s.Nil(err)
resp, err := s.store.SendReq(bo, req, loc.Region, tikv.ReadTimeoutShort)
s.Nil(err)
s.NotNil(resp.Resp)
keyErr := resp.Resp.(*kvrpcpb.GetResponse).GetError()
s.NotNil(keyErr)
lock, err := txnlock.ExtractLockFromKeyErr(keyErr)
s.Nil(err)
return lock
}
func (s *testLockSuite) ttlEquals(x, y uint64) {
if x < y {
x, y = y, x
}
s.LessOrEqual(x-y, uint64(50))
}
func (s *testLockSuite) TestLockTTL() {
managedLockTTL := atomic.LoadUint64(&transaction.ManagedLockTTL)
atomic.StoreUint64(&transaction.ManagedLockTTL, 20000) // set to 20s
defer atomic.StoreUint64(&transaction.ManagedLockTTL, managedLockTTL) // restore value
defaultLockTTL := tikv.ConfigProbe{}.GetDefaultLockTTL()
ttlFactor := tikv.ConfigProbe{}.GetTTLFactor()
txn, err := s.store.Begin()
s.Nil(err)
txn.Set([]byte("key"), []byte("value"))
time.Sleep(time.Millisecond)
s.prewriteTxnWithTTL(txn, 3100)
l := s.mustGetLock([]byte("key"))
s.True(l.TTL >= defaultLockTTL)
// Huge txn has a greater TTL.
txn, err = s.store.Begin()
start := time.Now()
s.Nil(err)
txn.Set([]byte("key"), []byte("value"))
for i := 0; i < 2048; i++ {
k, v := randKV(1024, 1024)
txn.Set([]byte(k), []byte(v))
}
elapsed := time.Since(start) / time.Millisecond
s.prewriteTxn(txn)
l = s.mustGetLock([]byte("key"))
s.ttlEquals(l.TTL, uint64(ttlFactor*2)+uint64(elapsed))
// Txn with long read time.
start = time.Now()
txn, err = s.store.Begin()
s.Nil(err)
time.Sleep(time.Millisecond * 50)
txn.Set([]byte("key"), []byte("value"))
elapsed = time.Since(start) / time.Millisecond
s.prewriteTxn(txn)
l = s.mustGetLock([]byte("key"))
s.ttlEquals(l.TTL, defaultLockTTL+uint64(elapsed))
}
func (s *testLockSuite) TestBatchResolveLocks() {
// The first transaction is a normal transaction with a long TTL
txn, err := s.store.Begin()
s.Nil(err)
txn.Set([]byte("k1"), []byte("v1"))
txn.Set([]byte("k2"), []byte("v2"))
s.prewriteTxnWithTTL(txn, 20000)
// The second transaction is an async commit transaction
txn, err = s.store.Begin()
s.Nil(err)
txn.Set([]byte("k3"), []byte("v3"))
txn.Set([]byte("k4"), []byte("v4"))
committer, err := txn.NewCommitter(0)
s.Nil(err)
committer.SetUseAsyncCommit()
committer.SetLockTTL(20000)
err = committer.PrewriteAllMutations(context.Background())
s.Nil(err)
var locks []*txnkv.Lock
for _, key := range []string{"k1", "k2", "k3", "k4"} {
l := s.mustGetLock([]byte(key))
locks = append(locks, l)
}
// Locks may not expired
msBeforeLockExpired := s.store.GetOracle().UntilExpired(locks[0].TxnID, locks[1].TTL, &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Greater(msBeforeLockExpired, int64(0))
msBeforeLockExpired = s.store.GetOracle().UntilExpired(locks[3].TxnID, locks[3].TTL, &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Greater(msBeforeLockExpired, int64(0))
lr := s.store.NewLockResolver()
bo := tikv.NewGcResolveLockMaxBackoffer(context.Background())
loc, err := s.store.GetRegionCache().LocateKey(bo, locks[0].Primary)
s.Nil(err)
// Check BatchResolveLocks resolve the lock even the ttl is not expired.
success, err := lr.BatchResolveLocks(bo, locks, loc.Region)
s.True(success)
s.Nil(err)
txn, err = s.store.Begin()
s.Nil(err)
// transaction 1 is rolled back
_, err = txn.Get(context.Background(), []byte("k1"))
s.Equal(err, tikverr.ErrNotExist)
_, err = txn.Get(context.Background(), []byte("k2"))
s.Equal(err, tikverr.ErrNotExist)
// transaction 2 is committed
v, err := txn.Get(context.Background(), []byte("k3"))
s.Nil(err)
s.True(bytes.Equal(v, []byte("v3")))
v, err = txn.Get(context.Background(), []byte("k4"))
s.Nil(err)
s.True(bytes.Equal(v, []byte("v4")))
}
func (s *testLockSuite) TestNewLockZeroTTL() {
l := txnlock.NewLock(&kvrpcpb.LockInfo{})
s.Equal(l.TTL, uint64(0))
}
func init() {
// Speed up tests.
tikv.ConfigProbe{}.SetOracleUpdateInterval(2)
}
func (s *testLockSuite) TestZeroMinCommitTS() {
txn, err := s.store.Begin()
s.Nil(err)
txn.Set([]byte("key"), []byte("value"))
bo := tikv.NewBackofferWithVars(context.Background(), int(transaction.PrewriteMaxBackoff.Load()), nil)
mockValue := fmt.Sprintf(`return(%d)`, txn.StartTS())
s.Nil(failpoint.Enable("tikvclient/mockZeroCommitTS", mockValue))
s.prewriteTxnWithTTL(txn, 1000)
s.Nil(failpoint.Disable("tikvclient/mockZeroCommitTS"))
lock := s.mustGetLock([]byte("key"))
expire, pushed, _, err := s.store.NewLockResolver().ResolveLocksForRead(bo, 0, []*txnkv.Lock{lock}, true)
s.Nil(err)
s.Len(pushed, 0)
s.Greater(expire, int64(0))
expire, pushed, _, err = s.store.NewLockResolver().ResolveLocksForRead(bo, math.MaxUint64, []*txnkv.Lock{lock}, true)
s.Nil(err)
s.Len(pushed, 1)
s.Equal(expire, int64(0))
// Clean up this test.
lock.TTL = uint64(0)
expire, err = s.store.NewLockResolver().ResolveLocks(bo, 0, []*txnkv.Lock{lock})
s.Nil(err)
s.Equal(expire, int64(0))
}
func (s *testLockSuite) prepareTxnFallenBackFromAsyncCommit() {
txn, err := s.store.Begin()
s.Nil(err)
err = txn.Set([]byte("fb1"), []byte("1"))
s.Nil(err)
err = txn.Set([]byte("fb2"), []byte("2"))
s.Nil(err)
committer, err := txn.NewCommitter(1)
s.Nil(err)
s.Equal(committer.GetMutations().Len(), 2)
committer.SetLockTTL(0)
committer.SetUseAsyncCommit()
committer.SetCommitTS(committer.GetStartTS() + (100 << 18)) // 100ms
err = committer.PrewriteMutations(context.Background(), committer.GetMutations().Slice(0, 1))
s.Nil(err)
s.True(committer.IsAsyncCommit())
// Set an invalid maxCommitTS to produce MaxCommitTsTooLarge
committer.SetMaxCommitTS(committer.GetStartTS() - 1)
err = committer.PrewriteMutations(context.Background(), committer.GetMutations().Slice(1, 2))
s.Nil(err)
s.False(committer.IsAsyncCommit()) // Fallback due to MaxCommitTsTooLarge
}
func (s *testLockSuite) TestCheckLocksFallenBackFromAsyncCommit() {
s.prepareTxnFallenBackFromAsyncCommit()
lock := s.mustGetLock([]byte("fb1"))
s.True(lock.UseAsyncCommit)
bo := tikv.NewBackoffer(context.Background(), getMaxBackoff)
lr := s.store.NewLockResolver()
status, err := lr.GetTxnStatusFromLock(bo, lock, 0, false)
s.Nil(err)
s.Equal(txnlock.LockProbe{}.GetPrimaryKeyFromTxnStatus(status), []byte("fb1"))
err = lr.CheckAllSecondaries(bo, lock, &status)
s.True(lr.IsNonAsyncCommitLock(err))
status, err = lr.GetTxnStatusFromLock(bo, lock, 0, true)
s.Nil(err)
s.Equal(status.Action(), kvrpcpb.Action_TTLExpireRollback)
s.Equal(status.TTL(), uint64(0))
}
func (s *testLockSuite) TestResolveTxnFallenBackFromAsyncCommit() {
s.prepareTxnFallenBackFromAsyncCommit()
lock := s.mustGetLock([]byte("fb1"))
s.True(lock.UseAsyncCommit)
bo := tikv.NewBackoffer(context.Background(), getMaxBackoff)
expire, err := s.store.NewLockResolver().ResolveLocks(bo, 0, []*txnkv.Lock{lock})
s.Nil(err)
s.Equal(expire, int64(0))
t3, err := s.store.Begin()
s.Nil(err)
_, err = t3.Get(context.Background(), []byte("fb1"))
s.True(tikverr.IsErrNotFound(err))
_, err = t3.Get(context.Background(), []byte("fb2"))
s.True(tikverr.IsErrNotFound(err))
}
func (s *testLockSuite) TestBatchResolveTxnFallenBackFromAsyncCommit() {
s.prepareTxnFallenBackFromAsyncCommit()
lock := s.mustGetLock([]byte("fb1"))
s.True(lock.UseAsyncCommit)
bo := tikv.NewBackoffer(context.Background(), getMaxBackoff)
loc, err := s.store.GetRegionCache().LocateKey(bo, []byte("fb1"))
s.Nil(err)
ok, err := s.store.NewLockResolver().BatchResolveLocks(bo, []*txnkv.Lock{lock}, loc.Region)
s.Nil(err)
s.True(ok)
t3, err := s.store.Begin()
s.Nil(err)
_, err = t3.Get(context.Background(), []byte("fb1"))
s.True(tikverr.IsErrNotFound(err))
_, err = t3.Get(context.Background(), []byte("fb2"))
s.True(tikverr.IsErrNotFound(err))
}
func (s *testLockSuite) TestDeadlockReportWaitChain() {
// Utilities to make the test logic clear and simple.
type txnWrapper struct {
transaction.TxnProbe
wg sync.WaitGroup
}
makeLockCtx := func(txn *txnWrapper, resourceGroupTag string) *kv.LockCtx {
lockctx := kv.NewLockCtx(txn.StartTS(), 1000, time.Now())
lockctx.ResourceGroupTag = []byte(resourceGroupTag)
return lockctx
}
// Prepares several transactions and each locks a key.
prepareTxns := func(num int) []*txnWrapper {
res := make([]*txnWrapper, 0, num)
for i := 0; i < num; i++ {
txnProbe, err := s.store.Begin()
s.Nil(err)
txn := &txnWrapper{TxnProbe: txnProbe}
txn.SetPessimistic(true)
tag := fmt.Sprintf("tag-init%v", i)
key := []byte{'k', byte(i)}
err = txn.LockKeys(context.Background(), makeLockCtx(txn, tag), key)
s.Nil(err)
res = append(res, txn)
}
return res
}
// Let the i-th trnasaction lock the key that has been locked by j-th transaction
tryLock := func(txns []*txnWrapper, i int, j int) error {
s.T().Logf("txn %v try locking %v", i, j)
txn := txns[i]
tag := fmt.Sprintf("tag-%v-%v", i, j)
key := []byte{'k', byte(j)}
return txn.LockKeys(context.Background(), makeLockCtx(txn, tag), key)
}
// Asserts the i-th transaction waits for the j-th transaction.
makeWaitFor := func(txns []*txnWrapper, i int, j int) {
txns[i].wg.Add(1)
go func() {
defer txns[i].wg.Done()
err := tryLock(txns, i, j)
// After the lock being waited for is released, the transaction returns a WriteConflict error
// unconditionally, which is by design.
s.NotNil(err)
s.T().Logf("txn %v wait for %v finished, err: %s", i, j, err.Error())
_, ok := errors.Cause(err).(*tikverr.ErrWriteConflict)
s.True(ok)
}()
}
waitAndRollback := func(txns []*txnWrapper, i int) {
// It's expected that each transaction should be rolled back after its blocker, so that `Rollback` will not
// run when there's concurrent `LockKeys` running.
// If it's blocked on the `Wait` forever, it means the transaction's blocker is not rolled back.
s.T().Logf("rollback txn %v", i)
txns[i].wg.Wait()
err := txns[i].Rollback()
s.Nil(err)
}
// Check the given WaitForEntry is caused by txn[i] waiting for txn[j].
checkWaitChainEntry := func(txns []*txnWrapper, entry *deadlockpb.WaitForEntry, i, j int) {
s.Equal(entry.Txn, txns[i].StartTS())
s.Equal(entry.WaitForTxn, txns[j].StartTS())
s.Equal(entry.Key, []byte{'k', byte(j)})
s.Equal(string(entry.ResourceGroupTag), fmt.Sprintf("tag-%v-%v", i, j))
}
s.T().Log("test case 1: 1->0->1")
txns := prepareTxns(2)
makeWaitFor(txns, 0, 1)
// Sleep for a while to make sure it has been blocked.
time.Sleep(time.Millisecond * 100)
// txn2 tries locking k1 and encounters deadlock error.
err := tryLock(txns, 1, 0)
s.NotNil(err)
dl, ok := errors.Cause(err).(*tikverr.ErrDeadlock)
s.True(ok)
waitChain := dl.GetWaitChain()
s.Equal(len(waitChain), 2)
checkWaitChainEntry(txns, waitChain[0], 0, 1)
checkWaitChainEntry(txns, waitChain[1], 1, 0)
// Each transaction should be rolled back after its blocker being rolled back
waitAndRollback(txns, 1)
waitAndRollback(txns, 0)
s.T().Log("test case 2: 3->2->0->1->3")
txns = prepareTxns(4)
makeWaitFor(txns, 0, 1)
makeWaitFor(txns, 2, 0)
makeWaitFor(txns, 1, 3)
// Sleep for a while to make sure it has been blocked.
time.Sleep(time.Millisecond * 100)
err = tryLock(txns, 3, 2)
s.NotNil(err)
dl, ok = errors.Cause(err).(*tikverr.ErrDeadlock)
s.True(ok)
waitChain = dl.GetWaitChain()
s.Equal(len(waitChain), 4)
s.T().Logf("wait chain: \n** %v\n**%v\n**%v\n**%v\n", waitChain[0], waitChain[1], waitChain[2], waitChain[3])
checkWaitChainEntry(txns, waitChain[0], 2, 0)
checkWaitChainEntry(txns, waitChain[1], 0, 1)
checkWaitChainEntry(txns, waitChain[2], 1, 3)
checkWaitChainEntry(txns, waitChain[3], 3, 2)
// Each transaction should be rolled back after its blocker being rolled back
waitAndRollback(txns, 3)
waitAndRollback(txns, 1)
waitAndRollback(txns, 0)
waitAndRollback(txns, 2)
}
func (s *testLockSuite) TestStartHeartBeatAfterLockingPrimary() {
atomic.StoreUint64(&transaction.ManagedLockTTL, 500)
s.Nil(failpoint.Enable("tikvclient/twoPCRequestBatchSizeLimit", `return`))
s.Nil(failpoint.Enable("tikvclient/afterPrimaryBatch", `pause`))
defer func() {
atomic.StoreUint64(&transaction.ManagedLockTTL, 20000)
s.Nil(failpoint.Disable("tikvclient/twoPCRequestBatchSizeLimit"))
}()
txn, err := s.store.Begin()
s.Nil(err)
txn.SetPessimistic(true)
lockCtx := &kv.LockCtx{ForUpdateTS: txn.StartTS(), WaitStartTime: time.Now()}
lockResCh := make(chan error)
go func() {
err = txn.LockKeys(context.Background(), lockCtx, []byte("a"), []byte("b"))
lockResCh <- err
}()
time.Sleep(500 * time.Millisecond)
// Check the TTL should have been updated
lr := s.store.NewLockResolver()
status, err := lr.LockResolver.GetTxnStatus(txn.StartTS(), 0, []byte("a"))
s.Nil(err)
s.False(status.IsCommitted())
s.Greater(status.TTL(), uint64(600))
s.Equal(status.CommitTS(), uint64(0))
// Let locking the secondary key fail
s.Nil(failpoint.Enable("tikvclient/PessimisticLockErrWriteConflict", "return"))
s.Nil(failpoint.Disable("tikvclient/afterPrimaryBatch"))
s.Error(<-lockResCh)
s.Nil(failpoint.Disable("tikvclient/PessimisticLockErrWriteConflict"))
err = txn.LockKeys(context.Background(), lockCtx, []byte("c"), []byte("d"))
s.Nil(err)
time.Sleep(500 * time.Millisecond)
// The original primary key "a" should be rolled back because its TTL is not updated
lr = s.store.NewLockResolver()
status, err = lr.LockResolver.GetTxnStatus(txn.StartTS(), 0, []byte("a"))
s.Nil(err)
s.False(status.IsCommitted())
s.Equal(status.TTL(), uint64(0))
// The TTL of the new primary lock should be updated.
lr = s.store.NewLockResolver()
status, err = lr.LockResolver.GetTxnStatus(txn.StartTS(), 0, []byte("c"))
s.Nil(err)
s.False(status.IsCommitted())
s.Greater(status.TTL(), uint64(1200))
s.Equal(status.CommitTS(), uint64(0))
s.Nil(txn.Rollback())
}
func (s *testLockSuite) TestPrewriteEncountersLargerTsLock() {
t1, err := s.store.Begin()
s.Nil(err)
s.Nil(t1.Set([]byte("k1"), []byte("v1")))
s.Nil(t1.Set([]byte("k2"), []byte("v2")))
// t2 has larger TS. Let t2 prewrite only the secondary lock.
t2, err := s.store.Begin()
s.Nil(err)
s.Nil(t2.Set([]byte("k1"), []byte("v1")))
s.Nil(t2.Set([]byte("k2"), []byte("v2")))
committer, err := t2.NewCommitter(1)
s.Nil(err)
committer.SetLockTTL(20000) // set TTL to 20s
s.Nil(failpoint.Enable("tikvclient/twoPCRequestBatchSizeLimit", "return"))
defer failpoint.Disable("tikvclient/twoPCRequestBatchSizeLimit")
s.Nil(failpoint.Enable("tikvclient/prewritePrimary", "pause"))
ch := make(chan struct{})
go func() {
err = committer.PrewriteAllMutations(context.Background())
s.Nil(err)
ch <- struct{}{}
}()
time.Sleep(200 * time.Millisecond) // make prewrite earlier than t1 commits
// Set 1 second timeout. If we still need to wait until t2 expires, we will get a timeout error
// instead of write conflict.
ctx, cancel := context.WithTimeout(context.Background(), time.Second)
defer cancel()
err = t1.Commit(ctx)
s.True(tikverr.IsErrWriteConflict(err))
s.Nil(failpoint.Disable("tikvclient/prewritePrimary"))
<-ch
}
func (s *testLockSuite) TestResolveLocksForRead() {
ctx := context.Background()
var resolvedLocks, committedLocks []uint64
var locks []*txnlock.Lock
// commitTS < readStartTS
startTS, _ := s.lockKey([]byte("k1"), []byte("v1"), []byte("k11"), []byte("v11"), 3000, true, false)
committedLocks = append(committedLocks, startTS)
lock := s.mustGetLock([]byte("k1"))
locks = append(locks, lock)
// rolled back
startTS, _ = s.lockKey([]byte("k2"), []byte("v2"), []byte("k22"), []byte("v22"), 3000, false, false)
lock = s.mustGetLock([]byte("k22"))
err := s.store.NewLockResolver().ForceResolveLock(ctx, lock)
s.Nil(err)
resolvedLocks = append(resolvedLocks, startTS)
lock = s.mustGetLock([]byte("k2"))
locks = append(locks, lock)
// pushed
startTS, _ = s.lockKey([]byte("k3"), []byte("v3"), []byte("k33"), []byte("v33"), 3000, false, false)
resolvedLocks = append(resolvedLocks, startTS)
lock = s.mustGetLock([]byte("k3"))
locks = append(locks, lock)
// can't be pushed and isn't expired
_, _ = s.lockKey([]byte("k4"), []byte("v4"), []byte("k44"), []byte("v44"), 3000, false, true)
lock = s.mustGetLock([]byte("k4"))
locks = append(locks, lock)
// can't be pushed but is expired
startTS, _ = s.lockKey([]byte("k5"), []byte("v5"), []byte("k55"), []byte("v55"), 0, false, true)
committedLocks = append(committedLocks, startTS)
lock = s.mustGetLock([]byte("k5"))
locks = append(locks, lock)
// commitTS > readStartTS
var readStartTS uint64
{
t, err := s.store.Begin()
s.Nil(err)
resolvedLocks = append(resolvedLocks, t.StartTS())
s.Nil(t.Set([]byte("k6"), []byte("v6")))
s.Nil(t.Set([]byte("k66"), []byte("v66")))
committer, err := t.NewCommitter(1)
s.Nil(err)
s.Nil(committer.PrewriteAllMutations(ctx))
committer.SetPrimaryKey([]byte("k66"))
readStartTS, err = s.store.GetOracle().GetTimestamp(ctx, &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
commitTS, err := s.store.GetOracle().GetTimestamp(ctx, &oracle.Option{TxnScope: oracle.GlobalTxnScope})
s.Nil(err)
s.Greater(commitTS, readStartTS)
committer.SetCommitTS(commitTS)
err = committer.CommitMutations(ctx)
s.Nil(err)
lock = s.mustGetLock([]byte("k6"))
locks = append(locks, lock)
}
bo := tikv.NewBackoffer(context.Background(), getMaxBackoff)
lr := s.store.NewLockResolver()
defer lr.Close()
msBeforeExpired, resolved, committed, err := lr.ResolveLocksForRead(bo, readStartTS, locks, false)
s.Nil(err)
s.Greater(msBeforeExpired, int64(0))
s.Equal(resolvedLocks, resolved)
s.Equal(committedLocks, committed)
}
func (s *testLockSuite) TestLockWaitTimeLimit() {
k1 := []byte("k1")
k2 := []byte("k2")
txn1, err := s.store.Begin()
s.Nil(err)
txn1.SetPessimistic(true)
// lock the primary key
lockCtx := &kv.LockCtx{ForUpdateTS: txn1.StartTS(), WaitStartTime: time.Now()}
err = txn1.LockKeys(context.Background(), lockCtx, k1, k2)
s.Nil(err)
txn2, err := s.store.Begin()
s.Nil(err)
txn2.SetPessimistic(true)
// test no wait
lockCtx = kv.NewLockCtx(txn2.StartTS(), kv.LockNoWait, time.Now())
err = txn2.LockKeys(context.Background(), lockCtx, k1)
// cannot acquire lock immediately thus error
s.Equal(tikverr.ErrLockAcquireFailAndNoWaitSet.Error(), err.Error())
// Default wait time is 1s, we use 500ms as an upper bound
s.Less(time.Since(lockCtx.WaitStartTime), 500*time.Millisecond)
// test for wait limited time (200ms)
lockCtx = kv.NewLockCtx(txn2.StartTS(), 200, time.Now())
err = txn2.LockKeys(context.Background(), lockCtx, k2)
// cannot acquire lock in time thus error
s.Equal(tikverr.ErrLockWaitTimeout.Error(), err.Error())
s.GreaterOrEqual(time.Since(lockCtx.WaitStartTime), 200*time.Millisecond)
s.Less(time.Since(lockCtx.WaitStartTime), 800*time.Millisecond)
s.Nil(txn1.Rollback())
s.Nil(txn2.Rollback())
}
type testLockWithTiKVSuite struct {
suite.Suite
store tikv.StoreProbe
}
func (s *testLockWithTiKVSuite) SetupTest() {
if *withTiKV {
s.store = tikv.StoreProbe{KVStore: NewTestStore(s.T())}
s.cleanupLocks()
} else {
s.store = tikv.StoreProbe{KVStore: NewTestUniStore(s.T())}
s.cleanupLocks()
}
}
func (s *testLockWithTiKVSuite) TearDownTest() {
s.store.Close()
}
func (s *testLockWithTiKVSuite) cleanupLocks() {
// Cleanup possible left locks.
bo := tikv.NewBackofferWithVars(context.Background(), int(transaction.PrewriteMaxBackoff.Load()), nil)
ctx := context.WithValue(context.Background(), util.SessionID, uint64(1))
currentTS, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
s.NoError(err)
remainingLocks, err := s.store.ScanLocks(ctx, []byte("k"), []byte("l"), currentTS)
s.NoError(err)
if len(remainingLocks) > 0 {
s.mustResolve(ctx, bo, remainingLocks, currentTS, []byte("k"), []byte("l"))
}
}
// TODO: Migrate FairLocking related tests here.
func withRetry[T any](f func() (T, error), limit int, delay time.Duration) (T, error) {
for {
res, err := f()
if err == nil {
return res, nil
}
limit--
if limit <= 0 {
return res, err
}
if delay != 0 {
time.Sleep(delay)
}
}
}
func (s *testLockWithTiKVSuite) checkIsKeyLocked(key []byte, expectedLocked bool) {
// To be aware of the result of async operations (e.g. async pessimistic rollback), retry if the check fails.
_, err := withRetry(func() (interface{}, error) {
txn, err := s.store.Begin()
s.NoError(err)
txn.SetPessimistic(true)
lockCtx := kv.NewLockCtx(txn.StartTS(), kv.LockNoWait, time.Now())
err = txn.LockKeys(context.Background(), lockCtx, key)
var isCheckSuccess bool
if err != nil && stderrs.Is(err, tikverr.ErrLockAcquireFailAndNoWaitSet) {
isCheckSuccess = expectedLocked
} else {
s.Nil(err)
isCheckSuccess = !expectedLocked
}
if isCheckSuccess {
s.Nil(txn.Rollback())
return nil, nil
}
s.Nil(txn.Rollback())
return nil, errors.Errorf("expected key %q locked = %v, but the actual result not match", string(key), expectedLocked)
}, 5, time.Millisecond*50)
s.NoError(err)
}
func (s *testLockWithTiKVSuite) trySetTiKVConfig(name string, value interface{}) func() {
stores, err := s.store.GetPDClient().GetAllStores(context.Background())
s.NoError(err)
type configItem struct {
url string
name string
value interface{}
}
var recoverConfigs []configItem
httpScheme := "http"
if c, err := config.GetGlobalConfig().Security.ToTLSConfig(); err == nil && c != nil {
httpScheme = "https"
}
t := s.Suite.T()
setCfg := func(url, name string, value interface{}) error {
postBody, err := json.Marshal(map[string]interface{}{name: value})
if err != nil {
return err
}
resp, err := http.Post(url, "text/json", bytes.NewReader(postBody))
if err != nil {
return err
}
s.NoError(resp.Body.Close())
if resp.StatusCode != 200 {
return errors.Errorf("post config got unexpected status code: %v, request body: %s", resp.StatusCode, postBody)
}
t.Logf("set config for tikv at %s finished: %s", url, string(postBody))
return nil
}
storeIter:
for _, store := range stores {
if store.State != metapb.StoreState_Up {
continue
}
for _, label := range store.Labels {
if label.Key == "engine" && label.Value != "tikv" {
continue storeIter
}
}
err := func() (err error) {
defer func() {
if r := recover(); r != nil {
err = errors.Errorf("set config for store at %v panicked: %v", store.StatusAddress, r)
}
}()
url := fmt.Sprintf("%s://%s/config", httpScheme, store.StatusAddress)
resp, err := http.Get(url)
if err != nil {
return err
}
defer resp.Body.Close()
if resp.StatusCode != 200 {
return errors.Errorf("unexpected response status: %v", resp.Status)
}
oldCfgRaw, err := io.ReadAll(resp.Body)
if err != nil {
return err
}
oldCfg := make(map[string]interface{})
err = json.Unmarshal(oldCfgRaw, &oldCfg)
if err != nil {
return err
}
oldValue := oldCfg["pessimistic-txn"].(map[string]interface{})["in-memory"]
if assert.ObjectsAreEqual(oldValue, value) {
return nil
}
err = setCfg(url, name, value)
if err != nil {
return err
}
recoverConfigs = append(recoverConfigs, configItem{
url: url,
name: name,
value: oldValue,
})
return nil
}()
if err != nil {
t.Logf("failed to set config for store at %s: %v", store.StatusAddress, err)
}
}
// Prevent goleak from complaining about its internal connections.
http.DefaultClient.CloseIdleConnections()
if len(recoverConfigs) > 0 {
// Sleep for a while to ensure the new configs are applied.
time.Sleep(time.Second)
}
return func() {
for _, item := range recoverConfigs {
err = setCfg(item.url, item.name, item.value)
if err != nil {
t.Logf("failed to recover config for store at %s: %v", item.url, err)
}
}
// Prevent goleak from complaining about its internal connections.
http.DefaultClient.CloseIdleConnections()
}
}
func (s *testLockWithTiKVSuite) TestPrewriteCheckForUpdateTS() {
test := func(asyncCommit bool, onePC bool, causalConsistency bool) {
k1 := []byte("k1")
k2 := []byte("k2")
k3 := []byte("k3")
k4 := []byte("k4")
v1 := []byte("v1")
v2 := []byte("v2")
// Clear previous value
{
txn, err := s.store.Begin()
s.NoError(err)
for _, k := range [][]byte{k1, k2, k3, k4} {
s.NoError(txn.Delete(k))
}
s.NoError(txn.Commit(context.Background()))
}
ctx := context.WithValue(context.Background(), util.SessionID, uint64(1))
// Test failing case
txn, err := s.store.Begin()
s.NoError(err)
txn.SetPessimistic(true)
txn.SetEnableAsyncCommit(asyncCommit)
txn.SetEnable1PC(onePC)
txn.SetCausalConsistency(causalConsistency)
txn.StartAggressiveLocking()
lockTime := time.Now()
lockCtx := kv.NewLockCtx(txn.StartTS(), 200, lockTime)
s.NoError(txn.LockKeys(ctx, lockCtx, k1))
s.NoError(txn.LockKeys(ctx, lockCtx, k2))
s.NoError(txn.LockKeys(ctx, lockCtx, k3))
txn.DoneAggressiveLocking(ctx)
s.NoError(txn.Set(k1, v1))
txn.GetCommitter().CloseTTLManager()
simulatedCommitter, err := txn.NewCommitter(1)
s.NoError(err)
s.NoError(failpoint.Enable("tikvclient/beforePrewrite", "pause"))
commitFinishCh := make(chan error)
go func() {
commitFinishCh <- txn.Commit(ctx)
}()
select {
case <-commitFinishCh:
s.Fail("txn commit not blocked")
case <-time.After(time.Millisecond * 100):
}
// Simulate pessimistic lock lost. Retry on region error to make it stable when running with TiKV.
{
mutations := transaction.NewPlainMutations(1)
mutations.Push(kvrpcpb.Op_PessimisticLock, k1, nil, true, false, false, false)
simulatedCommitter.SetForUpdateTS(simulatedCommitter.GetStartTS())
err := simulatedCommitter.PessimisticRollbackMutations(context.Background(), &mutations)
s.NoError(err)
s.checkIsKeyLocked(k1, false)
}
// Simulate the key being written by another transaction
txn2, err := s.store.Begin()
s.NoError(err)
s.NoError(txn2.Set(k1, v2))
s.NoError(txn2.Commit(context.Background()))
// Simulate stale pessimistic lock request being replayed on TiKV
{
simulatedTxn, err := s.store.Begin()
s.NoError(err)
simulatedTxn.SetStartTS(txn.StartTS())
simulatedTxn.SetPessimistic(true)
simulatedTxn.StartAggressiveLocking()
lockCtx := kv.NewLockCtx(txn.StartTS(), 200, lockTime)
s.NoError(simulatedTxn.LockKeys(context.Background(), lockCtx, k1))
info := simulatedTxn.GetAggressiveLockingKeysInfo()
s.Equal(1, len(info))
s.Equal(k1, info[0].Key())
s.Equal(txn2.GetCommitTS(), info[0].ActualLockForUpdateTS())
simulatedTxn.DoneAggressiveLocking(context.Background())
defer func() {
s.NoError(simulatedTxn.Rollback())
}()
}
s.NoError(failpoint.Disable("tikvclient/beforePrewrite"))
err = <-commitFinishCh
s.Error(err)
s.Regexp("[pP]essimistic ?[lL]ock ?[nN]ot ?[fF]ound", err.Error())
snapshot := s.store.GetSnapshot(txn2.GetCommitTS())
v, err := snapshot.Get(context.Background(), k1)
s.NoError(err)
s.Equal(v2, v)
snapshot = s.store.GetSnapshot(txn2.GetCommitTS() - 1)
_, err = snapshot.Get(context.Background(), k1)
s.Equal(tikverr.ErrNotExist, err)
// Test passing case
txn, err = s.store.Begin()
s.NoError(err)
txn.SetPessimistic(true)
txn.SetEnableAsyncCommit(asyncCommit)
txn.SetEnable1PC(onePC)
txn.SetCausalConsistency(causalConsistency)
// Prepare a conflicting version to key k2
{
txn1, err := s.store.Begin()
s.NoError(err)
s.NoError(txn1.Set(k2, v2))
s.NoError(txn1.Commit(context.Background()))
}
txn.StartAggressiveLocking()
lockCtx = kv.NewLockCtx(txn.StartTS(), 200, lockTime)
// k2: conflicting key
s.NoError(txn.LockKeys(ctx, lockCtx, k2))
// k3: non-conflicting key
s.NoError(txn.LockKeys(ctx, lockCtx, k3))
// There must be a new tso allocation before committing if any key is locked with conflict, otherwise
// async commit will become unsafe.
// In TiDB, there must be a tso allocation for updating forUpdateTS.
currentTS, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
s.NoError(err)
lockCtx = kv.NewLockCtx(currentTS, 200, lockTime)
// k4: non-conflicting key but forUpdateTS updated
s.NoError(txn.LockKeys(ctx, lockCtx, k4))
s.NoError(txn.Set(k2, v1))
s.NoError(txn.Set(k3, v1))
txn.DoneAggressiveLocking(ctx)
s.NoError(txn.Commit(ctx))
snapshot = s.store.GetSnapshot(txn.GetCommitTS())
v, err = snapshot.Get(context.Background(), k2)
s.NoError(err)
s.Equal(v1, v)
v, err = snapshot.Get(context.Background(), k3)
s.NoError(err)
s.Equal(v1, v)
snapshot = s.store.GetSnapshot(txn.GetCommitTS() - 1)
v, err = snapshot.Get(context.Background(), k2)
s.NoError(err)
s.Equal(v2, v)
_, err = snapshot.Get(context.Background(), k3)
s.Equal(tikverr.ErrNotExist, err)
}
test(false, false, false)
test(true, false, false)
test(true, true, false)
test(true, false, true)
}
func (s *testLockWithTiKVSuite) TestCheckTxnStatusSentToSecondary() {
s.NoError(failpoint.Enable("tikvclient/beforeAsyncPessimisticRollback", `return("skip")`))
s.NoError(failpoint.Enable("tikvclient/twoPCRequestBatchSizeLimit", "return"))
s.NoError(failpoint.Enable("tikvclient/shortPessimisticLockTTL", "return"))
s.NoError(failpoint.Enable("tikvclient/twoPCShortLockTTL", "return"))
defer func() {
s.NoError(failpoint.Disable("tikvclient/beforeAsyncPessimisticRollback"))
s.NoError(failpoint.Disable("tikvclient/twoPCRequestBatchSizeLimit"))
s.NoError(failpoint.Disable("tikvclient/shortPessimisticLockTTL"))
s.NoError(failpoint.Disable("tikvclient/twoPCShortLockTTL"))
}()
k1 := []byte("k1")
k2 := []byte("k2")
k3 := []byte("k3")
ctx := context.WithValue(context.Background(), util.SessionID, uint64(1))
txn, err := s.store.Begin()
s.NoError(err)
txn.SetPessimistic(true)
// Construct write conflict to make the LockKeys operation fail.
{
txn2, err := s.store.Begin()
s.NoError(err)
s.NoError(txn2.Set(k3, []byte("v3")))
s.NoError(txn2.Commit(ctx))
}
lockCtx := kv.NewLockCtx(txn.StartTS(), 200, time.Now())
err = txn.LockKeys(ctx, lockCtx, k1, k2, k3)
s.IsType(&tikverr.ErrWriteConflict{}, errors.Cause(err))
// At this time: txn's primary is unsetted, and the keys:
// * k1: stale pessimistic lock, primary
// * k2: stale pessimistic lock, primary -> k1
forUpdateTS, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
s.NoError(err)
lockCtx = kv.NewLockCtx(forUpdateTS, 200, time.Now())
err = txn.LockKeys(ctx, lockCtx, k3) // k3 becomes primary
err = txn.LockKeys(ctx, lockCtx, k1)
s.Equal(k3, txn.GetCommitter().GetPrimaryKey())
// At this time:
// * k1: pessimistic lock, primary -> k3
// * k2: stale pessimistic lock, primary -> k1
// * k3: pessimistic lock, primary
s.NoError(txn.Set(k1, []byte("v1-1")))
s.NoError(txn.Set(k3, []byte("v3-1")))
s.NoError(failpoint.Enable("tikvclient/beforeCommitSecondaries", `return("skip")`))
defer func() {
s.NoError(failpoint.Disable("tikvclient/beforeCommitSecondaries"))
}()
s.NoError(txn.Commit(ctx))
// At this time:
// * k1: prewritten, primary -> k3
// * k2: stale pessimistic lock, primary -> k1
// * k3: committed
// Trigger resolving lock on k2
{
txn2, err := s.store.Begin()
s.NoError(err)
txn2.SetPessimistic(true)
lockCtx = kv.NewLockCtx(txn2.StartTS(), 200, time.Now())
s.NoError(txn2.LockKeys(ctx, lockCtx, k2))
s.NoError(txn2.Rollback())
}
// Check data consistency
readTS, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
s.NoError(err)
snapshot := s.store.GetSnapshot(readTS)
v, err := snapshot.Get(ctx, k3)
s.NoError(err)
s.Equal([]byte("v3-1"), v)
_, err = snapshot.Get(ctx, k2)
s.Equal(tikverr.ErrNotExist, err)
v, err = snapshot.Get(ctx, k1)
s.NoError(err)
s.Equal([]byte("v1-1"), v)
}
func (s *testLockWithTiKVSuite) TestBatchResolveLocks() {
if *withTiKV {
recoverFunc := s.trySetTiKVConfig("pessimistic-txn.in-memory", false)
defer recoverFunc()
}
s.NoError(failpoint.Enable("tikvclient/beforeAsyncPessimisticRollback", `return("skip")`))
s.NoError(failpoint.Enable("tikvclient/beforeCommitSecondaries", `return("skip")`))
s.NoError(failpoint.Enable("tikvclient/twoPCRequestBatchSizeLimit", `return`))
s.NoError(failpoint.Enable("tikvclient/onRollback", `return("skipRollbackPessimisticLock")`))
defer func() {
s.NoError(failpoint.Disable("tikvclient/beforeAsyncPessimisticRollback"))
s.NoError(failpoint.Disable("tikvclient/beforeCommitSecondaries"))
s.NoError(failpoint.Disable("tikvclient/twoPCRequestBatchSizeLimit"))
s.NoError(failpoint.Disable("tikvclient/onRollback"))
}()
k1, k2, k3, k4 := []byte("k1"), []byte("k2"), []byte("k3"), []byte("k4")
v2, v3 := []byte("v2"), []byte("v3")
ctx := context.WithValue(context.Background(), util.SessionID, uint64(1))
txn1, err := s.store.Begin()
s.NoError(err)
txn1.SetPessimistic(true)
{
// Produce write conflict on key k2
helperTxn, err := s.store.Begin()
s.NoError(err)
s.NoError(helperTxn.Set(k2, []byte("v0")))
s.NoError(helperTxn.Commit(ctx))
}
lockCtx := kv.NewLockCtx(txn1.StartTS(), 200, time.Now())
err = txn1.LockKeys(ctx, lockCtx, k1, k2)
s.IsType(&tikverr.ErrWriteConflict{}, errors.Cause(err))
// k1 has txn1's stale pessimistic lock now.
forUpdateTS, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
s.NoError(err)
lockCtx = kv.NewLockCtx(forUpdateTS, 200, time.Now())
s.NoError(txn1.LockKeys(ctx, lockCtx, k2, k3))
s.NoError(txn1.Set(k2, v2))
s.NoError(txn1.Set(k3, v3))
s.NoError(txn1.Commit(ctx))
// k3 has txn1's stale prewrite lock now.
txn2, err := s.store.Begin()
txn2.SetPessimistic(true)
s.NoError(err)
lockCtx = kv.NewLockCtx(txn1.StartTS(), 200, time.Now())
err = txn2.LockKeys(ctx, lockCtx, k4)
s.NoError(err)
s.NoError(txn2.Rollback())
// k4 has txn2's stale primary pessimistic lock now.
currentTS, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
remainingLocks, err := s.store.ScanLocks(ctx, []byte("k"), []byte("l"), currentTS)
s.NoError(err)
s.Len(remainingLocks, 3)
s.Equal(remainingLocks[0].Key, k1)
s.Equal(remainingLocks[0].LockType, kvrpcpb.Op_PessimisticLock)
s.Equal(remainingLocks[1].Key, k3)
s.Equal(remainingLocks[1].LockType, kvrpcpb.Op_Put)
s.Equal(remainingLocks[2].Key, k4)
s.Equal(remainingLocks[2].LockType, kvrpcpb.Op_PessimisticLock)
s.Equal(remainingLocks[2].Primary, k4)
// Perform ScanLock - BatchResolveLock.
s.NoError(err)
s.NoError(s.store.GCResolveLockPhase(ctx, currentTS, 1))
// Do ScanLock again to make sure no locks are left.
remainingLocks, err = s.store.ScanLocks(ctx, []byte("k"), []byte("l"), currentTS)
s.NoError(err)
s.Empty(remainingLocks)
// Check data consistency
readTS, err := s.store.CurrentTimestamp(oracle.GlobalTxnScope)
snapshot := s.store.GetSnapshot(readTS)
_, err = snapshot.Get(ctx, k1)
s.Equal(tikverr.ErrNotExist, err)
v, err := snapshot.Get(ctx, k2)
s.NoError(err)
s.Equal(v2, v)
v, err = snapshot.Get(ctx, k3)
s.NoError(err)
s.Equal(v3, v)
}
func (s *testLockWithTiKVSuite) makeLock(startTS uint64, forUpdateTS uint64, key []byte, primary []byte) *txnlock.Lock {
return &txnlock.Lock{
Key: key,
Primary: primary,
TxnID: startTS,
TTL: 10,
TxnSize: 1024,
LockType: kvrpcpb.Op_PessimisticLock,
UseAsyncCommit: false,
LockForUpdateTS: forUpdateTS,
MinCommitTS: forUpdateTS,
}
}
func (s *testLockWithTiKVSuite) mustLockNum(ctx context.Context, expectedNum int, scanTS uint64, startKey []byte, endKey []byte) {
remainingLocks, err := s.store.ScanLocks(ctx, startKey, endKey, scanTS)
s.NoError(err)
s.Len(remainingLocks, expectedNum)
}
func (s *testLockWithTiKVSuite) mustResolve(ctx context.Context, bo *retry.Backoffer, remainingLocks []*txnlock.Lock, callerTS uint64, startKey []byte, endKey []byte) {
if len(remainingLocks) > 0 {
_, err := s.store.GetLockResolver().ResolveLocksWithOpts(bo, txnlock.ResolveLocksOptions{
CallerStartTS: callerTS,
Locks: remainingLocks,
Lite: false,
ForRead: false,
Detail: nil,
PessimisticRegionResolve: true,
})
s.NoError(err)
lockAfterResolve, err := s.store.ScanLocks(ctx, startKey, endKey, callerTS)
s.NoError(err)
s.Len(lockAfterResolve, 0, "expected=%v actual=%v", 0, len(lockAfterResolve))
}
}
func (s *testLockWithTiKVSuite) TestPessimisticRollbackWithRead() {
s.NoError(failpoint.Enable("tikvclient/shortPessimisticLockTTL", "return"))
s.NoError(failpoint.Enable("tikvclient/twoPCShortLockTTL", "return"))
defer func() {
s.NoError(failpoint.Disable("tikvclient/shortPessimisticLockTTL"))
s.NoError(failpoint.Disable("tikvclient/twoPCShortLockTTL"))
}()
test := func(inMemoryLock bool) {
if *withTiKV {
recoverFunc := s.trySetTiKVConfig("pessimistic-txn.in-memory", inMemoryLock)
defer recoverFunc()
}
// Init, cleanup possible left locks.
bo := tikv.NewBackofferWithVars(context.Background(), int(transaction.PrewriteMaxBackoff.Load()), nil)
ctx := context.WithValue(context.Background(), util.SessionID, uint64(1))
s.cleanupLocks()
// Basic case, three keys could be rolled back within one pessimistic rollback request.
k1, k2, k3 := []byte("k1"), []byte("k2"), []byte("k3")
txn1, err := s.store.Begin()
s.NoError(err)
startTS := txn1.StartTS()
txn1.SetPessimistic(true)
lockCtx := kv.NewLockCtx(startTS, 200, time.Now())
err = txn1.LockKeys(ctx, lockCtx, k1, k2, k3)
s.NoError(err)
txn1.GetCommitter().CloseTTLManager()
time.Sleep(time.Millisecond * 100)
s.mustLockNum(ctx, 3, startTS+1, []byte("k"), []byte("l"))
locks := []*txnlock.Lock{
s.makeLock(startTS, startTS, k3, k1),
}
s.mustResolve(ctx, bo, locks, startTS+1, []byte("k"), []byte("l"))
time.Sleep(time.Millisecond * 100)
s.mustLockNum(ctx, 0, startTS+1, []byte("k"), []byte("l"))
// Acquire pessimistic locks for more than 256(RESOLVE_LOCK_BATCH_SIZE) keys.
formatKey := func(prefix rune, i int) []byte {
return []byte(fmt.Sprintf("%c%04d", prefix, i))
}
numKeys := 1000
prewriteKeys := make([][]byte, 0, numKeys/2)
pessimisticLockKeys := make([][]byte, 0, numKeys/2)
for i := 0; i < numKeys; i++ {
key := formatKey('k', i)
if i%2 == 0 {
err = txn1.LockKeys(ctx, lockCtx, key)
pessimisticLockKeys = append(pessimisticLockKeys, key)
} else {
err = txn1.Set(key, []byte("val"))
s.NoError(err)
prewriteKeys = append(prewriteKeys, key)
}
s.NoError(err)
}
committer, err := txn1.NewCommitter(1)
s.NoError(err)
mutations := committer.MutationsOfKeys(prewriteKeys)
err = committer.PrewriteMutations(ctx, mutations)
s.NoError(err)
// All the pessimistic locks belonging to the same transaction are pessimistic
// rolled back within one request.
time.Sleep(time.Millisecond * 100)
pessimisticLock := s.makeLock(startTS, startTS, pessimisticLockKeys[1], pessimisticLockKeys[0])
_, err = s.store.GetLockResolver().ResolveLocksWithOpts(bo, txnlock.ResolveLocksOptions{
CallerStartTS: startTS + 1,
Locks: []*txnlock.Lock{pessimisticLock},
Lite: false,
ForRead: false,
Detail: nil,
PessimisticRegionResolve: true,
})
s.NoError(err)
time.Sleep(time.Millisecond * 100)
s.mustLockNum(ctx, numKeys/2, startTS+1, []byte("k"), []byte("l"))
// Cleanup.
err = txn1.Rollback()
s.NoError(err)
}
test(false)
test(true)
}