2 Star 2 Fork 1

cockroachdb/cockroach

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
文件
克隆/下载
txn.go 44.21 KB
一键复制 编辑 原始数据 按行查看 历史
Andrei Matei 提交于 2017-09-29 18:54 . sql: fix stale txn deadline
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223
// Copyright 2015 The Cockroach Authors.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
// implied. See the License for the specific language governing
// permissions and limitations under the License.
package client
import (
"fmt"
"github.com/gogo/protobuf/proto"
opentracing "github.com/opentracing/opentracing-go"
"github.com/pkg/errors"
"golang.org/x/net/context"
"github.com/cockroachdb/cockroach/pkg/keys"
"github.com/cockroachdb/cockroach/pkg/roachpb"
"github.com/cockroachdb/cockroach/pkg/storage/engine/enginepb"
"github.com/cockroachdb/cockroach/pkg/util/hlc"
"github.com/cockroachdb/cockroach/pkg/util/log"
"github.com/cockroachdb/cockroach/pkg/util/syncutil"
"github.com/cockroachdb/cockroach/pkg/util/tracing"
"github.com/cockroachdb/cockroach/pkg/util/uuid"
)
// Txn is an in-progress distributed database transaction. A Txn is safe for
// concurrent use by multiple goroutines.
type Txn struct {
db *DB
// gatewayNodeID, if != 0, is the ID of the node on whose behalf this
// transaction is running. Normally this is the current node, but in the case
// of Txns created on remote nodes by DistSQL this will be the gateway.
// It will be attached to all requests sent through this transaction.
gatewayNodeID roachpb.NodeID
// The following fields are not safe for concurrent modification.
// They should be set before operating on the transaction.
// commitTriggers are run upon successful commit.
commitTriggers []func()
// systemConfigTrigger is set to true when modifying keys from the SystemConfig
// span. This sets the SystemConfigTrigger on EndTransactionRequest.
systemConfigTrigger bool
// The txn has to be committed by this deadline. A nil value indicates no
// deadline.
deadline *hlc.Timestamp
// mu holds fields that need to be synchronized for concurrent request execution.
mu struct {
syncutil.Mutex
Proto roachpb.Transaction
// UserPriority is the transaction's priority. If not set,
// NormalUserPriority will be used.
// TODO(andrei): Can this go away now that UserPriority and Proto.Priority
// are initialized at the same time?
UserPriority roachpb.UserPriority
// active is set whenever the transaction is actively running. It will
// be initially set when the transaction sends its first batch, but is
// reset if the transaction is aborted.
active bool
// txnAnchorKey is the key at which to anchor the transaction record. If
// unset, the first key written in the transaction will be used.
txnAnchorKey roachpb.Key
// writingTxnRecord is set when the Txn is in the middle of writing
// its transaction record. It is used to assure that even in the presence
// of concurrent requests, only one sends a BeginTxnRequest.
writingTxnRecord bool
// see IsFinalized()
finalized bool
// previousIDs holds the set of all previous IDs that the Txn's Proto has
// had across transaction aborts. This allows us to determine if a given
// response was meant for any incarnation of this transaction.
//
// TODO(andrei): This concept of the history of IDs seems problematic to me:
// if we get a retryable error for a really old incarnation of a
// transaction, a client (or Txn.Exec) probably doesn't want to retry.
// If Txn stays multi-threaded, I think restarting a transaction should
// become an explicit client operation that doesn't allow more requests to
// be sent for the old incarnation, and also doesn't let results for
// requests sent through old incarnations to be processed.
// If Txn becomes single-threaded, then the point is moot and this can again
// go away.
previousIDs map[uuid.UUID]struct{}
// commandCount indicates how many requests have been sent through
// this transaction. Reset on retryable txn errors.
// TODO(andrei): This is broken for DistSQL, which doesn't account for the
// requests it uses the transaction for.
commandCount int
}
// Set for DistSQL transactions that get errors that would otherwise be
// handled by the TxnCoordSender.
acceptUnhandledRetryableErrors bool
}
// NewTxn returns a new txn.
//
// gatewayNodeID: If != 0, this is the ID of the node on whose behalf this
// transaction is running. Normally this is the current node, but in the case
// of Txns created on remote nodes by DistSQL this will be the gateway.
// If 0 is passed, then no value is going to be filled in the batches sent
// through this txn. This will have the effect that the DistSender will fill
// in the batch with the current node's ID.
func NewTxn(db *DB, gatewayNodeID roachpb.NodeID) *Txn {
return NewTxnWithProto(db, gatewayNodeID, roachpb.MakeTransaction(
"unnamed",
nil, // baseKey
roachpb.NormalUserPriority,
enginepb.SERIALIZABLE,
db.clock.Now(),
db.clock.MaxOffset().Nanoseconds(),
))
}
// NewTxnWithProto is like NewTxn, except it returns a new txn with the provided
// Transaction proto. This allows a client.Txn to be created with an already
// initialized proto.
func NewTxnWithProto(db *DB, gatewayNodeID roachpb.NodeID, proto roachpb.Transaction) *Txn {
if db == nil {
log.Fatalf(context.TODO(), "attempting to create txn with nil db for Transaction: %s", proto)
}
proto.AssertInitialized(context.TODO())
txn := &Txn{db: db, gatewayNodeID: gatewayNodeID}
txn.mu.Proto = proto
return txn
}
// ID returns the current ID of the transaction.
func (txn *Txn) ID() uuid.UUID {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.Proto.ID
}
// AcceptUnhandledRetryableErrors is used by DistSQL to make the client.Txn not
// freak out on errors that should be handled by the TxnCoordSender.
func (txn *Txn) AcceptUnhandledRetryableErrors() {
txn.acceptUnhandledRetryableErrors = true
}
// CommandCount returns the count of commands executed through this txn.
// Retryable errors on the transaction will reset the count to 0.
func (txn *Txn) CommandCount() int {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.commandCount
}
// IsFinalized returns true if this Txn has been finalized and should therefore
// not be used for any more KV operations.
// A Txn is considered finalized if it successfully committed or if a rollback
// was attempted (successful or not).
// Note that Commit() always leaves the transaction finalized, since it attempts
// to rollback on error.
func (txn *Txn) IsFinalized() bool {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.finalized
}
// status returns the txn proto status field.
func (txn *Txn) status() roachpb.TransactionStatus {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.Proto.Status
}
// IsCommitted returns true if the transaction has the committed status.
func (txn *Txn) IsCommitted() bool {
return txn.status() == roachpb.COMMITTED
}
// IsAborted returns true if the transaction has the aborted status.
func (txn *Txn) IsAborted() bool {
return txn.status() == roachpb.ABORTED
}
// SetUserPriority sets the transaction's user priority. Transactions default to
// normal user priority. The user priority must be set before any operations are
// performed on the transaction.
func (txn *Txn) SetUserPriority(userPriority roachpb.UserPriority) error {
txn.mu.Lock()
defer txn.mu.Unlock()
if txn.mu.UserPriority == userPriority {
return nil
}
if txn.mu.active {
return errors.Errorf("cannot change the user priority of a running transaction")
}
if userPriority < roachpb.MinUserPriority || userPriority > roachpb.MaxUserPriority {
return errors.Errorf("the given user priority %f is out of the allowed range [%f, %d]",
userPriority, roachpb.MinUserPriority, roachpb.MaxUserPriority)
}
txn.mu.UserPriority = userPriority
txn.mu.Proto.Priority = roachpb.MakePriority(userPriority)
return nil
}
// InternalSetPriority sets the transaction priority. It is intended for
// internal (testing) use only.
func (txn *Txn) InternalSetPriority(priority int32) {
txn.mu.Lock()
// The negative user priority is translated on the server into a positive,
// non-randomized, priority for the transaction.
txn.mu.UserPriority = roachpb.UserPriority(-priority)
txn.mu.Proto.Priority = roachpb.MakePriority(txn.mu.UserPriority)
txn.mu.Unlock()
}
// UserPriority returns the transaction's user priority.
func (txn *Txn) UserPriority() roachpb.UserPriority {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.UserPriority
}
// SetDebugName sets the debug name associated with the transaction which will
// appear in log files and the web UI.
func (txn *Txn) SetDebugName(name string) {
txn.mu.Lock()
defer txn.mu.Unlock()
if txn.mu.Proto.Name == name {
return
}
if txn.mu.active {
panic("cannot change the debug name of a running transaction")
}
txn.mu.Proto.Name = name
}
// DebugName returns the debug name associated with the transaction.
func (txn *Txn) DebugName() string {
txn.mu.Lock()
defer txn.mu.Unlock()
return fmt.Sprintf("%s (id: %s)", txn.mu.Proto.Name, txn.mu.Proto.ID)
}
// SetIsolation sets the transaction's isolation type. Transactions default to
// serializable isolation. The isolation must be set before any operations are
// performed on the transaction.
func (txn *Txn) SetIsolation(isolation enginepb.IsolationType) error {
txn.mu.Lock()
defer txn.mu.Unlock()
if txn.mu.Proto.Isolation == isolation {
return nil
}
if txn.mu.active {
return errors.Errorf("cannot change the isolation level of a running transaction")
}
txn.mu.Proto.Isolation = isolation
return nil
}
// Isolation returns the transaction's isolation type.
func (txn *Txn) Isolation() enginepb.IsolationType {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.Proto.Isolation
}
// OrigTimestamp returns the transaction's starting timestamp.
func (txn *Txn) OrigTimestamp() hlc.Timestamp {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.Proto.OrigTimestamp
}
// AnchorKey returns the transaction's anchor key. The caller should treat the
// returned byte slice as immutable.
func (txn *Txn) AnchorKey() []byte {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.mu.Proto.Key
}
// SetTxnAnchorKey sets the key at which to anchor the transaction record. The
// transaction anchor key defaults to the first key written in a transaction.
func (txn *Txn) SetTxnAnchorKey(key roachpb.Key) error {
txn.mu.Lock()
defer txn.mu.Unlock()
if txn.mu.Proto.Writing || txn.mu.writingTxnRecord {
return errors.Errorf("transaction anchor key already set")
}
txn.mu.txnAnchorKey = key
return nil
}
// SetSystemConfigTrigger sets the system db trigger to true on this transaction.
// This will impact the EndTransactionRequest.
//
// NOTE: The system db trigger will only execute correctly if the transaction
// record is located on the range that contains the system span. If a
// transaction is created which modifies both system *and* non-system data, it
// should be ensured that the transaction record itself is on the system span.
// This can be done by making sure a system key is the first key touched in the
// transaction.
func (txn *Txn) SetSystemConfigTrigger() error {
if !txn.systemConfigTrigger {
txn.systemConfigTrigger = true
// The system-config trigger must be run on the system-config range which
// means any transaction with the trigger set needs to be anchored to the
// system-config range.
return txn.SetTxnAnchorKey(keys.SystemConfigSpan.Key)
}
return nil
}
// Proto returns the transactions underlying protocol buffer. It is not thread-safe,
// only use if you know that no requests are executing concurrently.
//
// A thread-safe alternative would be to clone the Proto under lock and return
// this clone, but we currently have no situations where this is needed.
func (txn *Txn) Proto() *roachpb.Transaction {
return &txn.mu.Proto
}
// IsSerializableRestart returns true if the transaction is serializable and
// its timestamp has been pushed. Used to detect whether the txn will be
// allowed to commit.
//
// Note that this method allows for false negatives: sometimes the client only
// figures out that it's been pushed when it sends an EndTransaction - i.e. it's
// possible for the txn to have been pushed asynchoronously by some other
// operation (usually, but not exclusively, by a high-priority txn with
// conflicting writes).
func (txn *Txn) IsSerializableRestart() bool {
txn.mu.Lock()
defer txn.mu.Unlock()
// TODO(andrei): The Walltime != 0 test is necessary but it feels like it
// shouldn't be. Hopefully the proto initialization can be improved such that
// Timestamp is always set.
isTxnPushed := txn.Proto().Timestamp.WallTime != 0 &&
txn.Proto().Timestamp != txn.Proto().OrigTimestamp
return txn.Proto().Isolation == enginepb.SERIALIZABLE && isTxnPushed
}
// NewBatch creates and returns a new empty batch object for use with the Txn.
func (txn *Txn) NewBatch() *Batch {
return &Batch{txn: txn}
}
// Get retrieves the value for a key, returning the retrieved key/value or an
// error. It is not considered an error for the key to not exist.
//
// r, err := db.Get("a")
// // string(r.Key) == "a"
//
// key can be either a byte slice or a string.
func (txn *Txn) Get(ctx context.Context, key interface{}) (KeyValue, error) {
b := txn.NewBatch()
b.Get(key)
return getOneRow(txn.Run(ctx, b), b)
}
// GetProto retrieves the value for a key and decodes the result as a proto
// message. If the key doesn't exist, the proto will simply be reset.
//
// key can be either a byte slice or a string.
func (txn *Txn) GetProto(ctx context.Context, key interface{}, msg proto.Message) error {
r, err := txn.Get(ctx, key)
if err != nil {
return err
}
return r.ValueProto(msg)
}
// Put sets the value for a key
//
// key can be either a byte slice or a string. value can be any key type, a
// proto.Message or any Go primitive type (bool, int, etc).
func (txn *Txn) Put(ctx context.Context, key, value interface{}) error {
b := txn.NewBatch()
b.Put(key, value)
return getOneErr(txn.Run(ctx, b), b)
}
// CPut conditionally sets the value for a key if the existing value is equal
// to expValue. To conditionally set a value only if there is no existing entry
// pass nil for expValue. Note that this must be an interface{}(nil), not a
// typed nil value (e.g. []byte(nil)).
//
// Returns an error if the existing value is not equal to expValue.
//
// key can be either a byte slice or a string. value can be any key type, a
// proto.Message or any Go primitive type (bool, int, etc).
func (txn *Txn) CPut(ctx context.Context, key, value, expValue interface{}) error {
b := txn.NewBatch()
b.CPut(key, value, expValue)
return getOneErr(txn.Run(ctx, b), b)
}
// InitPut sets the first value for a key to value. An error is reported if a
// value already exists for the key and it's not equal to the value passed in.
// If failOnTombstones is set to true, tombstones count as mismatched values
// and will cause a ConditionFailedError.
//
// key can be either a byte slice or a string. value can be any key type, a
// proto.Message or any Go primitive type (bool, int, etc). It is illegal to
// set value to nil.
func (txn *Txn) InitPut(ctx context.Context, key, value interface{}, failOnTombstones bool) error {
b := txn.NewBatch()
b.InitPut(key, value, failOnTombstones)
return getOneErr(txn.Run(ctx, b), b)
}
// Inc increments the integer value at key. If the key does not exist it will
// be created with an initial value of 0 which will then be incremented. If the
// key exists but was set using Put or CPut an error will be returned.
//
// The returned Result will contain a single row and Result.Err will indicate
// success or failure.
//
// key can be either a byte slice or a string.
func (txn *Txn) Inc(ctx context.Context, key interface{}, value int64) (KeyValue, error) {
b := txn.NewBatch()
b.Inc(key, value)
return getOneRow(txn.Run(ctx, b), b)
}
func (txn *Txn) scan(
ctx context.Context, begin, end interface{}, maxRows int64, isReverse bool,
) ([]KeyValue, error) {
b := txn.NewBatch()
if maxRows > 0 {
b.Header.MaxSpanRequestKeys = maxRows
}
if !isReverse {
b.Scan(begin, end)
} else {
b.ReverseScan(begin, end)
}
r, err := getOneResult(txn.Run(ctx, b), b)
return r.Rows, err
}
// Scan retrieves the rows between begin (inclusive) and end (exclusive) in
// ascending order.
//
// The returned []KeyValue will contain up to maxRows elements (or all results
// when zero is supplied).
//
// key can be either a byte slice or a string.
func (txn *Txn) Scan(
ctx context.Context, begin, end interface{}, maxRows int64,
) ([]KeyValue, error) {
return txn.scan(ctx, begin, end, maxRows, false)
}
// ReverseScan retrieves the rows between begin (inclusive) and end (exclusive)
// in descending order.
//
// The returned []KeyValue will contain up to maxRows elements (or all results
// when zero is supplied).
//
// key can be either a byte slice or a string.
func (txn *Txn) ReverseScan(
ctx context.Context, begin, end interface{}, maxRows int64,
) ([]KeyValue, error) {
return txn.scan(ctx, begin, end, maxRows, true)
}
// Del deletes one or more keys.
//
// key can be either a byte slice or a string.
func (txn *Txn) Del(ctx context.Context, keys ...interface{}) error {
b := txn.NewBatch()
b.Del(keys...)
return getOneErr(txn.Run(ctx, b), b)
}
// DelRange deletes the rows between begin (inclusive) and end (exclusive).
//
// The returned Result will contain 0 rows and Result.Err will indicate success
// or failure.
//
// key can be either a byte slice or a string.
func (txn *Txn) DelRange(ctx context.Context, begin, end interface{}) error {
b := txn.NewBatch()
b.DelRange(begin, end, false)
return getOneErr(txn.Run(ctx, b), b)
}
// Run executes the operations queued up within a batch. Before executing any
// of the operations the batch is first checked to see if there were any errors
// during its construction (e.g. failure to marshal a proto message).
//
// The operations within a batch are run in parallel and the order is
// non-deterministic. It is an unspecified behavior to modify and retrieve the
// same key within a batch.
//
// Upon completion, Batch.Results will contain the results for each
// operation. The order of the results matches the order the operations were
// added to the batch.
func (txn *Txn) Run(ctx context.Context, b *Batch) error {
tracing.AnnotateTrace()
defer tracing.AnnotateTrace()
if err := b.prepare(); err != nil {
return err
}
return sendAndFill(ctx, txn.Send, b)
}
func (txn *Txn) commit(ctx context.Context) error {
pErr := txn.sendEndTxnReq(ctx, true /* commit */, txn.deadline)
if pErr == nil {
for _, t := range txn.commitTriggers {
t()
}
}
return pErr.GoError()
}
// CleanupOnError cleans up the transaction as a result of an error.
func (txn *Txn) CleanupOnError(ctx context.Context, err error) {
if err == nil {
log.Fatal(ctx, "CleanupOnError called with nil error")
}
// This may race with a concurrent EndTxnRequests. That's fine though because
// we're just trying to clean up and will happily log the failed Rollback error
// if someone beat us.
if txn.status() == roachpb.PENDING {
// We don't need to send a rollback if no requests have been sent.
txn.mu.Lock()
if !txn.mu.active {
// Simulate the effect of sending a rollback.
txn.mu.finalized = true
// Let's set the status to ABORTED; unclear if this is necessary, but
// can't hurt.
txn.mu.Proto.Status = roachpb.ABORTED
txn.mu.Unlock()
return
}
txn.mu.Unlock()
if replyErr := txn.rollback(ctx); replyErr != nil {
if _, ok := replyErr.GetDetail().(*roachpb.TransactionStatusError); ok || txn.status() == roachpb.ABORTED {
log.Eventf(ctx, "failure aborting transaction: %s; abort caused by: %s", replyErr, err)
} else {
log.Warningf(ctx, "failure aborting transaction: %s; abort caused by: %s", replyErr, err)
}
}
}
}
// Commit is the same as CommitOrCleanup but will not attempt to clean
// up on failure. This can be used when the caller is prepared to do proper
// cleanup.
func (txn *Txn) Commit(ctx context.Context) error {
return txn.commit(ctx)
}
// CommitInBatch executes the operations queued up within a batch and
// commits the transaction. Explicitly committing a transaction is
// optional, but more efficient than relying on the implicit commit
// performed when the transaction function returns without error.
// The batch must be created by this transaction.
// If the command completes successfully, the txn is considered finalized. On
// error, no attempt is made to clean up the (possibly still pending)
// transaction.
func (txn *Txn) CommitInBatch(ctx context.Context, b *Batch) error {
if txn != b.txn {
return errors.Errorf("a batch b can only be committed by b.txn")
}
b.AddRawRequest(endTxnReq(true /* commit */, txn.deadline, txn.systemConfigTrigger))
return txn.Run(ctx, b)
}
// CommitOrCleanup sends an EndTransactionRequest with Commit=true.
// If that fails, an attempt to rollback is made.
// txn should not be used to send any more commands after this call.
func (txn *Txn) CommitOrCleanup(ctx context.Context) error {
err := txn.commit(ctx)
if err != nil {
txn.CleanupOnError(ctx, err)
}
if !txn.IsFinalized() {
log.Fatal(ctx, "Commit() failed to move txn to a final state")
}
return err
}
// UpdateDeadlineMaybe sets the transactions deadline to the lower of the
// current one (if any) and the passed value.
//
// The deadline cannot be lower than txn.OrigTimestamp.
func (txn *Txn) UpdateDeadlineMaybe(ctx context.Context, deadline hlc.Timestamp) bool {
if txn.deadline == nil || deadline.Less(*txn.deadline) {
if deadline.Less(txn.OrigTimestamp()) {
log.Fatalf(ctx, "deadline below txn.OrigTimestamp is nonsensical; "+
"txn has would have no change to commit. Deadline: %s, txn: %s",
deadline, txn.Proto())
}
txn.deadline = &deadline
return true
}
return false
}
// ResetDeadline resets the deadline.
func (txn *Txn) ResetDeadline() {
txn.deadline = nil
}
// Rollback sends an EndTransactionRequest with Commit=false.
// txn is considered finalized and cannot be used to send any more commands.
func (txn *Txn) Rollback(ctx context.Context) error {
return txn.rollback(ctx).GoError()
}
func (txn *Txn) rollback(ctx context.Context) *roachpb.Error {
log.VEventf(ctx, 2, "rolling back transaction")
return txn.sendEndTxnReq(ctx, false /* commit */, nil)
}
// AddCommitTrigger adds a closure to be executed on successful commit
// of the transaction.
func (txn *Txn) AddCommitTrigger(trigger func()) {
txn.commitTriggers = append(txn.commitTriggers, trigger)
}
// maybeFinishReadonly provides a fast-path for finishing a read-only
// transaction without going through the overhead of creating an
// EndTransactionRequest only to not send it.
//
// NB: The logic here must be kept in sync with the logic in txn.Send.
//
// TODO(andrei): Can we share this code with txn.Send?
func (txn *Txn) maybeFinishReadonly(commit bool, deadline *hlc.Timestamp) (bool, *roachpb.Error) {
txn.mu.Lock()
defer txn.mu.Unlock()
if txn.mu.Proto.Writing || txn.mu.writingTxnRecord {
return false, nil
}
txn.mu.finalized = true
// Check that read only transactions do not violate their deadline. This can NOT
// happen since the txn deadline is normally updated when it is about to expire
// or expired. We will just keep the code for safety (see TestReacquireLeaseOnRestart).
if deadline != nil && deadline.Less(txn.mu.Proto.Timestamp) {
// NB: The returned error contains a pointer to txn.mu.Proto, but that's ok
// because we can't have concurrent operations going on while
// committing/aborting.
//
// TODO(andrei): What is happening in this case?
//
// 1. our txn starts at ts1
// 2. catches uncertainty read error
// 3. updates its timestamp
// 4. new timestamp violates deadline
// 5. txn retries the read
// 6. commit fails - only thanks to this code path?
return false, roachpb.NewErrorWithTxn(roachpb.NewTransactionAbortedError(), &txn.mu.Proto)
}
if commit {
txn.mu.Proto.Status = roachpb.COMMITTED
} else {
txn.mu.Proto.Status = roachpb.ABORTED
}
return true, nil
}
func (txn *Txn) sendEndTxnReq(
ctx context.Context, commit bool, deadline *hlc.Timestamp,
) *roachpb.Error {
if ok, err := txn.maybeFinishReadonly(commit, deadline); ok || err != nil {
return err
}
var ba roachpb.BatchRequest
ba.Add(endTxnReq(commit, deadline, txn.systemConfigTrigger))
_, pErr := txn.Send(ctx, ba)
return pErr
}
func endTxnReq(commit bool, deadline *hlc.Timestamp, hasTrigger bool) roachpb.Request {
req := &roachpb.EndTransactionRequest{
Commit: commit,
Deadline: deadline,
}
if hasTrigger {
req.InternalCommitTrigger = &roachpb.InternalCommitTrigger{
ModifiedSpanTrigger: &roachpb.ModifiedSpanTrigger{
SystemConfigSpan: true,
},
}
}
return req
}
// TxnExecOptions controls how Exec() runs a transaction and the corresponding
// closure.
type TxnExecOptions struct {
// If set, the transaction is automatically aborted if the closure returns any
// error aside from recoverable internal errors, in which case the closure is
// retried. The retryable function should have no side effects which could
// cause problems in the event it must be run more than once.
// If not set, all errors cause the txn to be aborted.
AutoRetry bool
// If set, then the txn is automatically committed if no errors are
// encountered. If not set, committing or leaving open the txn is the
// responsibility of the client.
AutoCommit bool
}
// AutoCommitError wraps a non-retryable error coming from auto-commit.
type AutoCommitError struct {
cause error
}
func (e *AutoCommitError) Error() string {
return e.cause.Error()
}
// Exec executes fn in the context of a distributed transaction.
// Execution is controlled by opt (see comments in TxnExecOptions).
//
// opt is passed to fn, and it's valid for fn to modify opt as it sees
// fit during each execution attempt.
//
// It's valid for txn to be nil (meaning the txn has already aborted) if fn
// can handle that. This is useful for continuing transactions that have been
// aborted because of an error in a previous batch of statements in the hope
// that a ROLLBACK will reset the state. Neither opt.AutoRetry not opt.AutoCommit
// can be set in this case.
//
// It is not permitted to call Commit concurrently with any call to Exec. Since
// Exec with the AutoCommitflag is equivalent to an Exec possibly followed by a
// Commit, it must not be called concurrently with any other call to Exec or
// Commit.
//
// When this method returns, txn might be in any state; Exec does not attempt
// to clean up the transaction before returning an error. In case of
// TransactionAbortedError, txn is reset to a fresh transaction, ready to be
// used.
//
// TODO(andrei): The SQL Executor was the most complex user of this interface.
// It needed fine control by using TxnExecOptions. Now SQL no longer uses this
// interface, so it's time to see how it can be simplified. TxnExecOptions can
// probably go away, and so can AutoCommitError. The method should also be
// documented to not allow calls concurrent with any other txn use, so that the
// Commit() call inside it is clearly correct (as in, it won't run concurrently
// with other txn calls).
func (txn *Txn) Exec(
ctx context.Context, opt TxnExecOptions, fn func(context.Context, *Txn, *TxnExecOptions) error,
) (err error) {
// Run fn in a retry loop until we encounter a success or
// error condition this loop isn't capable of handling.
if txn == nil && (opt.AutoRetry || opt.AutoCommit) {
log.Fatal(ctx, "asked to retry or commit a txn that is already aborted")
}
for {
err = fn(ctx, txn, &opt)
if err == nil && opt.AutoCommit {
status := txn.status()
switch status {
case roachpb.ABORTED:
// TODO(andrei): Until 7881 is fixed.
log.Errorf(ctx, "#7881: no err but aborted txn proto. opt: %+v, txn: %+v",
opt, txn)
case roachpb.PENDING:
// fn succeeded, but didn't commit.
err = txn.Commit(ctx)
log.Eventf(ctx, "client.Txn did AutoCommit. err: %v\ntxn: %+v", err, txn.Proto())
if err != nil {
if _, retryable := err.(*roachpb.HandledRetryableTxnError); !retryable {
// We can't retry, so let the caller know we tried to
// autocommit.
err = &AutoCommitError{cause: err}
}
}
}
}
if _, ok := err.(*roachpb.UnhandledRetryableError); ok {
// We sent transactional requests, so the TxnCoordSender was supposed to
// turn retryable errors into HandledRetryableTxnError.
log.Fatalf(ctx, "unexpected UnhandledRetryableError at the txn.Exec level: %s", err)
}
retErr, retryable := err.(*roachpb.HandledRetryableTxnError)
if retryable && !txn.IsRetryableErrMeantForTxn(*retErr) {
// Make sure the txn record that err carries is for this txn.
// If it's not, we terminate the "retryable" character of the error. We
// might get a HandledRetryableTxnError if the closure ran another
// transaction internally and let the error propagate upwards.
return errors.Wrapf(
retErr,
"retryable error from another txn. Current txn ID: %v", txn.Proto().ID)
}
if !opt.AutoRetry || !retryable {
break
}
txn.PrepareForRetry(ctx, err)
}
return err
}
// PrepareForRetry needs to be called before an retry to perform some
// book-keeping.
//
// TODO(andrei): I think this is called in the wrong place. See #18170.
func (txn *Txn) PrepareForRetry(ctx context.Context, err error) {
txn.commitTriggers = nil
log.VEventf(ctx, 2, "automatically retrying transaction: %s because of error: %s",
txn.DebugName(), err)
}
// IsRetryableErrMeantForTxn returns true if err is a retryable
// error meant to restart this client transaction.
func (txn *Txn) IsRetryableErrMeantForTxn(retryErr roachpb.HandledRetryableTxnError) bool {
txn.mu.Lock()
defer txn.mu.Unlock()
return txn.isRetryableErrMeantForTxnLocked(retryErr)
}
func (txn *Txn) isRetryableErrMeantForTxnLocked(retryErr roachpb.HandledRetryableTxnError) bool {
errTxnID := retryErr.TxnID
// Make sure the txn record that err carries is for this txn.
// First check if the error was meant for a previous incarnation
// of the transaction.
if _, ok := txn.mu.previousIDs[errTxnID]; ok {
return true
}
// If not, make sure it was meant for this transaction.
return errTxnID == txn.mu.Proto.ID
}
// Send runs the specified calls synchronously in a single batch and
// returns any errors. If the transaction is read-only or has already
// been successfully committed or aborted, a potential trailing
// EndTransaction call is silently dropped, allowing the caller to
// always commit or clean-up explicitly even when that may not be
// required (or even erroneous). Returns (nil, nil) for an empty batch.
func (txn *Txn) Send(
ctx context.Context, ba roachpb.BatchRequest,
) (*roachpb.BatchResponse, *roachpb.Error) {
// It doesn't make sense to use inconsistent reads in a transaction. However,
// we still need to accept it as a parameter for this to compile.
if ba.ReadConsistency != roachpb.CONSISTENT {
return nil, roachpb.NewErrorf("cannot use %s ReadConsistency in txn",
ba.ReadConsistency)
}
// Fill in the GatewayNodeID on the batch if the txn knows it.
// NOTE(andrei): It seems a bit ugly that we're filling in the batches here as
// opposed to the point where the requests are being created, but
// unfortunately requests are being created in many ways and this was the best
// place I found to set this field.
if txn.gatewayNodeID != 0 {
ba.Header.GatewayNodeID = txn.gatewayNodeID
}
lastIndex := len(ba.Requests) - 1
if lastIndex < 0 {
return nil, nil
}
firstWriteIdx, pErr := firstWriteIndex(ba)
if pErr != nil {
return nil, pErr
}
haveTxnWrite := firstWriteIdx != -1
endTxnRequest, haveEndTxn := ba.Requests[lastIndex].GetInner().(*roachpb.EndTransactionRequest)
var needBeginTxn, elideEndTxn bool
lockedPrelude := func() *roachpb.Error {
txn.mu.Lock()
defer txn.mu.Unlock()
if txn.mu.Proto.Status != roachpb.PENDING || txn.mu.finalized {
return roachpb.NewErrorf(
"attempting to use transaction with wrong status or finalized: %s %v",
txn.mu.Proto.Status, txn.mu.finalized)
}
// For testing purposes, txn.UserPriority can be a negative value (see
// roachpb.MakePriority).
if txn.mu.UserPriority != 0 {
ba.UserPriority = txn.mu.UserPriority
}
if !txn.mu.active {
user := roachpb.MakePriority(ba.UserPriority)
if txn.mu.Proto.Priority < user {
txn.mu.Proto.Priority = user
}
txn.mu.active = true
}
needBeginTxn = !(txn.mu.Proto.Writing || txn.mu.writingTxnRecord) && haveTxnWrite
needEndTxn := txn.mu.Proto.Writing || txn.mu.writingTxnRecord || haveTxnWrite
elideEndTxn = haveEndTxn && !needEndTxn
// If we're not yet writing in this txn, but intend to, insert a
// begin transaction request before the first write command and update
// transaction state accordingly.
if needBeginTxn {
// Set txn key based on the key of the first transactional write if
// not already set. If the transaction already has a key (we're in a
// restart), make sure we keep the anchor key the same.
if len(txn.mu.Proto.Key) == 0 {
txnAnchorKey := txn.mu.txnAnchorKey
if len(txnAnchorKey) == 0 {
txnAnchorKey = ba.Requests[0].GetInner().Header().Key
}
txn.mu.Proto.Key = txnAnchorKey
}
// Set the key in the begin transaction request to the txn's anchor key.
bt := &roachpb.BeginTransactionRequest{
Span: roachpb.Span{
Key: txn.mu.Proto.Key,
},
}
// Inject the new request before position firstWriteIdx, taking
// care to avoid unnecessary allocations.
oldRequests := ba.Requests
ba.Requests = make([]roachpb.RequestUnion, len(ba.Requests)+1)
copy(ba.Requests, oldRequests[:firstWriteIdx])
ba.Requests[firstWriteIdx].MustSetInner(bt)
copy(ba.Requests[firstWriteIdx+1:], oldRequests[firstWriteIdx:])
// We're going to be writing the transaction record by sending the
// begin transaction request.
txn.mu.writingTxnRecord = true
}
if elideEndTxn {
ba.Requests = ba.Requests[:lastIndex]
}
// Increment the statement count sent through this transaction.
txn.mu.commandCount += len(ba.Requests)
// Clone the Txn's Proto so that future modifications can be made without
// worrying about synchronization.
newTxn := txn.mu.Proto.Clone()
ba.Txn = &newTxn
return nil
}
if pErr := lockedPrelude(); pErr != nil {
return nil, pErr
}
// Send call through the DB.
requestTxnID := ba.Txn.ID
br, pErr := txn.db.send(ctx, ba)
// Lock for the entire response postlude.
txn.mu.Lock()
defer txn.mu.Unlock()
// If we inserted a begin transaction request, remove it here. We also
// unset the flag writingTxnRecord flag in case another ever needs to
// be sent again (for instance, if we're aborted and need to restart).
if needBeginTxn {
if br != nil && br.Responses != nil {
br.Responses = append(br.Responses[:firstWriteIdx], br.Responses[firstWriteIdx+1:]...)
}
// Handle case where inserted begin txn confused an indexed error.
if pErr != nil && pErr.Index != nil {
idx := pErr.Index.Index
if idx == int32(firstWriteIdx) {
// An error was encountered on begin txn; disallow the indexing.
pErr.Index = nil
} else if idx > int32(firstWriteIdx) {
// An error was encountered after begin txn; decrement index.
pErr.SetErrorIndex(idx - 1)
}
}
txn.mu.writingTxnRecord = false
}
if haveEndTxn {
if pErr == nil || !endTxnRequest.Commit {
// Finalize the transaction if either we sent a successful commit
// EndTxnRequest, or sent a rollback EndTxnRequest (regardless of
// if it succeeded).
txn.mu.finalized = true
}
}
if pErr != nil {
if log.V(1) {
log.Infof(ctx, "failed batch: %s", pErr)
}
if retryErr, ok := pErr.GetDetail().(*roachpb.HandledRetryableTxnError); ok {
txn.updateStateOnRetryableErrLocked(ctx, *retryErr, requestTxnID)
}
if pErr.TransactionRestart != roachpb.TransactionRestart_NONE &&
!txn.acceptUnhandledRetryableErrors {
log.Fatalf(ctx,
"unexpected retryable error at the client.Txn level: (%T) %s",
pErr.GetDetail(), pErr)
}
return nil, pErr
}
if br != nil {
if br.Error != nil {
panic(roachpb.ErrorUnexpectedlySet(txn.db.sender, br))
}
if br.Txn != nil && br.Txn.ID != txn.mu.Proto.ID {
return nil, roachpb.NewError(&roachpb.TxnPrevAttemptError{})
}
if len(br.CollectedSpans) != 0 {
span := opentracing.SpanFromContext(ctx)
if span == nil {
return nil, roachpb.NewErrorf(
"trying to ingest remote spans but there is no recording span set up",
)
}
if err := tracing.ImportRemoteSpans(span, br.CollectedSpans); err != nil {
return nil, roachpb.NewErrorf("error ingesting remote spans: %s", err)
}
}
// Only successful requests can carry an updated Txn in their response
// header. Some errors (e.g. a restart) have a Txn attached to them as
// well; these errors have been handled above.
txn.mu.Proto.Update(br.Txn)
}
if elideEndTxn {
// Check that read only transactions do not violate their deadline. This can NOT
// happen since the txn deadline is normally updated when it is about to expire
// or expired. We will just keep the code for safety (see TestReacquireLeaseOnRestart).
if endTxnRequest.Deadline != nil {
if endTxnRequest.Deadline.Less(txn.mu.Proto.Timestamp) {
// NB: The returned error contains a pointer to txn.mu.Proto, but
// that's ok because we can't have concurrent operations going on while
// committing/aborting.
return nil, roachpb.NewErrorWithTxn(roachpb.NewTransactionAbortedError(), &txn.mu.Proto)
}
}
// This normally happens on the server and sent back in response
// headers, but this transaction was optimized away. The caller may
// still inspect the transaction struct, so we manually update it
// here to emulate a true transaction.
if endTxnRequest.Commit {
txn.mu.Proto.Status = roachpb.COMMITTED
} else {
txn.mu.Proto.Status = roachpb.ABORTED
}
}
return br, nil
}
// firstWriteIndex returns the index of the first transactional write in the
// BatchRequest. Returns -1 if the batch has not intention to write. It also
// verifies that if an EndTransactionRequest is included, then it is the last
// request in the batch.
func firstWriteIndex(ba roachpb.BatchRequest) (int, *roachpb.Error) {
firstWriteIdx := -1
for i, ru := range ba.Requests {
args := ru.GetInner()
if i < len(ba.Requests)-1 /* if not last*/ {
if _, ok := args.(*roachpb.EndTransactionRequest); ok {
return -1, roachpb.NewErrorf("%s sent as non-terminal call", args.Method())
}
}
if roachpb.IsTransactionWrite(args) {
if firstWriteIdx == -1 {
firstWriteIdx = i
}
}
}
return firstWriteIdx, nil
}
// UpdateStateOnRemoteRetryableErr updates the Txn, and the Transaction proto
// inside it, in response to an error encountered when running a request through
// the txn. If the error is not a RetryableTxnError, then this is a no-op. For a
// retryable error, the Transaction proto is either initialized with the updated
// proto from the error, or a new Transaction proto is initialized.
func (txn *Txn) UpdateStateOnRemoteRetryableErr(ctx context.Context, pErr roachpb.Error) {
txn.mu.Lock()
defer txn.mu.Unlock()
if pErr.TransactionRestart == roachpb.TransactionRestart_NONE {
log.Fatalf(ctx, "unexpected non-retryable error: %s", pErr)
}
if pErr.GetTxn() == nil {
// DistSQL requests (like all SQL requests) are always supposed to be done
// in a transaction.
log.Fatalf(ctx, "unexpected retryable error with no txn ran through DistSQL: %s", pErr)
}
// Assert that the TxnCoordSender doesn't have any state for this transaction
// (and it shouldn't, since DistSQL isn't supposed to do any works in
// transaction that had performed writes and hence started being tracked). If
// the TxnCoordSender were to have state, it'd be a bad thing that we're not
// updating it.
txnID := pErr.GetTxn().ID
if _, ok := txn.db.GetSender().(SenderWithDistSQLBackdoor).GetTxnState(txnID); ok {
log.Fatalf(ctx, "unexpected state in TxnCoordSender for transaction in error: %s", pErr)
}
// Emulate the processing that the TxnCoordSender would have done on this
// error.
newTxn := roachpb.PrepareTransactionForRetry(ctx, &pErr, txn.mu.UserPriority, txn.db.clock)
newErr := roachpb.NewHandledRetryableTxnError(pErr.Message, pErr.GetTxn().ID, newTxn)
txn.updateStateOnRetryableErrLocked(
ctx, *newErr,
// We're passing the current ID as the "request"'s. In doing so, we're
// assuming that the Txn hasn't changed asynchronously since we started
// executing the query; we're relying on DistSQL queries not being
// executed concurrently with anything else using this txn.
txn.mu.Proto.ID)
}
// updateStateOnRetryableErrLocked updates the Transaction proto inside txn.
//
// requestTxnID identifies the state of the transaction at the time when the
// request that generated retryErr was sent. It is used to see if the information
// in the error is obsolete by now.
//
// This method is safe to call repeatedly for requests from the same txn epoch.
// The first such update will move the Transaction forward (either create a new
// one or increment the epoch), and next calls will be no-ops.
func (txn *Txn) updateStateOnRetryableErrLocked(
ctx context.Context, retryErr roachpb.HandledRetryableTxnError, requestTxnID uuid.UUID,
) {
if requestTxnID != retryErr.TxnID {
// KV should not return errors for transactions other than the one that sent
// the request.
log.Fatalf(ctx, "retryable error for the wrong txn. "+
"requestTxnID: %s, retryErr.TxnID: %s. retryErr: %s",
requestTxnID, retryErr.TxnID, retryErr)
}
newTxn := &retryErr.Transaction
if requestTxnID != txn.mu.Proto.ID {
// We were already aborted, so ignore the retry error for the previous
// Txn incarnation.
return
}
// Reset the statement count as this is a retryable txn error.
txn.mu.commandCount = 0
abortErr := requestTxnID != newTxn.ID
if abortErr {
// This means that the cause was a TransactionAbortedError;
// we've created a new Transaction that we're about to start using, so we
// save the old transaction ID so that concurrent requests or delayed
// responses that that throw errors know that these errors were sent to
// the correct transaction, even once the proto is reset.
txn.recordPreviousTxnIDLocked(txn.mu.Proto.ID)
// Overwrite the transaction proto with the one to be used for the next
// attempt. The txn inside pErr was correctly prepared for this by
// TxnCoordSender.
txn.mu.Proto = *newTxn
} else {
// Update the transaction proto with the one to be used for the next
// attempt. The txn inside pErr was correctly prepared for this by
// TxnCoordSender. However, we can't blindly replace the proto, because
// multiple retryable errors might come back here out-of-order. Instead,
// we rely on the associativity of Transaction.Update to sort out this
// lack of ordering guarantee.
txn.mu.Proto.Update(newTxn)
}
}
func (txn *Txn) recordPreviousTxnIDLocked(prevTxnID uuid.UUID) {
if txn.mu.previousIDs == nil {
txn.mu.previousIDs = make(map[uuid.UUID]struct{})
}
txn.mu.previousIDs[txn.mu.Proto.ID] = struct{}{}
}
// SetFixedTimestamp makes the transaction run in an unusual way, at a "fixed
// timestamp": Timestamp and OrigTimestamp are set to ts, there's no clock
// uncertainty, and the txn's deadline is set to ts such that the transaction
// can't be pushed to a different timestamp.
//
// This is used to support historical queries (AS OF SYSTEM TIME queries and
// backups). This method must be called on every transaction retry (but note
// that retries should be rare for read-only queries with no clock uncertainty).
func (txn *Txn) SetFixedTimestamp(ctx context.Context, ts hlc.Timestamp) {
txn.mu.Lock()
txn.mu.Proto.Timestamp = ts
txn.mu.Proto.OrigTimestamp = ts
txn.mu.Proto.MaxTimestamp = ts
txn.mu.Unlock()
// The deadline-checking code checks that the `Timestamp` field of the proto
// hasn't exceeded the deadline. Since we set the Timestamp field each retry,
// it won't ever exceed the deadline, and thus setting the deadline here is
// not strictly needed. However, it doesn't do anything incorrect and it will
// possibly find problems if things change in the future, so it is left in.
txn.UpdateDeadlineMaybe(ctx, ts)
}
// GenerateForcedRetryableError returns a HandledRetryableTxnError that will
// cause the txn to be retried.
func (txn *Txn) GenerateForcedRetryableError(msg string) error {
return roachpb.NewHandledRetryableTxnError(
msg,
txn.ID(),
roachpb.MakeTransaction(
txn.DebugName(),
nil, // baseKey
txn.UserPriority(),
txn.Isolation(),
txn.db.clock.Now(),
txn.db.clock.MaxOffset().Nanoseconds(),
))
}
Loading...
马建仓 AI 助手
尝试更多
代码解读
代码找茬
代码优化
1
https://gitee.com/mirrors_cockroachdb/cockroach.git
git@gitee.com:mirrors_cockroachdb/cockroach.git
mirrors_cockroachdb
cockroach
cockroach
v1.1.1

搜索帮助