2019-05-23 21:05:29 +03:00
|
|
|
package routing
|
|
|
|
|
|
|
|
import (
|
2020-04-01 01:13:26 +03:00
|
|
|
"fmt"
|
|
|
|
"sync"
|
2019-05-23 21:05:29 +03:00
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/davecgh/go-spew/spew"
|
|
|
|
sphinx "github.com/lightningnetwork/lightning-onion"
|
2019-05-23 21:05:29 +03:00
|
|
|
"github.com/lightningnetwork/lnd/channeldb"
|
2019-05-23 21:05:29 +03:00
|
|
|
"github.com/lightningnetwork/lnd/htlcswitch"
|
2020-04-01 01:13:22 +03:00
|
|
|
"github.com/lightningnetwork/lnd/lntypes"
|
2019-05-23 21:05:29 +03:00
|
|
|
"github.com/lightningnetwork/lnd/lnwire"
|
|
|
|
"github.com/lightningnetwork/lnd/routing/route"
|
2021-04-12 16:21:59 +03:00
|
|
|
"github.com/lightningnetwork/lnd/routing/shards"
|
2019-05-23 21:05:29 +03:00
|
|
|
)
|
|
|
|
|
2020-11-24 16:15:12 +03:00
|
|
|
// errShardHandlerExiting is returned from the shardHandler when it exits.
|
|
|
|
var errShardHandlerExiting = fmt.Errorf("shard handler exiting")
|
|
|
|
|
2019-05-23 21:05:29 +03:00
|
|
|
// paymentLifecycle holds all information about the current state of a payment
|
|
|
|
// needed to resume if from any point.
|
|
|
|
type paymentLifecycle struct {
|
2020-04-01 01:13:22 +03:00
|
|
|
router *ChannelRouter
|
2020-04-01 01:13:22 +03:00
|
|
|
totalAmount lnwire.MilliSatoshi
|
|
|
|
feeLimit lnwire.MilliSatoshi
|
2021-03-31 13:23:08 +03:00
|
|
|
identifier lntypes.Hash
|
2020-04-01 01:13:22 +03:00
|
|
|
paySession PaymentSession
|
2021-04-12 16:21:59 +03:00
|
|
|
shardTracker shards.ShardTracker
|
2020-04-01 01:13:22 +03:00
|
|
|
timeoutChan <-chan time.Time
|
|
|
|
currentHeight int32
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// payemntState holds a number of key insights learned from a given MPPayment
|
|
|
|
// that we use to determine what to do on each payment loop iteration.
|
|
|
|
type paymentState struct {
|
|
|
|
numShardsInFlight int
|
|
|
|
remainingAmt lnwire.MilliSatoshi
|
|
|
|
remainingFees lnwire.MilliSatoshi
|
|
|
|
terminate bool
|
|
|
|
}
|
|
|
|
|
|
|
|
// paymentState uses the passed payment to find the latest information we need
|
|
|
|
// to act on every iteration of the payment loop.
|
|
|
|
func (p *paymentLifecycle) paymentState(payment *channeldb.MPPayment) (
|
|
|
|
*paymentState, error) {
|
|
|
|
|
|
|
|
// Fetch the total amount and fees that has already been sent in
|
|
|
|
// settled and still in-flight shards.
|
|
|
|
sentAmt, fees := payment.SentAmt()
|
|
|
|
|
|
|
|
// Sanity check we haven't sent a value larger than the payment amount.
|
|
|
|
if sentAmt > p.totalAmount {
|
|
|
|
return nil, fmt.Errorf("amount sent %v exceeds "+
|
|
|
|
"total amount %v", sentAmt, p.totalAmount)
|
|
|
|
}
|
|
|
|
|
|
|
|
// We'll subtract the used fee from our fee budget, but allow the fees
|
|
|
|
// of the already sent shards to exceed our budget (can happen after
|
|
|
|
// restarts).
|
|
|
|
feeBudget := p.feeLimit
|
|
|
|
if fees <= feeBudget {
|
|
|
|
feeBudget -= fees
|
|
|
|
} else {
|
|
|
|
feeBudget = 0
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get any terminal info for this payment.
|
|
|
|
settle, failure := payment.TerminalInfo()
|
|
|
|
|
|
|
|
// If either an HTLC settled, or the payment has a payment level
|
|
|
|
// failure recorded, it means we should terminate the moment all shards
|
|
|
|
// have returned with a result.
|
|
|
|
terminate := settle != nil || failure != nil
|
|
|
|
|
|
|
|
activeShards := payment.InFlightHTLCs()
|
|
|
|
return &paymentState{
|
|
|
|
numShardsInFlight: len(activeShards),
|
|
|
|
remainingAmt: p.totalAmount - sentAmt,
|
|
|
|
remainingFees: feeBudget,
|
|
|
|
terminate: terminate,
|
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
2019-05-23 21:05:29 +03:00
|
|
|
// resumePayment resumes the paymentLifecycle from the current state.
|
|
|
|
func (p *paymentLifecycle) resumePayment() ([32]byte, *route.Route, error) {
|
2020-04-01 01:13:24 +03:00
|
|
|
shardHandler := &shardHandler{
|
2021-04-12 16:21:59 +03:00
|
|
|
router: p.router,
|
2021-03-31 13:23:08 +03:00
|
|
|
identifier: p.identifier,
|
2021-04-12 16:21:59 +03:00
|
|
|
shardTracker: p.shardTracker,
|
|
|
|
shardErrors: make(chan error),
|
|
|
|
quit: make(chan struct{}),
|
2020-04-01 01:13:24 +03:00
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// When the payment lifecycle loop exits, we make sure to signal any
|
|
|
|
// sub goroutine of the shardHandler to exit, then wait for them to
|
|
|
|
// return.
|
|
|
|
defer shardHandler.stop()
|
|
|
|
|
|
|
|
// If we had any existing attempts outstanding, we'll start by spinning
|
|
|
|
// up goroutines that'll collect their results and deliver them to the
|
|
|
|
// lifecycle loop below.
|
2020-04-01 01:13:25 +03:00
|
|
|
payment, err := p.router.cfg.Control.FetchPayment(
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier,
|
2020-04-01 01:13:25 +03:00
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return [32]byte{}, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
for _, a := range payment.InFlightHTLCs() {
|
|
|
|
a := a
|
|
|
|
|
2021-03-31 13:23:08 +03:00
|
|
|
log.Infof("Resuming payment shard %v for payment %v",
|
|
|
|
a.AttemptID, p.identifier)
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
shardHandler.collectResultAsync(&a.HTLCAttemptInfo)
|
2020-04-01 01:13:25 +03:00
|
|
|
}
|
|
|
|
|
2019-05-23 21:05:29 +03:00
|
|
|
// We'll continue until either our payment succeeds, or we encounter a
|
|
|
|
// critical error during path finding.
|
2021-04-23 09:51:07 +03:00
|
|
|
lifecycle:
|
2019-05-23 21:05:29 +03:00
|
|
|
for {
|
2020-04-01 01:13:26 +03:00
|
|
|
// Start by quickly checking if there are any outcomes already
|
|
|
|
// available to handle before we reevaluate our state.
|
|
|
|
if err := shardHandler.checkShards(); err != nil {
|
|
|
|
return [32]byte{}, nil, err
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:24 +03:00
|
|
|
// We start every iteration by fetching the lastest state of
|
|
|
|
// the payment from the ControlTower. This ensures that we will
|
|
|
|
// act on the latest available information, whether we are
|
|
|
|
// resuming an existing payment or just sent a new attempt.
|
|
|
|
payment, err := p.router.cfg.Control.FetchPayment(
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier,
|
2020-04-01 01:13:24 +03:00
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return [32]byte{}, nil, err
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// Using this latest state of the payment, calculate
|
|
|
|
// information about our active shards and terminal conditions.
|
|
|
|
state, err := p.paymentState(payment)
|
|
|
|
if err != nil {
|
|
|
|
return [32]byte{}, nil, err
|
2020-04-01 01:13:24 +03:00
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
log.Debugf("Payment %v in state terminate=%v, "+
|
|
|
|
"active_shards=%v, rem_value=%v, fee_limit=%v",
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, state.terminate, state.numShardsInFlight,
|
2020-04-01 01:13:26 +03:00
|
|
|
state.remainingAmt, state.remainingFees)
|
|
|
|
|
|
|
|
switch {
|
|
|
|
|
|
|
|
// We have a terminal condition and no active shards, we are
|
|
|
|
// ready to exit.
|
|
|
|
case state.terminate && state.numShardsInFlight == 0:
|
|
|
|
// Find the first successful shard and return
|
|
|
|
// the preimage and route.
|
|
|
|
for _, a := range payment.HTLCs {
|
|
|
|
if a.Settle != nil {
|
|
|
|
return a.Settle.Preimage, &a.Route, nil
|
|
|
|
}
|
|
|
|
}
|
2019-05-23 21:05:29 +03:00
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// Payment failed.
|
2020-04-01 01:13:25 +03:00
|
|
|
return [32]byte{}, nil, *payment.FailureReason
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// If we either reached a terminal error condition (but had
|
|
|
|
// active shards still) or there is no remaining value to send,
|
|
|
|
// we'll wait for a shard outcome.
|
|
|
|
case state.terminate || state.remainingAmt == 0:
|
|
|
|
// We still have outstanding shards, so wait for a new
|
|
|
|
// outcome to be available before re-evaluating our
|
|
|
|
// state.
|
|
|
|
if err := shardHandler.waitForShard(); err != nil {
|
|
|
|
return [32]byte{}, nil, err
|
|
|
|
}
|
2021-04-23 09:51:07 +03:00
|
|
|
continue lifecycle
|
2020-04-01 01:13:26 +03:00
|
|
|
}
|
2020-04-01 01:13:23 +03:00
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// Before we attempt any new shard, we'll check to see if
|
|
|
|
// either we've gone past the payment attempt timeout, or the
|
|
|
|
// router is exiting. In either case, we'll stop this payment
|
|
|
|
// attempt short. If a timeout is not applicable, timeoutChan
|
|
|
|
// will be nil.
|
|
|
|
select {
|
|
|
|
case <-p.timeoutChan:
|
|
|
|
log.Warnf("payment attempt not completed before " +
|
|
|
|
"timeout")
|
|
|
|
|
|
|
|
// By marking the payment failed with the control
|
|
|
|
// tower, no further shards will be launched and we'll
|
|
|
|
// return with an error the moment all active shards
|
|
|
|
// have finished.
|
|
|
|
saveErr := p.router.cfg.Control.Fail(
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, channeldb.FailureReasonTimeout,
|
2020-04-01 01:13:26 +03:00
|
|
|
)
|
|
|
|
if saveErr != nil {
|
|
|
|
return [32]byte{}, nil, saveErr
|
|
|
|
}
|
2020-04-01 01:13:23 +03:00
|
|
|
|
2021-04-23 09:51:07 +03:00
|
|
|
continue lifecycle
|
2020-04-01 01:13:23 +03:00
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
case <-p.router.quit:
|
|
|
|
return [32]byte{}, nil, ErrRouterShuttingDown
|
2020-04-01 01:13:23 +03:00
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// Fall through if we haven't hit our time limit.
|
|
|
|
default:
|
|
|
|
}
|
2020-04-01 01:13:23 +03:00
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// Create a new payment attempt from the given payment session.
|
|
|
|
rt, err := p.paySession.RequestRoute(
|
|
|
|
state.remainingAmt, state.remainingFees,
|
|
|
|
uint32(state.numShardsInFlight), uint32(p.currentHeight),
|
|
|
|
)
|
|
|
|
if err != nil {
|
2020-04-06 13:18:50 +03:00
|
|
|
log.Warnf("Failed to find route for payment %v: %v",
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, err)
|
2020-04-01 01:13:26 +03:00
|
|
|
|
2020-04-01 01:13:27 +03:00
|
|
|
routeErr, ok := err.(noRouteError)
|
|
|
|
if !ok {
|
|
|
|
return [32]byte{}, nil, err
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// There is no route to try, and we have no active
|
|
|
|
// shards. This means that there is no way for us to
|
|
|
|
// send the payment, so mark it failed with no route.
|
|
|
|
if state.numShardsInFlight == 0 {
|
2020-04-01 01:13:27 +03:00
|
|
|
failureCode := routeErr.FailureReason()
|
2020-04-01 01:13:26 +03:00
|
|
|
log.Debugf("Marking payment %v permanently "+
|
|
|
|
"failed with no route: %v",
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, failureCode)
|
2020-04-01 01:13:23 +03:00
|
|
|
|
|
|
|
saveErr := p.router.cfg.Control.Fail(
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, failureCode,
|
2020-04-01 01:13:23 +03:00
|
|
|
)
|
|
|
|
if saveErr != nil {
|
|
|
|
return [32]byte{}, nil, saveErr
|
|
|
|
}
|
|
|
|
|
2021-04-23 09:51:07 +03:00
|
|
|
continue lifecycle
|
2020-04-01 01:13:23 +03:00
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// We still have active shards, we'll wait for an
|
|
|
|
// outcome to be available before retrying.
|
|
|
|
if err := shardHandler.waitForShard(); err != nil {
|
2019-05-23 21:05:29 +03:00
|
|
|
return [32]byte{}, nil, err
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
2021-04-23 09:51:07 +03:00
|
|
|
continue lifecycle
|
2020-04-01 01:13:26 +03:00
|
|
|
}
|
2020-04-01 01:13:23 +03:00
|
|
|
|
2021-04-12 16:21:59 +03:00
|
|
|
// If this route will consume the last remeining amount to send
|
|
|
|
// to the receiver, this will be our last shard (for now).
|
|
|
|
lastShard := rt.ReceiverAmt() == state.remainingAmt
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// We found a route to try, launch a new shard.
|
2021-04-12 16:21:59 +03:00
|
|
|
attempt, outcome, err := shardHandler.launchShard(rt, lastShard)
|
2021-04-23 09:39:46 +03:00
|
|
|
switch {
|
|
|
|
// We may get a terminal error if we've processed a shard with
|
|
|
|
// a terminal state (settled or permanent failure), while we
|
|
|
|
// were pathfinding. We know we're in a terminal state here,
|
|
|
|
// so we can continue and wait for our last shards to return.
|
|
|
|
case err == channeldb.ErrPaymentTerminal:
|
2021-03-31 13:23:08 +03:00
|
|
|
log.Infof("Payment %v in terminal state, abandoning "+
|
|
|
|
"shard", p.identifier)
|
2021-04-23 09:39:46 +03:00
|
|
|
|
2021-04-23 09:51:07 +03:00
|
|
|
continue lifecycle
|
2021-04-23 09:39:46 +03:00
|
|
|
|
|
|
|
case err != nil:
|
2020-04-01 01:13:26 +03:00
|
|
|
return [32]byte{}, nil, err
|
|
|
|
}
|
2019-05-23 21:05:29 +03:00
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// If we encountered a non-critical error when launching the
|
|
|
|
// shard, handle it.
|
|
|
|
if outcome.err != nil {
|
|
|
|
log.Warnf("Failed to launch shard %v for "+
|
|
|
|
"payment %v: %v", attempt.AttemptID,
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, outcome.err)
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
// We must inspect the error to know whether it was
|
|
|
|
// critical or not, to decide whether we should
|
|
|
|
// continue trying.
|
|
|
|
err := shardHandler.handleSendError(
|
|
|
|
attempt, outcome.err,
|
|
|
|
)
|
2020-04-01 01:13:24 +03:00
|
|
|
if err != nil {
|
2019-05-23 21:05:29 +03:00
|
|
|
return [32]byte{}, nil, err
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// Error was handled successfully, continue to make a
|
|
|
|
// new attempt.
|
2021-04-23 09:51:07 +03:00
|
|
|
continue lifecycle
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
// Now that the shard was successfully sent, launch a go
|
|
|
|
// routine that will handle its result when its back.
|
|
|
|
shardHandler.collectResultAsync(attempt)
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:24 +03:00
|
|
|
// shardHandler holds what is necessary to send and collect the result of
|
|
|
|
// shards.
|
|
|
|
type shardHandler struct {
|
2021-03-31 13:23:08 +03:00
|
|
|
identifier lntypes.Hash
|
2021-04-12 16:21:59 +03:00
|
|
|
router *ChannelRouter
|
|
|
|
shardTracker shards.ShardTracker
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
// shardErrors is a channel where errors collected by calling
|
|
|
|
// collectResultAsync will be delivered. These results are meant to be
|
|
|
|
// inspected by calling waitForShard or checkShards, and the channel
|
|
|
|
// doesn't need to be initiated if the caller is using the sync
|
|
|
|
// collectResult directly.
|
|
|
|
shardErrors chan error
|
|
|
|
|
|
|
|
// quit is closed to signal the sub goroutines of the payment lifecycle
|
|
|
|
// to stop.
|
|
|
|
quit chan struct{}
|
|
|
|
wg sync.WaitGroup
|
|
|
|
}
|
|
|
|
|
|
|
|
// stop signals any active shard goroutine to exit and waits for them to exit.
|
|
|
|
func (p *shardHandler) stop() {
|
|
|
|
close(p.quit)
|
|
|
|
p.wg.Wait()
|
|
|
|
}
|
|
|
|
|
|
|
|
// waitForShard blocks until any of the outstanding shards return.
|
|
|
|
func (p *shardHandler) waitForShard() error {
|
|
|
|
select {
|
|
|
|
case err := <-p.shardErrors:
|
|
|
|
return err
|
|
|
|
|
|
|
|
case <-p.quit:
|
2020-11-24 16:15:12 +03:00
|
|
|
return errShardHandlerExiting
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
case <-p.router.quit:
|
|
|
|
return ErrRouterShuttingDown
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// checkShards is a non-blocking method that check if any shards has finished
|
|
|
|
// their execution.
|
|
|
|
func (p *shardHandler) checkShards() error {
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case err := <-p.shardErrors:
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
case <-p.quit:
|
2020-11-24 16:15:12 +03:00
|
|
|
return errShardHandlerExiting
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
case <-p.router.quit:
|
|
|
|
return ErrRouterShuttingDown
|
|
|
|
|
|
|
|
default:
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
}
|
2020-04-01 01:13:24 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
// launchOutcome is a type returned from launchShard that indicates whether the
|
|
|
|
// shard was successfully send onto the network.
|
|
|
|
type launchOutcome struct {
|
|
|
|
// err is non-nil if a non-critical error was encountered when trying
|
|
|
|
// to send the shard, and we successfully updated the control tower to
|
|
|
|
// reflect this error. This can be errors like not enough local
|
|
|
|
// balance for the given route etc.
|
|
|
|
err error
|
2020-05-06 16:44:36 +03:00
|
|
|
|
|
|
|
// attempt is the attempt structure as recorded in the database.
|
|
|
|
attempt *channeldb.HTLCAttempt
|
2020-04-01 01:13:24 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
// launchShard creates and sends an HTLC attempt along the given route,
|
2021-04-12 16:21:59 +03:00
|
|
|
// registering it with the control tower before sending it. The lastShard
|
|
|
|
// argument should be true if this shard will consume the remainder of the
|
|
|
|
// amount to send. It returns the HTLCAttemptInfo that was created for the
|
|
|
|
// shard, along with a launchOutcome. The launchOutcome is used to indicate
|
|
|
|
// whether the attempt was successfully sent. If the launchOutcome wraps a
|
|
|
|
// non-nil error, it means that the attempt was not sent onto the network, so
|
|
|
|
// no result will be available in the future for it.
|
|
|
|
func (p *shardHandler) launchShard(rt *route.Route,
|
|
|
|
lastShard bool) (*channeldb.HTLCAttemptInfo, *launchOutcome, error) {
|
2020-04-01 01:13:24 +03:00
|
|
|
|
|
|
|
// Using the route received from the payment session, create a new
|
|
|
|
// shard to send.
|
|
|
|
firstHop, htlcAdd, attempt, err := p.createNewPaymentAttempt(
|
2021-04-12 16:21:59 +03:00
|
|
|
rt, lastShard,
|
2020-04-01 01:13:24 +03:00
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Before sending this HTLC to the switch, we checkpoint the fresh
|
|
|
|
// paymentID and route to the DB. This lets us know on startup the ID
|
|
|
|
// of the payment that we attempted to send, such that we can query the
|
|
|
|
// Switch for its whereabouts. The route is needed to handle the result
|
|
|
|
// when it eventually comes back.
|
2021-03-31 13:23:08 +03:00
|
|
|
err = p.router.cfg.Control.RegisterAttempt(p.identifier, attempt)
|
2020-04-01 01:13:24 +03:00
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Now that the attempt is created and checkpointed to the DB, we send
|
|
|
|
// it.
|
|
|
|
sendErr := p.sendPaymentAttempt(attempt, firstHop, htlcAdd)
|
|
|
|
if sendErr != nil {
|
|
|
|
// TODO(joostjager): Distinguish unexpected internal errors
|
|
|
|
// from real send errors.
|
2020-05-06 16:44:36 +03:00
|
|
|
htlcAttempt, err := p.failAttempt(attempt, sendErr)
|
2020-04-01 01:13:24 +03:00
|
|
|
if err != nil {
|
|
|
|
return nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return a launchOutcome indicating the shard failed.
|
|
|
|
return attempt, &launchOutcome{
|
2020-05-06 16:44:36 +03:00
|
|
|
attempt: htlcAttempt,
|
|
|
|
err: sendErr,
|
2020-04-01 01:13:24 +03:00
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
return attempt, &launchOutcome{}, nil
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:24 +03:00
|
|
|
// shardResult holds the resulting outcome of a shard sent.
|
|
|
|
type shardResult struct {
|
2020-05-06 16:44:36 +03:00
|
|
|
// attempt is the attempt structure as recorded in the database.
|
|
|
|
attempt *channeldb.HTLCAttempt
|
2020-04-01 01:13:24 +03:00
|
|
|
|
|
|
|
// err indicates that the shard failed.
|
|
|
|
err error
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
// collectResultAsync launches a goroutine that will wait for the result of the
|
|
|
|
// given HTLC attempt to be available then handle its result. Note that it will
|
|
|
|
// fail the payment with the control tower if a terminal error is encountered.
|
|
|
|
func (p *shardHandler) collectResultAsync(attempt *channeldb.HTLCAttemptInfo) {
|
|
|
|
p.wg.Add(1)
|
|
|
|
go func() {
|
|
|
|
defer p.wg.Done()
|
|
|
|
|
|
|
|
// Block until the result is available.
|
|
|
|
result, err := p.collectResult(attempt)
|
|
|
|
if err != nil {
|
|
|
|
if err != ErrRouterShuttingDown &&
|
2020-11-24 16:15:12 +03:00
|
|
|
err != htlcswitch.ErrSwitchExiting &&
|
|
|
|
err != errShardHandlerExiting {
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
log.Errorf("Error collecting result for "+
|
|
|
|
"shard %v for payment %v: %v",
|
2021-03-31 13:23:08 +03:00
|
|
|
attempt.AttemptID, p.identifier, err)
|
2020-04-01 01:13:26 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
|
|
|
case p.shardErrors <- err:
|
|
|
|
case <-p.router.quit:
|
|
|
|
case <-p.quit:
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// If a non-critical error was encountered handle it and mark
|
|
|
|
// the payment failed if the failure was terminal.
|
|
|
|
if result.err != nil {
|
|
|
|
err := p.handleSendError(attempt, result.err)
|
|
|
|
if err != nil {
|
|
|
|
select {
|
|
|
|
case p.shardErrors <- err:
|
|
|
|
case <-p.router.quit:
|
|
|
|
case <-p.quit:
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
select {
|
|
|
|
case p.shardErrors <- nil:
|
|
|
|
case <-p.router.quit:
|
|
|
|
case <-p.quit:
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:24 +03:00
|
|
|
// collectResult waits for the result for the given attempt to be available
|
|
|
|
// from the Switch, then records the attempt outcome with the control tower. A
|
|
|
|
// shardResult is returned, indicating the final outcome of this HTLC attempt.
|
|
|
|
func (p *shardHandler) collectResult(attempt *channeldb.HTLCAttemptInfo) (
|
|
|
|
*shardResult, error) {
|
|
|
|
|
2021-04-12 16:21:59 +03:00
|
|
|
// We'll retrieve the hash specific to this shard from the
|
|
|
|
// shardTracker, since it will be needed to regenerate the circuit
|
|
|
|
// below.
|
|
|
|
hash, err := p.shardTracker.GetHash(attempt.AttemptID)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:24 +03:00
|
|
|
// Regenerate the circuit for this attempt.
|
|
|
|
_, circuit, err := generateSphinxPacket(
|
2021-05-19 10:03:46 +03:00
|
|
|
&attempt.Route, hash[:], attempt.SessionKey(),
|
2020-04-01 01:13:24 +03:00
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Using the created circuit, initialize the error decrypter so we can
|
|
|
|
// parse+decode any failures incurred by this payment within the
|
|
|
|
// switch.
|
|
|
|
errorDecryptor := &htlcswitch.SphinxErrorDecrypter{
|
|
|
|
OnionErrorDecrypter: sphinx.NewOnionErrorDecrypter(circuit),
|
|
|
|
}
|
|
|
|
|
|
|
|
// Now ask the switch to return the result of the payment when
|
|
|
|
// available.
|
|
|
|
resultChan, err := p.router.cfg.Payer.GetPaymentResult(
|
2021-03-31 13:23:08 +03:00
|
|
|
attempt.AttemptID, p.identifier, errorDecryptor,
|
2020-04-01 01:13:24 +03:00
|
|
|
)
|
|
|
|
switch {
|
|
|
|
|
|
|
|
// If this attempt ID is unknown to the Switch, it means it was never
|
|
|
|
// checkpointed and forwarded by the switch before a restart. In this
|
|
|
|
// case we can safely send a new payment attempt, and wait for its
|
|
|
|
// result to be available.
|
|
|
|
case err == htlcswitch.ErrPaymentIDNotFound:
|
2021-03-31 13:23:08 +03:00
|
|
|
log.Debugf("Attempt ID %v for payment %v not found in "+
|
2020-04-01 01:13:24 +03:00
|
|
|
"the Switch, retrying.", attempt.AttemptID,
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier)
|
2020-04-01 01:13:24 +03:00
|
|
|
|
2020-05-06 16:44:36 +03:00
|
|
|
attempt, cErr := p.failAttempt(attempt, err)
|
2020-04-01 01:13:24 +03:00
|
|
|
if cErr != nil {
|
|
|
|
return nil, cErr
|
|
|
|
}
|
|
|
|
|
|
|
|
return &shardResult{
|
2020-05-06 16:44:36 +03:00
|
|
|
attempt: attempt,
|
|
|
|
err: err,
|
2020-04-01 01:13:24 +03:00
|
|
|
}, nil
|
|
|
|
|
|
|
|
// A critical, unexpected error was encountered.
|
|
|
|
case err != nil:
|
|
|
|
log.Errorf("Failed getting result for attemptID %d "+
|
|
|
|
"from switch: %v", attempt.AttemptID, err)
|
|
|
|
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// The switch knows about this payment, we'll wait for a result to be
|
|
|
|
// available.
|
|
|
|
var (
|
|
|
|
result *htlcswitch.PaymentResult
|
|
|
|
ok bool
|
|
|
|
)
|
|
|
|
|
|
|
|
select {
|
|
|
|
case result, ok = <-resultChan:
|
|
|
|
if !ok {
|
|
|
|
return nil, htlcswitch.ErrSwitchExiting
|
|
|
|
}
|
|
|
|
|
|
|
|
case <-p.router.quit:
|
|
|
|
return nil, ErrRouterShuttingDown
|
2020-04-01 01:13:26 +03:00
|
|
|
|
|
|
|
case <-p.quit:
|
2020-11-24 16:15:12 +03:00
|
|
|
return nil, errShardHandlerExiting
|
2020-04-01 01:13:24 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
// In case of a payment failure, fail the attempt with the control
|
|
|
|
// tower and return.
|
|
|
|
if result.Error != nil {
|
2020-05-06 16:44:36 +03:00
|
|
|
attempt, err := p.failAttempt(attempt, result.Error)
|
2020-04-01 01:13:24 +03:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return &shardResult{
|
2020-05-06 16:44:36 +03:00
|
|
|
attempt: attempt,
|
|
|
|
err: result.Error,
|
2020-04-01 01:13:24 +03:00
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// We successfully got a payment result back from the switch.
|
2020-04-06 13:18:50 +03:00
|
|
|
log.Debugf("Payment %v succeeded with pid=%v",
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, attempt.AttemptID)
|
2020-04-01 01:13:24 +03:00
|
|
|
|
|
|
|
// Report success to mission control.
|
|
|
|
err = p.router.cfg.MissionControl.ReportPaymentSuccess(
|
|
|
|
attempt.AttemptID, &attempt.Route,
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
log.Errorf("Error reporting payment success to mc: %v",
|
|
|
|
err)
|
|
|
|
}
|
|
|
|
|
|
|
|
// In case of success we atomically store settle result to the DB move
|
|
|
|
// the shard to the settled state.
|
2020-05-06 16:44:36 +03:00
|
|
|
htlcAttempt, err := p.router.cfg.Control.SettleAttempt(
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, attempt.AttemptID,
|
2020-04-01 01:13:24 +03:00
|
|
|
&channeldb.HTLCSettleInfo{
|
|
|
|
Preimage: result.Preimage,
|
|
|
|
SettleTime: p.router.cfg.Clock.Now(),
|
|
|
|
},
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
log.Errorf("Unable to succeed payment attempt: %v", err)
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
return &shardResult{
|
2020-05-06 16:44:36 +03:00
|
|
|
attempt: htlcAttempt,
|
2020-04-01 01:13:24 +03:00
|
|
|
}, nil
|
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:23 +03:00
|
|
|
// createNewPaymentAttempt creates a new payment attempt from the given route.
|
2021-04-12 16:21:59 +03:00
|
|
|
func (p *shardHandler) createNewPaymentAttempt(rt *route.Route, lastShard bool) (
|
2020-04-01 01:13:23 +03:00
|
|
|
lnwire.ShortChannelID, *lnwire.UpdateAddHTLC,
|
|
|
|
*channeldb.HTLCAttemptInfo, error) {
|
2019-05-23 21:05:29 +03:00
|
|
|
|
|
|
|
// Generate a new key to be used for this attempt.
|
|
|
|
sessionKey, err := generateNewSessionKey()
|
|
|
|
if err != nil {
|
2020-04-01 01:13:23 +03:00
|
|
|
return lnwire.ShortChannelID{}, nil, nil, err
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
|
|
|
|
2021-04-12 16:21:59 +03:00
|
|
|
// We generate a new, unique payment ID that we will use for
|
|
|
|
// this HTLC.
|
|
|
|
attemptID, err := p.router.cfg.NextPaymentID()
|
|
|
|
if err != nil {
|
|
|
|
return lnwire.ShortChannelID{}, nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// Requesst a new shard from the ShardTracker. If this is an AMP
|
|
|
|
// payment, and this is the last shard, the outstanding shards together
|
|
|
|
// with ths one will be enough for the receiver to derive all HTLC
|
|
|
|
// preimages. If this a non-AMP payment, the ShardTracker will return a
|
|
|
|
// simple shard with the payment's static payment hash.
|
|
|
|
shard, err := p.shardTracker.NewShard(attemptID, lastShard)
|
|
|
|
if err != nil {
|
|
|
|
return lnwire.ShortChannelID{}, nil, nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// It this shard carries MPP or AMP options, add them to the last hop
|
|
|
|
// on the route.
|
|
|
|
hop := rt.Hops[len(rt.Hops)-1]
|
|
|
|
if shard.MPP() != nil {
|
|
|
|
hop.MPP = shard.MPP()
|
|
|
|
}
|
|
|
|
|
|
|
|
if shard.AMP() != nil {
|
|
|
|
hop.AMP = shard.AMP()
|
|
|
|
}
|
|
|
|
|
2019-05-23 21:05:29 +03:00
|
|
|
// Generate the raw encoded sphinx packet to be included along
|
|
|
|
// with the htlcAdd message that we send directly to the
|
|
|
|
// switch.
|
2021-04-12 16:21:59 +03:00
|
|
|
hash := shard.Hash()
|
|
|
|
onionBlob, _, err := generateSphinxPacket(rt, hash[:], sessionKey)
|
2019-05-23 21:05:29 +03:00
|
|
|
if err != nil {
|
2020-04-01 01:13:23 +03:00
|
|
|
return lnwire.ShortChannelID{}, nil, nil, err
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
|
|
|
|
2019-05-23 21:05:29 +03:00
|
|
|
// Craft an HTLC packet to send to the layer 2 switch. The
|
|
|
|
// metadata within this packet will be used to route the
|
|
|
|
// payment through the network, starting with the first-hop.
|
|
|
|
htlcAdd := &lnwire.UpdateAddHTLC{
|
2019-12-11 10:41:59 +03:00
|
|
|
Amount: rt.TotalAmount,
|
|
|
|
Expiry: rt.TotalTimeLock,
|
2021-04-12 16:21:59 +03:00
|
|
|
PaymentHash: hash,
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
|
|
|
copy(htlcAdd.OnionBlob[:], onionBlob)
|
|
|
|
|
|
|
|
// Attempt to send this payment through the network to complete
|
|
|
|
// the payment. If this attempt fails, then we'll continue on
|
|
|
|
// to the next available route.
|
|
|
|
firstHop := lnwire.NewShortChanIDFromInt(
|
2019-12-11 10:41:59 +03:00
|
|
|
rt.Hops[0].ChannelID,
|
2019-05-23 21:05:29 +03:00
|
|
|
)
|
|
|
|
|
2021-05-19 10:03:46 +03:00
|
|
|
// We now have all the information needed to populate the current
|
|
|
|
// attempt information.
|
|
|
|
attempt := channeldb.NewHtlcAttemptInfo(
|
|
|
|
attemptID, sessionKey, *rt, p.router.cfg.Clock.Now(), &hash,
|
|
|
|
)
|
2019-05-23 21:05:29 +03:00
|
|
|
|
2020-04-01 01:13:23 +03:00
|
|
|
return firstHop, htlcAdd, attempt, nil
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
2019-05-23 21:05:29 +03:00
|
|
|
|
2019-05-23 21:05:29 +03:00
|
|
|
// sendPaymentAttempt attempts to send the current attempt to the switch.
|
2020-04-01 01:13:24 +03:00
|
|
|
func (p *shardHandler) sendPaymentAttempt(
|
2020-04-01 01:13:24 +03:00
|
|
|
attempt *channeldb.HTLCAttemptInfo, firstHop lnwire.ShortChannelID,
|
2019-05-23 21:05:29 +03:00
|
|
|
htlcAdd *lnwire.UpdateAddHTLC) error {
|
|
|
|
|
2020-04-06 13:18:50 +03:00
|
|
|
log.Tracef("Attempting to send payment %v (pid=%v), "+
|
2021-03-31 13:23:08 +03:00
|
|
|
"using route: %v", p.identifier, attempt.AttemptID,
|
2019-05-23 21:05:29 +03:00
|
|
|
newLogClosure(func() string {
|
2020-04-01 01:13:24 +03:00
|
|
|
return spew.Sdump(attempt.Route)
|
2019-05-23 21:05:29 +03:00
|
|
|
}),
|
|
|
|
)
|
|
|
|
|
|
|
|
// Send it to the Switch. When this method returns we assume
|
|
|
|
// the Switch successfully has persisted the payment attempt,
|
|
|
|
// such that we can resume waiting for the result after a
|
|
|
|
// restart.
|
|
|
|
err := p.router.cfg.Payer.SendHTLC(
|
2020-04-01 01:13:24 +03:00
|
|
|
firstHop, attempt.AttemptID, htlcAdd,
|
2019-05-23 21:05:29 +03:00
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
log.Errorf("Failed sending attempt %d for payment "+
|
2020-04-06 13:18:50 +03:00
|
|
|
"%v to switch: %v", attempt.AttemptID,
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, err)
|
2019-05-23 21:05:29 +03:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2020-04-06 13:18:50 +03:00
|
|
|
log.Debugf("Payment %v (pid=%v) successfully sent to switch, route: %v",
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, attempt.AttemptID, &attempt.Route)
|
2019-05-23 21:05:29 +03:00
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
2019-05-23 21:05:29 +03:00
|
|
|
|
2019-05-23 21:05:29 +03:00
|
|
|
// handleSendError inspects the given error from the Switch and determines
|
2020-04-01 01:13:25 +03:00
|
|
|
// whether we should make another payment attempt, or if it should be
|
|
|
|
// considered a terminal error. Terminal errors will be recorded with the
|
|
|
|
// control tower.
|
2020-04-01 01:13:24 +03:00
|
|
|
func (p *shardHandler) handleSendError(attempt *channeldb.HTLCAttemptInfo,
|
2020-04-01 01:13:24 +03:00
|
|
|
sendErr error) error {
|
2019-05-23 22:17:16 +03:00
|
|
|
|
2019-08-05 13:13:58 +03:00
|
|
|
reason := p.router.processSendError(
|
2020-04-01 01:13:24 +03:00
|
|
|
attempt.AttemptID, &attempt.Route, sendErr,
|
2019-06-19 12:12:10 +03:00
|
|
|
)
|
2019-08-05 13:13:58 +03:00
|
|
|
if reason == nil {
|
2019-06-19 12:12:10 +03:00
|
|
|
return nil
|
2019-06-04 12:22:23 +03:00
|
|
|
}
|
|
|
|
|
2020-11-24 16:16:03 +03:00
|
|
|
log.Infof("Payment %v failed: final_outcome=%v, raw_err=%v",
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, *reason, sendErr)
|
2019-05-23 21:05:29 +03:00
|
|
|
|
2021-03-31 13:23:08 +03:00
|
|
|
err := p.router.cfg.Control.Fail(p.identifier, *reason)
|
2019-06-04 12:22:23 +03:00
|
|
|
if err != nil {
|
|
|
|
return err
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
|
|
|
|
2020-04-01 01:13:25 +03:00
|
|
|
return nil
|
2019-05-23 21:05:29 +03:00
|
|
|
}
|
2020-02-20 20:08:01 +03:00
|
|
|
|
|
|
|
// failAttempt calls control tower to fail the current payment attempt.
|
2020-04-01 01:13:24 +03:00
|
|
|
func (p *shardHandler) failAttempt(attempt *channeldb.HTLCAttemptInfo,
|
2020-05-06 16:44:36 +03:00
|
|
|
sendError error) (*channeldb.HTLCAttempt, error) {
|
2020-04-01 01:13:24 +03:00
|
|
|
|
2020-04-01 01:13:26 +03:00
|
|
|
log.Warnf("Attempt %v for payment %v failed: %v", attempt.AttemptID,
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, sendError)
|
2020-04-01 01:13:26 +03:00
|
|
|
|
2020-02-20 20:08:01 +03:00
|
|
|
failInfo := marshallError(
|
|
|
|
sendError,
|
|
|
|
p.router.cfg.Clock.Now(),
|
|
|
|
)
|
2020-02-20 20:08:01 +03:00
|
|
|
|
2021-04-12 16:21:59 +03:00
|
|
|
// Now that we are failing this payment attempt, cancel the shard with
|
|
|
|
// the ShardTracker such that it can derive the correct hash for the
|
|
|
|
// next attempt.
|
|
|
|
if err := p.shardTracker.CancelShard(attempt.AttemptID); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
2020-02-20 20:08:01 +03:00
|
|
|
return p.router.cfg.Control.FailAttempt(
|
2021-03-31 13:23:08 +03:00
|
|
|
p.identifier, attempt.AttemptID,
|
2020-02-20 20:08:01 +03:00
|
|
|
failInfo,
|
|
|
|
)
|
|
|
|
}
|
2020-02-20 20:08:01 +03:00
|
|
|
|
|
|
|
// marshallError marshall an error as received from the switch to a structure
|
|
|
|
// that is suitable for database storage.
|
|
|
|
func marshallError(sendError error, time time.Time) *channeldb.HTLCFailInfo {
|
|
|
|
response := &channeldb.HTLCFailInfo{
|
|
|
|
FailTime: time,
|
|
|
|
}
|
|
|
|
|
|
|
|
switch sendError {
|
|
|
|
|
|
|
|
case htlcswitch.ErrPaymentIDNotFound:
|
|
|
|
response.Reason = channeldb.HTLCFailInternal
|
|
|
|
return response
|
|
|
|
|
|
|
|
case htlcswitch.ErrUnreadableFailureMessage:
|
|
|
|
response.Reason = channeldb.HTLCFailUnreadable
|
|
|
|
return response
|
|
|
|
}
|
|
|
|
|
|
|
|
rtErr, ok := sendError.(htlcswitch.ClearTextError)
|
|
|
|
if !ok {
|
|
|
|
response.Reason = channeldb.HTLCFailInternal
|
|
|
|
return response
|
|
|
|
}
|
|
|
|
|
|
|
|
message := rtErr.WireMessage()
|
|
|
|
if message != nil {
|
|
|
|
response.Reason = channeldb.HTLCFailMessage
|
|
|
|
response.Message = message
|
|
|
|
} else {
|
|
|
|
response.Reason = channeldb.HTLCFailUnknown
|
|
|
|
}
|
|
|
|
|
|
|
|
// If the ClearTextError received is a ForwardingError, the error
|
|
|
|
// originated from a node along the route, not locally on our outgoing
|
|
|
|
// link. We set failureSourceIdx to the index of the node where the
|
|
|
|
// failure occurred. If the error is not a ForwardingError, the failure
|
|
|
|
// occurred at our node, so we leave the index as 0 to indicate that
|
|
|
|
// we failed locally.
|
|
|
|
fErr, ok := rtErr.(*htlcswitch.ForwardingError)
|
|
|
|
if ok {
|
|
|
|
response.FailureSourceIndex = uint32(fErr.FailureSourceIdx)
|
|
|
|
}
|
|
|
|
|
|
|
|
return response
|
|
|
|
}
|