Track actions to execute after a `ChannelMonitor` is updated

[rust-lightning] / lightning / src / ln / channelmanager.rs
diff --git a/lightning/src/ln/channelmanager.rs b/lightning/src/ln/channelmanager.rs

index a1148b692b102b15754386bfc620a116f4d5fb8d..9b277ff1e4691cd462d75f2b9f0abc97751e59d1 100644 (file)
--- a/lightning/src/ln/channelmanager.rs
+++ b/lightning/src/ln/channelmanager.rs
@@ -65,12 +65,14 @@ use crate::util::ser::{BigSize, FixedLengthReader, Readable, ReadableArgs, Maybe
  use crate::util::logger::{Level, Logger};
  use crate::util::errors::APIError;
  
+use alloc::collections::BTreeMap;
+
  use crate::io;
  use crate::prelude::*;
  use core::{cmp, mem};
  use core::cell::RefCell;
  use crate::io::Read;
-use crate::sync::{Arc, Mutex, RwLock, RwLockReadGuard, FairRwLock};
+use crate::sync::{Arc, Mutex, RwLock, RwLockReadGuard, FairRwLock, LockTestExt, LockHeldState};
  use core::sync::atomic::{AtomicUsize, Ordering};
  use core::time::Duration;
  use core::ops::Deref;
@@ -474,6 +476,11 @@ pub(crate) enum MonitorUpdateCompletionAction {
         EmitEvent { event: events::Event },
  }
  
+impl_writeable_tlv_based_enum_upgradable!(MonitorUpdateCompletionAction,
+       (0, PaymentClaimed) => { (0, payment_hash, required) },
+       (2, EmitEvent) => { (0, event, ignorable) },
+);
+
  /// State we hold per-peer.
  pub(super) struct PeerState<Signer: ChannelSigner> {
         /// `temporary_channel_id` or `channel_id` -> `channel`.
@@ -487,6 +494,21 @@ pub(super) struct PeerState<Signer: ChannelSigner> {
         /// Messages to send to the peer - pushed to in the same lock that they are generated in (except
         /// for broadcast messages, where ordering isn't as strict).
         pub(super) pending_msg_events: Vec<MessageSendEvent>,
+       /// Map from a specific channel to some action(s) that should be taken when all pending
+       /// [`ChannelMonitorUpdate`]s for the channel complete updating.
+       ///
+       /// Note that because we generally only have one entry here a HashMap is pretty overkill. A
+       /// BTreeMap currently stores more than ten elements per leaf node, so even up to a few
+       /// channels with a peer this will just be one allocation and will amount to a linear list of
+       /// channels to walk, avoiding the whole hashing rigmarole.
+       ///
+       /// Note that the channel may no longer exist. For example, if a channel was closed but we
+       /// later needed to claim an HTLC which is pending on-chain, we may generate a monitor update
+       /// for a missing channel. While a malicious peer could construct a second channel with the
+       /// same `temporary_channel_id` (or final `channel_id` in the case of 0conf channels or prior
+       /// to funding appearing on-chain), the downstream `ChannelMonitor` set is required to ensure
+       /// duplicates do not occur, so such channels should fail without a monitor update completing.
+       monitor_update_blocked_actions: BTreeMap<[u8; 32], Vec<MonitorUpdateCompletionAction>>,
         /// The peer is currently connected (i.e. we've seen a
         /// [`ChannelMessageHandler::peer_connected`] and no corresponding
         /// [`ChannelMessageHandler::peer_disconnected`].
@@ -501,7 +523,7 @@ impl <Signer: ChannelSigner> PeerState<Signer> {
                 if require_disconnected && self.is_connected {
                         return false
                 }
-               self.channel_by_id.len() == 0
+               self.channel_by_id.is_empty() && self.monitor_update_blocked_actions.is_empty()
         }
  }
  
@@ -1190,9 +1212,9 @@ pub enum RecentPaymentDetails {
                 /// made before LDK version 0.0.104.
                 payment_hash: Option<PaymentHash>,
         },
-       /// After a payment is explicitly abandoned by calling [`ChannelManager::abandon_payment`], it
-       /// is marked as abandoned until an [`Event::PaymentFailed`] is generated. A payment could also
-       /// be marked as abandoned if pathfinding fails repeatedly or retries have been exhausted.
+       /// After a payment's retries are exhausted per the provided [`Retry`], or it is explicitly
+       /// abandoned via [`ChannelManager::abandon_payment`], it is marked as abandoned until all
+       /// pending HTLCs for this payment resolve and an [`Event::PaymentFailed`] is generated.
         Abandoned {
                 /// Hash of the payment that we have given up trying to send.
                 payment_hash: PaymentHash,
@@ -1218,13 +1240,10 @@ macro_rules! handle_error {
                 match $internal {
                         Ok(msg) => Ok(msg),
                         Err(MsgHandleErrInternal { err, chan_id, shutdown_finish }) => {
-                               #[cfg(any(feature = "_test_utils", test))]
-                               {
-                                       // In testing, ensure there are no deadlocks where the lock is already held upon
-                                       // entering the macro.
-                                       debug_assert!($self.pending_events.try_lock().is_ok());
-                                       debug_assert!($self.per_peer_state.try_write().is_ok());
-                               }
+                               // In testing, ensure there are no deadlocks where the lock is already held upon
+                               // entering the macro.
+                               debug_assert_ne!($self.pending_events.held_by_thread(), LockHeldState::HeldByThread);
+                               debug_assert_ne!($self.per_peer_state.held_by_thread(), LockHeldState::HeldByThread);
  
                                 let mut msg_events = Vec::with_capacity(2);
  
@@ -1718,7 +1737,7 @@ where
         ///
         /// This can be useful for payments that may have been prepared, but ultimately not sent, as a
         /// result of a crash. If such a payment exists, is not listed here, and an
-       /// [`Event::PaymentSent`] has not been received, you may consider retrying the payment.
+       /// [`Event::PaymentSent`] has not been received, you may consider resending the payment.
         ///
         /// [`Event::PaymentSent`]: events::Event::PaymentSent
         pub fn list_recent_payments(&self) -> Vec<RecentPaymentDetails> {
@@ -2393,10 +2412,10 @@ where
                         let mut peer_state_lock = peer_state_mutex.lock().unwrap();
                         let peer_state = &mut *peer_state_lock;
                         if let hash_map::Entry::Occupied(mut chan) = peer_state.channel_by_id.entry(id) {
+                               if !chan.get().is_live() {
+                                       return Err(APIError::ChannelUnavailable{err: "Peer for first hop currently disconnected".to_owned()});
+                               }
                                 match {
-                                       if !chan.get().is_live() {
-                                               return Err(APIError::ChannelUnavailable{err: "Peer for first hop currently disconnected/pending monitor update!".to_owned()});
-                                       }
                                         break_chan_entry!(self, chan.get_mut().send_htlc_and_commit(
                                                 htlc_msat, payment_hash.clone(), htlc_cltv, HTLCSource::OutboundRoute {
                                                         path: path.clone(),
@@ -2475,8 +2494,8 @@ where
         /// If a pending payment is currently in-flight with the same [`PaymentId`] provided, this
         /// method will error with an [`APIError::InvalidRoute`]. Note, however, that once a payment
         /// is no longer pending (either via [`ChannelManager::abandon_payment`], or handling of an
-       /// [`Event::PaymentSent`]) LDK will not stop you from sending a second payment with the same
-       /// [`PaymentId`].
+       /// [`Event::PaymentSent`] or [`Event::PaymentFailed`]) LDK will not stop you from sending a
+       /// second payment with the same [`PaymentId`].
         ///
         /// Thus, in order to ensure duplicate payments are not sent, you should implement your own
         /// tracking of payments, including state to indicate once a payment has completed. Because you
@@ -2521,6 +2540,7 @@ where
         /// [`Route`], we assume the invoice had the basic_mpp feature set.
         ///
         /// [`Event::PaymentSent`]: events::Event::PaymentSent
+       /// [`Event::PaymentFailed`]: events::Event::PaymentFailed
         /// [`PeerManager::process_events`]: crate::ln::peer_handler::PeerManager::process_events
         /// [`ChannelMonitorUpdateStatus::InProgress`]: crate::chain::ChannelMonitorUpdateStatus::InProgress
         pub fn send_payment(&self, route: &Route, payment_hash: PaymentHash, payment_secret: &Option<PaymentSecret>, payment_id: PaymentId) -> Result<(), PaymentSendFailure> {
@@ -2558,48 +2578,25 @@ where
         }
  
  
-       /// Retries a payment along the given [`Route`].
-       ///
-       /// Errors returned are a superset of those returned from [`send_payment`], so see
-       /// [`send_payment`] documentation for more details on errors. This method will also error if the
-       /// retry amount puts the payment more than 10% over the payment's total amount, if the payment
-       /// for the given `payment_id` cannot be found (likely due to timeout or success), or if
-       /// further retries have been disabled with [`abandon_payment`].
+       /// Signals that no further retries for the given payment should occur. Useful if you have a
+       /// pending outbound payment with retries remaining, but wish to stop retrying the payment before
+       /// retries are exhausted.
         ///
-       /// [`send_payment`]: [`ChannelManager::send_payment`]
-       /// [`abandon_payment`]: [`ChannelManager::abandon_payment`]
-       pub fn retry_payment(&self, route: &Route, payment_id: PaymentId) -> Result<(), PaymentSendFailure> {
-               let best_block_height = self.best_block.read().unwrap().height();
-               self.pending_outbound_payments.retry_payment_with_route(route, payment_id, &self.entropy_source, &self.node_signer, best_block_height,
-                       |path, payment_params, payment_hash, payment_secret, total_value, cur_height, payment_id, keysend_preimage, session_priv|
-                       self.send_payment_along_path(path, payment_params, payment_hash, payment_secret, total_value, cur_height, payment_id, keysend_preimage, session_priv))
-       }
-
-       /// Signals that no further retries for the given payment will occur.
-       ///
-       /// After this method returns, no future calls to [`retry_payment`] for the given `payment_id`
-       /// are allowed. If no [`Event::PaymentFailed`] event had been generated before, one will be
-       /// generated as soon as there are no remaining pending HTLCs for this payment.
+       /// If no [`Event::PaymentFailed`] event had been generated before, one will be generated as soon
+       /// as there are no remaining pending HTLCs for this payment.
         ///
         /// Note that calling this method does *not* prevent a payment from succeeding. You must still
         /// wait until you receive either a [`Event::PaymentFailed`] or [`Event::PaymentSent`] event to
         /// determine the ultimate status of a payment.
         ///
         /// If an [`Event::PaymentFailed`] event is generated and we restart without this
-       /// [`ChannelManager`] having been persisted, the payment may still be in the pending state
-       /// upon restart. This allows further calls to [`retry_payment`] (and requiring a second call
-       /// to [`abandon_payment`] to mark the payment as failed again). Otherwise, future calls to
-       /// [`retry_payment`] will fail with [`PaymentSendFailure::ParameterError`].
+       /// [`ChannelManager`] having been persisted, another [`Event::PaymentFailed`] may be generated.
         ///
-       /// [`abandon_payment`]: Self::abandon_payment
-       /// [`retry_payment`]: Self::retry_payment
         /// [`Event::PaymentFailed`]: events::Event::PaymentFailed
         /// [`Event::PaymentSent`]: events::Event::PaymentSent
         pub fn abandon_payment(&self, payment_id: PaymentId) {
                 let _persistence_guard = PersistenceNotifierGuard::notify_on_drop(&self.total_consistency_lock, &self.persistence_notifier);
-               if let Some(payment_failed_ev) = self.pending_outbound_payments.abandon_payment(payment_id) {
-                       self.pending_events.lock().unwrap().push(payment_failed_ev);
-               }
+               self.pending_outbound_payments.abandon_payment(payment_id, &self.pending_events);
         }
  
         /// Send a spontaneous payment, which is a payment that does not require the recipient to have
@@ -3372,7 +3369,8 @@ where
  
                 let best_block_height = self.best_block.read().unwrap().height();
                 self.pending_outbound_payments.check_retry_payments(&self.router, || self.list_usable_channels(),
-                       || self.compute_inflight_htlcs(), &self.entropy_source, &self.node_signer, best_block_height, &self.logger,
+                       || self.compute_inflight_htlcs(), &self.entropy_source, &self.node_signer, best_block_height,
+                       &self.pending_events, &self.logger,
                         |path, payment_params, payment_hash, payment_secret, total_value, cur_height, payment_id, keysend_preimage, session_priv|
                         self.send_payment_along_path(path, payment_params, payment_hash, payment_secret, total_value, cur_height, payment_id, keysend_preimage, session_priv));
  
@@ -3743,17 +3741,12 @@ where
         /// Fails an HTLC backwards to the sender of it to us.
         /// Note that we do not assume that channels corresponding to failed HTLCs are still available.
         fn fail_htlc_backwards_internal(&self, source: &HTLCSource, payment_hash: &PaymentHash, onion_error: &HTLCFailReason, destination: HTLCDestination) {
-               #[cfg(any(feature = "_test_utils", test))]
-               {
-                       // Ensure that the peer state channel storage lock is not held when calling this
-                       // function.
-                       // This ensures that future code doesn't introduce a lock_order requirement for
-                       // `forward_htlcs` to be locked after the `per_peer_state` peer locks, which calling
-                       // this function with any `per_peer_state` peer lock aquired would.
-                       let per_peer_state = self.per_peer_state.read().unwrap();
-                       for (_, peer) in per_peer_state.iter() {
-                               debug_assert!(peer.try_lock().is_ok());
-                       }
+               // Ensure that no peer state channel storage lock is held when calling this function.
+               // This ensures that future code doesn't introduce a lock-order requirement for
+               // `forward_htlcs` to be locked after the `per_peer_state` peer locks, which calling
+               // this function with any `per_peer_state` peer lock acquired would.
+               for (_, peer) in self.per_peer_state.read().unwrap().iter() {
+                       debug_assert_ne!(peer.held_by_thread(), LockHeldState::HeldByThread);
                 }
  
                 //TODO: There is a timing attack here where if a node fails an HTLC back to us they can
@@ -6348,6 +6341,7 @@ where
                                                 channel_by_id: HashMap::new(),
                                                 latest_features: init_msg.features.clone(),
                                                 pending_msg_events: Vec::new(),
+                                               monitor_update_blocked_actions: BTreeMap::new(),
                                                 is_connected: true,
                                         }));
                                 },
@@ -6975,10 +6969,14 @@ where
                         htlc_purposes.push(purpose);
                 }
  
+               let mut monitor_update_blocked_actions_per_peer = None;
+               let mut peer_states = Vec::new();
+               for (_, peer_state_mutex) in per_peer_state.iter() {
+                       peer_states.push(peer_state_mutex.lock().unwrap());
+               }
+
                 (serializable_peer_count).write(writer)?;
-               for (peer_pubkey, peer_state_mutex) in per_peer_state.iter() {
-                       let peer_state_lock = peer_state_mutex.lock().unwrap();
-                       let peer_state = &*peer_state_lock;
+               for ((peer_pubkey, _), peer_state) in per_peer_state.iter().zip(peer_states.iter()) {
                         // Peers which we have no channels to should be dropped once disconnected. As we
                         // disconnect all peers when shutting down and serializing the ChannelManager, we
                         // consider all peers as disconnected here. There's therefore no need write peers with
@@ -6986,6 +6984,11 @@ where
                         if !peer_state.ok_to_remove(false) {
                                 peer_pubkey.write(writer)?;
                                 peer_state.latest_features.write(writer)?;
+                               if !peer_state.monitor_update_blocked_actions.is_empty() {
+                                       monitor_update_blocked_actions_per_peer
+                                               .get_or_insert_with(Vec::new)
+                                               .push((*peer_pubkey, &peer_state.monitor_update_blocked_actions));
+                               }
                         }
                 }
  
@@ -7073,6 +7076,7 @@ where
                         (3, pending_outbound_payments, required),
                         (4, pending_claiming_payments, option),
                         (5, self.our_network_pubkey, required),
+                       (6, monitor_update_blocked_actions_per_peer, option),
                         (7, self.fake_scid_rand_bytes, required),
                         (9, htlc_purposes, vec_type),
                         (11, self.probing_cookie_secret, required),
@@ -7385,6 +7389,7 @@ where
                                 channel_by_id: peer_channels.remove(&peer_pubkey).unwrap_or(HashMap::new()),
                                 latest_features: Readable::read(reader)?,
                                 pending_msg_events: Vec::new(),
+                               monitor_update_blocked_actions: BTreeMap::new(),
                                 is_connected: false,
                         };
                         per_peer_state.insert(peer_pubkey, Mutex::new(peer_state));
@@ -7441,12 +7446,14 @@ where
                 let mut probing_cookie_secret: Option<[u8; 32]> = None;
                 let mut claimable_htlc_purposes = None;
                 let mut pending_claiming_payments = Some(HashMap::new());
+               let mut monitor_update_blocked_actions_per_peer = Some(Vec::new());
                 read_tlv_fields!(reader, {
                         (1, pending_outbound_payments_no_retry, option),
                         (2, pending_intercepted_htlcs, option),
                         (3, pending_outbound_payments, option),
                         (4, pending_claiming_payments, option),
                         (5, received_network_pubkey, option),
+                       (6, monitor_update_blocked_actions_per_peer, option),
                         (7, fake_scid_rand_bytes, option),
                         (9, claimable_htlc_purposes, vec_type),
                         (11, probing_cookie_secret, option),
@@ -7712,6 +7719,15 @@ where
                         }
                 }
  
+               for (node_id, monitor_update_blocked_actions) in monitor_update_blocked_actions_per_peer.unwrap() {
+                       if let Some(peer_state) = per_peer_state.get_mut(&node_id) {
+                               peer_state.lock().unwrap().monitor_update_blocked_actions = monitor_update_blocked_actions;
+                       } else {
+                               log_error!(args.logger, "Got blocked actions without a per-peer-state for {}", node_id);
+                               return Err(DecodeError::InvalidValue);
+                       }
+               }
+
                 let channel_manager = ChannelManager {
                         genesis_hash,
                         fee_estimator: bounded_fee_estimator,
@@ -7723,7 +7739,7 @@ where
  
                         inbound_payment_key: expanded_inbound_key,
                         pending_inbound_payments: Mutex::new(pending_inbound_payments),
-                       pending_outbound_payments: OutboundPayments { pending_outbound_payments: Mutex::new(pending_outbound_payments.unwrap()) },
+                       pending_outbound_payments: OutboundPayments { pending_outbound_payments: Mutex::new(pending_outbound_payments.unwrap()), retry_lock: Mutex::new(()), },
                         pending_intercepted_htlcs: Mutex::new(pending_intercepted_htlcs.unwrap()),
  
                         forward_htlcs: Mutex::new(forward_htlcs),