Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[XCM] Treat recursion limit error as transient in the MQ #4202

Merged
merged 9 commits into from
Apr 25, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
46 changes: 45 additions & 1 deletion polkadot/xcm/xcm-builder/src/process_xcm_message.rs
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,12 @@ impl<
target: LOG_TARGET,
"XCM message execution error: {error:?}",
);
(required, Err(ProcessMessageError::Unsupported))
let error = match error {
xcm::latest::Error::ExceedsStackLimit => ProcessMessageError::StackLimitReached,
_ => ProcessMessageError::Unsupported,
};

(required, Err(error))
},
};
meter.consume(consumed);
Expand Down Expand Up @@ -148,6 +153,45 @@ mod tests {
}
}

#[test]
fn process_message_exceeds_limits_fails() {
struct MockedExecutor;
impl ExecuteXcm<()> for MockedExecutor {
type Prepared = xcm_executor::WeighedMessage<()>;
fn prepare(
message: xcm::latest::Xcm<()>,
) -> core::result::Result<Self::Prepared, xcm::latest::Xcm<()>> {
Ok(xcm_executor::WeighedMessage::new(Weight::zero(), message))
}
fn execute(
_: impl Into<Location>,
_: Self::Prepared,
_: &mut XcmHash,
_: Weight,
) -> Outcome {
Outcome::Error { error: xcm::latest::Error::ExceedsStackLimit }
}
fn charge_fees(_location: impl Into<Location>, _fees: Assets) -> xcm::latest::Result {
unreachable!()
}
}

type Processor = ProcessXcmMessage<Junction, MockedExecutor, ()>;

let xcm = VersionedXcm::V4(xcm::latest::Xcm::<()>(vec![
xcm::latest::Instruction::<()>::ClearOrigin,
]));
assert_err!(
Processor::process_message(
&xcm.encode(),
ORIGIN,
&mut WeightMeter::new(),
&mut [0; 32]
),
ProcessMessageError::StackLimitReached,
);
}

#[test]
fn process_message_overweight_fails() {
for msg in [v3_xcm(true), v3_xcm(false), v3_xcm(false), v2_xcm(false)] {
Expand Down
7 changes: 7 additions & 0 deletions polkadot/xcm/xcm-executor/src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -182,6 +182,13 @@ impl<C> PreparedMessage for WeighedMessage<C> {
}
}

#[cfg(any(test, feature = "std"))]
impl<C> WeighedMessage<C> {
pub fn new(weight: Weight, message: Xcm<C>) -> Self {
Self(weight, message)
}
}

impl<Config: config::Config> ExecuteXcm<Config::RuntimeCall> for XcmExecutor<Config> {
type Prepared = WeighedMessage<Config::RuntimeCall>;
fn prepare(
Expand Down
16 changes: 16 additions & 0 deletions prdoc/pr_4202.prdoc
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
title: "Treat XCM ExceedsStackLimit errors as transient in the MQ pallet"

doc:
- audience: Runtime User
description: |
Fixes an issue where the MessageQueue can incorrectly assume that a message will permanently fail to process and disallow retrial of it.

crates:
- name: frame-support
bump: major
- name: pallet-message-queue
bump: patch
- name: staging-xcm-builder
bump: patch
ggwpez marked this conversation as resolved.
Show resolved Hide resolved
- name: staging-xcm-executor
bump: patch
16 changes: 14 additions & 2 deletions substrate/frame/message-queue/src/lib.rs
Original file line number Diff line number Diff line change
Expand Up @@ -765,6 +765,13 @@ enum MessageExecutionStatus {
Processed,
/// The message was processed and resulted in a, possibly permanent, error.
Unprocessable { permanent: bool },
/// The stack depth limit was reached.
///
/// We cannot just return `Unprocessable` in this case, because the processability of the
/// message depends on how the function was called. This may be a permanent error if it was
/// called by a top-level function, or a transient error if it was already called in a nested
/// function.
StackLimitReached,
}

impl<T: Config> Pallet<T> {
Expand Down Expand Up @@ -984,7 +991,8 @@ impl<T: Config> Pallet<T> {
// additional overweight event being deposited.
) {
Overweight | InsufficientWeight => Err(Error::<T>::InsufficientWeight),
Unprocessable { permanent: false } => Err(Error::<T>::TemporarilyUnprocessable),
StackLimitReached | Unprocessable { permanent: false } =>
Err(Error::<T>::TemporarilyUnprocessable),
Unprocessable { permanent: true } | Processed => {
page.note_processed_at_pos(pos);
book_state.message_count.saturating_dec();
Expand Down Expand Up @@ -1250,7 +1258,7 @@ impl<T: Config> Pallet<T> {
let is_processed = match res {
InsufficientWeight => return ItemExecutionStatus::Bailed,
Unprocessable { permanent: false } => return ItemExecutionStatus::NoProgress,
Processed | Unprocessable { permanent: true } => true,
Processed | Unprocessable { permanent: true } | StackLimitReached => true,
Overweight => false,
};

Expand Down Expand Up @@ -1461,6 +1469,10 @@ impl<T: Config> Pallet<T> {
Self::deposit_event(Event::<T>::ProcessingFailed { id: id.into(), origin, error });
MessageExecutionStatus::Unprocessable { permanent: true }
},
Err(error @ StackLimitReached) => {
Self::deposit_event(Event::<T>::ProcessingFailed { id: id.into(), origin, error });
MessageExecutionStatus::StackLimitReached
},
Ok(success) => {
// Success
let weight_used = meter.consumed().saturating_sub(prev_consumed);
Expand Down
3 changes: 3 additions & 0 deletions substrate/frame/message-queue/src/mock.rs
Original file line number Diff line number Diff line change
Expand Up @@ -198,6 +198,7 @@ impl ProcessMessage for RecordingMessageProcessor {

parameter_types! {
pub static Callback: Box<fn (&MessageOrigin, u32)> = Box::new(|_, _| {});
pub static IgnoreStackOvError: bool = false;
}

/// Processed a mocked message. Messages that end with `badformat`, `corrupt`, `unsupported` or
Expand All @@ -216,6 +217,8 @@ fn processing_message(msg: &[u8], origin: &MessageOrigin) -> Result<(), ProcessM
Err(ProcessMessageError::Unsupported)
} else if msg.ends_with("yield") {
Err(ProcessMessageError::Yield)
} else if msg.ends_with("stacklimitreached") && !IgnoreStackOvError::get() {
Err(ProcessMessageError::StackLimitReached)
} else {
Ok(())
}
Expand Down
101 changes: 98 additions & 3 deletions substrate/frame/message-queue/src/tests.rs
Original file line number Diff line number Diff line change
Expand Up @@ -174,9 +174,10 @@ fn service_queues_failing_messages_works() {
MessageQueue::enqueue_message(msg("badformat"), Here);
MessageQueue::enqueue_message(msg("corrupt"), Here);
MessageQueue::enqueue_message(msg("unsupported"), Here);
MessageQueue::enqueue_message(msg("stacklimitreached"), Here);
MessageQueue::enqueue_message(msg("yield"), Here);
// Starts with four pages.
assert_pages(&[0, 1, 2, 3]);
assert_pages(&[0, 1, 2, 3, 4]);

assert_eq!(MessageQueue::service_queues(1.into_weight()), 1.into_weight());
assert_last_event::<Test>(
Expand Down Expand Up @@ -206,9 +207,9 @@ fn service_queues_failing_messages_works() {
.into(),
);
assert_eq!(MessageQueue::service_queues(1.into_weight()), 1.into_weight());
assert_eq!(System::events().len(), 3);
assert_eq!(System::events().len(), 4);
// Last page with the `yield` stays in.
assert_pages(&[3]);
assert_pages(&[4]);
});
}

Expand Down Expand Up @@ -1880,3 +1881,97 @@ fn process_enqueued_on_idle_requires_enough_weight() {
assert_eq!(MessagesProcessed::take(), vec![]);
})
}

/// A message that reports `StackLimitReached` will not be put into the overweight queue when
/// executed from the top level.
#[test]
fn process_discards_stack_ov_message() {
use MessageOrigin::*;
build_and_execute::<Test>(|| {
MessageQueue::enqueue_message(msg("stacklimitreached"), Here);

MessageQueue::service_queues(10.into_weight());

assert_last_event::<Test>(
Event::ProcessingFailed {
id: blake2_256(b"stacklimitreached").into(),
origin: MessageOrigin::Here,
error: ProcessMessageError::StackLimitReached,
}
.into(),
);

assert!(MessagesProcessed::take().is_empty());
// Message is gone and not overweight:
assert_pages(&[]);
});
}

/// A message that reports `StackLimitReached` will stay in the overweight queue when it is executed
/// by `execute_overweight`.
#[test]
fn execute_overweight_keeps_stack_ov_message() {
use MessageOrigin::*;
build_and_execute::<Test>(|| {
// We need to create a mocked message that first reports insufficient weight, and then
// `StackLimitReached`:
IgnoreStackOvError::set(true);
MessageQueue::enqueue_message(msg("stacklimitreached"), Here);
MessageQueue::service_queues(0.into_weight());

assert_last_event::<Test>(
Event::OverweightEnqueued {
id: blake2_256(b"stacklimitreached"),
origin: MessageOrigin::Here,
message_index: 0,
page_index: 0,
}
.into(),
);
// Does not count as 'processed':
assert!(MessagesProcessed::take().is_empty());
assert_pages(&[0]);

// Now let it return `StackLimitReached`. Note that this case would normally not happen,
// since we assume that the top-level execution is the one with the most remaining stack
// depth.
IgnoreStackOvError::set(false);
// Ensure that trying to execute the message does not change any state (besides events).
System::reset_events();
let storage_noop = StorageNoopGuard::new();
assert_eq!(
<MessageQueue as ServiceQueues>::execute_overweight(3.into_weight(), (Here, 0, 0)),
Err(ExecuteOverweightError::Other)
);
assert_last_event::<Test>(
Event::ProcessingFailed {
id: blake2_256(b"stacklimitreached").into(),
origin: MessageOrigin::Here,
error: ProcessMessageError::StackLimitReached,
}
.into(),
);
System::reset_events();
drop(storage_noop);

// Now let's process it normally:
IgnoreStackOvError::set(true);
assert_eq!(
<MessageQueue as ServiceQueues>::execute_overweight(1.into_weight(), (Here, 0, 0))
.unwrap(),
1.into_weight()
);

assert_last_event::<Test>(
Event::Processed {
id: blake2_256(b"stacklimitreached").into(),
origin: MessageOrigin::Here,
weight_used: 1.into_weight(),
success: true,
}
.into(),
);
assert_pages(&[]);
System::reset_events();
});
}
4 changes: 4 additions & 0 deletions substrate/frame/support/src/traits/messages.rs
Original file line number Diff line number Diff line change
Expand Up @@ -46,6 +46,8 @@ pub enum ProcessMessageError {
/// the case that a queue is re-serviced within the same block after *yielding*. A queue is
/// not required to *yield* again when it is being re-serviced withing the same block.
Yield,
/// The message could not be processed for reaching the stack depth limit.
StackLimitReached,
}

/// Can process messages from a specific origin.
Expand Down Expand Up @@ -96,6 +98,8 @@ pub trait ServiceQueues {
/// - `weight_limit`: The maximum amount of dynamic weight that this call can use.
///
/// Returns the dynamic weight used by this call; is never greater than `weight_limit`.
/// Should only be called in top-level runtime entry points like `on_initialize` or `on_idle`.
/// Otherwise, stack depth limit errors may be miss-handled.
fn service_queues(weight_limit: Weight) -> Weight;

/// Executes a message that could not be executed by [`Self::service_queues()`] because it was
Expand Down
Loading