RasaHQ · dakshvar22 · Jul 12, 2021 · Jul 8, 2021 · Jul 8, 2021 · Jul 9, 2021
diff --git a/rasa/core/test.py b/rasa/core/test.py
@@ -26,6 +26,9 @@
 from rasa.shared.core.training_data.story_writer.yaml_story_writer import (
     YAMLStoryWriter,
 )
+from rasa.shared.core.training_data.structures import (
+    StoryStep,
+)
 from rasa.shared.core.domain import Domain
 from rasa.nlu.constants import (
     RESPONSE_SELECTOR_DEFAULT_INTENT,
@@ -680,9 +683,7 @@ def _collect_action_executed_predictions(
             action_predictions=[predicted_action], action_targets=[expected_action]
         )
 
-    if action_executed_eval_store.has_prediction_target_mismatch() or (
-        predicted_action_unlikely_intent and predicted_action != expected_action
-    ):
+    if action_executed_eval_store.has_prediction_target_mismatch():
         partial_tracker.update(
             WronglyPredictedAction(
                 expected_action_name,
@@ -698,7 +699,7 @@ def _collect_action_executed_predictions(
         if (
             fail_on_prediction_errors
             and predicted_action != ACTION_UNLIKELY_INTENT_NAME
-            and expected_action != ACTION_UNLIKELY_INTENT_NAME
+            and predicted_action != expected_action
         ):
             story_dump = YAMLStoryWriter().dumps(partial_tracker.as_story().story_steps)
             error_msg = (
@@ -972,6 +973,20 @@ async def _collect_story_predictions(
     )
 
 
+def _filter_step_events(step: StoryStep) -> StoryStep:
+    events = []
+    for event in step.events:
+        if (
+                type(event) == WronglyPredictedAction
+                and event.action_name == event.action_name_prediction == ACTION_UNLIKELY_INTENT_NAME
+        ):
+            continue
+        events.append(event)
+    updated_step = step.create_copy(use_new_id=False)
+    updated_step.events = events
+    return updated_step
+
+
 def _log_stories(
     trackers: List[DialogueStateTracker], file_path: Text, message_if_no_trackers: Text
 ) -> None:
@@ -981,7 +996,7 @@ def _log_stories(
             f.write(f"# {message_if_no_trackers}")
         else:
             stories = [tracker.as_story(include_source=True) for tracker in trackers]
-            steps = [step for story in stories for step in story.story_steps]
+            steps = [_filter_step_events(step) for story in stories for step in story.story_steps]
             f.write(YAMLStoryWriter().dumps(steps))
 
 

diff --git a/tests/core/test_test.py b/tests/core/test_test.py
@@ -256,13 +256,54 @@ async def test_action_unlikely_intent_correctly_predicted(
     )
 
     result = await rasa.core.test.test(
-        str(file_name), agent, out_directory=str(tmp_path),
+        str(file_name), agent, out_directory=str(tmp_path), fail_on_prediction_errors = True
     )
     assert "report" in result.keys()
     assert result["report"]["conversation_accuracy"]["correct"] == 1
     assert result["report"]["conversation_accuracy"]["with_warnings"] == 0
 
 
+async def test_action_unlikely_intent_fail_on_prediction_errors(
+        monkeypatch: MonkeyPatch, tmp_path: Path, moodbot_domain: Domain
+):
+    monkeypatch.setattr(
+        SimplePolicyEnsemble,
+        "probabilities_using_best_policy",
+        _probabilities_with_action_unlikely_intent_for(["mood_unhappy"]),
+    )
+
+    file_name = tmp_path / "test_action_unlikely_intent_2.yml"
+    file_name.write_text(
+        """
+        version: "2.0"
+        stories:
+          - story: unlikely path (with action_unlikely_intent)
+            steps:
+              - user: |
+                  very terrible
+                intent: mood_unhappy
+              - action: utter_cheer_up
+              - action: action_unlikely_intent
+              - action: utter_did_that_help
+              - intent: affirm
+              - action: utter_happy
+        """
+    )
+
+    # We train on the above story so that RulePolicy can memorize
+    # it and we don't have to worry about other actions being
+    # predicted correctly.
+    agent = await _train_rule_based_agent(
+        moodbot_domain, file_name, monkeypatch, ignore_action_unlikely_intent=False
+    )
+
+    with pytest.raises(rasa.core.test.WrongPredictionException):
+        result = await rasa.core.test.test(
+            str(file_name), agent, out_directory=str(tmp_path), fail_on_prediction_errors=True
+        )
+
+
+
 async def test_wrong_action_after_action_unlikely_intent(
     monkeypatch: MonkeyPatch, tmp_path: Path, moodbot_domain: Domain
 ):