Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add verify stories and rules actions in domain to rasa data validate #8645

Merged
merged 16 commits into from
May 18, 2021
Merged
Show file tree
Hide file tree
Changes from 14 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions changelog/7799.improvement.md
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
Updated validator used by `rasa data validate` to verify that actions used in stories and rules are present in the domain and that form slots match domain slots.
6 changes: 5 additions & 1 deletion rasa/cli/data.py
Original file line number Diff line number Diff line change
Expand Up @@ -273,7 +273,11 @@ def validate_stories(args: argparse.Namespace) -> None:


def _validate_domain(validator: "Validator") -> bool:
return validator.verify_domain_validity()
return (
validator.verify_domain_validity()
and validator.verify_actions_in_stories_rules()
and validator.verify_form_slots()
)


def _validate_nlu(validator: "Validator", args: argparse.Namespace) -> bool:
Expand Down
49 changes: 49 additions & 0 deletions rasa/validator.py
Original file line number Diff line number Diff line change
Expand Up @@ -192,6 +192,35 @@ def verify_utterances_in_stories(self, ignore_warnings: bool = True) -> bool:

return everything_is_alright

def verify_actions_in_stories_rules(self) -> bool:
"""Verifies that actions used in stories and rules are present in the domain."""
everything_is_alright = True
visited = set()

for story in self.story_graph.story_steps:
for event in story.events:
if not isinstance(event, ActionExecuted):
continue

if not event.action_name.startswith("action_"):
wochinge marked this conversation as resolved.
Show resolved Hide resolved
continue

if event.action_name in visited:
# we already processed this one before, we only want to warn once
continue

if event.action_name not in self.domain.action_names_or_texts:
rasa.shared.utils.io.raise_warning(
f"The action '{event.action_name}' is used in your stories or rules, but it "
f"is not listed in the domain file. You should add it to your "
f"domain file!",
docs=DOCS_URL_DOMAINS,
)
everything_is_alright = False
visited.add(event.action_name)

return everything_is_alright

def verify_story_structure(
self, ignore_warnings: bool = True, max_history: Optional[int] = None
) -> bool:
Expand Down Expand Up @@ -244,6 +273,26 @@ def verify_nlu(self, ignore_warnings: bool = True) -> bool:
stories_are_valid = self.verify_utterances_in_stories(ignore_warnings)
return intents_are_valid and stories_are_valid and there_is_no_duplication

def verify_form_slots(self) -> bool:
"""Verifies that form slots match the slot mappings in domain."""
domain_slot_names = [slot.name for slot in self.domain.slots]
everything_is_alright = True

for form in self.domain.form_names:
form_slots = self.domain.slot_mapping_for_form(form)
for slot in form_slots.keys():
if slot in domain_slot_names:
continue
else:
rasa.shared.utils.io.raise_warning(
f"The form slot '{slot}' in form '{form}' is not present in the domain slots."
wochinge marked this conversation as resolved.
Show resolved Hide resolved
f"Please add the correct slot or check for typos.",
docs=DOCS_URL_DOMAINS,
)
everything_is_alright = False

return everything_is_alright

def verify_domain_validity(self) -> bool:
"""Checks whether the domain returned by the importer is empty.

Expand Down
55 changes: 55 additions & 0 deletions tests/cli/test_rasa_data.py
Original file line number Diff line number Diff line change
Expand Up @@ -144,6 +144,61 @@ async def mock_from_importer(importer: TrainingDataImporter) -> Validator:
data.validate_files(args)


@pytest.mark.parametrize(
("file_type", "data_type"), [("stories", "story"), ("rules", "rule")]
)
def test_validate_files_action_not_found_invalid_domain(
file_type: Text, data_type: Text, tmp_path: Path
):
file_name = tmp_path / f"{file_type}.yml"
file_name.write_text(
f"""
version: "2.0"
{file_type}:
- {data_type}: test path
steps:
- intent: goodbye
- action: action_test
"""
)
args = {
"domain": "data/test_moodbot/domain.yml",
"data": [file_name],
"max_history": None,
"config": None,
}
with pytest.raises(SystemExit):
data.validate_files(namedtuple("Args", args.keys())(*args.values()))


def test_validate_files_form_slots_not_matching(tmp_path: Path):
domain_file_name = tmp_path / "domain.yml"
domain_file_name.write_text(
"""
version: "2.0"
forms:
name_form:
first_name:
- type: from_text
last_name:
- type: from_text
slots:
first_name:
type: text
last_nam:
type: text
"""
)
args = {
"domain": domain_file_name,
"data": None,
"max_history": None,
"config": None,
}
with pytest.raises(SystemExit):
data.validate_files(namedtuple("Args", args.keys())(*args.values()))


def test_validate_files_exit_early():
with pytest.raises(SystemExit) as pytest_e:
args = {
Expand Down
171 changes: 171 additions & 0 deletions tests/test_validator.py
Original file line number Diff line number Diff line change
Expand Up @@ -259,9 +259,180 @@ async def test_verify_there_is_not_example_repetition_in_intents():
assert validator.verify_example_repetition_in_intents(False)


async def test_verify_actions_in_stories_not_in_domain(
tmp_path: Path, domain_path: Text
):
story_file_name = tmp_path / "stories.yml"
story_file_name.write_text(
"""
version: "2.0"
stories:
- story: story path 1
steps:
- intent: greet
- action: action_test_1
"""
)

importer = RasaFileImporter(
domain_path=domain_path, training_data_paths=[story_file_name],
)
validator = await Validator.from_importer(importer)
with pytest.warns(UserWarning) as warning:
validity = validator.verify_actions_in_stories_rules()
assert validity is False

assert (
"The action 'action_test_1' is used in your stories or rules, "
"but it is not listed in the domain file." in warning[0].message.args[0]
)


async def test_verify_actions_in_rules_not_in_domain(tmp_path: Path, domain_path: Text):
rules_file_name = tmp_path / "rules.yml"
rules_file_name.write_text(
"""
version: "2.0"
rules:
- rule: rule path 1
steps:
- intent: goodbye
- action: action_test_2
"""
)
importer = RasaFileImporter(
domain_path=domain_path, training_data_paths=[rules_file_name],
)
validator = await Validator.from_importer(importer)
with pytest.warns(UserWarning) as warning:
validity = validator.verify_actions_in_stories_rules()
assert validity is False

assert (
"The action 'action_test_2' is used in your stories or rules, "
"but it is not listed in the domain file." in warning[0].message.args[0]
)


async def test_verify_form_slots_invalid_domain(tmp_path: Path):
domain = tmp_path / "domain.yml"
domain.write_text(
"""
version: "2.0"
forms:
name_form:
first_name:
- type: from_text
last_name:
- type: from_text
slots:
first_name:
type: text
last_nam:
type: text
"""
)
importer = RasaFileImporter(domain_path=domain)
validator = await Validator.from_importer(importer)
with pytest.warns(UserWarning) as w:
validity = validator.verify_form_slots()
assert validity is False

assert (
w[0].message.args[0]
== "The form slot 'last_name' in form 'name_form' is not present in the domain slots."
"Please add the correct slot or check for typos."
)


async def test_invalid_domain_mapping_policy():
importer = RasaFileImporter(
domain_path="data/test_domains/default_with_mapping.yml"
)
validator = await Validator.from_importer(importer)
assert validator.verify_domain_validity() is False


@pytest.mark.parametrize(
("file_name", "data_type"), [("stories", "story"), ("rules", "rule")]
)
async def test_valid_stories_rules_actions_in_domain(
file_name: Text, data_type: Text, tmp_path: Path
):
domain = tmp_path / "domain.yml"
domain.write_text(
"""
version: "2.0"
intents:
- greet
actions:
- action_greet
"""
)
file_name = tmp_path / f"{file_name}.yml"
file_name.write_text(
f"""
version: "2.0"
{file_name}:
- {data_type}: test path
steps:
- intent: greet
- action: action_greet
"""
)
importer = RasaFileImporter(domain_path=domain, training_data_paths=[file_name],)
validator = await Validator.from_importer(importer)
assert validator.verify_actions_in_stories_rules()


@pytest.mark.parametrize(
("file_name", "data_type"), [("stories", "story"), ("rules", "rule")]
)
async def test_valid_stories_rules_default_actions(
file_name: Text, data_type: Text, tmp_path: Path
):
domain = tmp_path / "domain.yml"
domain.write_text(
"""
version: "2.0"
intents:
- greet
"""
)
file_name = tmp_path / f"{file_name}.yml"
file_name.write_text(
f"""
version: "2.0"
{file_name}:
- {data_type}: test path
steps:
- intent: greet
- action: action_restart
"""
)
importer = RasaFileImporter(domain_path=domain, training_data_paths=[file_name],)
validator = await Validator.from_importer(importer)
assert validator.verify_actions_in_stories_rules()


async def test_valid_form_slots_in_domain(tmp_path: Path):
domain = tmp_path / "domain.yml"
domain.write_text(
"""
version: "2.0"
forms:
name_form:
first_name:
- type: from_text
last_name:
- type: from_text
slots:
first_name:
type: text
last_name:
type: text
"""
)
importer = RasaFileImporter(domain_path=domain)
validator = await Validator.from_importer(importer)
assert validator.verify_form_slots()