Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

GOTH - Power outage test #668

Merged
merged 4 commits into from
Sep 27, 2021
Merged
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
112 changes: 112 additions & 0 deletions tests/goth_tests/test_power_outage.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,112 @@
import logging
import os
from pathlib import Path
from typing import List

import pytest

from goth.assertions import EventStream
from goth.configuration import load_yaml, Override
from goth.runner.log import configure_logging
from goth.runner import Runner
from goth.runner.probe import RequestorProbe, ProviderProbe

from yapapi.log import SummaryLogger

from .assertions import assert_no_errors, assert_tasks_processed


logger = logging.getLogger("goth.test.power_outage")

ALL_TASKS = {"0", "10", "20", "30", "40", "50"}


# Temporal assertions expressing properties of sequences of "events". In this case, each "event"
# is just a line of output from `blender.py`.


async def assert_all_tasks_started(output_lines: EventStream[str]):
"""Assert that for every task a line with `Task started on provider` will appear."""
await assert_tasks_processed(ALL_TASKS, "started on provider", output_lines)


async def assert_all_tasks_computed(output_lines: EventStream[str]):
"""Assert that for every task a line with `Task computed by provider` will appear."""
await assert_tasks_processed(ALL_TASKS, "finished by provider", output_lines)


""" Test when provider has a power outage.

Start a regular blender task, when the first task is started on the provider it gets
shut down. The requestor is supposed to send all tasks to the other machine and complete
the task. The invoice for the power-outage provider will not be paid. """


@pytest.mark.asyncio
async def test_power_outage(
project_dir: Path, log_dir: Path, goth_config_path: Path, config_overrides: List[Override]
) -> None:

# This is the default configuration with 2 wasm/VM providers
goth_config = load_yaml(goth_config_path, config_overrides)

blender_path = project_dir / "examples" / "blender" / "blender.py"

configure_logging(log_dir)

runner = Runner(
base_log_dir=log_dir,
compose_config=goth_config.compose_config,
)

async with runner(goth_config.containers):

requestor = runner.get_probes(probe_type=RequestorProbe)[0]
provider_1 = runner.get_probes(probe_type=ProviderProbe)[0]

async with requestor.run_command_on_host(
f"{blender_path} --subnet-tag goth",
env=os.environ,
) as (_cmd_task, cmd_monitor):

# Add assertions to the command output monitor `cmd_monitor`:
cmd_monitor.add_assertion(assert_no_errors)
all_sent = cmd_monitor.add_assertion(assert_all_tasks_started)
all_computed = cmd_monitor.add_assertion(assert_all_tasks_computed)

await cmd_monitor.wait_for_pattern(".*Received proposals from 2 ", timeout=20)
logger.info("Received proposals")

await cmd_monitor.wait_for_pattern(".*Agreement proposed ", timeout=10)
logger.info("Agreement proposed")

await cmd_monitor.wait_for_pattern(".*Agreement confirmed ", timeout=10)
logger.info("Agreement confirmed")

await cmd_monitor.wait_for_pattern(
".*Task started on provider 'provider-1'.*", timeout=10
)

logger.debug("Stopping provider 1")
await provider_1.stop()
provider_1.container.stop()
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Since goth version 0.7.2 (latest patch release) Container.stop gets called as part of Probe.stop, so this line is no longer necessary. :)

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

awesome, goth keeps getting better :D

logger.info("Provider 1 stopped.")
provider_1.container.restart()
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

And this shouldn't be necessary with goth version 0.7.3. :D

Copy link
Contributor Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

great! can update this in a cleanup PR if needed :)


await cmd_monitor.wait_for_pattern(".*Terminated agreement with provider-1")
logger.info("Agreement properly terminated")

await all_sent.wait_for_result(timeout=120)
logger.info("All tasks sent")

await all_computed.wait_for_result(timeout=120)
logger.info("All tasks computed, waiting for Golem shutdown")

await cmd_monitor.wait_for_pattern(".*Unpaid agreements: .*")
logger.info("Expected 1 unpaid agreement")
Copy link
Contributor

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Suggested change
logger.info("Expected 1 unpaid agreement")
logger.info("Found expected unpaid agreement")


await cmd_monitor.wait_for_pattern(
f".*{SummaryLogger.GOLEM_SHUTDOWN_SUCCESSFUL_MESSAGE}", timeout=120
)

logger.info("Requestor script finished")