Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat: rely on rabbitmq dlq for computation errors handling #575

Merged
merged 7 commits into from
Jan 8, 2025
Merged
Original file line number Diff line number Diff line change
@@ -0,0 +1,17 @@
/*
* Copyright (c) 2024, RTE (http://www.rte-france.com)
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*/

package org.gridsuite.modification.server;

/**
* @author Joris Mancini <joris.mancini_externe at rte-france.com>
*/
public class BuildException extends RuntimeException {
public BuildException(String message, Throwable e) {
super(message, e);
}
}

This file was deleted.

Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,7 @@
import com.fasterxml.jackson.databind.ObjectMapper;
import com.google.common.collect.Sets;
import lombok.NonNull;
import org.gridsuite.modification.server.BuildException;
import org.gridsuite.modification.server.dto.BuildInfos;
import org.gridsuite.modification.server.dto.NetworkModificationResult;
import org.slf4j.Logger;
Expand Down Expand Up @@ -46,8 +47,6 @@ public class BuildWorkerService {

private final BuildStoppedPublisherService stoppedPublisherService;

private final BuildFailedPublisherService failedPublisherService;

private final Map<String, CompletableFuture<NetworkModificationResult>> futures = new ConcurrentHashMap<>();

private final Map<String, BuildCancelContext> cancelBuildRequests = new ConcurrentHashMap<>();
Expand All @@ -61,12 +60,10 @@ public class BuildWorkerService {

public BuildWorkerService(@NonNull NetworkModificationService networkModificationService,
@NonNull ObjectMapper objectMapper,
@NonNull BuildStoppedPublisherService stoppedPublisherService,
@NonNull BuildFailedPublisherService failedPublisherService) {
@NonNull BuildStoppedPublisherService stoppedPublisherService) {
this.networkModificationService = networkModificationService;
this.objectMapper = objectMapper;
this.stoppedPublisherService = stoppedPublisherService;
this.failedPublisherService = failedPublisherService;
}

private CompletableFuture<NetworkModificationResult> execBuildVariant(BuildExecContext execContext, BuildInfos buildInfos) {
Expand Down Expand Up @@ -98,11 +95,11 @@ private CompletableFuture<NetworkModificationResult> execBuildVariant(BuildExecC
@Bean
public Consumer<Message<String>> consumeBuild() {
return message -> {
BuildExecContext execContext = null;
BuildExecContext execContext;
try {
execContext = BuildExecContext.fromMessage(message, objectMapper);
} catch (Exception e) {
LOGGER.error("Error retrieving message in consumeBuild", e);
throw new BuildException("Failed to read build message", e);
}
startBuild(Objects.requireNonNull(execContext));
};
Expand All @@ -113,7 +110,7 @@ private void startBuild(BuildExecContext execContext) {
BuildInfos buildInfos = execContext.getBuildInfos();
CompletableFuture<NetworkModificationResult> future = execBuildVariant(execContext, buildInfos);
NetworkModificationResult result;
if (future != null && (result = future.get()) != null) { // result available
if (future != null && (result = future.join()) != null) { // result available
notificationService.emitBuildResultMessage(result, execContext.getReceiver());
LOGGER.info("Build complete on node '{}'", execContext.getReceiver());
} else { // result not available : stop build request
Expand All @@ -123,13 +120,8 @@ private void startBuild(BuildExecContext execContext) {
}
} catch (CancellationException e) {
stoppedPublisherService.publishCancel(execContext.getReceiver(), CANCEL_MESSAGE);
} catch (InterruptedException e) {
LOGGER.error(FAIL_MESSAGE, e);
failedPublisherService.publishFail(execContext.getReceiver(), FAIL_MESSAGE + " : " + e.getMessage());
Thread.currentThread().interrupt();
} catch (Exception e) {
LOGGER.error(FAIL_MESSAGE, e);
failedPublisherService.publishFail(execContext.getReceiver(), FAIL_MESSAGE + " : " + e.getMessage());
throw new BuildException("Node build failed", e);
} finally {
futures.remove(execContext.getReceiver());
cancelBuildRequests.remove(execContext.getReceiver());
Expand Down
16 changes: 13 additions & 3 deletions src/main/resources/config/application.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -21,6 +21,7 @@ spring:
group: buildGroup
consumer:
concurrency: 2
max-attempts: 1
publishBuild-out-0:
destination: ${powsybl-ws.rabbitmq.destination.prefix:}build.run
publishResultBuild-out-0:
Expand All @@ -31,9 +32,18 @@ spring:
destination: ${powsybl-ws.rabbitmq.destination.prefix:}build.cancel
publishStoppedBuild-out-0:
destination: ${powsybl-ws.rabbitmq.destination.prefix:}build.stopped
publishFailedBuild-out-0:
destination: ${powsybl-ws.rabbitmq.destination.prefix:}build.failed
output-bindings: publishBuild-out-0;publishResultBuild-out-0;publishCancelBuild-out-0;publishStoppedBuild-out-0;publishFailedBuild-out-0
output-bindings: publishBuild-out-0;publishResultBuild-out-0;publishCancelBuild-out-0;publishStoppedBuild-out-0
rabbit:
bindings:
consumeBuild-in-0:
consumer:
auto-bind-dlq: true
dead-letter-exchange: ${powsybl-ws.rabbitmq.destination.prefix:}build.run.dlx
dead-letter-queue-name: ${powsybl-ws.rabbitmq.destination.prefix:}build.run.dlx.dlq
dead-letter-exchange-type: topic
quorum:
enabled: true
delivery-limit: 2

powsybl-ws:
database:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -72,9 +72,6 @@
import static com.powsybl.iidm.network.ReactiveLimitsKind.MIN_MAX;
import static org.gridsuite.modification.server.impacts.TestImpactUtils.*;
import static org.gridsuite.modification.server.service.BuildWorkerService.CANCEL_MESSAGE;
import static org.gridsuite.modification.server.service.BuildWorkerService.FAIL_MESSAGE;
import static org.hamcrest.MatcherAssert.assertThat;
import static org.hamcrest.Matchers.startsWith;
import static org.junit.jupiter.api.Assertions.*;
import static org.mockito.ArgumentMatchers.any;
import static org.mockito.ArgumentMatchers.eq;
Expand Down Expand Up @@ -127,9 +124,6 @@ class BuildTest {
@Value("${spring.cloud.stream.bindings.publishStoppedBuild-out-0.destination}")
private String buildStoppedDestination;

@Value("${spring.cloud.stream.bindings.publishFailedBuild-out-0.destination}")
private String buildFailedDestination;

@Autowired
private OutputDestination output;

Expand Down Expand Up @@ -910,9 +904,6 @@ void runBuildWithReportErrorTest(final MockWebServer server) throws Exception {
assertTrue(TestUtils.getRequestsDone(1, server).stream().anyMatch(r -> r.matches("/v1/reports/.*")));

assertNull(output.receive(TIMEOUT, buildResultDestination));
Message<byte[]> message = output.receive(TIMEOUT * 3, buildFailedDestination);
assertEquals("me", message.getHeaders().get("receiver"));
assertThat((String) message.getHeaders().get("message"), startsWith(FAIL_MESSAGE));
TheMaskedTurtle marked this conversation as resolved.
Show resolved Hide resolved
Message<byte[]> buildMessage = output.receive(TIMEOUT, consumeBuildDestination);
assertNotNull(buildMessage);
assertEquals("me", buildMessage.getHeaders().get("receiver"));
Expand Down Expand Up @@ -970,7 +961,7 @@ private void testNetworkModificationsCount(UUID groupUuid, int actualSize) {

@AfterEach
void tearDown(final MockWebServer server) {
List<String> destinations = List.of(consumeBuildDestination, cancelBuildDestination, buildResultDestination, buildStoppedDestination, buildFailedDestination);
List<String> destinations = List.of(consumeBuildDestination, cancelBuildDestination, buildResultDestination, buildStoppedDestination);
TestUtils.assertQueuesEmptyThenClear(destinations, output);
try {
TestUtils.assertServerRequestsEmptyThenShutdown(server);
Expand Down
Loading