diff --git a/.github/workflows/dockerimage-clang-3.9-ubuntu-mpich.yml b/.github/workflows/dockerimage-clang-3.9-ubuntu-mpich.yml index bc835d2f77..ff1fd7e498 100644 --- a/.github/workflows/dockerimage-clang-3.9-ubuntu-mpich.yml +++ b/.github/workflows/dockerimage-clang-3.9-ubuntu-mpich.yml @@ -32,7 +32,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-ubuntu-${{ env.UBUNTU }}-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/.github/workflows/dockerimage-clang-5.0-ubuntu-mpich.yml b/.github/workflows/dockerimage-clang-5.0-ubuntu-mpich.yml index c0a7c2ec5c..67947049b3 100644 --- a/.github/workflows/dockerimage-clang-5.0-ubuntu-mpich.yml +++ b/.github/workflows/dockerimage-clang-5.0-ubuntu-mpich.yml @@ -32,7 +32,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-ubuntu-${{ env.UBUNTU }}-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/.github/workflows/dockerimage-clang-8-alpine-mpich.yml b/.github/workflows/dockerimage-clang-8-alpine-mpich.yml index 59262f1295..e39622cab5 100644 --- a/.github/workflows/dockerimage-clang-8-alpine-mpich.yml +++ b/.github/workflows/dockerimage-clang-8-alpine-mpich.yml @@ -25,7 +25,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-alpine-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/.github/workflows/dockerimage-gcc-5-ubuntu-mpich.yml b/.github/workflows/dockerimage-gcc-5-ubuntu-mpich.yml index cc83907f81..ecfd8bbfcc 100644 --- a/.github/workflows/dockerimage-gcc-5-ubuntu-mpich.yml +++ b/.github/workflows/dockerimage-gcc-5-ubuntu-mpich.yml @@ -32,7 +32,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-ubuntu-${{ env.UBUNTU }}-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/.github/workflows/dockerimage-gcc-6-ubuntu-mpich.yml b/.github/workflows/dockerimage-gcc-6-ubuntu-mpich.yml index fc1aa72b73..40c9bd90b6 100644 --- a/.github/workflows/dockerimage-gcc-6-ubuntu-mpich.yml +++ b/.github/workflows/dockerimage-gcc-6-ubuntu-mpich.yml @@ -32,7 +32,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-ubuntu-${{ env.UBUNTU }}-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/.github/workflows/dockerimage-gcc-7-ubuntu-mpich.yml b/.github/workflows/dockerimage-gcc-7-ubuntu-mpich.yml index 5e00b71282..6fbcce3926 100644 --- a/.github/workflows/dockerimage-gcc-7-ubuntu-mpich.yml +++ b/.github/workflows/dockerimage-gcc-7-ubuntu-mpich.yml @@ -31,7 +31,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-ubuntu-${{ env.UBUNTU }}-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/.github/workflows/dockerimage-gcc-8-ubuntu-mpich.yml b/.github/workflows/dockerimage-gcc-8-ubuntu-mpich.yml index 8f7f5a2f93..1864bb5b2b 100644 --- a/.github/workflows/dockerimage-gcc-8-ubuntu-mpich.yml +++ b/.github/workflows/dockerimage-gcc-8-ubuntu-mpich.yml @@ -32,7 +32,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-ubuntu-${{ env.UBUNTU }}-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/.github/workflows/dockerimage-intel-18-ubuntu-mpich.yml b/.github/workflows/dockerimage-intel-18-ubuntu-mpich.yml index 2a6e56da92..8e8d79e376 100644 --- a/.github/workflows/dockerimage-intel-18-ubuntu-mpich.yml +++ b/.github/workflows/dockerimage-intel-18-ubuntu-mpich.yml @@ -32,7 +32,7 @@ jobs: steps: - name: Setup Build Root - uses: allenevans/set-env@v1.0.0 + uses: allenevans/set-env@v2.0.1 with: BUILD_ROOT: "~/.local/cache/${{ env.ARCH }}-ubuntu-${{ env.UBUNTU }}-${{ env.COMPILER }}-cache/" - name: Prepare caching timestamp diff --git a/ci/azure/azure-intel-19-ubuntu-mpich.yml b/ci/azure/azure-intel-19-ubuntu-mpich.yml new file mode 100644 index 0000000000..0e28d769dc --- /dev/null +++ b/ci/azure/azure-intel-19-ubuntu-mpich.yml @@ -0,0 +1,145 @@ +############################################################################### +############## Warning this is a generated file---do not modify ############### +############################################################################### + +name: PR tests (intel 19, ubuntu, mpich) + +trigger: + branches: + include: + - develop + - 1.0.0* + +pr: + branches: + include: + - '*' + + +resources: +- repo: self + +variables: + tag: '$(Build.BuildId)' + REPO: lifflander1/vt + ARCH: amd64 + UBUNTU: 18.04 + COMPILER_TYPE: intel + COMPILER: icc-19 + BUILD_TYPE: release + ULIMIT_CORE: 0 + CODE_COVERAGE: 0 + VT_LB: 1 + VT_TRACE: 1 + VT_TRACE_RT: 0 + VT_MIMALLOC: 0 + VT_DOCS: 0 + VT_ASAN: 0 + VT_POOL: 0 + VT_EXTENDED_TESTS: 0 + VT_UNITY_BUILD: 1 + VT_ZOLTAN: 0 + VT_CI_BUILD: 1 + VT_DIAGNOSTICS: 1 + CACHE: "$(Agent.TempDirectory)/cache/" + cache_name: ubuntu-intel-19-cache + build_root: "$(CACHE)/$(ARCH)-ubuntu-$(UBUNTU)-$(COMPILER)-cache/" + TS: 0 + TS_YEAR: 0 + TS_MONTH: 0 + TS_DAY: 0 + +stages: +- stage: Build + displayName: Build image + jobs: + - job: Build + displayName: Build + pool: + vmImage: 'ubuntu-18.04' + timeoutInMinutes: 180 + steps: + - task: Bash@3 + displayName: Job setup + inputs: + targetType: 'inline' + script: | + echo setup + - task: Bash@3 + displayName: Build timestep for caching + inputs: + targetType: 'inline' + script: | + echo 'string(TIMESTAMP current_date "%H;%M;%S" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS]$val" + echo 'string(TIMESTAMP current_date "%Y" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_YEAR]$val" + echo 'string(TIMESTAMP current_date "%m" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_MONTH]$val" + echo 'string(TIMESTAMP current_date "%d" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_DAY]$val" + - task: Bash@3 + displayName: Output timestamp for caching + inputs: + targetType: 'inline' + script: 'echo "my pipeline variable is $(TS) $(TS_YEAR) $(TS_MONTH) $(TS_DAY)"' + - task: Cache@2 + displayName: Update cache + inputs: + securityNamespace: cache + key: $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) | $(TS_DAY) | $(TS) + path: '$(build_root)/ccache' + restoreKeys: | + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) | $(TS_DAY) + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) + $(Agent.OS) | "$(cache_name)" + - task: DockerCompose@0 + displayName: Pull container + inputs: + containerregistrytype: 'Container Registry' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'pull --ignore-pull-failures ubuntu-cpp-clean' + - task: DockerCompose@0 + displayName: Build container + inputs: + containerregistrytype: 'Container Registry' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'run ubuntu-cpp-clean' + - task: DockerCompose@0 + displayName: Push container to registry + inputs: + containerregistrytype: 'Container Registry' + dockerRegistryEndpoint: 'dockerRegistryConnection1' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'push ubuntu-cpp-clean' + - task: Bash@3 + displayName: Create artifacts + inputs: + targetType: 'inline' + script: | + zip -j $(Agent.TempDirectory)/LastTest.log.gz $(build_root)/vt/Testing/Temporary/LastTest.log + zip -j $(Agent.TempDirectory)/cmake-output.log.gz $(build_root)/vt/cmake-output.log + - task: PublishPipelineArtifact@1 + displayName: Upload CMake test output artifact + inputs: + targetPath: '$(Agent.TempDirectory)/LastTest.log.gz' + artifact: 'CMakeLastTestLog' + publishLocation: 'pipeline' + - task: PublishPipelineArtifact@1 + displayName: Upload CMake full output artifact + inputs: + targetPath: '$(Agent.TempDirectory)/cmake-output.log.gz' + artifact: 'CMakeOutputLog' + publishLocation: 'pipeline' diff --git a/ci/azure/azure-nvidia-10-ubuntu-mpich.yml b/ci/azure/azure-nvidia-10-ubuntu-mpich.yml new file mode 100644 index 0000000000..4cd8460b45 --- /dev/null +++ b/ci/azure/azure-nvidia-10-ubuntu-mpich.yml @@ -0,0 +1,145 @@ +############################################################################### +############## Warning this is a generated file---do not modify ############### +############################################################################### + +name: PR tests (nvidia cuda 10.1, ubuntu, mpich) + +trigger: + branches: + include: + - develop + - 1.0.0* + +pr: + branches: + include: + - '*' + + +resources: +- repo: self + +variables: + tag: '$(Build.BuildId)' + REPO: lifflander1/vt + ARCH: amd64 + UBUNTU: 18.04 + COMPILER_TYPE: nvidia + COMPILER: nvcc-10 + BUILD_TYPE: release + ULIMIT_CORE: 0 + CODE_COVERAGE: 0 + VT_LB: 1 + VT_TRACE: 1 + VT_TRACE_RT: 0 + VT_MIMALLOC: 0 + VT_DOCS: 0 + VT_ASAN: 0 + VT_POOL: 0 + VT_EXTENDED_TESTS: 0 + VT_UNITY_BUILD: 1 + VT_ZOLTAN: 0 + VT_CI_BUILD: 1 + VT_DIAGNOSTICS: 0 + CACHE: "$(Agent.TempDirectory)/cache/" + cache_name: ubuntu-nvidia-10-cache + build_root: "$(CACHE)/$(ARCH)-ubuntu-$(UBUNTU)-$(COMPILER)-cache/" + TS: 0 + TS_YEAR: 0 + TS_MONTH: 0 + TS_DAY: 0 + +stages: +- stage: Build + displayName: Build image + jobs: + - job: Build + displayName: Build + pool: + vmImage: 'ubuntu-18.04' + timeoutInMinutes: 180 + steps: + - task: Bash@3 + displayName: Job setup + inputs: + targetType: 'inline' + script: | + echo setup + - task: Bash@3 + displayName: Build timestep for caching + inputs: + targetType: 'inline' + script: | + echo 'string(TIMESTAMP current_date "%H;%M;%S" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS]$val" + echo 'string(TIMESTAMP current_date "%Y" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_YEAR]$val" + echo 'string(TIMESTAMP current_date "%m" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_MONTH]$val" + echo 'string(TIMESTAMP current_date "%d" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_DAY]$val" + - task: Bash@3 + displayName: Output timestamp for caching + inputs: + targetType: 'inline' + script: 'echo "my pipeline variable is $(TS) $(TS_YEAR) $(TS_MONTH) $(TS_DAY)"' + - task: Cache@2 + displayName: Update cache + inputs: + securityNamespace: cache + key: $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) | $(TS_DAY) | $(TS) + path: '$(build_root)/ccache' + restoreKeys: | + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) | $(TS_DAY) + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) + $(Agent.OS) | "$(cache_name)" + - task: DockerCompose@0 + displayName: Pull container + inputs: + containerregistrytype: 'Container Registry' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'pull --ignore-pull-failures ubuntu-cpp-clean' + - task: DockerCompose@0 + displayName: Build container + inputs: + containerregistrytype: 'Container Registry' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'run ubuntu-cpp-clean' + - task: DockerCompose@0 + displayName: Push container to registry + inputs: + containerregistrytype: 'Container Registry' + dockerRegistryEndpoint: 'dockerRegistryConnection1' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'push ubuntu-cpp-clean' + - task: Bash@3 + displayName: Create artifacts + inputs: + targetType: 'inline' + script: | + zip -j $(Agent.TempDirectory)/LastTest.log.gz $(build_root)/vt/Testing/Temporary/LastTest.log + zip -j $(Agent.TempDirectory)/cmake-output.log.gz $(build_root)/vt/cmake-output.log + - task: PublishPipelineArtifact@1 + displayName: Upload CMake test output artifact + inputs: + targetPath: '$(Agent.TempDirectory)/LastTest.log.gz' + artifact: 'CMakeLastTestLog' + publishLocation: 'pipeline' + - task: PublishPipelineArtifact@1 + displayName: Upload CMake full output artifact + inputs: + targetPath: '$(Agent.TempDirectory)/cmake-output.log.gz' + artifact: 'CMakeOutputLog' + publishLocation: 'pipeline' diff --git a/ci/azure/azure-nvidia-11-ubuntu-mpich.yml b/ci/azure/azure-nvidia-11-ubuntu-mpich.yml new file mode 100644 index 0000000000..ccd27e71f4 --- /dev/null +++ b/ci/azure/azure-nvidia-11-ubuntu-mpich.yml @@ -0,0 +1,145 @@ +############################################################################### +############## Warning this is a generated file---do not modify ############### +############################################################################### + +name: PR tests (nvidia cuda 11.0, ubuntu, mpich) + +trigger: + branches: + include: + - develop + - 1.0.0* + +pr: + branches: + include: + - '*' + + +resources: +- repo: self + +variables: + tag: '$(Build.BuildId)' + REPO: lifflander1/vt + ARCH: amd64 + UBUNTU: 18.04 + COMPILER_TYPE: nvidia + COMPILER: nvcc-11 + BUILD_TYPE: release + ULIMIT_CORE: 0 + CODE_COVERAGE: 0 + VT_LB: 1 + VT_TRACE: 1 + VT_TRACE_RT: 0 + VT_MIMALLOC: 0 + VT_DOCS: 0 + VT_ASAN: 0 + VT_POOL: 0 + VT_EXTENDED_TESTS: 0 + VT_UNITY_BUILD: 1 + VT_ZOLTAN: 0 + VT_CI_BUILD: 1 + VT_DIAGNOSTICS: 0 + CACHE: "$(Agent.TempDirectory)/cache/" + cache_name: ubuntu-nvidia-11-cache + build_root: "$(CACHE)/$(ARCH)-ubuntu-$(UBUNTU)-$(COMPILER)-cache/" + TS: 0 + TS_YEAR: 0 + TS_MONTH: 0 + TS_DAY: 0 + +stages: +- stage: Build + displayName: Build image + jobs: + - job: Build + displayName: Build + pool: + vmImage: 'ubuntu-18.04' + timeoutInMinutes: 180 + steps: + - task: Bash@3 + displayName: Job setup + inputs: + targetType: 'inline' + script: | + echo setup + - task: Bash@3 + displayName: Build timestep for caching + inputs: + targetType: 'inline' + script: | + echo 'string(TIMESTAMP current_date "%H;%M;%S" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS]$val" + echo 'string(TIMESTAMP current_date "%Y" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_YEAR]$val" + echo 'string(TIMESTAMP current_date "%m" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_MONTH]$val" + echo 'string(TIMESTAMP current_date "%d" UTC)' > script + echo 'execute_process(COMMAND ${CMAKE_COMMAND} -E echo "${current_date}")' >> script + val=$(cmake -P script) + echo "##vso[task.setvariable variable=TS_DAY]$val" + - task: Bash@3 + displayName: Output timestamp for caching + inputs: + targetType: 'inline' + script: 'echo "my pipeline variable is $(TS) $(TS_YEAR) $(TS_MONTH) $(TS_DAY)"' + - task: Cache@2 + displayName: Update cache + inputs: + securityNamespace: cache + key: $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) | $(TS_DAY) | $(TS) + path: '$(build_root)/ccache' + restoreKeys: | + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) | $(TS_DAY) + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) | $(TS_MONTH) + $(Agent.OS) | "$(cache_name)" | $(TS_YEAR) + $(Agent.OS) | "$(cache_name)" + - task: DockerCompose@0 + displayName: Pull container + inputs: + containerregistrytype: 'Container Registry' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'pull --ignore-pull-failures ubuntu-cpp-clean' + - task: DockerCompose@0 + displayName: Build container + inputs: + containerregistrytype: 'Container Registry' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'run ubuntu-cpp-clean' + - task: DockerCompose@0 + displayName: Push container to registry + inputs: + containerregistrytype: 'Container Registry' + dockerRegistryEndpoint: 'dockerRegistryConnection1' + dockerComposeFile: '**/docker-compose.yml' + action: 'Run a Docker Compose command' + dockerComposeCommand: 'push ubuntu-cpp-clean' + - task: Bash@3 + displayName: Create artifacts + inputs: + targetType: 'inline' + script: | + zip -j $(Agent.TempDirectory)/LastTest.log.gz $(build_root)/vt/Testing/Temporary/LastTest.log + zip -j $(Agent.TempDirectory)/cmake-output.log.gz $(build_root)/vt/cmake-output.log + - task: PublishPipelineArtifact@1 + displayName: Upload CMake test output artifact + inputs: + targetPath: '$(Agent.TempDirectory)/LastTest.log.gz' + artifact: 'CMakeLastTestLog' + publishLocation: 'pipeline' + - task: PublishPipelineArtifact@1 + displayName: Upload CMake full output artifact + inputs: + targetPath: '$(Agent.TempDirectory)/cmake-output.log.gz' + artifact: 'CMakeOutputLog' + publishLocation: 'pipeline' diff --git a/scripts/workflows-azure.ini b/scripts/workflows-azure.ini new file mode 100644 index 0000000000..8ae15a42ba --- /dev/null +++ b/scripts/workflows-azure.ini @@ -0,0 +1,189 @@ + +test_type = "PR tests" +vt_lb = 1 +vt_trace = 0 +vt_trace_rt = 0 +vt_mimalloc = 0 +vt_docs = 0 +vt_asan = 0 +vt_pool = 1 +vt_extended_tests = 1 +vt_unity_build = 1 +vt_zoltan = 0 +vt_ci_build = 1 +ulimit_core = 0 +code_coverage = 0 +build_type = release +repo = lifflander1/vt +arch = amd64 +is_ubuntu = 1 +distro = 18.04 +linux = ubuntu +cache_dir = "~/.local/cache/" +cache_name = "[% linux %]-[% compiler %]-cache" +docker_target = "[% linux %]-cpp-clean" +triggers = "trigger:\\n branches:\\n include:\\n - develop\\n - 1.0.0*" +warning = "###############################################################################\\n############## Warning this is a generated file---do not modify ###############\\n###############################################################################" +job_name = build +workflow_runs_on = "vmImage: 'ubuntu-18.04'" +build_root = $(ARCH)-[% linux %]-$(UBUNTU)-$(COMPILER)-cache +linux_env = " UBUNTU: [% distro %]" +vt_diagnostics = 1 +pr_pattern = "pr:\\n branches:\\n include:\\n - '*'\\n" +job_setup = "echo setup" + +[PR-tests-intel-18-03] +test_configuration = "intel 18.03, ubuntu, mpich" +compiler_type = intel +compiler = icc-18 +cache_name = ubuntu-intel-18-cache +output_name = ci/azure/azure-intel-18-ubuntu-mpich.yml +vt_trace = 1 +vt_pool = 0 +vt_extended_tests = 0 + +[PR-tests-intel-19] +test_configuration = "intel 19, ubuntu, mpich" +compiler_type = intel +compiler = icc-19 +cache_name = ubuntu-intel-19-cache +output_name = ci/azure/azure-intel-19-ubuntu-mpich.yml +vt_trace = 1 +vt_pool = 0 +vt_extended_tests = 0 + +[PR-tests-intel-18-03-extended] +test_type = "PR tests extended" +test_configuration = "intel 18.03, ubuntu, mpich" +compiler_type = intel +compiler = icc-18 +cache_name = ubuntu-intel-18-cache +output_name = ci/azure/azure-intel-18-ubuntu-mpich-extended.yml +pr_pattern = "\\n" +triggers = "\\n" +job_name = build_optional +vt_trace = 1 +vt_pool = 0 + +[PR-tests-nvcc-10-1] +test_configuration = "nvidia cuda 10.1, ubuntu, mpich" +compiler_type = nvidia +compiler = nvcc-10 +cache_name = ubuntu-nvidia-10-cache +output_name = ci/azure/azure-nvidia-10-ubuntu-mpich.yml +vt_extended_tests = 0 +job_name = build_optional +vt_trace = 1 +vt_pool = 0 +vt_diagnostics = 0 + +[PR-tests-nvcc-10-1-extended] +test_type = "PR tests extended" +test_configuration = "nvidia cuda 10.1, ubuntu, mpich" +compiler_type = nvidia +compiler = nvcc-10 +cache_name = ubuntu-nvidia-10-cache +output_name = ci/azure/azure-nvidia-10-ubuntu-mpich-extended.yml +pr_pattern = "\\n" +triggers = "\\n" +job_name = build_optional +vt_trace = 1 +vt_pool = 0 + +[PR-tests-nvcc-11-0] +test_configuration = "nvidia cuda 11.0, ubuntu, mpich" +compiler_type = nvidia +compiler = nvcc-11 +cache_name = ubuntu-nvidia-11-cache +output_name = ci/azure/azure-nvidia-11-ubuntu-mpich.yml +vt_extended_tests = 0 +job_name = build_optional +vt_diagnostics = 0 +vt_trace = 1 +vt_pool = 0 + +[PR-tests-nvcc-11-0-extended] +test_type = "PR tests extended" +test_configuration = "nvidia cuda 11.0, ubuntu, mpich" +compiler_type = nvidia +compiler = nvcc-11 +cache_name = ubuntu-nvidia-11-cache +output_name = ci/azure/azure-nvidia-11-ubuntu-mpich-extended.yml +pr_pattern = "\\n" +triggers = "\\n" +job_name = build_optional +vt_trace = 1 +vt_pool = 0 + +[PR-tests-gcc-5] +test_configuration = "gcc-5, ubuntu, mpich" +compiler_type = gnu +compiler = gcc-5 +output_name = ci/azure/azure-gcc-5-ubuntu-mpich.yml +cache_name = "[% linux %]-[% compiler %]-cache" + +[PR-tests-gcc-6] +test_configuration = "gcc-6, ubuntu, mpich" +compiler_type = gnu +compiler = gcc-6 +output_name = ci/azure/azure-gcc-6-ubuntu-mpich.yml + +[PR-tests-gcc-7] +test_configuration = "gcc-7, ubuntu, mpich, trace runtime, LB" +compiler_type = gnu +compiler = gcc-7 +vt_trace = 1 +vt_trace_rt = 1 +code_coverage = 1 +output_name = ci/azure/azure-gcc-7-ubuntu-mpich.yml +workflow_runs_on = "name: 'vt-agent-pool'" +job_setup = "source /etc/docker-setup.sh" + +[PR-tests-gcc-8] +test_configuration = "gcc-8, ubuntu, mpich, address sanitizer" +compiler_type = gnu +compiler = gcc-8 +vt_trace = 1 +vt_pool = 0 +vt_asan = 1 +output_name = ci/azure/azure-gcc-8-ubuntu-mpich.yml + +[PR-tests-gcc-9] +test_configuration = "gcc-9, ubuntu, mpich, zoltan" +compiler_type = gnu +compiler = gcc-9 +distro = 20.04 +output_name = ci/azure/azure-gcc-9-ubuntu-mpich.yml +vt_zoltan = 1 + +[PR-tests-gcc-10] +test_configuration = "gcc-10, ubuntu, openmpi, no LB" +compiler_type = gnu +compiler = gcc-10 +distro = 20.04 +docker_target = "[% linux %]-cpp-clean-openmpi" +output_name = ci/azure/azure-gcc-10-ubuntu-openmpi.yml +vt_lb = 0 + +[PR-tests-clang-39] +test_configuration = "clang-3.9, ubuntu, mpich" +compiler_type = clang +compiler = clang-3.9 +output_name = ci/azure/azure-clang-3.9-ubuntu-mpich.yml + +[PR-tests-clang-5] +test_configuration = "clang-5.0, ubuntu, mpich" +compiler_type = clang +compiler = clang-5.0 +output_name = ci/azure/azure-clang-5.0-ubuntu-mpich.yml +vt_trace = 1 + +[PR-tests-clang-8] +test_configuration = "clang-8, alpine, mpich" +compiler_type = clang +compiler = clang-8 +is_ubuntu = 0 +linux = alpine +linux_env ="" +output_name = ci/azure/azure-clang-8-alpine-mpich.yml +build_root = $(ARCH)-[% linux %]-$(COMPILER)-cache diff --git a/src/vt/collective/reduce/reduce.h b/src/vt/collective/reduce/reduce.h index 64c93e3626..a9a06205c6 100644 --- a/src/vt/collective/reduce/reduce.h +++ b/src/vt/collective/reduce/reduce.h @@ -87,9 +87,7 @@ struct Reduce : virtual collective::tree::Tree { template < typename OpT, typename MsgT, - ActiveTypedFnType *f = MsgT::template msgHandler< - MsgT, OpT, collective::reduce::operators::ReduceCallback - > + ActiveTypedFnType *f > SequentialIDType reduce( NodeType const& root, MsgT* msg, Callback cb, @@ -98,18 +96,58 @@ struct Reduce : virtual collective::tree::Tree { VirtualProxyType const& proxy = no_vrt_proxy, ObjGroupProxyType objgroup = no_obj_group ); + template < + typename OpT, + typename MsgT + > + SequentialIDType reduce( + NodeType const& root, MsgT* msg, Callback cb, + TagType const& tag = no_tag, SequentialIDType const& seq = no_seq_id, + ReduceNumType const& num_contrib = 1, + VirtualProxyType const& proxy = no_vrt_proxy, + ObjGroupProxyType objgroup = no_obj_group + ) + { + return reduce< + OpT, + MsgT, + &MsgT::template msgHandler< + MsgT, + OpT, + collective::reduce::operators::ReduceCallback + > + >(root, msg, cb, tag, seq, num_contrib, proxy, objgroup); + } template < typename OpT, typename FunctorT, typename MsgT, - ActiveTypedFnType *f = MsgT::template msgHandler + ActiveTypedFnType *f > SequentialIDType reduce( NodeType const& root, MsgT* msg, TagType const& tag = no_tag, SequentialIDType const& seq = no_seq_id, ReduceNumType const& num_contrib = 1, VirtualProxyType const& proxy = no_vrt_proxy ); + template < + typename OpT, + typename FunctorT, + typename MsgT + > + SequentialIDType reduce( + NodeType const& root, MsgT* msg, TagType const& tag = no_tag, + SequentialIDType const& seq = no_seq_id, ReduceNumType const& num_contrib = 1, + VirtualProxyType const& proxy = no_vrt_proxy + ) + { + return reduce< + OpT, + FunctorT, + MsgT, + &MsgT::template msgHandler + >(root, msg, tag, seq, num_contrib, proxy); + } template void reduceAddMsg( diff --git a/src/vt/collective/startup.cc b/src/vt/collective/startup.cc index 607dfc9912..e0a8ed6d71 100644 --- a/src/vt/collective/startup.cc +++ b/src/vt/collective/startup.cc @@ -52,23 +52,20 @@ namespace vt { // vt::{initialize,finalize} for main ::vt namespace RuntimePtrType initialize( - int& argc, char**& argv, WorkerCountType const num_workers, - bool is_interop, MPI_Comm* comm + int argc, char** argv, WorkerCountType const num_workers, + bool is_interop /* = false */, MPI_Comm* comm /* = nullptr */ ) { return CollectiveOps::initialize(argc,argv,num_workers,is_interop,comm); } -RuntimePtrType initialize(int& argc, char**& argv, MPI_Comm* comm) { +RuntimePtrType initialize( + int argc /* = 0 */, char** argv /* = nullptr */, + MPI_Comm* comm /* = nullptr */ +) { bool const is_interop = comm != nullptr; return CollectiveOps::initialize(argc,argv,no_workers,is_interop,comm); } -RuntimePtrType initialize(MPI_Comm* comm) { - int argc = 0; - char** argv = nullptr; - return CollectiveOps::initialize(argc,argv,no_workers,true,comm); -} - void finalize(RuntimePtrType in_rt) { if (in_rt) { return CollectiveOps::finalize(std::move(in_rt)); diff --git a/src/vt/collective/startup.h b/src/vt/collective/startup.h index c7a05d53e8..fc5bb9a743 100644 --- a/src/vt/collective/startup.h +++ b/src/vt/collective/startup.h @@ -51,11 +51,12 @@ namespace vt { RuntimePtrType initialize( - int& argc, char**& argv, WorkerCountType const num_workers, + int argc, char** argv, WorkerCountType const num_workers, bool is_interop = false, MPI_Comm* comm = nullptr ); -RuntimePtrType initialize(int& argc, char**& argv, MPI_Comm* comm = nullptr); -RuntimePtrType initialize(MPI_Comm* comm = nullptr); +RuntimePtrType initialize( + int argc = 0, char** argv = nullptr, MPI_Comm* comm = nullptr +); void finalize(RuntimePtrType in_rt); void finalize(); diff --git a/src/vt/configs/arguments/args.cc b/src/vt/configs/arguments/args.cc index 598e93099a..c627da1a0e 100644 --- a/src/vt/configs/arguments/args.cc +++ b/src/vt/configs/arguments/args.cc @@ -165,6 +165,8 @@ namespace vt { namespace arguments { /*static*/ bool ArgConfig::parsed = false; +/*static*/ std::size_t ArgConfig::vt_max_mpi_send_size = 1ull << 30; + static std::unique_ptr new_argv = nullptr; /*static*/ int ArgConfig::parse(int& argc, char**& argv) { @@ -549,6 +551,18 @@ static std::unique_ptr new_argv = nullptr; hca->group(schedulerGroup); kca->group(schedulerGroup); + /* + * Options for configuring the runtime + */ + auto max_size = "Maximum MPI send size (causes larger messages to be split " + "into multiple MPI sends)"; + auto a1x = app.add_option( + "--vt_max_mpi_send_size", vt_max_mpi_send_size, max_size, true + ); + + auto configRuntime = "Runtime"; + a1x->group(configRuntime); + /* * Run the parser! */ diff --git a/src/vt/configs/arguments/args.h b/src/vt/configs/arguments/args.h index 5b209facc3..c42cbd85bd 100644 --- a/src/vt/configs/arguments/args.h +++ b/src/vt/configs/arguments/args.h @@ -154,6 +154,7 @@ struct ArgConfig { static bool vt_debug_objgroup; static bool vt_debug_print_flush; + static std::size_t vt_max_mpi_send_size; static bool vt_user_1; static bool vt_user_2; diff --git a/src/vt/configs/types/types_type.h b/src/vt/configs/types/types_type.h index eb589d7738..2670eaa7cd 100644 --- a/src/vt/configs/types/types_type.h +++ b/src/vt/configs/types/types_type.h @@ -77,7 +77,7 @@ using VirtualElmOnlyProxyType = uint64_t; using VirtualElmCountType = int64_t; using UniqueIndexBitType = uint64_t; using GroupType = uint64_t; -using MsgSizeType = int32_t; +using MsgSizeType = int64_t; using PhaseType = uint64_t; using PipeType = uint64_t; using ObjGroupProxyType = uint64_t; diff --git a/src/vt/messaging/active.cc b/src/vt/messaging/active.cc index 7cce284871..c14031c022 100644 --- a/src/vt/messaging/active.cc +++ b/src/vt/messaging/active.cc @@ -159,9 +159,9 @@ EventType ActiveMessenger::sendMsgBytesWithPut( } else { auto const& env_tag = envelopeGetPutTag(msg->env); auto const& ret = sendData( - RDMA_GetType{put_ptr,put_size}, dest, env_tag + PtrLenPairType{put_ptr,put_size}, dest, env_tag ); - auto const& ret_tag = std::get<1>(ret); + auto const& ret_tag = ret.getTag(); if (ret_tag != env_tag) { envelopeSetPutTag(msg->env, ret_tag); } @@ -177,6 +177,127 @@ EventType ActiveMessenger::sendMsgBytesWithPut( return no_event; } +struct MultiMsg : vt::Message { + MultiMsg() = default; + MultiMsg(SendInfo in_info, NodeType in_from, MsgSizeType in_size) + : info(in_info), + from(in_from), + size(in_size) + { } + + SendInfo getInfo() const { return info; } + NodeType getFrom() const { return from; } + MsgSizeType getSize() const { return size; } + +private: + SendInfo info; + NodeType from = uninitialized_destination; + MsgSizeType size = 0; +}; + +/*static*/ void ActiveMessenger::chunkedMultiMsg(MultiMsg* msg) { + theMsg()->handleChunkedMultiMsg(msg); +} + +void ActiveMessenger::handleChunkedMultiMsg(MultiMsg* msg) { + auto buf = +#if vt_check_enabled(memory_pool) + static_cast(thePool()->alloc(msg->getSize())); +#else + static_cast(std::malloc(msg->getSize())); +#endif + + auto const size = msg->getSize(); + auto const info = msg->getInfo(); + auto const sender = msg->getFrom(); + auto const nchunks = info.getNumChunks(); + auto const tag = info.getTag(); + + auto fn = [buf,sender,size,tag,this](PtrLenPairType,ActionType){ + debug_print( + active, node, + "handleChunkedMultiMsg: all chunks arrived tag={}, size={}, from={}\n", + tag, size, sender + ); + InProgressIRecv irecv(buf, size, sender); + finishPendingActiveMsgAsyncRecv(&irecv); + }; + + recvDataDirect(nchunks, buf, tag, sender, size, 0, nullptr, fn, false); +} + +EventType ActiveMessenger::sendMsgMPI( + NodeType const& dest, MsgSharedPtr const& base, + MsgSizeType const& msg_size, TagType const& send_tag +) { + BaseMsgType* base_typed_msg = base.get(); + + char* untyped_msg = reinterpret_cast(base_typed_msg); + + debug_print( + active, node, + "sendMsgMPI: dest={}, msg_size={}, send_tag={}\n", + dest, msg_size, send_tag + ); + + auto const max_per_send = ArgType::vt_max_mpi_send_size; + if (static_cast(msg_size) < max_per_send) { + auto const event_id = theEvent()->createMPIEvent(this_node_); + auto& holder = theEvent()->getEventHolder(event_id); + auto mpi_event = holder.get_event(); + + mpi_event->setManagedMessage(base.to()); + + int small_msg_size = static_cast(msg_size); + { + VT_ALLOW_MPI_CALLS; + #if vt_check_enabled(trace_enabled) + double tr_begin = 0; + if (ArgType::vt_trace_mpi) { + tr_begin = vt::timing::Timing::getCurrentTime(); + } + #endif + int const ret = MPI_Isend( + untyped_msg, small_msg_size, MPI_BYTE, dest, send_tag, + theContext()->getComm(), mpi_event->getRequest() + ); + vtAssertMPISuccess(ret, "MPI_Isend"); + + #if vt_check_enabled(trace_enabled) + if (ArgType::vt_trace_mpi) { + auto tr_end = vt::timing::Timing::getCurrentTime(); + auto tr_note = fmt::format("Isend(AM): dest={}, bytes={}", dest, msg_size); + trace::addUserBracketedNote(tr_begin, tr_end, tr_note, trace_isend); + } + #endif + } + + return event_id; + } else { + debug_print( + active, node, + "sendMsgMPI: (multi): size={}\n", msg_size + ); + auto tag = allocateNewTag(); + auto this_node = theContext()->getNode(); + + // Send the actual data in multiple chunks + PtrLenPairType tup = std::make_tuple(untyped_msg, msg_size); + SendInfo info = sendData(tup, dest, tag); + + auto event_id = info.getEvent(); + auto& holder = theEvent()->getEventHolder(event_id); + auto mpi_event = holder.get_event(); + mpi_event->setManagedMessage(base.to()); + + // Send the control message to receive the multiple chunks of data + auto m = makeMessage(info, this_node, msg_size); + sendMsg(dest, m.get()); + + return event_id; + } +} + EventType ActiveMessenger::sendMsgBytes( NodeType const& dest, MsgSharedPtr const& base, MsgSizeType const& msg_size, TagType const& send_tag @@ -185,14 +306,9 @@ EventType ActiveMessenger::sendMsgBytes( auto const epoch = envelopeIsEpochType(msg->env) ? envelopeGetEpoch(msg->env) : term::any_epoch_sentinel; - auto const is_shared = isSharedMessage(msg); auto const is_term = envelopeIsTerm(msg->env); auto const is_bcast = envelopeIsBcast(msg->env); - auto const event_id = theEvent()->createMPIEvent(this_node_); - auto& holder = theEvent()->getEventHolder(event_id); - auto mpi_event = holder.get_event(); - if (!is_term || backend_check_enabled(print_term_msgs)) { debug_print( active, node, @@ -200,10 +316,6 @@ EventType ActiveMessenger::sendMsgBytes( ); } - if (is_shared) { - mpi_event->setManagedMessage(base.to()); - } - vtWarnIf( !(dest != theContext()->getNode() || is_bcast), "Destination {} should != this node" @@ -212,29 +324,12 @@ EventType ActiveMessenger::sendMsgBytes( dest >= theContext()->getNumNodes() || dest < 0, "Invalid destination: {}" ); - { - VT_ALLOW_MPI_CALLS; - #if backend_check_enabled(trace_enabled) - double tr_begin = 0; - if (ArgType::vt_trace_mpi) { - tr_begin = vt::timing::Timing::getCurrentTime(); - } - #endif - - const int ret = MPI_Isend( - msg, msg_size, MPI_BYTE, dest, send_tag, theContext()->getComm(), - mpi_event->getRequest() - ); - vtAssertMPISuccess(ret, "MPI_Isend"); - - #if backend_check_enabled(trace_enabled) - if (ArgType::vt_trace_mpi) { - auto tr_end = vt::timing::Timing::getCurrentTime(); - auto tr_note = fmt::format("Isend(AM): dest={}, bytes={}", dest, msg_size); - trace::addUserBracketedNote(tr_begin, tr_end, tr_note, trace_isend); - } - #endif + if (is_term) { + // tdSentCount.increment(1); } + // amSentCounterGauge.incrementUpdate(msg_size, 1); + + EventType const event_id = sendMsgMPI(dest, base, msg_size, send_tag); if (not is_term) { theTerm()->produce(epoch,1,dest); @@ -311,8 +406,19 @@ EventType ActiveMessenger::sendMsgSized( return ret_event; } -ActiveMessenger::SendDataRetType ActiveMessenger::sendData( - RDMA_GetType const& ptr, NodeType const& dest, TagType const& tag +MPI_TagType ActiveMessenger::allocateNewTag() { + auto const max_tag = util::MPI_Attr::getMaxTag(); + + if (cur_direct_buffer_tag_ == max_tag) { + cur_direct_buffer_tag_ = starting_direct_buffer_tag; + } + auto const ret_tag = cur_direct_buffer_tag_++; + + return ret_tag; +} + +SendInfo ActiveMessenger::sendData( + PtrLenPairType const& ptr, NodeType const& dest, TagType const& tag ) { auto const& data_ptr = std::get<0>(ptr); auto const& num_bytes = std::get<1>(ptr); @@ -321,19 +427,9 @@ ActiveMessenger::SendDataRetType ActiveMessenger::sendData( if (tag != no_tag) { send_tag = tag; } else { - auto const max_tag = util::MPI_Attr::getMaxTag(); - - if (cur_direct_buffer_tag_ == max_tag) { - cur_direct_buffer_tag_ = starting_direct_buffer_tag; - } - send_tag = cur_direct_buffer_tag_++; + send_tag = allocateNewTag(); } - auto const event_id = theEvent()->createMPIEvent(this_node_); - auto& holder = theEvent()->getEventHolder(event_id); - - auto mpi_event = holder.get_event(); - debug_print( active, node, "sendData: ptr={}, num_bytes={} dest={}, tag={}, send_tag={}\n", @@ -349,29 +445,9 @@ ActiveMessenger::SendDataRetType ActiveMessenger::sendData( "Invalid destination: {}" ); - { - VT_ALLOW_MPI_CALLS; - #if backend_check_enabled(trace_enabled) - double tr_begin = 0; - if (ArgType::vt_trace_mpi) { - tr_begin = vt::timing::Timing::getCurrentTime(); - } - #endif - - const int ret = MPI_Isend( - data_ptr, num_bytes, MPI_BYTE, dest, send_tag, theContext()->getComm(), - mpi_event->getRequest() - ); - vtAssertMPISuccess(ret, "MPI_Isend"); - - #if backend_check_enabled(trace_enabled) - if (ArgType::vt_trace_mpi) { - auto tr_end = vt::timing::Timing::getCurrentTime(); - auto tr_note = fmt::format("Isend(Data): dest={}, bytes={}", dest, num_bytes); - trace::addUserBracketedNote(tr_begin, tr_end, tr_note, trace_isend); - } - #endif - } + auto ret = sendDataMPI(ptr, dest, send_tag); + EventType event_id = std::get<0>(ret); + int num = std::get<1>(ret); // Assume that any raw data send/recv is paired with a message with an epoch // if required to inhibit early termination of that epoch @@ -382,20 +458,87 @@ ActiveMessenger::SendDataRetType ActiveMessenger::sendData( l->send(dest, num_bytes, false); } - return SendDataRetType{event_id,send_tag}; + return SendInfo{event_id, send_tag, num}; +} + +std::tuple ActiveMessenger::sendDataMPI( + PtrLenPairType const& payload, NodeType const& dest, TagType const& tag +) { + auto ptr = static_cast(std::get<0>(payload)); + auto remainder = std::get<1>(payload); + int num_sends = 0; + std::vector events; + EventType ret_event = no_event; + auto const max_per_send = ArgType::vt_max_mpi_send_size; + while (remainder > 0) { + auto const event_id = theEvent()->createMPIEvent(this_node_); + auto& holder = theEvent()->getEventHolder(event_id); + auto mpi_event = holder.get_event(); + auto subsize = static_cast( + std::min(static_cast(remainder), max_per_send) + ); + { + #if vt_check_enabled(trace_enabled) + double tr_begin = 0; + if (ArgType::vt_trace_mpi) { + tr_begin = vt::timing::Timing::getCurrentTime(); + } + #endif + + debug_print( + active, node, + "sendDataMPI: remainder={}, node={}, tag={}, num_sends={}, subsize={}," + "total size={}\n", + remainder, dest, tag, num_sends, subsize, std::get<1>(payload) + ); + + VT_ALLOW_MPI_CALLS; + int const ret = MPI_Isend( + ptr, subsize, MPI_BYTE, dest, tag, theContext()->getComm(), + mpi_event->getRequest() + ); + vtAssertMPISuccess(ret, "MPI_Isend"); + + #if vt_check_enabled(trace_enabled) + if (ArgType::vt_trace_mpi) { + auto tr_end = vt::timing::Timing::getCurrentTime(); + auto tr_note = fmt::format("Isend(Data): dest={}, bytes={}", dest, subsize); + trace::addUserBracketedNote(tr_begin, tr_end, tr_note, trace_isend); + } + #endif + } + ptr += subsize; + remainder -= subsize; + num_sends++; + events.push_back(event_id); + } + + if (events.size() > 1) { + ret_event = theEvent()->createParentEvent(theContext()->getNode()); + auto& holder = theEvent()->getEventHolder(ret_event); + for (auto&& child_event : events) { + holder.get_event()->addEventToList(child_event); + } + } else { + vtAssert(events.size() > 0, "Must contain at least one event"); + ret_event = events.back(); + } + + return std::make_tuple(ret_event, num_sends); } bool ActiveMessenger::recvDataMsgPriority( - PriorityType priority, TagType const& tag, NodeType const& node, - RDMA_ContinuationDeleteType next + int nchunks, PriorityType priority, TagType const& tag, NodeType const& node, + ContinuationDeleterType next ) { - return recvDataMsg(priority, tag, node, true, next); + return recvDataMsg(nchunks, priority, tag, node, true, next); } bool ActiveMessenger::recvDataMsg( - TagType const& tag, NodeType const& node, RDMA_ContinuationDeleteType next + int nchunks, TagType const& tag, NodeType const& node, + ContinuationDeleterType next ) { - return recvDataMsg(default_priority, tag, node, true, next); + return recvDataMsg(nchunks, default_priority, tag, node, true, next); } bool ActiveMessenger::tryProcessDataMsgRecv() { @@ -403,10 +546,10 @@ bool ActiveMessenger::tryProcessDataMsgRecv() { auto iter = pending_recvs_.begin(); for (; iter != pending_recvs_.end(); ++iter) { + auto& elm = iter->second; auto const done = recvDataMsgBuffer( - iter->second.user_buf, iter->second.priority, iter->first, - iter->second.recv_node, false, iter->second.dealloc_user_buf, - iter->second.cont + elm.nchunks, elm.user_buf, elm.priority, iter->first, elm.sender, false, + elm.dealloc_user_buf, elm.cont, elm.is_user_buf ); if (done) { erase = true; @@ -423,17 +566,20 @@ bool ActiveMessenger::tryProcessDataMsgRecv() { } bool ActiveMessenger::recvDataMsgBuffer( - void* const user_buf, TagType const& tag, + int nchunks, void* const user_buf, TagType const& tag, NodeType const& node, bool const& enqueue, ActionType dealloc, - RDMA_ContinuationDeleteType next + ContinuationDeleterType next, bool is_user_buf ) { - return recvDataMsgBuffer(user_buf, no_priority, tag, node, enqueue, dealloc, next); + return recvDataMsgBuffer( + nchunks, user_buf, no_priority, tag, node, enqueue, dealloc, next, + is_user_buf + ); } bool ActiveMessenger::recvDataMsgBuffer( - void* const user_buf, PriorityType priority, TagType const& tag, + int nchunks, void* const user_buf, PriorityType priority, TagType const& tag, NodeType const& node, bool const& enqueue, ActionType dealloc_user_buf, - RDMA_ContinuationDeleteType next + ContinuationDeleterType next, bool is_user_buf ) { if (not enqueue) { CountType num_probe_bytes; @@ -465,53 +611,10 @@ bool ActiveMessenger::recvDataMsgBuffer( NodeType const sender = stat.MPI_SOURCE; - MPI_Request req; - - { - VT_ALLOW_MPI_CALLS; - - #if backend_check_enabled(trace_enabled) - double tr_begin = 0; - if (ArgType::vt_trace_mpi) { - tr_begin = vt::timing::Timing::getCurrentTime(); - } - #endif - - const int recv_ret = MPI_Irecv( - buf, num_probe_bytes, MPI_BYTE, stat.MPI_SOURCE, stat.MPI_TAG, - theContext()->getComm(), &req - ); - vtAssertMPISuccess(recv_ret, "MPI_Irecv"); - - #if backend_check_enabled(trace_enabled) - if (ArgType::vt_trace_mpi) { - auto tr_end = vt::timing::Timing::getCurrentTime(); - auto tr_note = fmt::format( - "Irecv(Data): from={}, bytes={}", - stat.MPI_SOURCE, num_probe_bytes - ); - trace::addUserBracketedNote(tr_begin, tr_end, tr_note, trace_irecv); - } - #endif - } - - InProgressDataIRecv recv_holder{ - buf, num_probe_bytes, sender, req, user_buf, dealloc_user_buf, next, - priority - }; - - int recv_flag = 0; - { - VT_ALLOW_MPI_CALLS; - MPI_Status recv_stat; - MPI_Test(&recv_holder.req, &recv_flag, &recv_stat); - } - - if (recv_flag == 1) { - finishPendingDataMsgAsyncRecv(&recv_holder); - } else { - in_progress_data_irecv.emplace(std::move(recv_holder)); - } + recvDataDirect( + nchunks, buf, tag, sender, num_probe_bytes, priority, dealloc_user_buf, + next, is_user_buf + ); return true; } else { @@ -520,21 +623,105 @@ bool ActiveMessenger::recvDataMsgBuffer( } else { debug_print( active, node, - "recvDataMsgBuffer: node={}, tag={}, enqueue={}, priority={:x}\n", - node, tag, print_bool(enqueue), priority + "recvDataMsgBuffer: nchunks={}, node={}, tag={}, enqueue={}, " + "priority={:x} buffering, is_user_buf={}\n", + nchunks, node, tag, print_bool(enqueue), priority, is_user_buf ); pending_recvs_.emplace( std::piecewise_construct, std::forward_as_tuple(tag), std::forward_as_tuple( - PendingRecvType{user_buf,next,dealloc_user_buf,node,priority} + PendingRecvType{ + nchunks, user_buf, next, dealloc_user_buf, node, priority, + is_user_buf + } ) ); return false; } } +void ActiveMessenger::recvDataDirect( + int nchunks, TagType const tag, NodeType const from, MsgSizeType len, + ContinuationDeleterType next +) { + char* buf = + #if vt_check_enabled(memory_pool) + static_cast(thePool()->alloc(len)); + #else + static_cast(std::malloc(len)); + #endif + + recvDataDirect( + nchunks, buf, tag, from, len, default_priority, nullptr, next, false + ); +} + +void ActiveMessenger::recvDataDirect( + int nchunks, void* const buf, TagType const tag, NodeType const from, + MsgSizeType len, PriorityType prio, ActionType dealloc, + ContinuationDeleterType next, bool is_user_buf +) { + vtAssert(nchunks > 0, "Must have at least one chunk"); + + std::vector reqs; + reqs.resize(nchunks); + + char* cbuf = static_cast(buf); + MsgSizeType remainder = len; + auto const max_per_send = ArgType::vt_max_mpi_send_size; + for (int i = 0; i < nchunks; i++) { + auto sublen = static_cast( + std::min(static_cast(remainder), max_per_send) + ); + + #if vt_check_enabled(trace_enabled) + double tr_begin = 0; + if (ArgType::vt_trace_mpi) { + tr_begin = vt::timing::Timing::getCurrentTime(); + } + #endif + + { + VT_ALLOW_MPI_CALLS; + int const ret = MPI_Irecv( + cbuf+(i*max_per_send), sublen, MPI_BYTE, from, tag, + theContext()->getComm(), &reqs[i] + ); + vtAssertMPISuccess(ret, "MPI_Irecv"); + } + + // dmPostedCounterGauge.incrementUpdate(len, 1); + + #if vt_check_enabled(trace_enabled) + if (ArgType::vt_trace_mpi) { + auto tr_end = vt::timing::Timing::getCurrentTime(); + auto tr_note = fmt::format( + "Irecv(Data): from={}, bytes={}", + from, sublen + ); + trace::addUserBracketedNote(tr_begin, tr_end, tr_note, trace_irecv); + } + #endif + + remainder -= sublen; + } + + InProgressDataIRecv recv{ + cbuf, len, from, std::move(reqs), is_user_buf ? buf : nullptr, dealloc, + next, prio + }; + + bool done = recv.test(); + + if (done) { + finishPendingDataMsgAsyncRecv(&recv); + } else { + in_progress_data_irecv.emplace(std::move(recv)); + } +} + void ActiveMessenger::finishPendingDataMsgAsyncRecv(InProgressDataIRecv* irecv) { auto buf = irecv->buf; auto num_probe_bytes = irecv->probe_bytes; @@ -575,7 +762,7 @@ void ActiveMessenger::finishPendingDataMsgAsyncRecv(InProgressDataIRecv* irecv) } else { // If we have a continuation, schedule to run later auto run = [=]{ - next(RDMA_GetType{buf,num_probe_bytes}, dealloc_buf); + next(PtrLenPairType{buf,num_probe_bytes}, dealloc_buf); theTerm()->consume(term::any_epoch_sentinel,1,sender); theTerm()->hangDetectRecv(); }; @@ -584,11 +771,12 @@ void ActiveMessenger::finishPendingDataMsgAsyncRecv(InProgressDataIRecv* irecv) } bool ActiveMessenger::recvDataMsg( - PriorityType priority, TagType const& tag, NodeType const& recv_node, - bool const& enqueue, RDMA_ContinuationDeleteType next + int nchunks, PriorityType priority, TagType const& tag, + NodeType const& sender, bool const& enqueue, + ContinuationDeleterType next ) { return recvDataMsgBuffer( - nullptr, priority, tag, recv_node, enqueue, nullptr, next + nchunks, nullptr, priority, tag, sender, enqueue, nullptr, next ); } @@ -776,16 +964,18 @@ bool ActiveMessenger::deliverActiveMsg( } bool ActiveMessenger::tryProcessIncomingActiveMsg() { - VT_ALLOW_MPI_CALLS; // MPI_Iprove, MPI_Irecv, MPI_Test - CountType num_probe_bytes; MPI_Status stat; int flag; - MPI_Iprobe( - MPI_ANY_SOURCE, static_cast(MPITag::ActiveMsgTag), - theContext()->getComm(), &flag, &stat - ); + { + VT_ALLOW_MPI_CALLS; + + MPI_Iprobe( + MPI_ANY_SOURCE, static_cast(MPITag::ActiveMsgTag), + theContext()->getComm(), &flag, &stat + ); + } if (flag == 1) { MPI_Get_count(&stat, MPI_BYTE, &num_probe_bytes); @@ -808,6 +998,7 @@ bool ActiveMessenger::tryProcessIncomingActiveMsg() { } #endif + VT_ALLOW_MPI_CALLS; MPI_Irecv( buf, num_probe_bytes, MPI_BYTE, sender, stat.MPI_TAG, theContext()->getComm(), &req @@ -827,10 +1018,9 @@ bool ActiveMessenger::tryProcessIncomingActiveMsg() { InProgressIRecv recv_holder{buf, num_probe_bytes, sender, req}; - int recv_flag = 0; - MPI_Status recv_stat; - MPI_Test(&recv_holder.req, &recv_flag, &recv_stat); - if (recv_flag == 1) { + auto done = recv_holder.test(); + + if (done) { finishPendingActiveMsgAsyncRecv(&recv_holder); } else { in_progress_active_msg_irecv.emplace(std::move(recv_holder)); @@ -896,8 +1086,8 @@ void ActiveMessenger::finishPendingActiveMsgAsyncRecv(InProgressIRecv* irecv) { put_finished = true; } else { /*bool const put_delivered = */recvDataMsg( - put_tag, sender, - [=](RDMA_GetType ptr, ActionType deleter){ + 1, put_tag, sender, + [=](PtrLenPairType ptr, ActionType deleter){ envelopeSetPutPtr(base->env, std::get<0>(ptr), std::get<1>(ptr)); scheduleActiveMsg(base, sender, num_probe_bytes, true, deleter); } diff --git a/src/vt/messaging/active.h b/src/vt/messaging/active.h index 02fadf97b4..d8c8d8b865 100644 --- a/src/vt/messaging/active.h +++ b/src/vt/messaging/active.h @@ -57,6 +57,7 @@ #include "vt/messaging/pending_send.h" #include "vt/messaging/listener.h" #include "vt/messaging/irecv_holder.h" +#include "vt/messaging/send_info.h" #include "vt/event/event.h" #include "vt/registry/registry.h" #include "vt/registry/auto/auto_registry_interface.h" @@ -74,6 +75,17 @@ #include #include +namespace vt { + +/// A pair of a void* and number of bytes (length) for sending data +using PtrLenPairType = std::tuple; + +/// A continuation function with an allocated pointer with a deleter function +using ContinuationDeleterType = + std::function; + +} /* end namespace vt */ + namespace vt { namespace messaging { using MPI_TagType = int; @@ -90,55 +102,96 @@ static constexpr TagType const starting_direct_buffer_tag = 1000; static constexpr MsgSizeType const max_pack_direct_size = 512; struct PendingRecv { + int nchunks = 0; void* user_buf = nullptr; - RDMA_ContinuationDeleteType cont = nullptr; + ContinuationDeleterType cont = nullptr; ActionType dealloc_user_buf = nullptr; - NodeType recv_node = uninitialized_destination; + NodeType sender = uninitialized_destination; PriorityType priority = no_priority; + bool is_user_buf = false; PendingRecv( - void* in_user_buf, RDMA_ContinuationDeleteType in_cont, + int in_nchunks, void* in_user_buf, ContinuationDeleterType in_cont, ActionType in_dealloc_user_buf, NodeType node, - PriorityType in_priority - ) : user_buf(in_user_buf), cont(in_cont), - dealloc_user_buf(in_dealloc_user_buf), recv_node(node), - priority(in_priority) + PriorityType in_priority, bool in_is_user_buf + ) : nchunks(in_nchunks), user_buf(in_user_buf), cont(in_cont), + dealloc_user_buf(in_dealloc_user_buf), sender(node), + priority(in_priority), is_user_buf(in_is_user_buf) { } }; -struct InProgressIRecv { - using CountType = int32_t; - - InProgressIRecv( - char* in_buf, CountType in_probe_bytes, NodeType in_sender, - MPI_Request in_req +struct InProgressBase { + InProgressBase( + char* in_buf, MsgSizeType in_probe_bytes, NodeType in_sender ) : buf(in_buf), probe_bytes(in_probe_bytes), sender(in_sender), - req(in_req), valid(true) + valid(true) { } char* buf = nullptr; - CountType probe_bytes = 0; + MsgSizeType probe_bytes = 0; NodeType sender = uninitialized_destination; - MPI_Request req; bool valid = false; }; -struct InProgressDataIRecv : public InProgressIRecv { +struct InProgressIRecv : InProgressBase { + + InProgressIRecv( + char* in_buf, MsgSizeType in_probe_bytes, NodeType in_sender, + MPI_Request in_req = MPI_REQUEST_NULL + ) : InProgressBase(in_buf, in_probe_bytes, in_sender), + req(in_req) + { } + + bool test() { + VT_ALLOW_MPI_CALLS; // MPI_Test + + int flag = 0; + MPI_Status stat; + MPI_Test(&req, &flag, &stat); + return flag; + } + +private: + MPI_Request req = MPI_REQUEST_NULL; +}; + +struct InProgressDataIRecv : InProgressBase { InProgressDataIRecv( - char* in_buf, CountType in_probe_bytes, NodeType in_sender, - MPI_Request in_req, void* const in_user_buf, + char* in_buf, MsgSizeType in_probe_bytes, NodeType in_sender, + std::vector in_reqs, void* const in_user_buf, ActionType in_dealloc_user_buf, - RDMA_ContinuationDeleteType in_next, + ContinuationDeleterType in_next, PriorityType in_priority - ) : InProgressIRecv{in_buf, in_probe_bytes, in_sender, in_req}, + ) : InProgressBase{in_buf, in_probe_bytes, in_sender}, user_buf(in_user_buf), dealloc_user_buf(in_dealloc_user_buf), - next(in_next), priority(in_priority) + next(in_next), priority(in_priority), reqs(std::move(in_reqs)) { } + bool test() { + int flag = 0; + MPI_Status stat; + for ( ; cur < reqs.size(); cur++) { + VT_ALLOW_MPI_CALLS; // MPI_Test + + MPI_Test(&reqs[cur], &flag, &stat); + + if (flag == 0) { + return false; + } + } + + return true; + } + +public: void* user_buf = nullptr; ActionType dealloc_user_buf = nullptr; - RDMA_ContinuationDeleteType next = nullptr; + ContinuationDeleterType next = nullptr; PriorityType priority = no_priority; + +private: + std::size_t cur = 0; + std::vector reqs; }; struct BufferedActiveMsg { @@ -155,16 +208,16 @@ struct BufferedActiveMsg { { } }; +// forward-declare for header +struct MultiMsg; + struct ActiveMessenger { using BufferedMsgType = BufferedActiveMsg; using MessageType = ShortMessage*; using CountType = int32_t; using PendingRecvType = PendingRecv; using EventRecordType = event::AsyncEvent::EventRecordType; - using SendDataRetType = std::tuple; - using SendFnType = std::function< - SendDataRetType(RDMA_GetType,NodeType,TagType) - >; + using SendFnType = std::function; using UserSendFnType = std::function; using ContainerPendingType = std::unordered_map; using MsgContType = std::list; @@ -489,37 +542,75 @@ struct ActiveMessenger { MsgSizeType const& ptr_bytes ); - SendDataRetType sendData( - RDMA_GetType const& ptr, NodeType const& dest, TagType const& tag + SendInfo sendData( + PtrLenPairType const& ptr, NodeType const& dest, TagType const& tag + ); + + std::tuple sendDataMPI( + PtrLenPairType const& ptr, NodeType const& dest, TagType const& tag ); bool recvDataMsgPriority( - PriorityType priority, TagType const& tag, NodeType const& node, - RDMA_ContinuationDeleteType next = nullptr + int nchunks, PriorityType priority, TagType const& tag, + NodeType const& node, ContinuationDeleterType next = nullptr ); bool recvDataMsg( - TagType const& tag, NodeType const& node, - RDMA_ContinuationDeleteType next = nullptr + int nchunks, TagType const& tag, NodeType const& node, + ContinuationDeleterType next = nullptr ); bool recvDataMsg( - PriorityType priority, TagType const& tag, NodeType const& recv_node, - bool const& enqueue, RDMA_ContinuationDeleteType next = nullptr + int nchunks, PriorityType priority, TagType const& tag, + NodeType const& sender, bool const& enqueue, + ContinuationDeleterType next = nullptr ); bool recvDataMsgBuffer( - void* const user_buf, PriorityType priority, TagType const& tag, + int nchunks, void* const user_buf, PriorityType priority, TagType const& tag, NodeType const& node = uninitialized_destination, bool const& enqueue = true, ActionType dealloc_user_buf = nullptr, - RDMA_ContinuationDeleteType next = nullptr + ContinuationDeleterType next = nullptr, bool is_user_buf = false ); bool recvDataMsgBuffer( - void* const user_buf, TagType const& tag, + int nchunks, void* const user_buf, TagType const& tag, NodeType const& node = uninitialized_destination, bool const& enqueue = true, ActionType dealloc_user_buf = nullptr, - RDMA_ContinuationDeleteType next = nullptr + ContinuationDeleterType next = nullptr, bool is_user_buf = false + ); + + /** + * \brief Receive data from MPI in multiple chunks + * + * \param[in] nchunks the number of chunks to receive + * \param[in] buf the receive buffer + * \param[in] tag the MPI tag + * \param[in] from the sender + * \param[in] len the total length + * \param[in] prio the priority for the continuation + * \param[in] dealloc the action to deallocate the buffer + * \param[in] next the continuation that gets passed the data when ready + * \param[in] is_user_buf is a user buffer that require user deallocation + */ + void recvDataDirect( + int nchunks, void* const buf, TagType const tag, NodeType const from, + MsgSizeType len, PriorityType prio, ActionType dealloc = nullptr, + ContinuationDeleterType next = nullptr, bool is_user_buf = false + ); + + /** + * \brief Receive data from MPI in multiple chunks + * + * \param[in] nchunks the number of chunks to receive + * \param[in] tag the MPI tag + * \param[in] from the sender + * \param[in] len the total length + * \param[in] next the continuation that gets passed the data when ready + */ + void recvDataDirect( + int nchunks, TagType const tag, NodeType const from, + MsgSizeType len, ContinuationDeleterType next ); EventType sendMsgSized( @@ -585,6 +676,23 @@ struct ActiveMessenger { MsgSizeType const& msg_size, TagType const& send_tag ); + /** + * \internal + * \brief Send already-packed message bytes with MPI using multiple + * sends if necessary + * + * \param[in] dest the destination of the message + * \param[in] base the message base pointer + * \param[in] msg_size the size of the message + * \param[in] send_tag the send tag on the message + * + * \return the event to test/wait for completion + */ + EventType sendMsgMPI( + NodeType const& dest, MsgSharedPtr const& base, + MsgSizeType const& msg_size, TagType const& send_tag + ); + /* * setGlobalEpoch() is a shortcut for both pushing and popping epochs on the * stack depending on the value of the `epoch' passed as an argument. @@ -642,6 +750,32 @@ struct ActiveMessenger { } private: + /** + * \internal \brief Allocate a new, unused tag. + * + * \note Wraps around when reaching max tag, determined by the MPI + * implementation. + * + * \return a new MPI tag + */ + MPI_TagType allocateNewTag(); + + /** + * \internal \brief Handle a control message that coordinates multiple + * payloads arriving that constitute a contiguous payload + * + * \param[in] msg the message with control data + */ + void handleChunkedMultiMsg(MultiMsg* msg); + + /** + * \internal \brief Handle a control message; immediately calls + * \c handleChunkedMultiMsg + * + * \param[in] msg the message with control data + */ + static void chunkedMultiMsg(MultiMsg* msg); + bool testPendingActiveMsgAsyncRecv(); bool testPendingDataMsgAsyncRecv(); void finishPendingActiveMsgAsyncRecv(InProgressIRecv* irecv); diff --git a/src/vt/messaging/irecv_holder.h b/src/vt/messaging/irecv_holder.h index 679ff4ac5c..226fcda791 100644 --- a/src/vt/messaging/irecv_holder.h +++ b/src/vt/messaging/irecv_holder.h @@ -94,11 +94,9 @@ struct IRecvHolder { auto& e = holder_[i]; vtAssert(e.valid, "Must be valid"); - int flag = 0; - MPI_Status stat; - MPI_Test(&e.req, &flag, &stat); + auto done = e.test(); - if (flag == 0) { + if (not done) { ++i; continue; } diff --git a/src/vt/messaging/send_info.h b/src/vt/messaging/send_info.h new file mode 100644 index 0000000000..4aaf6d2399 --- /dev/null +++ b/src/vt/messaging/send_info.h @@ -0,0 +1,103 @@ +/* +//@HEADER +// ***************************************************************************** +// +// send_info.h +// DARMA Toolkit v. 1.0.0 +// DARMA/vt => Virtual Transport +// +// Copyright 2019 National Technology & Engineering Solutions of Sandia, LLC +// (NTESS). Under the terms of Contract DE-NA0003525 with NTESS, the U.S. +// Government retains certain rights in this software. +// +// Redistribution and use in source and binary forms, with or without +// modification, are permitted provided that the following conditions are met: +// +// * Redistributions of source code must retain the above copyright notice, +// this list of conditions and the following disclaimer. +// +// * Redistributions in binary form must reproduce the above copyright notice, +// this list of conditions and the following disclaimer in the documentation +// and/or other materials provided with the distribution. +// +// * Neither the name of the copyright holder nor the names of its +// contributors may be used to endorse or promote products derived from this +// software without specific prior written permission. +// +// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" +// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE +// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE +// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR +// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF +// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS +// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN +// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) +// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE +// POSSIBILITY OF SUCH DAMAGE. +// +// Questions? Contact darma@sandia.gov +// +// ***************************************************************************** +//@HEADER +*/ + +#if !defined INCLUDED_VT_MESSAGING_SEND_INFO_H +#define INCLUDED_VT_MESSAGING_SEND_INFO_H + +#include "vt/config.h" + +namespace vt { namespace messaging { + +/** + * \struct SendInfo + * + * \brief Returned from a data send to be used to receive the data + */ +struct SendInfo { + + /** + * \internal + * \brief Construct a SendInfo + * + * \param[in] in_event the send event (parent event if multiple sends) + * \param[in] in_tag the MPI tag it was sent with + * \param[in] in_nchunks the number of send chunks for the entire payload + */ + SendInfo(EventType in_event, TagType in_tag, int in_nchunks) + : event(in_event), + tag(in_tag), + nchunks(in_nchunks) + { } + + /** + * \brief Get the send event (either an MPI event or a parent event containing + * multiple MPI events) + * + * \return the send event + */ + EventType getEvent() const { return event; } + + /** + * \brief The MPI tag that it was sent with + * + * \return the tag + */ + TagType getTag() const { return tag; } + + /** + * \brief The number of Isend chunks that make up the entire payload + * + * \return the number of chunks + */ + int getNumChunks() const { return nchunks; } + +private: + EventType const event = no_event; /**< The event for the send */ + TagType const tag = no_tag; /**< The MPI tag for the send */ + int const nchunks = 0; /**< The number of send chunks to receive */ +}; + +}} /* end namespace vt::messaging */ + +#endif /*INCLUDED_VT_MESSAGING_SEND_INFO_H*/ diff --git a/src/vt/objgroup/proxy/proxy_objgroup.h b/src/vt/objgroup/proxy/proxy_objgroup.h index 5772125b74..76a78a72c1 100644 --- a/src/vt/objgroup/proxy/proxy_objgroup.h +++ b/src/vt/objgroup/proxy/proxy_objgroup.h @@ -89,26 +89,61 @@ struct Proxy { template < typename OpT = collective::None, typename MsgPtrT, - typename MsgT = typename util::MsgPtrType::MsgType, - ActiveTypedFnType *f = MsgT::template msgHandler< - MsgT, OpT, collective::reduce::operators::ReduceCallback - > + typename MsgT, + ActiveTypedFnType *f > EpochType reduce( MsgPtrT msg, Callback cb, EpochType epoch = no_epoch, TagType tag = no_tag ) const; + template < + typename OpT = collective::None, + typename MsgPtrT, + typename MsgT = typename util::MsgPtrType::MsgType + > + EpochType reduce( + MsgPtrT msg, Callback cb, EpochType epoch = no_epoch, + TagType tag = no_tag + ) const + { + return reduce< + OpT, + MsgPtrT, + MsgT, + &MsgT::template msgHandler< + MsgT, OpT, collective::reduce::operators::ReduceCallback + > + >(msg, cb, epoch, tag); + } template < typename OpT = collective::None, typename FunctorT, typename MsgPtrT, typename MsgT = typename util::MsgPtrType::MsgType, - ActiveTypedFnType *f = MsgT::template msgHandler + ActiveTypedFnType *f > EpochType reduce( MsgPtrT msg, EpochType epoch = no_epoch, TagType tag = no_tag ) const; + template < + typename OpT = collective::None, + typename FunctorT, + typename MsgPtrT, + typename MsgT = typename util::MsgPtrType::MsgType + > + EpochType reduce( + MsgPtrT msg, EpochType epoch = no_epoch, TagType tag = no_tag + ) const + { + return reduce< + OpT, + FunctorT, + MsgPtrT, + MsgT, + &MsgT::template msgHandler + >(msg, epoch, tag); + } template < typename MsgPtrT, diff --git a/src/vt/rdma/collection/rdma_collection.cc b/src/vt/rdma/collection/rdma_collection.cc index 15dea098f6..66f6660911 100644 --- a/src/vt/rdma/collection/rdma_collection.cc +++ b/src/vt/rdma/collection/rdma_collection.cc @@ -197,7 +197,8 @@ namespace vt { namespace rdma { auto send_payload = [&](Active::SendFnType send){ auto ret = send(put_ret, put_node, no_tag); - msg->mpi_tag_to_recv = std::get<1>(ret); + msg->mpi_tag_to_recv = ret.getTag(); + msg->nchunks = ret.getNumChunks(); }; if (tag != no_tag) { diff --git a/src/vt/rdma/rdma.cc b/src/vt/rdma/rdma.cc index dde4cc6e6c..99f2afae89 100644 --- a/src/vt/rdma/rdma.cc +++ b/src/vt/rdma/rdma.cc @@ -87,7 +87,8 @@ RDMAManager::RDMAManager() auto send_payload = [&](Active::SendFnType send){ auto ret = send(data, recv_node, no_tag); - new_msg->mpi_tag_to_recv = std::get<1>(ret); + new_msg->mpi_tag_to_recv = ret.getTag(); + new_msg->nchunks = ret.getNumChunks(); debug_print( rdma, node, "data is sending: tag={}, node={}\n", @@ -125,7 +126,7 @@ RDMAManager::RDMAManager() if (get_ptr == nullptr) { theMsg()->recvDataMsg( - msg->mpi_tag_to_recv, msg->send_back, + msg->nchunks, msg->mpi_tag_to_recv, msg->send_back, [=](RDMA_GetType ptr, ActionType deleter){ theRDMA()->triggerGetRecvData( op_id, msg_tag, std::get<0>(ptr), std::get<1>(ptr), deleter @@ -134,7 +135,8 @@ RDMAManager::RDMAManager() ); } else { theMsg()->recvDataMsgBuffer( - get_ptr, msg->mpi_tag_to_recv, msg->send_back, true, [get_ptr_action]{ + msg->nchunks, get_ptr, msg->mpi_tag_to_recv, msg->send_back, true, + [get_ptr_action]{ debug_print( rdma, node, "recv_data_msg_buffer finished\n" @@ -142,7 +144,8 @@ RDMAManager::RDMAManager() if (get_ptr_action) { get_ptr_action(); } - } + }, + nullptr, true ); } } @@ -208,6 +211,7 @@ RDMAManager::RDMAManager() if (put_ptr == nullptr) { theMsg()->recvDataMsg( + msg->nchunks, recv_tag, recv_node, [=](RDMA_GetType ptr, ActionType deleter){ debug_print( rdma, node, @@ -237,7 +241,7 @@ RDMAManager::RDMAManager() msg->offset != no_byte ? static_cast(put_ptr) + msg->offset : put_ptr; // do a direct recv into the user buffer theMsg()->recvDataMsgBuffer( - put_ptr_offset, recv_tag, recv_node, true, []{}, + msg->nchunks, put_ptr_offset, recv_tag, recv_node, true, []{}, [=](RDMA_GetType ptr, ActionType deleter){ debug_print( rdma, node, @@ -685,7 +689,8 @@ void RDMAManager::putData( auto send_payload = [&](Active::SendFnType send){ auto ret = send(RDMA_GetType{ptr, num_bytes}, put_node, no_tag); - msg->mpi_tag_to_recv = std::get<1>(ret); + msg->mpi_tag_to_recv = ret.getTag(); + msg->nchunks = ret.getNumChunks(); }; if (tag != no_tag) { diff --git a/src/vt/rdma/rdma_msg.h b/src/vt/rdma/rdma_msg.h index 8e46310d18..2a985abe6d 100644 --- a/src/vt/rdma/rdma_msg.h +++ b/src/vt/rdma/rdma_msg.h @@ -82,12 +82,13 @@ struct SendDataMessage : ActiveMessage { NodeType const& back = uninitialized_destination, NodeType const& in_recv_node = uninitialized_destination, bool const in_packed_direct = false - ) : ActiveMessage(), - rdma_handle(in_han), send_back(back), recv_node(in_recv_node), - mpi_tag_to_recv(in_mpi_tag), op_id(in_op), num_bytes(in_num_bytes), - offset(in_offset), packed_direct(in_packed_direct) + ) : rdma_handle(in_han), send_back(back), + recv_node(in_recv_node), mpi_tag_to_recv(in_mpi_tag), op_id(in_op), + num_bytes(in_num_bytes), offset(in_offset), + packed_direct(in_packed_direct) { } + int nchunks = 0; RDMA_HandleType rdma_handle = no_rdma_handle; NodeType send_back = uninitialized_destination; NodeType recv_node = uninitialized_destination; diff --git a/src/vt/runtime/runtime.cc b/src/vt/runtime/runtime.cc index fda9441086..44f8805f3c 100644 --- a/src/vt/runtime/runtime.cc +++ b/src/vt/runtime/runtime.cc @@ -874,6 +874,23 @@ void Runtime::printStartupBanner() { } } + // Limit to between 256 B and 1 GiB. If its too small a VT envelope won't fit; + // if its too large we overflow an integer passed to MPI. + if (ArgType::vt_max_mpi_send_size < 256) { + vtAbort("Max size for MPI send must be greater than 256 B"); + } else if (ArgType::vt_max_mpi_send_size > 1ull << 30) { + vtAbort("Max size for MPI send must not be greater than 1 GiB (overflow)"); + } else { + auto const bytes = ArgType::vt_max_mpi_send_size; + auto const ret = util::memory::getBestMemoryUnit(bytes); + auto f_max = fmt::format( + "Splitting messages greater than {} {}", + std::get<1>(ret), std::get<0>(ret) + ); + auto f_max_arg = opt_on("--vt_max_mpi_send_size", f_max); + fmt::print("{}\t{}{}", vt_pre, f_max_arg, reset); + } + if (ArgType::vt_debug_all) { auto f11 = fmt::format("All debug prints are on (if enabled compile-time)"); auto f12 = opt_on("--vt_debug_all", f11); diff --git a/src/vt/serialization/messaging/serialized_data_msg.h b/src/vt/serialization/messaging/serialized_data_msg.h index c3dd8800eb..54abc563ef 100644 --- a/src/vt/serialization/messaging/serialized_data_msg.h +++ b/src/vt/serialization/messaging/serialized_data_msg.h @@ -64,6 +64,7 @@ struct SerializedDataMsgAny : MessageT { HandlerType handler = uninitialized_handler; TagType data_recv_tag = no_tag; NodeType from_node = uninitialized_destination; + int nchunks = 0; }; template diff --git a/src/vt/serialization/messaging/serialized_messenger.impl.h b/src/vt/serialization/messaging/serialized_messenger.impl.h index ad8ebb9b48..dbd5c2d581 100644 --- a/src/vt/serialization/messaging/serialized_messenger.impl.h +++ b/src/vt/serialization/messaging/serialized_messenger.impl.h @@ -91,6 +91,8 @@ template ) { auto const handler = sys_msg->handler; auto const& recv_tag = sys_msg->data_recv_tag; + auto const& nchunks = sys_msg->nchunks; + auto const& len = sys_msg->ptr_size; auto const epoch = envelopeGetEpoch(sys_msg->env); debug_print( @@ -107,8 +109,8 @@ template } auto node = sys_msg->from_node; - theMsg()->recvDataMsg( - recv_tag, sys_msg->from_node, + theMsg()->recvDataDirect( + nchunks, recv_tag, sys_msg->from_node, len, [handler,recv_tag,node,epoch,is_valid_epoch] (RDMA_GetType ptr, ActionType action){ // be careful here not to use "msg", it is no longer valid @@ -352,9 +354,11 @@ template auto sys_msg = makeMessage>(); auto send_serialized = [=](Active::SendFnType send){ auto ret = send(RDMA_GetType{ptr, ptr_size}, dest, no_tag); - EventType event = std::get<0>(ret); + EventType event = ret.getEvent(); theEvent()->attachAction(event, [=]{ std::free(ptr); }); - sys_msg->data_recv_tag = std::get<1>(ret); + sys_msg->data_recv_tag = ret.getTag(); + sys_msg->nchunks = ret.getNumChunks(); + sys_msg->ptr_size = ptr_size; }; auto cur_ref = envelopeGetRef(sys_msg->env); sys_msg->env = msg->env; diff --git a/src/vt/utils/memory/memory_units.cc b/src/vt/utils/memory/memory_units.cc index d952d79755..391814e7c0 100644 --- a/src/vt/utils/memory/memory_units.cc +++ b/src/vt/utils/memory/memory_units.cc @@ -69,4 +69,33 @@ MemoryUnitEnum getUnitFromString(std::string const& unit) { return MemoryUnitEnum::Bytes; } +std::tuple getBestMemoryUnit(std::size_t bytes) { + auto multiplier = static_cast(MemoryUnitEnum::Yottabytes); + for ( ; multiplier > 0; multiplier--) { + auto value_tmp = static_cast(bytes); + for (int8_t i = 0; i < static_cast(multiplier); i++) { + value_tmp /= 1024.0; + } + if (value_tmp >= 1.) { + break; + } + } + + // We found a multiplier that results in a value over 1.0, use it + vtAssert( + multiplier <= static_cast(MemoryUnitEnum::Yottabytes) and + multiplier >= 0, + "Must be a valid memory unit" + ); + + auto unit_name = getMemoryUnitName(static_cast(multiplier)); + + auto new_value = static_cast(bytes); + for (int8_t i = 0; i < static_cast(multiplier); i++) { + new_value /= 1024.0; + } + + return std::make_tuple(unit_name, new_value); +} + }}} /* end namespace vt::util::memory */ diff --git a/src/vt/utils/memory/memory_units.h b/src/vt/utils/memory/memory_units.h index c1699c5b7f..1fe2266d4f 100644 --- a/src/vt/utils/memory/memory_units.h +++ b/src/vt/utils/memory/memory_units.h @@ -52,14 +52,20 @@ namespace vt { namespace util { namespace memory { enum struct MemoryUnitEnum : int8_t { - Bytes = 0, - Kilobytes = 1, - Megabytes = 2, - Gigabytes = 3 + Bytes = 0, + Kilobytes = 1, + Megabytes = 2, + Gigabytes = 3, + Terabytes = 4, + Petabytes = 5, + Exabytes = 6, + Zettabytes = 7, + Yottabytes = 8 }; std::string getMemoryUnitName(MemoryUnitEnum unit); MemoryUnitEnum getUnitFromString(std::string const& unit); +std::tuple getBestMemoryUnit(std::size_t bytes); }}} /* end namespace vt::util::memory */ diff --git a/src/vt/vrt/collection/balance/elm_stats.cc b/src/vt/vrt/collection/balance/elm_stats.cc index cd3133a1e9..ae5a84571a 100644 --- a/src/vt/vrt/collection/balance/elm_stats.cc +++ b/src/vt/vrt/collection/balance/elm_stats.cc @@ -137,6 +137,10 @@ void ElementStats::updatePhase(PhaseType const& inc) { cur_phase_ += inc; } +void ElementStats::resetPhase() { + cur_phase_ = fst_lb_phase; +} + PhaseType ElementStats::getPhase() const { return cur_phase_; } diff --git a/src/vt/vrt/collection/balance/elm_stats.h b/src/vt/vrt/collection/balance/elm_stats.h index 3301043f8f..4113de51c8 100644 --- a/src/vt/vrt/collection/balance/elm_stats.h +++ b/src/vt/vrt/collection/balance/elm_stats.h @@ -88,6 +88,7 @@ struct ElementStats { ); void setModelWeight(TimeType const& time); void updatePhase(PhaseType const& inc = 1); + void resetPhase(); PhaseType getPhase() const; TimeType getLoad(PhaseType const& phase) const; TimeType getLoad(PhaseType phase, SubphaseType subphase) const; diff --git a/src/vt/vrt/collection/manager.h b/src/vt/vrt/collection/manager.h index 4a96e6c6b6..5d964f59c4 100644 --- a/src/vt/vrt/collection/manager.h +++ b/src/vt/vrt/collection/manager.h @@ -901,6 +901,8 @@ struct CollectionManager { /** * \brief Restore the collection (collective) from file. * + * \note Resets the phase to 0 for every element. + * * \param[in] range the range of the collection to restart * \param[in] file_base the base file name for the files to read * diff --git a/src/vt/vrt/collection/manager.impl.h b/src/vt/vrt/collection/manager.impl.h index 84fe1fef73..cf48254554 100644 --- a/src/vt/vrt/collection/manager.impl.h +++ b/src/vt/vrt/collection/manager.impl.h @@ -3343,6 +3343,7 @@ CollectionManager::restoreFromFile( // @todo: error check the file read with bytes in directory auto col_ptr = checkpoint::deserializeFromFile(file_name); + col_ptr->stats_.resetPhase(); token[idx].insertPtr(std::move(col_ptr)); } diff --git a/src/vt/vrt/collection/reducable/reducable.h b/src/vt/vrt/collection/reducable/reducable.h index f77e6e1e2b..415365a44c 100644 --- a/src/vt/vrt/collection/reducable/reducable.h +++ b/src/vt/vrt/collection/reducable/reducable.h @@ -70,25 +70,57 @@ struct Reducable : BaseProxyT { template < typename OpT = collective::None, typename MsgT, - ActiveTypedFnType *f = MsgT::template msgHandler< - MsgT, OpT, collective::reduce::operators::ReduceCallback - > + ActiveTypedFnType *f > EpochType reduce( MsgT *const msg, Callback cb, EpochType const& epoch = no_epoch, TagType const& tag = no_tag ) const; + template < + typename OpT = collective::None, + typename MsgT + > + EpochType reduce( + MsgT *const msg, Callback cb, EpochType const& epoch = no_epoch, + TagType const& tag = no_tag + ) const + { + return reduce< + OpT, + MsgT, + &MsgT::template msgHandler< + MsgT, OpT, collective::reduce::operators::ReduceCallback + > + >(msg, cb, epoch, tag); + } template < typename OpT, typename FunctorT, typename MsgT, - ActiveTypedFnType *f = MsgT::template msgHandler + ActiveTypedFnType *f > EpochType reduce( MsgT *const msg, EpochType const& epoch = no_epoch, TagType const& tag = no_tag ) const; + template < + typename OpT, + typename FunctorT, + typename MsgT + > + EpochType reduce( + MsgT *const msg, EpochType const& epoch = no_epoch, + TagType const& tag = no_tag + ) const + { + return reduce< + OpT, + FunctorT, + MsgT, + &MsgT::template msgHandler + >(msg, epoch, tag); + } template *f> EpochType reduce( diff --git a/tests/perf/ping_pong.cc b/tests/perf/ping_pong.cc index 1f0d4efd28..acd4a6f548 100644 --- a/tests/perf/ping_pong.cc +++ b/tests/perf/ping_pong.cc @@ -105,7 +105,7 @@ static void finishedPing(FinishedPingMsg* msg) { if (num_bytes != max_bytes) { auto pmsg = makeSharedMessage>(); - theMsg()->sendMsg, pingPong>( + theMsg()->sendMsg, pingPong>( pong_node, pmsg ); } @@ -133,7 +133,7 @@ static void pingPong(PingMsg* in_msg) { if (cnt >= num_pings) { auto msg = makeSharedMessage>(num_bytes); - theMsg()->sendMsg, finishedPing>( + theMsg()->sendMsg, finishedPing>( 0, msg ); } else { @@ -141,12 +141,12 @@ static void pingPong(PingMsg* in_msg) { theContext()->getNode() == ping_node ? pong_node : ping_node; #if REUSE_MESSAGE_PING_PONG // @todo: fix this memory allocation problem - theMsg()->sendMsg, pingPong>( + theMsg()->sendMsg, pingPong>( next, in_msg, [=]{ /*delete in_msg;*/ } ); #else auto m = makeSharedMessage>(cnt + 1); - theMsg()->sendMsg, pingPong>(next, m); + theMsg()->sendMsg, pingPong>(next, m); #endif } } @@ -169,7 +169,7 @@ int main(int argc, char** argv) { if (my_node == 0) { auto m = makeSharedMessage>(); - theMsg()->sendMsg, pingPong>(pong_node, m); + theMsg()->sendMsg, pingPong>(pong_node, m); } while (!rt->isTerminated()) { diff --git a/tests/unit/active/test_active_send_large.cc b/tests/unit/active/test_active_send_large.cc new file mode 100644 index 0000000000..17460b9a8d --- /dev/null +++ b/tests/unit/active/test_active_send_large.cc @@ -0,0 +1,174 @@ +/* +//@HEADER +// ***************************************************************************** +// +// test_active_send_large.cc +// DARMA Toolkit v. 1.0.0 +// DARMA/vt => Virtual Transport +// +// Copyright 2019 National Technology & Engineering Solutions of Sandia, LLC +// (NTESS). Under the terms of Contract DE-NA0003525 with NTESS, the U.S. +// Government retains certain rights in this software. +// +// Redistribution and use in source and binary forms, with or without +// modification, are permitted provided that the following conditions are met: +// +// * Redistributions of source code must retain the above copyright notice, +// this list of conditions and the following disclaimer. +// +// * Redistributions in binary form must reproduce the above copyright notice, +// this list of conditions and the following disclaimer in the documentation +// and/or other materials provided with the distribution. +// +// * Neither the name of the copyright holder nor the names of its +// contributors may be used to endorse or promote products derived from this +// software without specific prior written permission. +// +// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" +// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE +// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE +// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR +// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF +// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS +// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN +// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) +// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE +// POSSIBILITY OF SUCH DAMAGE. +// +// Questions? Contact darma@sandia.gov +// +// ***************************************************************************** +//@HEADER +*/ + +#include +#include + +#include "test_parallel_harness.h" +#include "data_message.h" + +namespace vt { namespace tests { namespace unit { namespace large { + +struct SerializedTag {}; +struct NonSerializedTag {}; + +using RecvMsg = vt::Message; + +struct CallbackMsg : vt::Message { + vt::Callback cb_; +}; + +template +struct LargeMsg; + +template +struct LargeMsg< + nbytes, + T, + typename std::enable_if_t::value> +> : TestStaticSerialBytesMsg { }; + +template +struct LargeMsg< + nbytes, + T, + typename std::enable_if_t::value> +> : TestStaticBytesMsg { }; + +template +void fillMsg(T msg) { + auto arr = reinterpret_cast(&msg->payload[0]); + for (std::size_t i = 0; i < msg->bytes / sizeof(int64_t); i++) { + arr[i] = i; + } +} + +template +void checkMsg(T msg) { + auto arr = reinterpret_cast(&msg->payload[0]); + for (std::size_t i = 0; i < msg->bytes / sizeof(int64_t); i++) { + EXPECT_EQ(arr[i], i); + } +} + +template +void myHandler(MsgT* m) { + checkMsg(m); + auto msg = makeMessage(); + m->cb_.send(msg.get()); +} + +template +struct TestActiveSendLarge : TestParallelHarness { + using TagType = typename std::tuple_element<1,T>::type; + + // Set max size to 16 KiB for testing + void addAdditionalArgs() override { + new_arg = fmt::format("--vt_max_mpi_send_size=16384"); + addArgs(new_arg); + } + +private: + std::string new_arg; +}; + +TYPED_TEST_SUITE_P(TestActiveSendLarge); + +TYPED_TEST_P(TestActiveSendLarge, test_large_bytes_msg) { + using IntegralType = typename std::tuple_element<0,TypeParam>::type; + using TagType = typename std::tuple_element<1,TypeParam>::type; + + static constexpr NumBytesType const nbytes = 1ll << IntegralType::value; + + using LargeMsgType = LargeMsg; + + NodeType const this_node = theContext()->getNode(); + NodeType const num_nodes = theContext()->getNumNodes(); + + // over two nodes will allocate a lot of memory for the run + if (num_nodes != 2) { + return; + } + + int counter = 0; + auto e = pipe::LifetimeEnum::Once; + auto cb = theCB()->makeFunc(e, [&counter](RecvMsg*){ counter++; }); + + NodeType next_node = (this_node + 1) % num_nodes; + + vt::runInEpochCollective([&]{ + auto msg = makeMessage(); + fillMsg(msg); + msg->cb_ = cb; + theMsg()->sendMsg>(next_node, msg.get()); + }); + + EXPECT_EQ(counter, 1); +} + +REGISTER_TYPED_TEST_SUITE_P(TestActiveSendLarge, test_large_bytes_msg); + +using NonSerTestTypes = testing::Types< + std::tuple, NonSerializedTag>, + std::tuple, NonSerializedTag> + // std::tuple, NonSerializedTag> +>; + +using SerTestTypes = testing::Types< + std::tuple, SerializedTag>, + std::tuple, SerializedTag> + // std::tuple, SerializedTag> +>; + +INSTANTIATE_TYPED_TEST_SUITE_P( + test_large_bytes_serialized, TestActiveSendLarge, NonSerTestTypes, + DEFAULT_NAME_GEN +); + +INSTANTIATE_TYPED_TEST_SUITE_P( + test_large_bytes_nonserialized, TestActiveSendLarge, SerTestTypes, + DEFAULT_NAME_GEN +); + +}}}} // end namespace vt::tests::unit::large diff --git a/tests/unit/pool/test_pool_message_sizes.cc b/tests/unit/pool/test_pool_message_sizes.cc index 69bc114d02..d0746f419b 100644 --- a/tests/unit/pool/test_pool_message_sizes.cc +++ b/tests/unit/pool/test_pool_message_sizes.cc @@ -102,12 +102,12 @@ void TestPoolMessageSizes::testPoolFun(TestMsg* prev_msg) { if (count < max_test_count) { auto msg = makeSharedMessage>(); - theMsg()->sendMsg, testPoolFun>( + theMsg()->sendMsg, testPoolFun>( next, msg ); } else { auto msg = makeSharedMessage>(); - theMsg()->sendMsg, testPoolFun>( + theMsg()->sendMsg, testPoolFun>( next, msg ); count = 0; diff --git a/tests/unit/runtime/test_initialization.nompi.cc b/tests/unit/runtime/test_initialization.nompi.cc new file mode 100644 index 0000000000..b04cd35cab --- /dev/null +++ b/tests/unit/runtime/test_initialization.nompi.cc @@ -0,0 +1,60 @@ +/* +//@HEADER +// ***************************************************************************** +// +// test_initialization.nompi.cc +// DARMA Toolkit v. 1.0.0 +// DARMA/vt => Virtual Transport +// +// Copyright 2020 National Technology & Engineering Solutions of Sandia, LLC +// (NTESS). Under the terms of Contract DE-NA0003525 with NTESS, the U.S. +// Government retains certain rights in this software. +// +// Redistribution and use in source and binary forms, with or without +// modification, are permitted provided that the following conditions are met: +// +// * Redistributions of source code must retain the above copyright notice, +// this list of conditions and the following disclaimer. +// +// * Redistributions in binary form must reproduce the above copyright notice, +// this list of conditions and the following disclaimer in the documentation +// and/or other materials provided with the distribution. +// +// * Neither the name of the copyright holder nor the names of its +// contributors may be used to endorse or promote products derived from this +// software without specific prior written permission. +// +// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" +// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE +// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE +// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR +// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF +// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS +// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN +// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) +// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE +// POSSIBILITY OF SUCH DAMAGE. +// +// Questions? Contact darma@sandia.gov +// +// ***************************************************************************** +//@HEADER +*/ + +#include + +#include "test_harness.h" + +#include + +namespace vt { namespace tests { namespace unit { + +using TestInitialization = TestHarness; + +TEST_F(TestInitialization, test_initialize_no_args) { + vt::initialize(); + vt::finalize(); +} + +}}} // end namespace vt::tests::unit diff --git a/tests/unit/test_parallel_harness.h b/tests/unit/test_parallel_harness.h index 6d98f10df0..985900fcfd 100644 --- a/tests/unit/test_parallel_harness.h +++ b/tests/unit/test_parallel_harness.h @@ -75,6 +75,9 @@ struct MPISingletonMultiTest { MPI_Finalize(); } +public: + MPI_Comm getComm() { return comm_; } + private: MPI_Comm comm_; }; @@ -119,6 +122,41 @@ struct TestParallelHarnessAny : TestHarnessAny { TestHarnessAny::TearDown(); } + +protected: + template + void addArgs(Arg& arg) { + this->additional_args_.emplace_back(&arg[0]); + } + + template + void addArgs(Arg& arg, Args&... args) { + this->additional_args_.emplace_back(&arg[0]); + addArgs(args...); + } + +private: + /** + * \internal \brief Add additional arguments used during initialization of vt + * components + * + * To add additional arguments override this function in your class and add + * needed arguments to `additional_args_` vector. + * + * Example: + * struct TestParallelHarnessWithStatsDumping : TestParallelHarnessParam { + * virtual void addAdditionalArgs() override { + * static char vt_lb_stats[]{"--vt_lb_stats"}; + * static char vt_lb_stats_dir[]{"--vt_lb_stats_dir=test_stats_dir"}; + * static char vt_lb_stats_file[]{"--vt_lb_stats_file=test_stats_outfile"}; + * + * addArgs(vt_lb_stats, vt_lb_stats_dir, vt_lb_stats_file); + * } + * }; + */ + virtual void addAdditionalArgs() {} + + std::vector additional_args_; }; using TestParallelHarness = TestParallelHarnessAny;