Skip to content

Commit

Permalink
Update hpc slurm gromac example and references to use Slurm V6
Browse files Browse the repository at this point in the history
  • Loading branch information
harshthakkar01 committed Jan 22, 2024
1 parent 214fcbd commit 29d96fa
Show file tree
Hide file tree
Showing 3 changed files with 49 additions and 34 deletions.
72 changes: 43 additions & 29 deletions community/examples/hpc-slurm-gromacs.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,7 @@ deployment_groups:
- group: primary
modules:
- id: network1
source: modules/network/pre-existing-vpc
source: modules/network/vpc

## Filesystems
- id: appsfs
Expand All @@ -49,6 +49,7 @@ deployment_groups:
source: community/modules/scripts/spack-setup
settings:
install_dir: /sw/spack
spack_ref: v0.20.0

- id: spack-execute
source: community/modules/scripts/spack-execute
Expand All @@ -68,11 +69,11 @@ deployment_groups:
projections:
all: '{name}/{version}-{compiler.name}-{compiler.version}'
commands: |
# Un-comment and update mirror_url to install from spack cache
# if ! spack mirror list | grep -q gcs_cache; then
# spack mirror add --scope site gcs_cache gs://optionally_set_spack_cache_bucket
# fi
# spack buildcache keys --install --trust
## Un-comment and update mirror_url to install from spack cache
## if ! spack mirror list | grep -q gcs_cache; then
## spack mirror add --scope site gcs_cache gs://optionally_set_spack_cache_bucket
## fi
## spack buildcache keys --install --trust
spack config --scope defaults add config:build_stage:/sw/spack/spack-stage
spack config --scope defaults add -f /tmp/projections-config.yaml
Expand All @@ -82,38 +83,51 @@ deployment_groups:
spack compiler find --scope site
spack install [email protected]%[email protected]
spack install [email protected] %[email protected] ^[email protected] ^[email protected] %gcc@4.8.5
spack install [email protected] %[email protected] ^[email protected] ^[email protected] %[email protected].0
- id: compute_partition
source: community/modules/compute/SchedMD-slurm-on-gcp-partition
use:
- network1
- homefs
- appsfs
- id: script
source: modules/scripts/startup-script
settings:
partition_name: compute
max_node_count: 20
runners:
# remove lustre client temporary to avoid startup failure due to known
# issue.
- type: shell
destination: remove_lustre_client.sh
content: |
#!/bin/bash
rm /etc/yum.repos.d/lustre-client.repo
- $(spack-execute.spack_runner)

- id: compute_nodeset
source: community/modules/compute/schedmd-slurm-gcp-v6-nodeset
use: [network1]
settings:
node_count_dynamic_max: 20
bandwidth_tier: gvnic_enabled

- id: slurm_controller
source: community/modules/scheduler/SchedMD-slurm-on-gcp-controller
use:
- network1
- homefs
- appsfs
- compute_partition
- id: compute_partition
source: community/modules/compute/schedmd-slurm-gcp-v6-partition
use: [compute_nodeset, homefs, appsfs]
settings:
login_node_count: 1
partition_name: compute

- id: slurm_login
source: community/modules/scheduler/SchedMD-slurm-on-gcp-login-node
source: community/modules/scheduler/schedmd-slurm-gcp-v6-login
use: [network1]
settings:
name_prefix: login
machine_type: n2-standard-4
disable_login_public_ips: false

- id: slurm_controller
source: community/modules/scheduler/schedmd-slurm-gcp-v6-controller
use:
- network1
- compute_partition
- slurm_login
- homefs
- appsfs
- slurm_controller
- spack-execute
settings:
login_machine_type: c2-standard-4
login_scopes:
- https://www.googleapis.com/auth/cloud-platform
disable_controller_public_ips: false
login_startup_script: $(script.startup_script)
login_startup_scripts_timeout: 21600
Original file line number Diff line number Diff line change
Expand Up @@ -18,7 +18,7 @@
ansible.builtin.include_tasks: "tasks/wait-for-startup-script.yml"
vars:
vm_name: "{{ login_node }}"
timeout_seconds: 7200
timeout_seconds: 21600
- name: Ensure spack is installed
ansible.builtin.command: spack --version
changed_when: False
Expand Down
9 changes: 5 additions & 4 deletions tools/cloud-build/daily-tests/tests/spack-gromacs.yml
Original file line number Diff line number Diff line change
Expand Up @@ -15,14 +15,15 @@
---

test_name: hpc-slurm-gromacs
deployment_name: "spack-gromacs-{{ build }}"
deployment_name: "groma-{{ build }}"
slurm_cluster_name: "groma{{ build[0:5] }}"
zone: us-central1-c
workspace: /workspace
blueprint_yaml: "{{ workspace }}/community/examples/hpc-slurm-gromacs.yaml"
network: "default"
network: "{{ deployment_name }}-net"
max_nodes: 5
login_node: slurm-{{ deployment_name }}-login0
controller_node: slurm-{{ deployment_name }}-controller
login_node: "{{ slurm_cluster_name }}-login-*"
controller_node: "{{ slurm_cluster_name }}-controller"
post_deploy_tests:
- test-validation/test-spack.yml
custom_vars:
Expand Down

0 comments on commit 29d96fa

Please sign in to comment.