Skip to content

Commit

Permalink
Disable reservation for larger jobs
Browse files Browse the repository at this point in the history
This commit disable the clima reservation for some of the larger CI
jobs. This increases the throughput for all the other jobs because slrum
will not try to hold onto the reserved node to run the larger jobs.
  • Loading branch information
Sbozzolo committed Feb 3, 2025
1 parent 30c7357 commit c9f1652
Show file tree
Hide file tree
Showing 2 changed files with 11 additions and 0 deletions.
9 changes: 9 additions & 0 deletions .buildkite/longruns/pipeline.yml
Original file line number Diff line number Diff line change
Expand Up @@ -145,6 +145,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- label: "TARGET IDEALIZED: new target aqua - fixed ocean T, nocouple, atmos flux calc"
Expand All @@ -158,6 +159,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- label: "TARGET IDEALIZED: new target aqua - fixed ocean T, coupler flux calc"
Expand All @@ -171,6 +173,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- label: "TARGET IDEALIZED: new target aqua - evolving slab ocean T"
Expand All @@ -184,6 +187,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- label: "TARGET IDEALIZED: new target slab - fixed ocean T, bucket"
Expand All @@ -197,6 +201,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- label: "TARGET IDEALIZED: new target slab - evolving slab ocean T, bucket"
Expand All @@ -210,6 +215,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- group: "Current target tests: AMIP surfaces"
Expand All @@ -227,6 +233,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- label: "MPI AMIP FINE: new target amip: topo"
Expand All @@ -240,6 +247,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 16G
slurm_reservation: "false"
soft_fail: true

- label: "MPI AMIP FINE: new target amip: topo + diagedmf"
Expand All @@ -253,6 +261,7 @@ steps:
slurm_ntasks_per_node: 16
slurm_nodes: 4
slurm_mem_per_cpu: 20G
slurm_reservation: "false"
soft_fail: true

- group: "Current target tests on GPU: AMIP surface"
Expand Down
2 changes: 2 additions & 0 deletions .buildkite/pipeline.yml
Original file line number Diff line number Diff line change
Expand Up @@ -37,6 +37,7 @@ steps:
- "julia --project=experiments/ClimaCore/ -e 'using Pkg; Pkg.add(\"MPI\"); Pkg.add(\"CUDA\")'"
- "julia --project=experiments/ClimaCore/ -e 'using Pkg; Pkg.precompile()'"
- "julia --project=experiments/ClimaCore/ -e 'using Pkg; Pkg.status()'"
- "julia --project=experiments/ClimaCore/ -e 'using CUDA; CUDA.precompile_runtime()'"

- echo "--- Instantiate ClimaEarth experiments env"
- "julia --project=experiments/ClimaEarth/ -e 'using Pkg; Pkg.develop(path=\".\")'"
Expand Down Expand Up @@ -206,6 +207,7 @@ steps:
agents:
slurm_ntasks: 4
slurm_mem: 48GB
slurm_reservation: "false"

# short high-res performance test
- label: "Unthreaded AMIP FINE" # also reported by longruns with a flame graph
Expand Down

0 comments on commit c9f1652

Please sign in to comment.