From f75d8017bb3c0c401d6db61c22898451ebf19505 Mon Sep 17 00:00:00 2001 From: Harsh Thakkar Date: Wed, 2 Oct 2024 18:07:00 +0000 Subject: [PATCH] Increase resume-timeout for TPU partition in blueprint --- community/examples/hpc-slurm6-tpu.yaml | 1 + 1 file changed, 1 insertion(+) diff --git a/community/examples/hpc-slurm6-tpu.yaml b/community/examples/hpc-slurm6-tpu.yaml index 606dae3246..5f9e9c3edd 100644 --- a/community/examples/hpc-slurm6-tpu.yaml +++ b/community/examples/hpc-slurm6-tpu.yaml @@ -49,6 +49,7 @@ deployment_groups: use: [tpu_nodeset] settings: partition_name: tpu + resume_timeout: 600 - id: slurm_login source: community/modules/scheduler/schedmd-slurm-gcp-v6-login