From 281dba57ab0219fdf804d30c3a8921c3a1f6b533 Mon Sep 17 00:00:00 2001 From: atalman Date: Fri, 22 Nov 2024 09:21:32 -0800 Subject: [PATCH 1/2] Use ephemeral runners for linux jobs --- .github/scale-config.yml | 12 ++++++++++++ tools/scripts/generate_binary_build_matrix.py | 4 ++-- 2 files changed, 14 insertions(+), 2 deletions(-) diff --git a/.github/scale-config.yml b/.github/scale-config.yml index 9f908af70e..6b2b105847 100644 --- a/.github/scale-config.yml +++ b/.github/scale-config.yml @@ -95,6 +95,12 @@ runner_types: is_ephemeral: false os: linux ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 + linux.2xlarge.ephemeral: + disk_size: 150 + instance_type: c5.2xlarge + is_ephemeral: true + os: linux + ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 linux.4xlarge: disk_size: 150 instance_type: c5.4xlarge @@ -143,6 +149,12 @@ runner_types: is_ephemeral: false os: linux ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 + linux.g5.4xlarge.nvidia.gpu.ephemeral: + disk_size: 150 + instance_type: g5.4xlarge + is_ephemeral: true + os: linux + ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 linux.g6.4xlarge.experimental.nvidia.gpu: disk_size: 150 instance_type: g6.4xlarge diff --git a/tools/scripts/generate_binary_build_matrix.py b/tools/scripts/generate_binary_build_matrix.py index 65d7e6f334..59c9dc1767 100644 --- a/tools/scripts/generate_binary_build_matrix.py +++ b/tools/scripts/generate_binary_build_matrix.py @@ -79,8 +79,8 @@ LIBTORCH_CONTAINER_IMAGES: Dict[Tuple[str, str], str] WHEEL_CONTAINER_IMAGES: Dict[str, str] -LINUX_GPU_RUNNER = "linux.g5.4xlarge.nvidia.gpu" -LINUX_CPU_RUNNER = "linux.2xlarge" +LINUX_GPU_RUNNER = "linux.g5.4xlarge.nvidia.gpu.ephemeral" +LINUX_CPU_RUNNER = "linux.2xlarge.ephemeral" LINUX_AARCH64_RUNNER = "linux.arm64.2xlarge" LINUX_AARCH64_GPU_RUNNER = "linux.arm64.m7g.4xlarge" WIN_GPU_RUNNER = "windows.g4dn.xlarge" From 6e0333504aee045bc445900af34ea4fdb7ae00e6 Mon Sep 17 00:00:00 2001 From: atalman Date: Fri, 22 Nov 2024 09:30:29 -0800 Subject: [PATCH 2/2] test --- .github/lf-canary-scale-config.yml | 12 ++++++++++++ .github/lf-scale-config.yml | 12 ++++++++++++ 2 files changed, 24 insertions(+) diff --git a/.github/lf-canary-scale-config.yml b/.github/lf-canary-scale-config.yml index 8e2ea2f198..0fe5778f57 100644 --- a/.github/lf-canary-scale-config.yml +++ b/.github/lf-canary-scale-config.yml @@ -99,6 +99,12 @@ runner_types: is_ephemeral: false os: linux ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 + lf.c.linux.2xlarge.ephemeral: + disk_size: 150 + instance_type: c5.2xlarge + is_ephemeral: true + os: linux + ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 lf.c.linux.4xlarge: disk_size: 150 instance_type: c5.4xlarge @@ -147,6 +153,12 @@ runner_types: is_ephemeral: false os: linux ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 + lf.c.linux.g5.4xlarge.nvidia.gpu.ephemeral: + disk_size: 150 + instance_type: g5.4xlarge + is_ephemeral: true + os: linux + ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 lf.c.linux.g6.4xlarge.experimental.nvidia.gpu: disk_size: 150 instance_type: g6.4xlarge diff --git a/.github/lf-scale-config.yml b/.github/lf-scale-config.yml index b1577768e6..f0876ad8fb 100644 --- a/.github/lf-scale-config.yml +++ b/.github/lf-scale-config.yml @@ -99,6 +99,12 @@ runner_types: is_ephemeral: false os: linux ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 + lf.linux.2xlarge.ephemeral: + disk_size: 150 + instance_type: c5.2xlarge + is_ephemeral: true + os: linux + ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 lf.linux.4xlarge: disk_size: 150 instance_type: c5.4xlarge @@ -147,6 +153,12 @@ runner_types: is_ephemeral: false os: linux ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 + lf.linux.g5.4xlarge.nvidia.gpu.ephemeral: + disk_size: 150 + instance_type: g5.4xlarge + is_ephemeral: true + os: linux + ami: al2023-ami-2023.5.202*-kernel-6.1-x86_64 lf.linux.g6.4xlarge.experimental.nvidia.gpu: disk_size: 150 instance_type: g6.4xlarge