From b40008d6c3afed0fe11523dcf0b27a3d3da69d59 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Test=C3=A9?= Date: Thu, 25 May 2023 16:03:34 +0200 Subject: [PATCH 1/7] test: aws fallback region --- ci/slab.toml | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/ci/slab.toml b/ci/slab.toml index b206d62..8bcbd83 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -1,9 +1,15 @@ [profile.cpu] region = "eu-west-3" image_id = "ami-05e8e219ac7e82eba" # ubuntu 22.04 -instance_type = "t3.micro" +#instance_type = "t3.micro" +instance_type = "m6g.large" subnet_id = "subnet-0e042c7621461f754" +[profile.cpu_fallback] +region = "us-east-1" +image_id = "ami-0c4773f5626d919b6" +instance_type = "p3.2xlarge" + [profile.gpu] region = "eu-west-1" # Ireland image_id = "ami-0261faf04cf54fe0a" # GPU image in eu-west-1 to test auto retry From 086fe2c37969f7c76544d73140ebd0ba03d275fd Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Test=C3=A9?= Date: Wed, 21 Feb 2024 12:23:51 +0100 Subject: [PATCH 2/7] test: provision spot instance --- ci/slab.toml | 12 +++++++++--- 1 file changed, 9 insertions(+), 3 deletions(-) diff --git a/ci/slab.toml b/ci/slab.toml index 8bcbd83..fc69e31 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -1,8 +1,8 @@ [profile.cpu] region = "eu-west-3" image_id = "ami-05e8e219ac7e82eba" # ubuntu 22.04 -#instance_type = "t3.micro" -instance_type = "m6g.large" +instance_type = "t3.micro" +#instance_type = "m6g.large" subnet_id = "subnet-0e042c7621461f754" [profile.cpu_fallback] @@ -15,6 +15,12 @@ region = "eu-west-1" # Ireland image_id = "ami-0261faf04cf54fe0a" # GPU image in eu-west-1 to test auto retry instance_type = "p3.2xlarge" +[profile.gpu-bench] +region = "us-west-2" +image_id = "ami-02ae9b9b4fffdf66f" +instance_type = "p5.48xlarge" +max_spot_price = "200.49" + [command.cpu_test] workflow = "main.yml" profile = "cpu" @@ -24,6 +30,6 @@ check_run_name = "AWS tests (Slab)" [command.gpu_test] workflow = "main.yml" -profile = "gpu" +profile = "gpu-bench" check_run_name = "AWS tests spawn GPU (Slab)" From 7a4e7299daeeea8916c14ad5dc4828165c47ef22 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Test=C3=A9?= Date: Thu, 29 Feb 2024 16:14:52 +0100 Subject: [PATCH 3/7] test: add new backend handling --- ci/slab.toml | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/ci/slab.toml b/ci/slab.toml index fc69e31..9f251a9 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -5,6 +5,12 @@ instance_type = "t3.micro" #instance_type = "m6g.large" subnet_id = "subnet-0e042c7621461f754" +# Handling backends +[backend.aws.cpu] +region = "eu-west-3" +image_id = "ami-05e8e219ac7e82eba" # ubuntu 22.04 +instance_type = "t3.xlarge" + [profile.cpu_fallback] region = "us-east-1" image_id = "ami-0c4773f5626d919b6" From 121f2aa571f6b9a31f155ece2d46d4dfbf6a0cda Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Test=C3=A9?= Date: Fri, 1 Mar 2024 18:03:07 +0100 Subject: [PATCH 4/7] test: add fallback for backend handling --- ci/slab.toml | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/ci/slab.toml b/ci/slab.toml index 9f251a9..b2d4efb 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -9,6 +9,11 @@ subnet_id = "subnet-0e042c7621461f754" [backend.aws.cpu] region = "eu-west-3" image_id = "ami-05e8e219ac7e82eba" # ubuntu 22.04 +instance_type = "t345.xlarge" # Non existing instance type + +[backend.aws.cpu_fallback] +region = "eu-west-3" +image_id = "ami-05e8e219ac7e82eba" # ubuntu 22.04 instance_type = "t3.xlarge" [profile.cpu_fallback] From 670d7068efc07c0698c4f3919ea882681f99c753 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Test=C3=A9?= Date: Thu, 7 Mar 2024 09:49:47 +0100 Subject: [PATCH 5/7] test: return to primary backend working --- ci/slab.toml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/ci/slab.toml b/ci/slab.toml index b2d4efb..6f7aab2 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -9,7 +9,8 @@ subnet_id = "subnet-0e042c7621461f754" [backend.aws.cpu] region = "eu-west-3" image_id = "ami-05e8e219ac7e82eba" # ubuntu 22.04 -instance_type = "t345.xlarge" # Non existing instance type +instance_type = "t3.xlarge" +#instance_type = "t345.xlarge" # Non existing instance type [backend.aws.cpu_fallback] region = "eu-west-3" From ffb9a73b805b4b22e9e98171ec98afc6ee1438d3 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Test=C3=A9?= Date: Thu, 4 Apr 2024 15:28:26 +0200 Subject: [PATCH 6/7] WIP: test hyperstack backend provider --- ci/slab.toml | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/ci/slab.toml b/ci/slab.toml index 6f7aab2..750b1aa 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -22,6 +22,16 @@ region = "us-east-1" image_id = "ami-0c4773f5626d919b6" instance_type = "p3.2xlarge" +#[backend.hyperstack.gpu] +#environment_name = "norway" +#image_name = "Ubuntu Server 22.04 LTS R535 CUDA 12.2" +#flavor_name = "n1-cpu-small" + +[backend.hyperstack.gpu] +environment_name = "canada" +image_name = "Ubuntu Server 22.04 LTS R535 CUDA 12.2" +flavor_name = "m" + [profile.gpu] region = "eu-west-1" # Ireland image_id = "ami-0261faf04cf54fe0a" # GPU image in eu-west-1 to test auto retry From f717c8e6a32547a33023ae982dd1daae44e99a21 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?David=20Test=C3=A9?= Date: Fri, 12 Apr 2024 15:50:51 +0200 Subject: [PATCH 7/7] test: test github architecture runners --- ci/slab.toml | 2 ++ 1 file changed, 2 insertions(+) diff --git a/ci/slab.toml b/ci/slab.toml index 750b1aa..05bc3a0 100644 --- a/ci/slab.toml +++ b/ci/slab.toml @@ -9,7 +9,9 @@ subnet_id = "subnet-0e042c7621461f754" [backend.aws.cpu] region = "eu-west-3" image_id = "ami-05e8e219ac7e82eba" # ubuntu 22.04 +#image_id = "ami-00232bbfe70330a10" # ubuntu 22.04 ARM64 instance_type = "t3.xlarge" +#instance_type = "t4g.medium" # ARM machine #instance_type = "t345.xlarge" # Non existing instance type [backend.aws.cpu_fallback]