From 2dbcc46a92349cc4d5fb1a10d73eeea2638509a1 Mon Sep 17 00:00:00 2001 From: Boris Popov Date: Thu, 12 Sep 2024 11:53:42 +0200 Subject: [PATCH] configured tests to run --- .github/workflows/terraform.yml | 2 +- k8s-training/tests/main.tftest.hcl | 1 + slurm/gpu_cluster.tf | 2 +- slurm/tests/main.tftest.hcl | 1 + slurm/variables.tf | 7 +++++++ 5 files changed, 11 insertions(+), 2 deletions(-) diff --git a/.github/workflows/terraform.yml b/.github/workflows/terraform.yml index 3b68b6d1..ba234aed 100644 --- a/.github/workflows/terraform.yml +++ b/.github/workflows/terraform.yml @@ -19,7 +19,7 @@ jobs: name: project-e00pjzzrtk1fs3yavy runs-on: ubuntu-latest strategy: - max-parallel: 2 + max-parallel: 3 matrix: solution: - name: k8s-inference diff --git a/k8s-training/tests/main.tftest.hcl b/k8s-training/tests/main.tftest.hcl index 6238e7bb..5ab20487 100644 --- a/k8s-training/tests/main.tftest.hcl +++ b/k8s-training/tests/main.tftest.hcl @@ -4,6 +4,7 @@ run "create_cluster" { variables { enable_loki = false # TODO: Disabling Loki since not possible to delete non-empty storage bucket test_mode = true + infiniband_fabric = "fabric-4" } assert { diff --git a/slurm/gpu_cluster.tf b/slurm/gpu_cluster.tf index 71639a63..08df678c 100644 --- a/slurm/gpu_cluster.tf +++ b/slurm/gpu_cluster.tf @@ -2,5 +2,5 @@ resource "nebius_compute_v1_gpu_cluster" "gpu-cluster-slurm" { parent_id = var.parent_id name = "gpu-cluster-slurm" - infiniband_fabric = "fabric-3" + infiniband_fabric = var.infiniband_fabric } diff --git a/slurm/tests/main.tftest.hcl b/slurm/tests/main.tftest.hcl index 66d45c39..ef2b2af3 100644 --- a/slurm/tests/main.tftest.hcl +++ b/slurm/tests/main.tftest.hcl @@ -4,5 +4,6 @@ run "create_cluster" { variables { cluster_workers_count = 2 test_mode = true + infiniband_fabric = "fabric-4" } } diff --git a/slurm/variables.tf b/slurm/variables.tf index 2acc651a..bfbb7cc3 100644 --- a/slurm/variables.tf +++ b/slurm/variables.tf @@ -93,3 +93,10 @@ variable "test_mode" { type = bool default = false } + + +variable "infiniband_fabric" { + description = "Infiniband's fabric name." + type = string + default = "fabric-4" +}