From 05e5846b5c6e32769ba3d4cb22ea8a8dc9da6667 Mon Sep 17 00:00:00 2001 From: XaverStiensmeier Date: Wed, 13 Dec 2023 15:32:58 +0100 Subject: [PATCH] Tried to fix temps and tried update to 23.11 but has errors so commented that part out --- .../playbook/roles/bibigrid/files/slurm/cgroup.conf | 1 + resources/playbook/roles/bibigrid/tasks/042-slurm.yml | 9 +++++++++ .../roles/bibigrid/templates/slurm/job_container.conf | 4 ++-- .../playbook/roles/bibigrid/templates/slurm/slurm.conf | 1 + 4 files changed, 13 insertions(+), 2 deletions(-) diff --git a/resources/playbook/roles/bibigrid/files/slurm/cgroup.conf b/resources/playbook/roles/bibigrid/files/slurm/cgroup.conf index 657a243d..2705699f 100644 --- a/resources/playbook/roles/bibigrid/files/slurm/cgroup.conf +++ b/resources/playbook/roles/bibigrid/files/slurm/cgroup.conf @@ -1,3 +1,4 @@ +# maybe this causes errors when using 23.11 https://slurm.schedmd.com/faq.html#cgroupv2 CgroupMountpoint="/sys/fs/cgroup" CgroupAutomount=yes ConstrainCores=no diff --git a/resources/playbook/roles/bibigrid/tasks/042-slurm.yml b/resources/playbook/roles/bibigrid/tasks/042-slurm.yml index f965d264..33c25bff 100644 --- a/resources/playbook/roles/bibigrid/tasks/042-slurm.yml +++ b/resources/playbook/roles/bibigrid/tasks/042-slurm.yml @@ -15,6 +15,15 @@ - slurm-full - munge +#- name: Download Slurm (TEMPORARY) +# get_url: +# url: "https://docs.cebitec.uni-bielefeld.de/s/FjCP3xQPPnBwSy9/download?path=%2F&files=slurm-full_23.11.0-0_amd64.deb" # Replace with your package link +# dest: "/tmp/package.deb" # Destination where the package will be saved +#- name: Install Slurm package +# apt: +# deb: "/tmp/package.deb" +# state: present # Install the package if not already installed + - name: Create new secret (Munge) copy: content: '{{ slurm_conf.munge_key }}' diff --git a/resources/playbook/roles/bibigrid/templates/slurm/job_container.conf b/resources/playbook/roles/bibigrid/templates/slurm/job_container.conf index 2b51ed11..caa6a91c 100644 --- a/resources/playbook/roles/bibigrid/templates/slurm/job_container.conf +++ b/resources/playbook/roles/bibigrid/templates/slurm/job_container.conf @@ -1,5 +1,5 @@ NodeName={{ name }} AutoBasePath=true BasePath={{ '/vol/scratch/storage' if flavor.ephemeral else '/var/local/storage' }} {% for worker_group in groups | select('match', '^bibigrid_worker_*') %} - {% set first_worker = groups[worker_group] | first %} - NodeName={{ hostvars[first_worker].name }} AutoBasePath=true BasePath={{ '/vol/scratch/storage' if hostvars[first_worker].flavor.ephemeral else '/var/local/storage' }} +{% set first_worker = groups[worker_group] | first %} +NodeName={{ hostvars[first_worker].name }} AutoBasePath=true BasePath={{ '/vol/scratch/storage' if hostvars[first_worker].flavor.ephemeral else '/var/local/storage' }} {% endfor %} \ No newline at end of file diff --git a/resources/playbook/roles/bibigrid/templates/slurm/slurm.conf b/resources/playbook/roles/bibigrid/templates/slurm/slurm.conf index e2e1b9cd..767aa8ca 100644 --- a/resources/playbook/roles/bibigrid/templates/slurm/slurm.conf +++ b/resources/playbook/roles/bibigrid/templates/slurm/slurm.conf @@ -111,5 +111,6 @@ PrivateData=cloud ResumeFailProgram=/opt/slurm/fail.sh # job container +# TO BE TESTED JobContainerType=job_container/tmpfs PrologFlags=Contain \ No newline at end of file