From 5b07269e3d0703f2dab4e7272f454c7fb48a4e20043c73cdba0bcd418626685e Mon Sep 17 00:00:00 2001 From: Christian Goll Date: Mon, 27 Sep 2021 09:23:35 +0000 Subject: [PATCH] Accepting request 919668 from home:mslacken:branches:network:cluster - updated to 21.08.1 with following bug fixes: * Fix potential memory leak if a problem happens while allocating GRES for a job. * If an overallocation of GRES happens terminate the creation of a job. * AutoDetect=nvml: Fatal if no devices found in MIG mode. * Print federation and cluster sacctmgr error messages to stderr. * Fix off by one error in --gpu-bind=mask_gpu. * Add --gpu-bind=none to disable gpu binding when using --gpus-per-task. * Handle the burst buffer state "alloc-revoke" which previously would not display in the job correctly. * Fix issue in the slurmstepd SPANK prolog/epilog handler where configuration values were used before being initialized. * Restore a step's ability to utilize all of an allocations memory if --mem=0. * Fix --cpu-bind=verbose garbage taskid. * Fix cgroup task affinity issues from garbage taskid info. * Make gres_job_state_validate() client logging behavior as before 44466a4641. * Fix steps with --hint overriding an allocation with --threads-per-core. * Require requesting a GPU if --mem-per-gpu is requested. * Return error early if a job is requesting --ntasks-per-gpu and no gpus or task count. * Properly clear out pending step if unavailable to run with available resources. * Kill all processes spawned by burst_buffer.lua including decendents. * openapi/v0.0.{35,36,37} - Avoid setting default values of min_cpus, job name, cwd, mail_type, and contiguous on job update. * openapi/v0.0.{35,36,37} - Clear user hold on job update if hold=false. * Prevent CRON_JOB flag from being cleared when loading job state. * sacctmgr - Fix deleting WCKeys when not specifying a cluster. * Fix getting memory for a step when the first node in the step isn't the first node in the allocation. OBS-URL: https://build.opensuse.org/request/show/919668 OBS-URL: https://build.opensuse.org/package/show/network:cluster/slurm?expand=0&rev=186 --- ...t-condition-in-netloc-autoconf-macro.patch | 42 ---------------- slurm-21.08.0.tar.bz2 | 3 -- slurm-21.08.1.tar.bz2 | 3 ++ slurm.changes | 50 ++++++++++++++++++- slurm.spec | 6 +-- 5 files changed, 54 insertions(+), 50 deletions(-) delete mode 100644 Fix-statement-condition-in-netloc-autoconf-macro.patch delete mode 100644 slurm-21.08.0.tar.bz2 create mode 100644 slurm-21.08.1.tar.bz2 diff --git a/Fix-statement-condition-in-netloc-autoconf-macro.patch b/Fix-statement-condition-in-netloc-autoconf-macro.patch deleted file mode 100644 index f8f2c29..0000000 --- a/Fix-statement-condition-in-netloc-autoconf-macro.patch +++ /dev/null @@ -1,42 +0,0 @@ -From 1f8be9ffb586b8bc3e5c7bf45cef16db5bf9b479 Mon Sep 17 00:00:00 2001 -From: Tim McMullan -Date: Thu, 26 Aug 2021 16:58:37 -0600 -Subject: [PATCH] Fix statement condition in netloc autoconf macro. - -Includes output of running 'autoreconf -i'. -Continuation of d7c089ec63. - -Bug 12370 ---- - NEWS | 1 + - auxdir/x_ac_netloc.m4 | 2 +- - configure | 2 +- - 3 files changed, 3 insertions(+), 2 deletions(-) - ---- a/auxdir/x_ac_netloc.m4 -+++ b/auxdir/x_ac_netloc.m4 -@@ -21,7 +21,7 @@ AC_DEFUN([X_AC_NETLOC], - [AS_IF([test "x$with_netloc" != xno && test "x$with_netloc" != xyes], - [_x_ac_netloc_dirs="$with_netloc"])]) - -- if [test "$with_netloc" = xno]; then -+ if [test "x$with_netloc" = xno]; then - AC_MSG_WARN([support for netloc disabled]) - else - AC_CACHE_CHECK( -diff --git a/configure b/configure -index 3dbe39b9b8..d563cfcd56 100755 ---- a/configure -+++ b/configure -@@ -24168,7 +24168,7 @@ fi - fi - - -- if test "$with_netloc" = xno; then -+ if test "x$with_netloc" = xno; then - { $as_echo "$as_me:${as_lineno-$LINENO}: WARNING: support for netloc disabled" >&5 - $as_echo "$as_me: WARNING: support for netloc disabled" >&2;} - else --- -2.26.2 - diff --git a/slurm-21.08.0.tar.bz2 b/slurm-21.08.0.tar.bz2 deleted file mode 100644 index cf57f45..0000000 --- a/slurm-21.08.0.tar.bz2 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:08e0ef2448c4c6178044907b1eebe698aafe043c91adea52667acf75c0cefce7 -size 6731503 diff --git a/slurm-21.08.1.tar.bz2 b/slurm-21.08.1.tar.bz2 new file mode 100644 index 0000000..bedddaf --- /dev/null +++ b/slurm-21.08.1.tar.bz2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b648864036477f5c188c750b9bdaefaa429b04c36912d4db2a86ced2a8e0c04 +size 6736996 diff --git a/slurm.changes b/slurm.changes index 3767013..32ebb86 100644 --- a/slurm.changes +++ b/slurm.changes @@ -1,3 +1,51 @@ +------------------------------------------------------------------- +Fri Sep 17 07:22:44 UTC 2021 - Christian Goll + +- updated to 21.08.1 with following bug fixes: + * Fix potential memory leak if a problem happens while allocating GRES for + a job. + * If an overallocation of GRES happens terminate the creation of a job. + * AutoDetect=nvml: Fatal if no devices found in MIG mode. + * Print federation and cluster sacctmgr error messages to stderr. + * Fix off by one error in --gpu-bind=mask_gpu. + * Add --gpu-bind=none to disable gpu binding when using --gpus-per-task. + * Handle the burst buffer state "alloc-revoke" which previously would not + display in the job correctly. + * Fix issue in the slurmstepd SPANK prolog/epilog handler where configuration + values were used before being initialized. + * Restore a step's ability to utilize all of an allocations memory if --mem=0. + * Fix --cpu-bind=verbose garbage taskid. + * Fix cgroup task affinity issues from garbage taskid info. + * Make gres_job_state_validate() client logging behavior as before 44466a4641. + * Fix steps with --hint overriding an allocation with --threads-per-core. + * Require requesting a GPU if --mem-per-gpu is requested. + * Return error early if a job is requesting --ntasks-per-gpu and no gpus or + task count. + * Properly clear out pending step if unavailable to run with available + resources. + * Kill all processes spawned by burst_buffer.lua including decendents. + * openapi/v0.0.{35,36,37} - Avoid setting default values of min_cpus, + job name, cwd, mail_type, and contiguous on job update. + * openapi/v0.0.{35,36,37} - Clear user hold on job update if hold=false. + * Prevent CRON_JOB flag from being cleared when loading job state. + * sacctmgr - Fix deleting WCKeys when not specifying a cluster. + * Fix getting memory for a step when the first node in the step isn't the + first node in the allocation. + * Make SelectTypeParameters=CR_Core_Memory default for cons_tres and cons_res. + * Correctly handle mutex unlocks in the gres code if failures happen. + * Give better error message if -m plane is given with no size. + * Fix --distribution=arbitrary for salloc. + * Fix jobcomp/script regression introduced in 21.08.0rc1 0c75b9ac9d. + * Only send the batch node in the step_hostlist in the job credential. + * When setting affinity for the batch step don't assume the batch host is node + 0. + * In task/affinity better checking for node existence when laying out + affinity. + * slurmrestd - fix job submission with auth/jwt. + +- removed Fix-statement-condition-in-netloc-autoconf-macro.patch + issue was fixed upstream + ------------------------------------------------------------------- Mon Sep 6 15:34:06 UTC 2021 - Egbert Eich @@ -9,7 +57,7 @@ Mon Sep 6 15:34:06 UTC 2021 - Egbert Eich ------------------------------------------------------------------- Thu Sep 2 13:19:33 UTC 2021 - Christian Goll -- updated to 21.08.1, major changes: +- updated to 21.08.0, major changes: * A new "AccountingStoreFlags=job_script" option to store the job scripts directly in SlurmDBD. * Added "sacct -o SubmitLine" format option to get the submit line diff --git a/slurm.spec b/slurm.spec index d98797e..d603adf 100644 --- a/slurm.spec +++ b/slurm.spec @@ -1,5 +1,5 @@ # -# spec file for package slurm +# spec file # # Copyright (c) 2021 SUSE LLC # @@ -18,7 +18,7 @@ # Check file META in sources: update so_version to (API_CURRENT - API_AGE) %define so_version 37 -%define ver 21.08.0 +%define ver 21.08.1 %define _ver _21_08 %define dl_ver %{ver} # so-version is 0 and seems to be stable @@ -135,7 +135,6 @@ Patch0: Remove-rpath-from-build.patch Patch1: slurm-2.4.4-init.patch Patch2: pam_slurm-Initialize-arrays-and-pass-sizes.patch Patch3: load-pmix-major-version.patch -Patch100: Fix-statement-condition-in-netloc-autoconf-macro.patch %{?upgrade:Provides: %{pname} = %{version}} %{?upgrade:Conflicts: %{pname}} @@ -547,7 +546,6 @@ Contains also cray specific documentation. %patch1 -p1 %patch2 -p1 %patch3 -p1 -%patch100 -p1 %if 0%{?python_ver} < 3 # Workaround for wrongly flagged python3 to keep SLE-11-SP4 building mkdir -p mybin; ln -s /usr/bin/python2 mybin/python3