forked from ROCm/rocblas
377 lines
11 KiB
RPMSpec
377 lines
11 KiB
RPMSpec
#
|
|
# spec file for package rocblas
|
|
#
|
|
# Copyright Fedora Project Authors.
|
|
#
|
|
# Permission is hereby granted, free of charge, to any person obtaining a copy
|
|
# of this software and associated documentation files (the "Software"), to
|
|
# deal in the Software without restriction, including without limitation the
|
|
# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
|
|
# sell copies of the Software, and to permit persons to whom the Software is
|
|
# furnished to do so, subject to the following conditions:
|
|
#
|
|
# The above copyright notice and this permission notice shall be included in
|
|
# all copies or substantial portions of the Software.
|
|
#
|
|
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
|
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
|
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
|
# THE SOFTWARE.
|
|
#
|
|
# Copyright (c) 2025 SUSE LLC and contributors
|
|
#
|
|
# All modifications and additions to the file contributed by third parties
|
|
# remain the property of their copyright owners, unless otherwise agreed
|
|
# upon. The license for this file, and modifications and additions to the
|
|
# file, is the same license as for the pristine package itself (unless the
|
|
# license for the pristine package is not an Open Source License, in which
|
|
# case the license is the MIT License). An "Open Source License" is a
|
|
# license that conforms to the Open Source Definition (Version 1.9)
|
|
# published by the Open Source Initiative.
|
|
|
|
# Please submit bugfixes or comments via https://bugs.opensuse.org/
|
|
#
|
|
|
|
|
|
%if 0%{?suse_version}
|
|
%global rocblas_name librocblas4
|
|
%else
|
|
%global rocblas_name rocblas
|
|
%endif
|
|
|
|
%global upstreamname rocBLAS
|
|
%global rocm_release 6.4
|
|
%global rocm_patch 2
|
|
%global rocm_version %{rocm_release}.%{rocm_patch}
|
|
|
|
%global toolchain rocm
|
|
# hipcc does not support some clang flags
|
|
%global build_cxxflags %(echo %{optflags} | sed -e 's/-fstack-protector-strong/-Xarch_host -fstack-protector-strong/' -e 's/-fcf-protection/-Xarch_host -fcf-protection/' -e 's/-mtls-dialect=gnu2//')
|
|
|
|
%bcond_with debug
|
|
%if %{with debug}
|
|
%global build_type DEBUG
|
|
%else
|
|
%global build_type RelWithDebInfo
|
|
%endif
|
|
|
|
%bcond_without compress
|
|
%if %{with compress}
|
|
%global build_compress ON
|
|
%else
|
|
%global build_compress OFF
|
|
%endif
|
|
|
|
%bcond_with test
|
|
%if %{with test}
|
|
%global build_test ON
|
|
%global __brp_check_rpaths %{nil}
|
|
%else
|
|
%global build_test OFF
|
|
%endif
|
|
|
|
# Option to test suite for testing on real HW:
|
|
# May have to set gpu under test with
|
|
# export HIP_VISIBLE_DEVICES=<num> - 0, 1 etc.
|
|
%bcond_with check
|
|
|
|
# Tensile in 6.4 does not support generics
|
|
# https://github.com/ROCm/Tensile/issues/2124
|
|
%if 0%{?suse_version}
|
|
# not in tw
|
|
%bcond_with tensile
|
|
%else
|
|
%bcond_without tensile
|
|
%endif
|
|
|
|
%if %{with tensile}
|
|
%global build_tensile ON
|
|
%else
|
|
%global build_tensile OFF
|
|
%endif
|
|
|
|
# Compression type and level for source/binary package payloads.
|
|
# "w7T0.xzdio" xz level 7 using %%{getncpus} threads
|
|
%global _source_payload w7T0.xzdio
|
|
%global _binary_payload w7T0.xzdio
|
|
|
|
# SUSE/OSB times out because -O is added to the make args
|
|
# This accumulates all the output from the long running tensile
|
|
# jobs.
|
|
%global _make_output_sync %{nil}
|
|
|
|
# OracleLinux 9 has a problem with it's strip not recognizing *.co's
|
|
%global __strip %rocmllvm_bindir/llvm-strip
|
|
|
|
# Use ninja if it is available
|
|
# Ninja is available on suse but obs times out with ninja build, make doesn't
|
|
%if 0%{?fedora}
|
|
%bcond_without ninja
|
|
%else
|
|
%bcond_with ninja
|
|
%endif
|
|
|
|
%if %{with ninja}
|
|
%global cmake_generator -G Ninja
|
|
%else
|
|
%global cmake_generator %{nil}
|
|
%endif
|
|
|
|
%global cmake_config \\\
|
|
-DBLAS_INCLUDE_DIR=%{_includedir}/%{blaslib} \\\
|
|
-DBLAS_LIBRARY=%{blaslib} \\\
|
|
-DCMAKE_CXX_COMPILER=hipcc \\\
|
|
-DCMAKE_C_COMPILER=hipcc \\\
|
|
-DCMAKE_LINKER=%rocmllvm_bindir/ld.lld \\\
|
|
-DCMAKE_AR=%rocmllvm_bindir/llvm-ar \\\
|
|
-DCMAKE_RANLIB=%rocmllvm_bindir/llvm-ranlib \\\
|
|
-DCMAKE_BUILD_TYPE=%{build_type} \\\
|
|
-DCMAKE_PREFIX_PATH=%{rocmllvm_cmakedir}/.. \\\
|
|
-DCMAKE_SKIP_RPATH=ON \\\
|
|
-DCMAKE_VERBOSE_MAKEFILE=ON \\\
|
|
-DBUILD_FILE_REORG_BACKWARD_COMPATIBILITY=OFF \\\
|
|
-DROCM_SYMLINK_LIBS=OFF \\\
|
|
-DHIP_PLATFORM=amd \\\
|
|
-DBUILD_CLIENTS_BENCHMARKS=%{build_test} \\\
|
|
-DBUILD_CLIENTS_TESTS=%{build_test} \\\
|
|
-DBUILD_CLIENTS_TESTS_OPENMP=OFF \\\
|
|
-DBUILD_FORTRAN_CLIENTS=OFF \\\
|
|
-DBUILD_OFFLOAD_COMPRESS=%{build_compress} \\\
|
|
-DBUILD_WITH_HIPBLASLT=OFF \\\
|
|
-DTensile_COMPILER=hipcc \\\
|
|
-DTensile_CPU_THREADS=${CORES} \\\
|
|
-DTensile_LIBRARY_FORMAT=%{tensile_library_format} \\\
|
|
-DTensile_VERBOSE=%{tensile_verbose} \\\
|
|
-DTensile_DIR=${TP}/cmake \\\
|
|
-DBUILD_WITH_PIP=OFF
|
|
|
|
%bcond_with generic
|
|
%global rocm_gpu_list_generic "gfx9-generic;gfx9-4-generic;gfx10-1-generic;gfx10-3-generic;gfx11-generic;gfx12-generic"
|
|
%if %{with generic}
|
|
%global gpu_list %{rocm_gpu_list_generic}
|
|
%else
|
|
%global gpu_list %{rocm_gpu_list_default}
|
|
%endif
|
|
|
|
Name: rocblas
|
|
Version: %{rocm_version}
|
|
Release: 10%{?dist}
|
|
Summary: BLAS implementation for ROCm
|
|
URL: https://github.com/ROCmSoftwarePlatform/%{upstreamname}
|
|
License: BSD-3-Clause AND MIT
|
|
|
|
Source0: %{url}/archive/refs/tags/rocm-%{rocm_version}.tar.gz#/%{upstreamname}-%{rocm_version}.tar.gz
|
|
Patch2: 0001-fixup-install-of-tensile-output.patch
|
|
Patch4: 0001-offload-compress-option.patch
|
|
Patch6: 0001-rocblas-remove-roctracer.patch
|
|
|
|
BuildRequires: cmake
|
|
BuildRequires: gcc-c++
|
|
BuildRequires: rocm-cmake
|
|
BuildRequires: rocm-comgr-devel
|
|
BuildRequires: rocm-compilersupport-macros
|
|
BuildRequires: rocm-hip-devel
|
|
BuildRequires: rocm-rpm-macros
|
|
BuildRequires: rocm-runtime-devel
|
|
|
|
%if %{with tensile}
|
|
%if 0%{?suse_version}
|
|
BuildRequires: msgpack-cxx-devel
|
|
%global tensile_library_format msgpack
|
|
# OBS vm times out without console output
|
|
%global tensile_verbose 2
|
|
BuildRequires: python3-joblib
|
|
BuildRequires: python3-tensile-devel
|
|
%else
|
|
BuildRequires: python3dist(tensile)
|
|
%if 0%{?rhel}
|
|
%global tensile_verbose 2
|
|
%global tensile_library_format yaml
|
|
%else
|
|
BuildRequires: msgpack-devel
|
|
%global tensile_verbose 1
|
|
%global tensile_library_format msgpack
|
|
%endif
|
|
%endif # suse_version
|
|
%else
|
|
%global tensile_verbose %{nil}
|
|
%global tensile_library_format %{nil}
|
|
%endif # tensile
|
|
|
|
%if %{with compress}
|
|
BuildRequires: pkgconfig(libzstd)
|
|
%endif
|
|
|
|
%if %{with test}
|
|
|
|
BuildRequires: libomp-devel
|
|
BuildRequires: rocm-smi-devel
|
|
BuildRequires: rocminfo
|
|
|
|
%if 0%{?suse_version}
|
|
BuildRequires: python3-PyYAML
|
|
BuildRequires: gcc-fortran
|
|
BuildRequires: gtest
|
|
BuildRequires: openblas-devel
|
|
%global blaslib openblas
|
|
%else
|
|
BuildRequires: gcc-gfortran
|
|
BuildRequires: gtest-devel
|
|
BuildRequires: python3dist(pyyaml)
|
|
%if 0%{?rhel}
|
|
BuildRequires: flexiblas-devel
|
|
%global blaslib flexiblas
|
|
%else
|
|
BuildRequires: blas-devel
|
|
%global blaslib cblas
|
|
%endif
|
|
%endif
|
|
%endif
|
|
|
|
%if %{with ninja}
|
|
%if 0%{?fedora} || 0%{?rhel}
|
|
BuildRequires: ninja-build
|
|
%endif
|
|
%if 0%{?suse_version}
|
|
BuildRequires: ninja
|
|
%define __builder ninja
|
|
%endif
|
|
%endif
|
|
|
|
Provides: rocblas = %{version}-%{release}
|
|
|
|
# Only x86_64 works right now:
|
|
ExclusiveArch: x86_64
|
|
|
|
%description
|
|
rocBLAS is the AMD library for Basic Linear Algebra Subprograms
|
|
(BLAS) on the ROCm platform. It is implemented in the HIP
|
|
programming language and optimized for AMD GPUs.
|
|
|
|
%if 0%{?suse_version}
|
|
%package -n %{rocblas_name}
|
|
Summary: Shared libraries for %{name}
|
|
|
|
%description -n %{rocblas_name}
|
|
%{summary}
|
|
|
|
%ldconfig_scriptlets -n %{rocblas_name}
|
|
%endif
|
|
|
|
%package devel
|
|
Summary: Libraries and headers for %{name}
|
|
Requires: %{rocblas_name}%{?_isa} = %{version}-%{release}
|
|
Requires: cmake(hip)
|
|
|
|
%description devel
|
|
%{summary}
|
|
|
|
%if %{with test}
|
|
%package test
|
|
Summary: Tests for %{name}
|
|
Requires: %{name}%{?_isa} = %{version}-%{release}
|
|
Requires: diffutils
|
|
|
|
%description test
|
|
%{summary}
|
|
%endif
|
|
|
|
%prep
|
|
%autosetup -p1 -n %{upstreamname}-rocm-%{version}
|
|
sed -i -e 's@set( BLAS_LIBRARY "blas" )@set( BLAS_LIBRARY "%blaslib" )@' clients/CMakeLists.txt
|
|
sed -i -e 's@target_link_libraries( rocblas-test PRIVATE ${BLAS_LIBRARY} ${GTEST_BOTH_LIBRARIES} roc::rocblas )@target_link_libraries( rocblas-test PRIVATE %blaslib ${GTEST_BOTH_LIBRARIES} roc::rocblas )@' clients/gtest/CMakeLists.txt
|
|
|
|
# no git in this build
|
|
sed -i -e 's@find_package(Git REQUIRED)@find_package(Git)@' library/CMakeLists.txt
|
|
|
|
# On Tumbleweed Q2,2025
|
|
# /usr/include/gtest/internal/gtest-port.h:279:2: error: C++ versions less than C++14 are not supported.
|
|
# 279 | #error C++ versions less than C++14 are not supported.
|
|
# Convert the c++11's to c++14
|
|
sed -i -e 's@CXX_STANDARD 11@CXX_STANDARD 14@' clients/samples/CMakeLists.txt
|
|
|
|
%if 0%{?suse_version}
|
|
# Suse's libgfortran.so for gcc 14 is here
|
|
# /usr/lib64/gcc/x86_64-suse-linux/14/libgfortran.so
|
|
# Without adding this path with -L, it isn't found, but thankfully it isn't really needed
|
|
sed -i -e 's@list( APPEND COMMON_LINK_LIBS "-lgfortran")@#list( APPEND COMMON_LINK_LIBS "-lgfortran")@' clients/{benchmarks,gtest}/CMakeLists.txt
|
|
%endif
|
|
|
|
%build
|
|
|
|
# With compat llvm the system clang is wrong
|
|
CLANG_PATH=`hipconfig --hipclangpath`
|
|
export TENSILE_ROCM_ASSEMBLER_PATH=${CLANG_PATH}/clang++
|
|
export TENSILE_ROCM_OFFLOAD_BUNDLER_PATH=${CLANG_PATH}/clang-offload-bundler
|
|
# Work around problem with koji's ld
|
|
export HIPCC_LINK_FLAGS_APPEND=-fuse-ld=lld
|
|
|
|
%if %{with tensile}
|
|
TP=`/usr/bin/TensileGetPath`
|
|
%endif
|
|
|
|
CORES=`lscpu | grep 'Core(s)' | awk '{ print $4 }'`
|
|
if [ ${CORES}x = x ]; then
|
|
CORES=1
|
|
fi
|
|
# Try again..
|
|
if [ ${CORES} = 1 ]; then
|
|
CORES=`lscpu | grep '^CPU(s)' | awk '{ print $2 }'`
|
|
if [ ${CORES}x = x ]; then
|
|
CORES=4
|
|
fi
|
|
fi
|
|
|
|
%cmake %{cmake_generator} %{cmake_config} \
|
|
-DGPU_TARGETS=%{gpu_list} \
|
|
-DBUILD_WITH_TENSILE=%{build_tensile} \
|
|
-DCMAKE_INSTALL_LIBDIR=%_libdir \
|
|
|
|
%cmake_build
|
|
|
|
%install
|
|
%cmake_install
|
|
|
|
rm -f %{buildroot}%{_prefix}/share/doc/rocblas/LICENSE.md
|
|
|
|
%check
|
|
%if %{with test}
|
|
%if %{with check}
|
|
%if 0%{?suse_version}
|
|
export LD_LIBRARY_PATH=%{__builddir}/library/src:$LD_LIBRARY_PATH
|
|
%{__builddir}/clients/staging/rocblas-test --gtest_brief=1
|
|
%else
|
|
export LD_LIBRARY_PATH=%{_vpath_builddir}/library/src:$LD_LIBRARY_PATH
|
|
%{_vpath_builddir}/clients/staging/rocblas-test --gtest_brief=1
|
|
%endif
|
|
%endif
|
|
%endif
|
|
|
|
%files -n %{rocblas_name}
|
|
%license LICENSE.md
|
|
%{_libdir}/librocblas.so.4{,.*}
|
|
%if %{with tensile}
|
|
%dir %{_libdir}/rocblas
|
|
%dir %{_libdir}/rocblas/library
|
|
%{_libdir}/rocblas/library/Kernels*
|
|
%{_libdir}/rocblas/library/Tensile*
|
|
%endif
|
|
|
|
%files devel
|
|
%doc README.md
|
|
%dir %{_libdir}/cmake/rocblas
|
|
%dir %{_includedir}/rocblas
|
|
%{_includedir}/rocblas/*
|
|
%{_libdir}/cmake/rocblas/*.cmake
|
|
%{_libdir}/librocblas.so
|
|
|
|
%if %{with test}
|
|
%files test
|
|
%{_bindir}/rocblas*
|
|
%endif
|
|
|
|
%changelog
|