Skip to content

Commit 745b744

Browse files
authored
Merge pull request #296 from daineAMD/master
ROCm 4.1 merge staging into master
2 parents 705cea6 + 7874dc0 commit 745b744

File tree

117 files changed

+11636
-4079
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

117 files changed

+11636
-4079
lines changed

.githooks/pre-commit

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,7 @@ fi
2929

3030
# Change the copyright date at the top of any text files
3131
for file in $files; do
32+
[[ -L $file ]] && continue
3233
echo "Processing copyright dates in $file"
3334
if [[ -e $file ]]; then
3435
/usr/bin/perl -pi -e 'INIT { exit 1 if !-f $ARGV[0] || -B $ARGV[0]; $year = (localtime)[5] + 1900 }
@@ -39,6 +40,7 @@ done
3940

4041
# do the formatting
4142
for file in $files; do
43+
[[ -L $file ]] && continue
4244
if [[ -e $file ]] && echo $file | grep -Eq '\.c$|\.h$|\.hpp$|\.cpp$|\.cl$|\.in$|\.txt$|\.yaml$|\.yml$|\.sh$|\.py$|\.pl$|\.cmake$|\.md$|\.rst$|\.groovy$|\.ini$|\.awk$|\.csv$'; then
4345
echo "Processing line endings in $file"
4446
sed -i -e 's/[[:space:]]*$//' "$file" # Remove whitespace at end of lines
@@ -58,6 +60,7 @@ done
5860
# if clang-format exists, run it on C/C++ files
5961
if command -v clang-format >/dev/null; then
6062
for file in $files; do
63+
[[ -L $file ]] && continue
6164
if [[ -e $file ]] && echo $file | grep -Eq '\.c$|\.h$|\.hpp$|\.cpp$|\.cl$|\.h\.in$|\.hpp\.in$|\.cpp\.in$'; then
6265
echo "clang-format $file"
6366
clang-format -i -style=file "$file"

CHANGELOG.md

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,17 @@
11
# Change Log for hipBLAS
22

3+
## [hipBLAS 0.42.0 for ROCm 4.1.0]
4+
### Added
5+
- Added the following functions. All added functions include batched and strided-batched support with rocBLAS backend:
6+
- axpy_ex
7+
- dot_ex
8+
- nrm2_ex
9+
- rot_ex
10+
- scal_ex
11+
12+
### Fixed
13+
- Fixed complex unit test bug caused by incorrect caxpy and zaxpy function signatures
14+
315
## [hipBLAS 0.40.0 for ROCm 4.0.0]
416
### Added
517
- Added changelog

CMakeLists.txt

Lines changed: 19 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -49,12 +49,18 @@ include( ROCMInstallTargets )
4949
include( ROCMPackageConfigHelpers )
5050
include( ROCMInstallSymlinks )
5151

52-
set ( VERSION_STRING "0.40.0" )
52+
set ( VERSION_STRING "0.42.0" )
5353
rocm_setup_version( VERSION ${VERSION_STRING} )
5454

55+
if( NOT DEFINED $ENV{HIP_PATH})
56+
set( HIP_PATH "/opt/rocm/hip" )
57+
else( )
58+
set (HIP_PATH $ENV{HIP_PATH} )
59+
endif( )
60+
5561
# Append our library helper cmake path and the cmake path for hip (for convenience)
5662
# Users may override HIP path by specifying their own in CMAKE_MODULE_PATH
57-
list( APPEND CMAKE_MODULE_PATH ${CMAKE_CURRENT_SOURCE_DIR}/cmake )
63+
list( APPEND CMAKE_MODULE_PATH ${CMAKE_CURRENT_SOURCE_DIR}/cmake ${HIP_PATH}/cmake)
5864

5965
# NOTE: workaround until hip cmake modules fixes symlink logic in their config files; remove when fixed
6066
list( APPEND CMAKE_PREFIX_PATH /opt/rocm /opt/rocm/llvm /opt/rocm/hip )
@@ -70,17 +76,24 @@ endif( )
7076
# BUILD_SHARED_LIBS is a cmake built-in; we make it an explicit option such that it shows in cmake-gui
7177
option( BUILD_SHARED_LIBS "Build hipBLAS as a shared library" ON )
7278

73-
74-
# Hip headers required of all clients; clients use hip to allocate device memory
75-
find_package( hip REQUIRED CONFIG PATHS ${ROCM_PATH} /opt/rocm)
76-
7779
# Quietly look for CUDA, but if not found it's not an error
7880
# The presense of hip is not sufficient to determine if we want a rocm or cuda backend
7981
option(USE_CUDA "Look for CUDA and use that as a backend if found" ON)
8082
if(USE_CUDA)
8183
find_package( CUDA QUIET )
8284
endif()
8385

86+
# Hip headers required of all clients; clients use hip to allocate device memory
87+
if( USE_CUDA)
88+
find_package( HIP REQUIRED )
89+
else( )
90+
find_package(hip REQUIRED CONFIG PATHS ${ROCM_PATH} /opt/rocm)
91+
endif( )
92+
93+
if( USE_CUDA )
94+
list( APPEND HIP_INCLUDE_DIRS "${HIP_ROOT_DIR}/include" )
95+
endif( )
96+
8497
# CMake list of machine targets
8598
set( AMDGPU_TARGETS gfx803;gfx900;gfx906;gfx908 CACHE STRING "List of specific machine types for library to target" )
8699

bump_develop_version.sh

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -5,11 +5,11 @@
55
# - run this script in master branch
66
# - after running this script merge master into develop
77

8-
OLD_HIPBLAS_VERSION="0.40.0"
9-
NEW_HIPBLAS_VERSION="0.41.0"
8+
OLD_HIPBLAS_VERSION="0.42.0"
9+
NEW_HIPBLAS_VERSION="0.43.0"
1010

11-
OLD_MINIMUM_ROCBLAS_VERSION="2.34.0"
12-
NEW_MINIMUM_ROCBLAS_VERSION="2.35.0"
11+
OLD_MINIMUM_ROCBLAS_VERSION="2.36.0"
12+
NEW_MINIMUM_ROCBLAS_VERSION="2.37.0"
1313

1414
OLD_MINIMUM_ROCSOLVER_VERSION="3.10.0"
1515
NEW_MINIMUM_ROCSOLVER_VERSION="3.11.0"

bump_master_version.sh

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -6,11 +6,11 @@
66
# - after running this script and merging develop into master, run bump_develop_version.sh in master and
77
# merge master into develop
88

9-
OLD_HIPBLAS_VERSION="0.39.0"
10-
NEW_HIPBLAS_VERSION="0.40.0"
9+
OLD_HIPBLAS_VERSION="0.41.0"
10+
NEW_HIPBLAS_VERSION="0.42.0"
1111

12-
OLD_MINIMUM_ROCBLAS_VERSION="2.33.0"
13-
NEW_MINIMUM_ROCBLAS_VERSION="2.34.0"
12+
OLD_MINIMUM_ROCBLAS_VERSION="2.35.0"
13+
NEW_MINIMUM_ROCBLAS_VERSION="2.36.0"
1414

1515
OLD_MINIMUM_ROCSOLVER_VERSION="3.10.0"
1616
NEW_MINIMUM_ROCSOLVER_VERSION="3.11.0"

clients/benchmarks/CMakeLists.txt

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -20,6 +20,9 @@ if( NOT TARGET hipblas )
2020
endif( )
2121
endif( )
2222

23+
find_package( GTest REQUIRED )
24+
include_directories(${GTEST_INCLUDE_DIRS})
25+
2326
set( hipblas_benchmark_common
2427
../common/utility.cpp
2528
../common/cblas_interface.cpp

clients/benchmarks/client.cpp

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1073,32 +1073,32 @@ try
10731073
"Leading dimension of matrix D, is only applicable to BLAS-EX ")
10741074

10751075
("stride_a",
1076-
value<hipblas_int>(&arg.stride_a)->default_value(128*128),
1076+
value<hipblasStride>(&arg.stride_a)->default_value(128*128),
10771077
"Specific stride of strided_batched matrix A, is only applicable to strided batched"
10781078
"BLAS-2 and BLAS-3: second dimension * leading dimension.")
10791079

10801080
("stride_b",
1081-
value<hipblas_int>(&arg.stride_b)->default_value(128*128),
1081+
value<hipblasStride>(&arg.stride_b)->default_value(128*128),
10821082
"Specific stride of strided_batched matrix B, is only applicable to strided batched"
10831083
"BLAS-2 and BLAS-3: second dimension * leading dimension.")
10841084

10851085
("stride_c",
1086-
value<hipblas_int>(&arg.stride_c)->default_value(128*128),
1086+
value<hipblasStride>(&arg.stride_c)->default_value(128*128),
10871087
"Specific stride of strided_batched matrix C, is only applicable to strided batched"
10881088
"BLAS-2 and BLAS-3: second dimension * leading dimension.")
10891089

10901090
("stride_d",
1091-
value<hipblas_int>(&arg.stride_d)->default_value(128*128),
1091+
value<hipblasStride>(&arg.stride_d)->default_value(128*128),
10921092
"Specific stride of strided_batched matrix D, is only applicable to strided batched"
10931093
"BLAS_EX: second dimension * leading dimension.")
10941094

10951095
("stride_x",
1096-
value<hipblas_int>(&arg.stride_x)->default_value(128),
1096+
value<hipblasStride>(&arg.stride_x)->default_value(128),
10971097
"Specific stride of strided_batched vector x, is only applicable to strided batched"
10981098
"BLAS_2: second dimension.")
10991099

11001100
("stride_y",
1101-
value<hipblas_int>(&arg.stride_y)->default_value(128),
1101+
value<hipblasStride>(&arg.stride_y)->default_value(128),
11021102
"Specific stride of strided_batched vector y, is only applicable to strided batched"
11031103
"BLAS_2: leading dimension.")
11041104

0 commit comments

Comments
 (0)