Skip to content

Commit d19db5d

Browse files
committed
Merge branch 'develop'
2 parents 1f135e5 + 01b407c commit d19db5d

File tree

65 files changed

+84702
-35049
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

65 files changed

+84702
-35049
lines changed

CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -126,7 +126,7 @@ include( ROCMInstallTargets )
126126
include( ROCMPackageConfigHelpers )
127127
include( ROCMInstallSymlinks )
128128

129-
rocm_setup_version( VERSION 0.14.2.5 NO_GIT_TAG_VERSION )
129+
rocm_setup_version( VERSION 0.14.3.0 NO_GIT_TAG_VERSION )
130130

131131
# Append our library helper cmake path and the cmake path for hip (for convenience)
132132
# Users may override HIP path by specifying their own in CMAKE_MODULE_PATH
@@ -164,7 +164,7 @@ if( BUILD_WITH_TENSILE )
164164
else()
165165
# Use the virtual-env setup and download package from specified repot:
166166
set( tensile_fork "ROCmSoftwarePlatform" CACHE STRING "Tensile fork to use" )
167-
set( tensile_tag v4.5.1 CACHE STRING "Tensile tag to download" )
167+
set( tensile_tag v4.6.0 CACHE STRING "Tensile tag to download" )
168168
virtualenv_install("git+https://github.com/ROCmSoftwarePlatform/Tensile.git@${tensile_tag}")
169169
message (STATUS "using GIT Tensile fork=${tensile_fork} from branch=${tensile_tag}")
170170
endif()

Jenkinsfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
// Mostly generated from snippet generator 'properties; set job properties'
55
// Time-based triggers added to execute nightly tests, eg '30 2 * * *' means 2:30 AM
66
properties([
7-
pipelineTriggers([cron('0 3 * * *'), [$class: 'PeriodicFolderTrigger', interval: '5m']]),
7+
pipelineTriggers([cron('0 1 * * *'), [$class: 'PeriodicFolderTrigger', interval: '5m']]),
88
buildDiscarder(logRotator(
99
artifactDaysToKeepStr: '',
1010
artifactNumToKeepStr: '',

bump_develop_version.sh

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5,10 +5,10 @@
55
# - run this script in master branch
66
# - after running this script merge master into develop
77

8-
OLD_ROCBLAS_VERSION="14.1.2"
9-
NEW_ROCBLAS_VERSION="15.1.2"
8+
OLD_ROCBLAS_VERSION="14.3.0"
9+
NEW_ROCBLAS_VERSION="15.3.0"
1010

11-
OLD_TENSILE_VERSION="tensile_tag v4.5.0"
11+
OLD_TENSILE_VERSION="tensile_tag v4.6.0"
1212
NEW_TENSILE_VERSION="tensile_tag \"develop\""
1313

1414
sed -i "s/${OLD_ROCBLAS_VERSION}/${NEW_ROCBLAS_VERSION}/g" CMakeLists.txt

bump_master_version.sh

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -6,14 +6,14 @@
66
# - after running this script and merging develop into master, run bump_develop_version.sh in master and
77
# merge master into develop
88

9-
OLD_ROCBLAS_VERSION="15.1.1"
10-
NEW_ROCBLAS_VERSION="14.1.2"
9+
OLD_ROCBLAS_VERSION="15.1.3"
10+
NEW_ROCBLAS_VERSION="14.3.0"
1111

1212
OLD_TENSILE_VERSION="tensile_tag \"develop\""
13-
NEW_TENSILE_VERSION="tensile_tag v4.5.0"
13+
NEW_TENSILE_VERSION="tensile_tag v4.6.0"
1414

15-
OLD_MINIMUM_REQUIRED_VERSION="MinimumRequiredVersion: 4.4.0"
16-
NEW_MINIMUM_REQUIRED_VERSION="MinimumRequiredVersion: 4.5.0"
15+
OLD_MINIMUM_REQUIRED_VERSION="MinimumRequiredVersion: 4.5.0"
16+
NEW_MINIMUM_REQUIRED_VERSION="MinimumRequiredVersion: 4.6.0"
1717

1818
sed -i "s/${OLD_ROCBLAS_VERSION}/${NEW_ROCBLAS_VERSION}/g" CMakeLists.txt
1919
sed -i "s/${OLD_TENSILE_VERSION}/${NEW_TENSILE_VERSION}/g" CMakeLists.txt

clients/benchmarks/client.cpp

Lines changed: 34 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,6 +33,7 @@
3333
#include "testing_gemm_strided_batched_kernel_name.hpp"
3434
#include "testing_trsm.hpp"
3535
#include "testing_gemm_ex.hpp"
36+
#include "testing_gemm_strided_batched_ex.hpp"
3637
#endif
3738

3839
namespace po = boost::program_options;
@@ -114,7 +115,7 @@ int main(int argc, char* argv[])
114115
"BLAS-2 and BLAS-3: second dimension * leading dimension.")
115116

116117
("stride_d",
117-
po::value<rocblas_int>(&argus.stride_c)->default_value(128*128),
118+
po::value<rocblas_int>(&argus.stride_d)->default_value(128*128),
118119
"Specific stride of strided_batched matrix D, is only applicable to strided batched"
119120
"BLAS_EX: second dimension * leading dimension.")
120121

@@ -500,6 +501,38 @@ int main(int argc, char* argv[])
500501
else if(precision == 'd')
501502
testing_gemm_strided_batched<double>(argus);
502503
}
504+
else if(function == "gemm_strided_batched_ex")
505+
{
506+
// adjust dimension for GEMM routines
507+
rocblas_int min_lda = argus.transA_option == 'N' ? argus.M : argus.K;
508+
rocblas_int min_ldb = argus.transB_option == 'N' ? argus.K : argus.N;
509+
rocblas_int min_ldc = argus.M;
510+
if(argus.lda < min_lda)
511+
{
512+
std::cout << "rocblas-bench INFO: lda < min_lda, set lda = " << min_lda << std::endl;
513+
argus.lda = min_lda;
514+
}
515+
if(argus.ldb < min_ldb)
516+
{
517+
std::cout << "rocblas-bench INFO: ldb < min_ldb, set ldb = " << min_ldb << std::endl;
518+
argus.ldb = min_ldb;
519+
}
520+
if(argus.ldc < min_ldc)
521+
{
522+
std::cout << "rocblas-bench INFO: ldc < min_ldc, set ldc = " << min_ldc << std::endl;
523+
argus.ldc = min_ldc;
524+
}
525+
526+
rocblas_int min_stride_c = argus.ldc * argus.N;
527+
if(argus.stride_c < min_stride_c)
528+
{
529+
std::cout << "rocblas-bench INFO: stride_c < min_stride_c, set stride_c = "
530+
<< min_stride_c << std::endl;
531+
argus.stride_c = min_stride_c;
532+
}
533+
534+
testing_gemm_strided_batched_ex(argus);
535+
}
503536
else if(function == "gemm_kernel_name")
504537
{
505538
// adjust dimension for GEMM routines

clients/common/norm.cpp

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -210,15 +210,15 @@ double norm_check_general<rocblas_half>(char norm_type,
210210
// use triangle inequality ||a+b|| <= ||a|| + ||b|| to calculate upper limit for Frobenius norm
211211
// of strided batched matrix
212212

213-
std::unique_ptr<float[]> hCPU_float(new float[N * lda]() + (batch_count - 1) * stride_a);
214-
std::unique_ptr<float[]> hGPU_float(new float[N * lda]() + (batch_count - 1) * stride_a);
213+
std::unique_ptr<float[]> hCPU_float(new float[N * lda + (batch_count - 1) * stride_a]());
214+
std::unique_ptr<float[]> hGPU_float(new float[N * lda + (batch_count - 1) * stride_a]());
215215
for(int i_batch = 0; i_batch < batch_count; i_batch++)
216216
{
217217
for(int i = 0; i < N * lda; i++)
218218
{
219219
int index = i + i_batch * stride_a;
220-
hCPU_float[index] = static_cast<float>(hCPU[index]);
221-
hGPU_float[index] = static_cast<float>(hGPU[index]);
220+
hCPU_float[index] = half_to_float(hCPU[index]);
221+
hGPU_float[index] = half_to_float(hGPU[index]);
222222
}
223223
}
224224

clients/gtest/CMakeLists.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -37,6 +37,7 @@ if( BUILD_WITH_TENSILE )
3737
gemm_gtest.cpp
3838
gemm_strided_batched_gtest.cpp
3939
gemm_ex_gtest.cpp
40+
gemm_strided_batched_ex_gtest.cpp
4041
trsm_gtest.cpp
4142
)
4243
endif( )

0 commit comments

Comments
 (0)