[clblas] 26/61: chanching the heuristic to detect the small matrices
Ghislain Vaillant
ghisvail-guest at moszumanska.debian.org
Fri Jul 24 22:49:45 UTC 2015
This is an automated email from the git hooks/post-receive script.
ghisvail-guest pushed a commit to branch master
in repository clblas.
commit aa972ecacecdfeb5dd6669239b52841c380073e6
Author: BenjaminCoquelle <benjamin.coquelle at amd.com>
Date: Fri May 8 19:17:48 2015 +0100
chanching the heuristic to detect the small matrices
---
src/library/blas/functor/hawaii.cc | 2 +-
src/library/blas/functor/hawaii_sgemmSplitKernel.cc | 2 +-
2 files changed, 2 insertions(+), 2 deletions(-)
diff --git a/src/library/blas/functor/hawaii.cc b/src/library/blas/functor/hawaii.cc
index 3824b91..a499024 100644
--- a/src/library/blas/functor/hawaii.cc
+++ b/src/library/blas/functor/hawaii.cc
@@ -101,7 +101,7 @@ clblasSgemmFunctor * FunctorSelectorHawaii::select_sgemm_specific(clblasSgemmFun
//TODO: the logic below is complicated; Needs cleanup;
clblasSgemmFunctor * functor;
bool Not_TT = ((args.transA==clblasNoTrans && args.transB==clblasTrans ) || ( args.transA==clblasNoTrans && args.transB==clblasNoTrans ) || ( args.transA==clblasTrans && args.transB==clblasNoTrans ));
- bool SmallMatrices = args.M/6*args.N/6<180*180 || ((args.M%64!=0 && args.N%64!=0 && args.M<1900 &&args.N<1900 ) && (args.M%96!=0 && args.N%96!=0 && args.M<1900 &&args.N<1900 ));
+ bool SmallMatrices = args.M/6*args.N/6<100*100 || (args.M/6*args.N/6<180*180 && (args.M%32!=0||args.N%32!=0) || ((args.M%64!=0 && args.N%64!=0 && args.M<1900 &&args.N<1900 ) && (args.M%96!=0 && args.N%96!=0 && args.M<1900 &&args.N<1900 ));
bool SmallMatricesMod32= (SmallMatrices && (args.M%32==0&&args.N%32==0)) ;
SmallMatricesMod32 = SmallMatricesMod32&&Not_TT&&args.K % 16 == 0;
//SmallMatrices= false;
diff --git a/src/library/blas/functor/hawaii_sgemmSplitKernel.cc b/src/library/blas/functor/hawaii_sgemmSplitKernel.cc
index 06eab3c..07eb674 100644
--- a/src/library/blas/functor/hawaii_sgemmSplitKernel.cc
+++ b/src/library/blas/functor/hawaii_sgemmSplitKernel.cc
@@ -1,4 +1,4 @@
-#if !defined CLBLAS_HAWAII_DYNAMIC_KERNEL && !defined CLBLAS_BONAIRE_DYNAMIC_KERNEL
+#if !defined CLBLAS_HAWAII_DYNAMIC_KERNEL || !defined CLBLAS_BONAIRE_DYNAMIC_KERNEL
#include <stdio.h>
#include <string.h>
--
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/debian-science/packages/clblas.git
More information about the debian-science-commits
mailing list