[clblas] 69/75: Merge tag 'v2.12' into debian/master
Ghislain Vaillant
ghisvail-guest at moszumanska.debian.org
Tue Jan 24 23:30:48 UTC 2017
This is an automated email from the git hooks/post-receive script.
ghisvail-guest pushed a commit to branch debian/master
in repository clblas.
commit 219575eea12d4ee1ae7eb34a044692d8c03c820b
Merge: 40ea8f8 1f3de2a
Author: Ghislain Antony Vaillant <ghisvail at gmail.com>
Date: Sat Jan 21 13:18:26 2017 +0000
Merge tag 'v2.12' into debian/master
bugfix rollup release
.gitignore | 4 +-
.travis.yml | 16 +-
CONTRIBUTING.md | 4 +-
README.md | 19 +-
appveyor.yml | 17 +-
src/CMakeLists.txt | 79 +-
src/FindNetlib.cmake | 19 +
src/FindOpenCL.cmake | 143 ++-
src/clBLAS.h | 2 +-
src/client/CMakeLists.txt | 9 +-
src/client/clfunc_common.hpp | 100 ++-
src/client/clfunc_xgemm.hpp | 579 +++++++-----
src/client/clfunc_xsyrk.hpp | 6 +-
src/client/clfunc_xtrmm.hpp | 266 ++++--
src/client/client.cpp | 967 +++++++++++----------
src/include/defbool.h | 5 +
src/include/kerngen.h | 2 +-
src/library/CMakeLists.txt | 58 +-
src/library/blas/AutoGemm/Includes.py | 8 +-
src/library/blas/AutoGemm/KernelOpenCL.py | 12 +-
src/library/blas/AutoGemm/KernelParameters.py | 4 +-
.../dgemm_Col_NN_B0_MX048_NX048_KX08_src.cpp | 4 +-
.../dgemm_Col_NN_B1_MX048_NX048_KX08_src.cpp | 4 +-
.../dgemm_Col_NT_B0_MX048_NX048_KX08_src.cpp | 4 +-
.../dgemm_Col_NT_B1_MX048_NX048_KX08_src.cpp | 4 +-
.../dgemm_Col_TN_B0_MX048_NX048_KX08_src.cpp | 4 +-
.../dgemm_Col_TN_B1_MX048_NX048_KX08_src.cpp | 4 +-
.../sgemm_Col_NN_B0_MX032_NX032_KX16_src.cpp | 2 +-
.../sgemm_Col_NN_B0_MX064_NX064_KX16_src.cpp | 2 +-
.../sgemm_Col_NN_B0_MX096_NX096_KX16_src.cpp | 74 +-
...sgemm_Col_NN_B1_MX032_NX032_KX16_BRANCH_src.cpp | 72 +-
.../sgemm_Col_NN_B1_MX032_NX032_KX16_src.cpp | 4 +-
.../sgemm_Col_NN_B1_MX064_NX064_KX16_src.cpp | 2 +-
.../sgemm_Col_NN_B1_MX096_NX096_KX16_src.cpp | 2 +-
.../sgemm_Col_NT_B0_MX032_NX032_KX16_src.cpp | 2 +-
.../sgemm_Col_NT_B0_MX064_NX064_KX16_src.cpp | 2 +-
.../sgemm_Col_NT_B0_MX096_NX096_KX16_src.cpp | 74 +-
...sgemm_Col_NT_B1_MX032_NX032_KX16_BRANCH_src.cpp | 70 +-
...sgemm_Col_NT_B1_MX032_NX032_KX16_SINGLE_src.cpp | 35 +-
.../sgemm_Col_NT_B1_MX032_NX032_KX16_src.cpp | 2 +-
.../sgemm_Col_NT_B1_MX032_NX064_KX16_ROW_src.cpp | 22 +-
.../sgemm_Col_NT_B1_MX064_NX032_KX16_COL_src.cpp | 20 +-
.../sgemm_Col_NT_B1_MX064_NX064_KX16_src.cpp | 2 +-
.../sgemm_Col_NT_B1_MX096_NX096_KX16_src.cpp | 2 +-
.../sgemm_Col_NT_B1_MX128_NX128_KX16_src.cpp | 6 +-
.../sgemm_Col_TN_B0_MX032_NX032_KX16_src.cpp | 2 +-
.../sgemm_Col_TN_B0_MX064_NX064_KX16_src.cpp | 2 +-
.../sgemm_Col_TN_B0_MX096_NX096_KX16_src.cpp | 74 +-
...sgemm_Col_TN_B1_MX032_NX032_KX16_BRANCH_src.cpp | 60 +-
.../sgemm_Col_TN_B1_MX032_NX032_KX16_src.cpp | 2 +-
.../sgemm_Col_TN_B1_MX064_NX064_KX16_src.cpp | 2 +-
.../sgemm_Col_TN_B1_MX096_NX096_KX16_src.cpp | 2 +-
src/library/blas/functor/functor_xscal.cc | 2 +-
src/library/blas/generic/solution_seq_make.c | 6 +-
src/library/blas/gens/asum.cpp | 6 +-
src/library/blas/gens/axpy_reg.cpp | 8 +-
src/library/blas/gens/clTemplates/gemm.cl | 8 +-
src/library/blas/gens/clTemplates/her2.cl | 8 +-
src/library/blas/gens/clTemplates/symm.cl | 36 +-
src/library/blas/gens/clTemplates/syr2.cl | 6 +-
src/library/blas/gens/clTemplates/syr2_her2.cl | 8 +-
src/library/blas/gens/clTemplates/trmv.cl | 4 +-
src/library/blas/gens/copy_reg.cpp | 8 +-
src/library/blas/gens/dot.cpp | 8 +-
src/library/blas/gens/gbmv.cpp | 4 +-
src/library/blas/gens/gemv.c | 10 +-
src/library/blas/gens/ger_lds.cpp | 4 +-
src/library/blas/gens/her2_lds.cpp | 4 +-
src/library/blas/gens/her_lds.cpp | 2 +-
src/library/blas/gens/iamax.cpp | 8 +-
src/library/blas/gens/kprintf.cpp | 4 +-
src/library/blas/gens/nrm2.cpp | 6 +-
src/library/blas/gens/rotm_reg.cpp | 8 +-
src/library/blas/gens/scal_reg.cpp | 4 +-
src/library/blas/gens/swap_reg.cpp | 8 +-
src/library/blas/gens/symv.c | 10 +-
src/library/blas/gens/syr2_lds.cpp | 4 +-
src/library/blas/gens/syr_lds.cpp | 2 +-
src/library/blas/gens/trmm.c | 2 +-
src/library/blas/gens/trmv_reg.cpp | 4 +-
src/library/blas/gens/trsv_gemv.cpp | 4 +-
src/library/blas/gens/trsv_trtri.cpp | 2 +-
src/library/blas/include/clblas-internal.h | 2 +-
src/library/blas/include/kprintf.hpp | 2 +-
src/library/blas/ixamax.c | 2 +-
src/library/blas/trtri/TrtriKernelSourceIncludes.h | 6 +-
.../blas/trtri/diag_dtrtri_lower_128_16.cpp | 3 +-
.../blas/trtri/diag_dtrtri_upper_128_16.cpp | 17 +-
.../blas/trtri/diag_dtrtri_upper_192_12.cpp | 11 +-
.../trtri/triple_dgemm_update_128_16_PART1_L.cpp | 9 +-
.../trtri/triple_dgemm_update_128_16_PART2_L.cpp | 1 -
.../blas/trtri/triple_dgemm_update_128_16_R.cpp | 11 +-
.../trtri/triple_dgemm_update_128_32_PART1_L.cpp | 7 +-
.../trtri/triple_dgemm_update_128_32_PART1_R.cpp | 7 +-
.../trtri/triple_dgemm_update_128_32_PART2_L.cpp | 1 -
.../trtri/triple_dgemm_update_128_32_PART2_R.cpp | 1 -
.../trtri/triple_dgemm_update_128_64_PART1_L.cpp | 7 +-
.../trtri/triple_dgemm_update_128_64_PART1_R.cpp | 5 +-
.../trtri/triple_dgemm_update_128_64_PART2_L.cpp | 1 -
.../trtri/triple_dgemm_update_128_64_PART2_R.cpp | 1 -
.../triple_dgemm_update_128_ABOVE64_PART1_L.cpp | 7 +-
.../triple_dgemm_update_128_ABOVE64_PART1_R.cpp | 5 +-
.../triple_dgemm_update_128_ABOVE64_PART2_L.cpp | 1 -
.../triple_dgemm_update_128_ABOVE64_PART2_R.cpp | 1 -
.../triple_dgemm_update_128_ABOVE64_PART3_L.cpp | 1 -
.../triple_dgemm_update_128_ABOVE64_PART3_R.cpp | 1 -
.../blas/trtri/triple_dgemm_update_192_12_R.cpp | 5 +-
.../trtri/triple_dgemm_update_192_24_PART1_R.cpp | 1 -
.../trtri/triple_dgemm_update_192_24_PART2_R.cpp | 1 -
.../trtri/triple_dgemm_update_192_48_PART1_R.cpp | 3 +-
.../trtri/triple_dgemm_update_192_48_PART2_R.cpp | 1 -
.../trtri/triple_dgemm_update_192_96_PART1_R.cpp | 3 +-
.../trtri/triple_dgemm_update_192_96_PART2_R.cpp | 1 -
src/library/blas/xasum.c | 2 +-
src/library/blas/xaxpy.c | 4 +-
src/library/blas/xcopy.c | 4 +-
src/library/blas/xdot.c | 4 +-
src/library/blas/xgbmv.c | 4 +-
src/library/blas/xgemm.cc | 275 ++++--
src/library/blas/xgemv.c | 4 +-
src/library/blas/xger.c | 4 +-
src/library/blas/xhemv.c | 4 +-
src/library/blas/xher.c | 2 +-
src/library/blas/xher2.c | 8 +-
src/library/blas/xhpmv.c | 4 +-
src/library/blas/xnrm2.c | 2 +-
src/library/blas/xrot.c | 4 +-
src/library/blas/xrotm.c | 4 +-
src/library/blas/xscal.c | 2 +-
src/library/blas/xshbmv.c | 4 +-
src/library/blas/xspmv.c | 4 +-
src/library/blas/xswap.c | 4 +-
src/library/blas/xsymv.c | 4 +-
src/library/blas/xsyr.c | 2 +-
src/library/blas/xsyr2.c | 4 +-
src/library/blas/xtbmv.c | 4 +-
src/library/blas/xtbsv.c | 44 +-
src/library/blas/xtrmv.c | 4 +-
src/library/blas/xtrsm.cc | 7 +-
src/library/blas/xtrsv.c | 6 +-
src/library/common/kerngen_core.c | 2 +-
src/library/tools/ktest/config.cpp | 4 +-
src/library/tools/ktest/steps/gemv.cpp | 12 +-
src/library/tools/ktest/steps/symv.cpp | 12 +-
src/samples/CMakeLists.txt | 34 +-
src/samples/example_ctrsm.c | 177 ++++
src/samples/example_strsm.cpp | 188 ++++
src/tests/BlasBase.cpp | 94 +-
src/tests/CMakeLists.txt | 26 +-
src/tests/cmdline.c | 43 +-
src/tests/correctness/blas-lapack.c | 8 +-
src/tests/correctness/blas-lapack.h | 8 +-
src/tests/correctness/corr-asum.cpp | 17 +-
src/tests/correctness/corr-axpy.cpp | 19 +-
src/tests/correctness/corr-copy.cpp | 18 +-
src/tests/correctness/corr-dot.cpp | 17 +-
src/tests/correctness/corr-dotc.cpp | 17 +-
src/tests/correctness/corr-gbmv.cpp | 19 +-
src/tests/correctness/corr-gemm.cpp | 19 +-
src/tests/correctness/corr-gemm2.cpp | 16 +-
src/tests/correctness/corr-gemv.cpp | 18 +-
src/tests/correctness/corr-ger.cpp | 21 +-
src/tests/correctness/corr-gerc.cpp | 21 +-
src/tests/correctness/corr-hbmv.cpp | 19 +-
src/tests/correctness/corr-hemm.cpp | 18 +-
src/tests/correctness/corr-hemv.cpp | 19 +-
src/tests/correctness/corr-her.cpp | 18 +-
src/tests/correctness/corr-her2.cpp | 18 +-
src/tests/correctness/corr-her2k.cpp | 15 +-
src/tests/correctness/corr-herk.cpp | 15 +-
src/tests/correctness/corr-hpmv.cpp | 10 -
src/tests/correctness/corr-hpr.cpp | 10 -
src/tests/correctness/corr-hpr2.cpp | 9 -
src/tests/correctness/corr-iamax.cpp | 16 +-
src/tests/correctness/corr-nrm2.cpp | 16 +-
src/tests/correctness/corr-rot.cpp | 18 +-
src/tests/correctness/corr-rotg.cpp | 34 +-
src/tests/correctness/corr-rotm.cpp | 17 +-
src/tests/correctness/corr-rotmg.cpp | 16 +-
src/tests/correctness/corr-sbmv.cpp | 19 +-
src/tests/correctness/corr-scal.cpp | 16 +-
src/tests/correctness/corr-spmv.cpp | 19 +-
src/tests/correctness/corr-spr.cpp | 12 -
src/tests/correctness/corr-spr2.cpp | 9 -
src/tests/correctness/corr-swap.cpp | 19 +-
src/tests/correctness/corr-symm.cpp | 17 +-
src/tests/correctness/corr-symv.cpp | 19 +-
src/tests/correctness/corr-syr.cpp | 21 +-
src/tests/correctness/corr-syr2.cpp | 18 +-
src/tests/correctness/corr-syr2k.cpp | 17 +-
src/tests/correctness/corr-syrk.cpp | 17 +-
src/tests/correctness/corr-tbmv.cpp | 18 +-
src/tests/correctness/corr-tbsv.cpp | 18 +-
src/tests/correctness/corr-tpmv.cpp | 11 -
src/tests/correctness/corr-tpsv.cpp | 9 -
src/tests/correctness/corr-trmm.cpp | 18 +-
src/tests/correctness/corr-trmv.cpp | 20 +-
src/tests/correctness/corr-trsm.cpp | 22 +-
src/tests/correctness/corr-trsv.cpp | 17 +-
src/tests/correctness/test-correctness.cpp | 102 +--
src/tests/functional/func-error.cpp | 4 +-
src/tests/functional/test-functional.cpp | 100 ++-
src/tests/include/BlasBase.h | 11 +-
src/tests/include/asum.h | 4 -
src/tests/include/axpy.h | 3 -
src/tests/include/cmdline.h | 6 +-
src/tests/include/copy.h | 3 -
src/tests/include/dot.h | 4 -
src/tests/include/dotc.h | 4 -
src/tests/include/gbmv.h | 5 -
src/tests/include/gemm-2.h | 6 -
src/tests/include/gemm.h | 5 -
src/tests/include/gemv.h | 5 -
src/tests/include/ger.h | 8 -
src/tests/include/gerc.h | 6 -
src/tests/include/hbmv.h | 5 -
src/tests/include/hemm.h | 5 -
src/tests/include/hemv.h | 5 -
src/tests/include/her.h | 6 -
src/tests/include/her2.h | 5 -
src/tests/include/her2k.h | 5 -
src/tests/include/herk.h | 5 -
src/tests/include/iamax.h | 3 -
src/tests/include/matrix.h | 118 +--
src/tests/include/nrm2.h | 4 -
src/tests/include/rot.h | 3 -
src/tests/include/rotg.h | 3 -
src/tests/include/rotm.h | 3 -
src/tests/include/rotmg.h | 3 -
src/tests/include/sbmv.h | 5 -
src/tests/include/scal.h | 4 -
src/tests/include/spmv.h | 5 -
src/tests/include/swap.h | 3 -
src/tests/include/symm.h | 5 -
src/tests/include/symv.h | 5 -
src/tests/include/syr.h | 5 -
src/tests/include/syr2.h | 5 -
src/tests/include/syr2k.h | 5 -
src/tests/include/syrk.h | 5 -
src/tests/include/tbmv.h | 5 -
src/tests/include/tbsv.h | 5 -
src/tests/include/trmm.h | 5 -
src/tests/include/trmv.h | 4 -
src/tests/include/trsm.h | 5 -
src/tests/include/trsv.h | 4 -
245 files changed, 3102 insertions(+), 2459 deletions(-)
--
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/debian-science/packages/clblas.git
More information about the debian-science-commits
mailing list