[clblas] 61/61: Merge pull request #119 from TimmyLiu/master

Ghislain Vaillant ghisvail-guest at moszumanska.debian.org
Fri Jul 24 22:49:50 UTC 2015


This is an automated email from the git hooks/post-receive script.

ghisvail-guest pushed a commit to branch master
in repository clblas.

commit 9731ea2a270509211a47bf6cf9df4de2069ccc52
Merge: a6b3f9d 3f032e7
Author: David Tanner <david.tanner at amd.com>
Date:   Wed Jul 1 15:00:31 2015 -0500

    Merge pull request #119 from TimmyLiu/master
    
    merge develop branch into master branch. bump the version number to 2.6

 .gitignore                                         |    3 +
 .travis.yml                                        |   22 +-
 LICENSE                                            |   25 -
 README.md                                          |   65 +-
 doc/README-BinaryCacheOnDisk.txt                   |   69 +
 doc/README-FunctorConcepts.txt                     |  100 +
 doc/README-HowToIntroduceFunctors.txt              |  402 ++
 doc/README-TransformASolverIntoAFunctor.txt        |  382 ++
 doc/performance/clBLAS_2.6.0/S9150/README.txt      |   35 +
 doc/performance/clBLAS_2.6.0/S9150/dgemm_32.csv    |  181 +
 doc/performance/clBLAS_2.6.0/S9150/dgemm_96.csv    |   61 +
 doc/performance/clBLAS_2.6.0/S9150/dtrsm_192.csv   |   31 +
 .../clBLAS_2.6.0/S9150/generate_graphs.sh          |   92 +
 doc/performance/clBLAS_2.6.0/S9150/peak_dp.csv     |  181 +
 doc/performance/clBLAS_2.6.0/S9150/peak_sp.csv     |  181 +
 doc/performance/clBLAS_2.6.0/S9150/sgemm_32.csv    |  181 +
 doc/performance/clBLAS_2.6.0/S9150/zgemm_32.csv    |  181 +
 doc/performance/clBLAS_2.6.0/S9150/zgemm_64.csv    |   91 +
 doc/performance/cuBLAS_7.0/Tesla_K40/README.txt    |   35 +
 doc/performance/cuBLAS_7.0/Tesla_K40/dgemm.csv     |  181 +
 doc/performance/cuBLAS_7.0/Tesla_K40/dtrsm.csv     |   31 +
 doc/performance/cuBLAS_7.0/Tesla_K40/peak_dp.csv   |  181 +
 doc/performance/cuBLAS_7.0/Tesla_K40/peak_sp.csv   |  181 +
 doc/performance/cuBLAS_7.0/Tesla_K40/sgemm.csv     |  181 +
 doc/performance/cuBLAS_7.0/Tesla_K40/zgemm.csv     |  181 +
 src/CMakeLists.txt                                 |   83 +-
 src/FindOpenCL.cmake                               |    3 +-
 src/clBLAS.def                                     |   28 +
 src/clBLAS.h                                       |  622 ++
 src/client/clfunc_common.hpp                       |    1 +
 src/client/clfunc_xgemm.hpp                        |   53 +-
 src/client/clfunc_xtrsm.hpp                        |   14 +-
 src/client/client.cpp                              |   21 +-
 src/flags_public.txt                               |    4 +
 src/include/binary_lookup.h                        |  273 +
 src/include/devinfo.h                              |    2 +
 src/include/md5sum.h                               |   50 +
 src/include/rwlock.h                               |  117 +
 src/library/CMakeLists.txt                         |  282 +-
 src/library/bingen.cmake                           |  144 +
 src/library/blas/fill.cc                           |  272 +
 src/library/blas/functor/bonaire.cc                |   90 +
 src/library/blas/functor/functor.cc                |  117 +
 src/library/blas/functor/functor_fill.cc           |  156 +
 src/library/blas/functor/functor_selector.cc       |  344 ++
 src/library/blas/functor/functor_xgemm.cc          |  323 +
 src/library/blas/functor/functor_xscal.cc          |  410 ++
 src/library/blas/functor/functor_xscal_generic.cc  |  439 ++
 src/library/blas/functor/functor_xtrsm.cc          |  336 ++
 src/library/blas/functor/gcn_dgemm.cc              | 1035 ++++
 src/library/blas/functor/gcn_dgemmCommon.cc        |  997 +++
 src/library/blas/functor/gcn_dgemmSmallMatrices.cc |  654 ++
 src/library/blas/functor/gcn_sgemm.cc              |  556 ++
 src/library/blas/functor/gcn_sgemmSmallMatrices.cc |  558 ++
 src/library/blas/functor/gcn_zgemm.cc              |  354 ++
 src/library/blas/functor/gpu_dtrsm.cc              |  823 +++
 src/library/blas/functor/gpu_dtrsm192.cc           |  596 ++
 src/library/blas/functor/hawaii.cc                 |  223 +
 .../blas/functor/hawaii_dgemmChannelConflict.cc    |  159 +
 .../blas/functor/hawaii_dgemmSplitKernel.cc        |  670 ++
 .../blas/functor/hawaii_sgemmBranchKernel.cc       |  442 ++
 src/library/blas/functor/hawaii_sgemmSplit64_32.cc |  423 ++
 .../blas/functor/hawaii_sgemmSplitKernel.cc        |  858 +++
 src/library/blas/functor/include/BinaryBuild.h     |   10 +
 src/library/blas/functor/include/atomic_counter.h  |  173 +
 src/library/blas/functor/include/bonaire.h         |   41 +
 src/library/blas/functor/include/functor.h         |  496 ++
 src/library/blas/functor/include/functor_fill.h    |   99 +
 .../functor/include/functor_hawaii_dgemm_NT_MN48.h |  210 +
 .../blas/functor/include/functor_selector.h        |  149 +
 src/library/blas/functor/include/functor_utils.h   |  116 +
 src/library/blas/functor/include/functor_xgemm.h   |  213 +
 src/library/blas/functor/include/functor_xscal.h   |  207 +
 .../blas/functor/include/functor_xscal_generic.h   |  173 +
 src/library/blas/functor/include/functor_xtrsm.h   |  203 +
 src/library/blas/functor/include/gcn_dgemm.h       |   59 +
 src/library/blas/functor/include/gcn_dgemmCommon.h |   22 +
 .../blas/functor/include/gcn_dgemmSmallMatrices.h  |   27 +
 src/library/blas/functor/include/gcn_sgemm.h       |   62 +
 .../blas/functor/include/gcn_sgemmSmallMatrices.h  |   27 +
 src/library/blas/functor/include/gcn_zgemm.h       |   62 +
 src/library/blas/functor/include/gpu_dtrsm.h       |   28 +
 src/library/blas/functor/include/gpu_dtrsm192.h    |   28 +
 src/library/blas/functor/include/hawaii.h          |   42 +
 .../functor/include/hawaii_dgemmChannelConflict.h  |   22 +
 .../blas/functor/include/hawaii_dgemmSplitKernel.h |   46 +
 .../functor/include/hawaii_sgemmBranchKernel.h     |   50 +
 .../blas/functor/include/hawaii_sgemmSplit64_32.h  |   46 +
 .../blas/functor/include/hawaii_sgemmSplitKernel.h |   46 +
 src/library/blas/functor/include/tahiti.h          |   41 +
 src/library/blas/functor/tahiti.cc                 |  120 +
 src/library/blas/generic/binary_lookup.cc          |  685 +++
 src/library/blas/generic/common.c                  |   25 +-
 src/library/blas/generic/common2.cc                |   98 +
 src/library/blas/generic/functor_cache.cc          |   80 +
 src/library/blas/generic/solution_seq_make.c       |    4 +-
 src/library/blas/gens/blas_kgen.h                  |    3 -
 src/library/blas/gens/blas_subgroup.c              |    6 +-
 src/library/blas/gens/clTemplates/dgemm_NT_MN48.cl |  347 ++
 .../gens/clTemplates/dgemm_gcn_SmallMatrices.cl    | 1159 ++++
 src/library/blas/gens/clTemplates/dgemm_hawai.cl   | 6371 ++++++++++++++++++++
 .../clTemplates/dgemm_hawaiiChannelConfilct.cl     |  152 +
 .../gens/clTemplates/dgemm_hawaiiSplitKernel.cl    | 5043 ++++++++++++++++
 src/library/blas/gens/clTemplates/dtrsm_gpu.cl     | 2004 ++++++
 src/library/blas/gens/clTemplates/dtrsm_gpu192.cl  | 1031 ++++
 src/library/blas/gens/clTemplates/sgemm_gcn.cl     | 2083 +++++++
 .../gens/clTemplates/sgemm_gcn_SmallMatrices.cl    | 1036 ++++
 .../gens/clTemplates/sgemm_hawaiiSplit64_32.cl     |  530 ++
 .../gens/clTemplates/sgemm_hawaiiSplitKernel.cl    | 6179 +++++++++++++++++++
 src/library/blas/gens/clTemplates/zgemm_gcn.cl     |  319 +
 src/library/blas/include/clblas-internal.h         |   28 +
 src/library/blas/init.c                            |   12 +
 src/library/blas/matrix.c                          |  979 +++
 src/library/blas/xgemm.c                           |  783 ---
 src/library/blas/xgemm.cc                          |  328 +
 src/library/blas/xscal.cc                          |  340 ++
 src/library/blas/xtrsm.c                           |  249 -
 src/library/blas/xtrsm.cc                          |  333 +
 src/library/common/devinfo.c                       |    6 +
 src/library/common/md5sum.c                        |  378 ++
 src/library/common/rwlock.c                        |  172 +
 .../perf => library/tools/bingen}/CMakeLists.txt   |   23 +-
 src/library/tools/bingen/bingen.cpp                |  512 ++
 src/library/tools/ktest/CMakeLists.txt             |   34 +-
 src/library/tools/tplgen/tplgen.cpp                |   85 +-
 src/library/tools/tune/CMakeLists.txt              |   33 +-
 src/library/tools/tune/tune.c                      |    5 +-
 src/samples/CMakeLists.txt                         |   21 +-
 src/samples/example_csscal.c                       |    3 +-
 src/scripts/perf/CMakeLists.txt                    |    6 +-
 src/scripts/perf/blasPerformanceTesting.py         |    4 +-
 src/tests/CMakeLists.txt                           |   28 +-
 src/tests/correctness/test-correctness.cpp         |    3 +-
 src/tests/performance/test-performance.cpp         |    5 +-
 134 files changed, 48858 insertions(+), 1271 deletions(-)

-- 
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/debian-science/packages/clblas.git



More information about the debian-science-commits mailing list