[beignet] 02/07: Merge tag 'upstream/1.2.0'

Rebecca Palmer rnpalmer-guest at moszumanska.debian.org
Tue Sep 6 21:32:55 UTC 2016


This is an automated email from the git hooks/post-receive script.

rnpalmer-guest pushed a commit to branch master
in repository beignet.

commit 8d9b115bb5bde8781dbaa745900a2dfde7949800
Merge: c9a3c2c 8435b1d
Author: Rebecca N. Palmer <rebecca_palmer at zoho.com>
Date:   Sun Sep 4 17:51:23 2016 +0100

    Merge tag 'upstream/1.2.0'
    
    Upstream version 1.2.0

 Android.common.mk                                  |   30 +
 Android.mk                                         |   14 +
 CMake/FindLLVM.cmake                               |    6 +-
 CMakeLists.txt                                     |   67 +-
 GetGenID.sh                                        |   18 +-
 backend/src/Android.mk                             |  288 +++
 backend/src/CMakeLists.txt                         |   11 +-
 backend/src/backend/context.cpp                    |  120 +-
 backend/src/backend/context.hpp                    |   25 +-
 backend/src/backend/gen/gen_mesa_disasm.c          |  219 +-
 backend/src/backend/gen75_context.cpp              |   42 +-
 backend/src/backend/gen75_encoder.cpp              |   66 -
 backend/src/backend/gen75_encoder.hpp              |    6 -
 backend/src/backend/gen7_encoder.cpp               |   62 +-
 backend/src/backend/gen7_encoder.hpp               |    8 +-
 backend/src/backend/gen7_instruction.hpp           |   31 +
 backend/src/backend/gen8_context.cpp               |  864 ++++++-
 backend/src/backend/gen8_context.hpp               |    8 +
 backend/src/backend/gen8_encoder.cpp               |  277 ++-
 backend/src/backend/gen8_encoder.hpp               |   16 +-
 backend/src/backend/gen8_instruction.hpp           |  102 +
 backend/src/backend/gen9_context.cpp               |    5 +
 backend/src/backend/gen9_context.hpp               |   15 +-
 backend/src/backend/gen_context.cpp                | 1939 +++++++++++++--
 backend/src/backend/gen_context.hpp                |   29 +-
 backend/src/backend/gen_defs.hpp                   |   70 +
 backend/src/backend/gen_encoder.cpp                |  289 ++-
 backend/src/backend/gen_encoder.hpp                |   37 +-
 backend/src/backend/gen_insn_compact.cpp           |  427 +++-
 .../src/backend/gen_insn_gen7_schedule_info.hxx    |   11 +
 backend/src/backend/gen_insn_scheduling.cpp        |  156 +-
 backend/src/backend/gen_insn_selection.cpp         | 2570 +++++++++++++++-----
 backend/src/backend/gen_insn_selection.hpp         |   63 +-
 backend/src/backend/gen_insn_selection.hxx         |   14 +-
 .../src/backend/gen_insn_selection_optimize.cpp    |  288 +++
 backend/src/backend/gen_insn_selection_output.cpp  |  172 ++
 backend/src/backend/gen_insn_selection_output.hpp  |   13 +
 backend/src/backend/gen_program.cpp                |  234 +-
 backend/src/backend/gen_program.hpp                |   10 +-
 backend/src/backend/gen_reg_allocation.cpp         |  609 +++--
 backend/src/backend/gen_reg_allocation.hpp         |    2 +
 backend/src/backend/gen_register.hpp               |  122 +-
 backend/src/backend/program.cpp                    |  242 +-
 backend/src/backend/program.h                      |   49 +-
 backend/src/backend/program.hpp                    |   51 +-
 backend/src/gbe_bin_generater.cpp                  |   10 +-
 backend/src/gbe_bin_interpreter.cpp                |    6 +-
 backend/src/ir/constant.cpp                        |   51 +-
 backend/src/ir/constant.hpp                        |    4 +-
 backend/src/ir/context.cpp                         |    8 +-
 backend/src/ir/context.hpp                         |   30 +-
 backend/src/ir/function.cpp                        |   41 +-
 backend/src/ir/function.hpp                        |   98 +-
 backend/src/ir/image.cpp                           |   23 +-
 backend/src/ir/image.hpp                           |    4 +-
 backend/src/ir/immediate.cpp                       |    1 +
 backend/src/ir/immediate.hpp                       |    2 +-
 backend/src/ir/instruction.cpp                     | 1090 +++++++--
 backend/src/ir/instruction.hpp                     |  225 +-
 backend/src/ir/instruction.hxx                     |   10 +
 backend/src/ir/liveness.cpp                        |  149 +-
 backend/src/ir/liveness.hpp                        |    9 +-
 backend/src/ir/lowering.cpp                        |   22 +-
 backend/src/ir/printf.cpp                          |  290 +--
 backend/src/ir/printf.hpp                          |  104 +-
 backend/src/ir/profile.cpp                         |   72 +-
 backend/src/ir/profile.hpp                         |   17 +-
 backend/src/ir/profiling.cpp                       |   74 +
 backend/src/ir/profiling.hpp                       |  132 +
 backend/src/ir/register.cpp                        |    8 +
 backend/src/ir/register.hpp                        |   79 +-
 backend/src/ir/sampler.cpp                         |   16 +-
 backend/src/ir/sampler.hpp                         |    4 +-
 backend/src/ir/structurizer.cpp                    |    9 +-
 backend/src/ir/type.cpp                            |    6 +-
 backend/src/ir/unit.cpp                            |    7 +-
 backend/src/ir/unit.hpp                            |   15 +
 backend/src/ir/value.cpp                           |  197 ++
 backend/src/ir/value.hpp                           |   16 +
 backend/src/libocl/Android.mk                      |   89 +
 backend/src/libocl/CMakeLists.txt                  |    2 +-
 backend/src/libocl/include/ocl.h                   |    2 +
 backend/src/libocl/include/ocl_float.h             |    1 +
 backend/src/libocl/include/ocl_geometric.h         |    4 +
 backend/src/libocl/include/ocl_misc.h              |   15 +
 backend/src/libocl/include/ocl_sync.h              |    7 +-
 backend/src/libocl/include/ocl_vload.h             |   14 +-
 backend/src/libocl/include/ocl_work_group.h        |  118 +
 backend/src/libocl/include/ocl_workitem.h          |    3 +
 backend/src/libocl/script/gen_vector.py            |    4 +-
 backend/src/libocl/script/ocl_math.def             |   28 +-
 backend/src/libocl/script/ocl_simd.def             |    9 +
 backend/src/libocl/src/ocl_barrier.ll              |    6 +
 backend/src/libocl/src/ocl_geometric.cl            |   12 +
 backend/src/libocl/src/ocl_memset.cl               |    2 +-
 backend/src/libocl/src/ocl_misc.cl                 |   24 +-
 backend/src/libocl/src/ocl_sync.cl                 |    7 +-
 backend/src/libocl/src/ocl_vload.cl                |   22 +-
 backend/src/libocl/src/ocl_work_group.cl           |  126 +
 backend/src/libocl/src/ocl_workitem.cl             |   30 +
 backend/src/libocl/tmpl/ocl_common.tmpl.cl         |    3 +-
 backend/src/libocl/tmpl/ocl_defines.tmpl.h         |    1 +
 backend/src/libocl/tmpl/ocl_integer.tmpl.cl        |    4 +-
 backend/src/libocl/tmpl/ocl_math.tmpl.cl           |  594 ++---
 backend/src/libocl/tmpl/ocl_math.tmpl.h            |   29 +-
 backend/src/libocl/tmpl/ocl_simd.tmpl.cl           |  243 ++
 backend/src/libocl/tmpl/ocl_simd.tmpl.h            |  143 ++
 backend/src/llvm/ExpandConstantExpr.cpp            |    4 +-
 backend/src/llvm/ExpandLargeIntegers.cpp           |    6 +-
 backend/src/llvm/ExpandUtils.cpp                   |    2 +-
 backend/src/llvm/PromoteIntegers.cpp               |    9 +-
 backend/src/llvm/StripAttributes.cpp               |    2 +-
 backend/src/llvm/llvm_bitcode_link.cpp             |   61 +-
 backend/src/llvm/llvm_gen_backend.cpp              | 1374 ++++++++---
 backend/src/llvm/llvm_gen_backend.hpp              |    8 +-
 backend/src/llvm/llvm_gen_ocl_function.hxx         |   72 +-
 backend/src/llvm/llvm_includes.hpp                 |    5 +
 backend/src/llvm/llvm_intrinsic_lowering.cpp       |    6 +-
 backend/src/llvm/llvm_loadstore_optimization.cpp   |  115 +-
 backend/src/llvm/llvm_passes.cpp                   |    7 +-
 backend/src/llvm/llvm_printf_parser.cpp            |  451 +---
 backend/src/llvm/llvm_profiling.cpp                |  214 ++
 backend/src/llvm/llvm_sampler_fix.cpp              |    2 +
 backend/src/llvm/llvm_scalarize.cpp                |  121 +-
 backend/src/llvm/llvm_to_gen.cpp                   |  100 +-
 backend/src/llvm/llvm_to_gen.hpp                   |    3 +-
 backend/src/llvm/llvm_unroll.cpp                   |   33 +-
 backend/src/ocl_common_defines.h                   |   33 +-
 backend/src/sys/alloc.hpp                          |    4 +-
 backend/src/sys/platform.hpp                       |    8 +-
 benchmark/CMakeLists.txt                           |    7 +-
 benchmark/benchmark_copy_buf.cpp                   |    4 +-
 benchmark/benchmark_copy_buffer.cpp                |   57 +
 benchmark/benchmark_copy_buffer_to_image.cpp       |    2 +-
 benchmark/benchmark_copy_image.cpp                 |   72 +
 benchmark/benchmark_copy_image_to_buffer.cpp       |    2 +-
 benchmark/benchmark_math.cpp                       |  126 +
 benchmark/benchmark_read_buffer.cpp                |    3 +-
 benchmark/benchmark_read_image.cpp                 |    3 +-
 benchmark/benchmark_run.cpp                        |    1 +
 benchmark/benchmark_use_host_ptr_buffer.cpp        |    3 +-
 benchmark/benchmark_workgroup.cpp                  |  370 +++
 docs/Beignet.mdwn                                  |  103 +-
 docs/NEWS.mdwn                                     |    3 +
 docs/howto/stand-alone-utest-howto.mdwn            |   45 +
 docs/howto/video-motion-estimation-howto.mdwn      |   71 +
 include/CL/cl_ext.h                                |  103 +
 include/CL/cl_intel.h                              |   64 +
 kernels/bench_copy_buffer.cl                       |   90 +
 kernels/bench_copy_image.cl                        |   52 +
 kernels/bench_math.cl                              |  272 +++
 kernels/bench_workgroup.cl                         |  239 ++
 kernels/builtin_global_linear_id.cl                |    4 +
 kernels/builtin_local_linear_id.cl                 |    6 +
 kernels/builtin_max_sub_group_size.cl              |    7 +
 kernels/builtin_num_sub_groups.cl                  |    7 +
 kernels/builtin_sub_group_id.cl                    |    7 +
 kernels/builtin_sub_group_size.cl                  |    7 +
 kernels/cmrt_utest_genx.isa                        |  Bin 0 -> 847 bytes
 kernels/compiler_bsort.cl                          |   47 +
 kernels/compiler_bswap.cl                          |   14 +-
 kernels/compiler_double_2.cl                       |    9 -
 kernels/compiler_double_4.cl                       |    5 -
 kernels/compiler_double_convert.cl                 |  102 +
 kernels/compiler_double_div.cl                     |   13 +
 kernels/compiler_get_max_sub_group_size.cl         |    5 +
 kernels/compiler_get_sub_group_id.cl               |    8 -
 kernels/compiler_get_sub_group_local_id.cl         |    8 +
 kernels/compiler_get_sub_group_size.cl             |    5 -
 kernels/compiler_half_convert.cl                   |   11 +-
 kernels/compiler_math_3op.cl                       |   20 +-
 kernels/compiler_mix.cl                            |    4 +
 kernels/compiler_sub_group_all.cl                  |   12 -
 kernels/compiler_sub_group_any.cl                  |   15 -
 kernels/compiler_sub_group_shuffle.cl              |    6 +-
 kernels/compiler_sub_group_shuffle_down.cl         |   19 +
 kernels/compiler_sub_group_shuffle_up.cl           |   19 +
 kernels/compiler_sub_group_shuffle_xor.cl          |   19 +
 kernels/compiler_subgroup_broadcast.cl             |   34 +
 kernels/compiler_subgroup_buffer_block_read.cl     |   31 +
 kernels/compiler_subgroup_buffer_block_write.cl    |   27 +
 kernels/compiler_subgroup_image_block_read.cl      |   31 +
 kernels/compiler_subgroup_image_block_write.cl     |   27 +
 kernels/compiler_subgroup_reduce.cl                |  136 ++
 kernels/compiler_subgroup_scan_exclusive.cl        |   98 +
 kernels/compiler_subgroup_scan_inclusive.cl        |   98 +
 kernels/compiler_vector_load_store.cl              |    8 +-
 kernels/compiler_workgroup_broadcast.cl            |  122 +
 kernels/compiler_workgroup_reduce.cl               |  137 ++
 kernels/compiler_workgroup_scan_exclusive.cl       |   98 +
 kernels/compiler_workgroup_scan_inclusive.cl       |   98 +
 kernels/image_1D_buffer.cl                         |    2 +-
 kernels/image_from_buffer.cl                       |   12 +
 kernels/runtime_use_host_ptr_image.cl              |   10 +
 kernels/test_fill_image_2d_array.cl                |    2 +-
 kernels/test_get_arg_info.cl                       |    2 +-
 kernels/test_printf.cl                             |   46 +
 src/Android.mk                                     |  124 +
 src/CMakeLists.txt                                 |   62 +-
 src/OCLConfig.h.in                                 |    1 -
 src/cl_accelerator_intel.c                         |   86 +
 src/cl_accelerator_intel.h                         |   29 +
 src/cl_api.c                                       |  241 +-
 src/cl_cmrt.cpp                                    |  311 +++
 src/cl_cmrt.h                                      |   45 +
 src/cl_command_queue.c                             |   63 +-
 src/cl_command_queue.h                             |    2 +
 src/cl_command_queue_gen7.c                        |  154 +-
 src/cl_context.c                                   |    1 +
 src/cl_context.h                                   |    3 +
 src/cl_device_data.h                               |   71 +-
 src/cl_device_id.c                                 |  405 ++-
 src/cl_device_id.h                                 |   19 +-
 src/cl_driver.h                                    |   55 +-
 src/cl_driver_defs.c                               |    9 +
 src/cl_enqueue.c                                   |   15 +-
 src/cl_event.c                                     |   30 +-
 src/cl_extensions.c                                |   52 +-
 src/cl_extensions.h                                |   17 +-
 src/cl_gbe_loader.cpp                              |   34 +-
 src/cl_gbe_loader.h                                |    5 +-
 src/cl_gen75_device.h                              |    5 +-
 src/cl_gen7_device.h                               |    7 +-
 src/{cl_gen75_device.h => cl_gen8_device.h}        |    8 +-
 src/{cl_gen75_device.h => cl_gen9_device.h}        |    7 +-
 src/cl_gt_device.h                                 |   12 +-
 src/cl_internals.h                                 |    1 +
 src/cl_kernel.c                                    |   80 +-
 src/cl_kernel.h                                    |    8 +-
 src/cl_mem.c                                       |  332 ++-
 src/cl_mem.h                                       |   18 +
 src/cl_mem_gl.c                                    |    2 +-
 src/cl_program.c                                   |  181 +-
 src/cl_program.h                                   |   17 +-
 src/cl_thread.c                                    |   91 +-
 src/cl_utils.h                                     |   43 +
 src/intel/intel_driver.c                           |   91 +-
 src/intel/intel_gpgpu.c                            |  408 +++-
 src/intel/intel_gpgpu.h                            |    7 +-
 src/intel/intel_structs.h                          |  120 +
 .../cl_internal_block_motion_estimate_intel.cl     |  369 +++
 src/performance.c                                  |    3 +
 src/x11/dricommon.c                                |    6 +-
 utests/Android.mk                                  |  248 ++
 utests/CMakeLists.txt                              |  121 +-
 utests/buildin_work_dim.cpp                        |   13 +-
 utests/builtin_acos_asin.cpp                       |   20 +-
 utests/builtin_exp.cpp                             |   22 +-
 utests/builtin_global_id.cpp                       |   16 +-
 ..._global_id.cpp => builtin_global_linear_id.cpp} |   36 +-
 utests/builtin_global_size.cpp                     |    9 +-
 .../builtin_kernel_block_motion_estimate_intel.cpp |  135 +
 utests/builtin_kernel_max_global_size.cpp          |    8 +-
 utests/builtin_lgamma.cpp                          |    2 +-
 utests/builtin_lgamma_r.cpp                        |    2 +-
 utests/builtin_local_id.cpp                        |   16 +-
 ...in_local_id.cpp => builtin_local_linear_id.cpp} |   32 +-
 utests/builtin_local_size.cpp                      |   10 +-
 utests/builtin_max_sub_group_size.cpp              |   62 +
 utests/builtin_num_groups.cpp                      |   10 +-
 utests/builtin_num_sub_groups.cpp                  |   62 +
 utests/builtin_pow.cpp                             |   19 +-
 utests/builtin_sub_group_id.cpp                    |   63 +
 utests/builtin_sub_group_size.cpp                  |   63 +
 utests/builtin_tgamma.cpp                          |    6 +-
 utests/compare_image_2d_and_1d_array.cpp           |    2 +
 utests/compiler_abs.cpp                            |   18 +-
 utests/compiler_abs_diff.cpp                       |   17 +-
 utests/compiler_array1.cpp                         |    2 +-
 utests/compiler_assignment_operation_in_if.cpp     |    2 +-
 utests/compiler_box_blur_float.cpp                 |    3 +
 utests/compiler_bsort.cpp                          |   45 +
 utests/compiler_bswap.cpp                          |   63 +-
 utests/compiler_cl_finish.cpp                      |    8 +-
 utests/compiler_clz.cpp                            |   16 +-
 utests/compiler_copy_image.cpp                     |    8 +-
 utests/compiler_copy_image1.cpp                    |   24 +-
 utests/compiler_copy_image_1d.cpp                  |    8 +-
 utests/compiler_double.cpp                         |    5 +-
 utests/compiler_double_2.cpp                       |   47 -
 utests/compiler_double_4.cpp                       |   40 -
 utests/compiler_double_convert.cpp                 |  621 +++++
 utests/compiler_double_div.cpp                     |   83 +
 utests/compiler_double_precision.cpp               |    3 +
 utests/compiler_fill_image.cpp                     |    4 +-
 utests/compiler_fill_image_1d_array.cpp            |    1 +
 utests/compiler_fill_image_2d_array.cpp            |   18 +-
 utests/compiler_fill_image_3d.cpp                  |    4 +-
 utests/compiler_function_qualifiers.cpp            |    1 +
 ...ize.cpp => compiler_get_max_sub_group_size.cpp} |   10 +-
 ..._id.cpp => compiler_get_sub_group_local_id.cpp} |    8 +-
 utests/compiler_half.cpp                           |  298 ++-
 utests/compiler_mad24.cpp                          |    2 +-
 utests/compiler_math.cpp                           |    8 +-
 utests/compiler_math_2op.cpp                       |    8 +-
 utests/compiler_math_3op.cpp                       |   76 +-
 utests/compiler_mix.cpp                            |   50 +
 utests/compiler_movforphi_undef.cpp                |    8 +-
 utests/compiler_mul24.cpp                          |    2 +-
 utests/compiler_popcount.cpp                       |    2 +-
 utests/compiler_sub_group_all.cpp                  |   43 -
 utests/compiler_sub_group_any.cpp                  |   43 -
 utests/compiler_sub_group_shuffle.cpp              |    2 +
 ...fle.cpp => compiler_sub_group_shuffle_down.cpp} |   19 +-
 ...uffle.cpp => compiler_sub_group_shuffle_up.cpp} |   19 +-
 ...ffle.cpp => compiler_sub_group_shuffle_xor.cpp} |   15 +-
 utests/compiler_subgroup_broadcast.cpp             |  187 ++
 utests/compiler_subgroup_buffer_block_read.cpp     |  202 ++
 utests/compiler_subgroup_buffer_block_write.cpp    |  202 ++
 utests/compiler_subgroup_image_block_read.cpp      |  197 ++
 utests/compiler_subgroup_image_block_write.cpp     |  201 ++
 utests/compiler_subgroup_reduce.cpp                |  425 ++++
 utests/compiler_subgroup_scan_exclusive.cpp        |  381 +++
 utests/compiler_subgroup_scan_inclusive.cpp        |  372 +++
 utests/compiler_time_stamp.cpp                     |    5 +
 utests/compiler_unstructured_branch3.cpp           |    4 +
 utests/compiler_vector_load_store.cpp              |   32 +-
 utests/compiler_workgroup_broadcast.cpp            |  320 +++
 utests/compiler_workgroup_reduce.cpp               |  417 ++++
 utests/compiler_workgroup_scan_exclusive.cpp       |  373 +++
 utests/compiler_workgroup_scan_inclusive.cpp       |  364 +++
 utests/enqueue_copy_buf_unaligned.cpp              |    2 +-
 utests/get_cl_info.cpp                             |  247 +-
 utests/image_1D_buffer.cpp                         |    3 +-
 utests/image_from_buffer.cpp                       |  109 +
 utests/load_program_from_bin_file.cpp              |    4 +
 utests/load_program_from_gen_bin.cpp               |    8 +
 utests/load_program_from_spir.cpp                  |    6 +
 utests/profiling_exec.cpp                          |    8 +-
 utests/runtime_alloc_host_ptr_buffer.cpp           |    6 +-
 utests/runtime_barrier_list.cpp                    |    1 -
 utests/runtime_climage_from_boname.cpp             |   14 +-
 utests/runtime_cmrt.cpp                            |  274 +++
 utests/runtime_compile_link.cpp                    |   25 +-
 utests/runtime_event.cpp                           |    1 -
 utests/runtime_flat_address_space.cpp              |    8 +-
 utests/runtime_marker_list.cpp                     |    1 -
 utests/runtime_use_host_ptr_image.cpp              |   76 +
 utests/sub_buffer.cpp                              |    2 +-
 utests/test_printf.cpp                             |   54 +
 utests/utest.cpp                                   |   92 +-
 utests/utest.hpp                                   |   22 +-
 utests/utest_generator.py                          |   57 +-
 utests/utest_helper.cpp                            |  388 ++-
 utests/utest_helper.hpp                            |   97 +-
 utests/utest_math_gen.py                           |   30 +-
 utests/utest_run.cpp                               |   36 +-
 utests/vload_bench.cpp                             |    2 +-
 348 files changed, 26538 insertions(+), 4796 deletions(-)

-- 
Alioth's /usr/local/bin/git-commit-notice on /srv/git.debian.org/git/pkg-opencl/beignet.git



More information about the Pkg-opencl-commits mailing list