This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git
from 8cadd1fbc5 [ARITH] Enhance Canonical Simplify for LE (#15471)
add 34cacb0a64 [VM][Textures] Enable OpenCL textures for VM (#15419)
add 9ff71f4a9f [CodeGenC] Handle GlobalVar callee as internal function
call (#15103)
No new revisions were added by this update.
Summary of changes:
include/tvm/runtime/ndarray.h | 8 +-
include/tvm/runtime/vm/bytecode.h | 19 +-
include/tvm/runtime/vm/executable.h | 5 +-
.../arm_cpu/mprofile/dsp/micro_kernel/avg_pool.py | 8 +-
.../topi/arm_cpu/mprofile/dsp/micro_kernel/gemm.py | 87 ++++-
.../arm_cpu/mprofile/dsp/micro_kernel/max_pool.py | 13 +-
.../arm_cpu/mprofile/dsp/micro_kernel/tensordot.py | 7 +-
.../backend/contrib/cmsisnn/tir_to_runtime.cc | 28 +-
.../contrib/example_target_hooks/tir_to_runtime.cc | 26 +-
src/relay/backend/contrib/uma/tir_to_runtime.cc | 34 +-
src/relay/backend/vm/compiler.cc | 41 ++-
src/relay/backend/vm/manifest_lifetimes.cc | 4 +-
src/relay/op/memory/memory.cc | 20 +-
src/relay/op/memory/memory.h | 5 +-
src/relay/transforms/annotate_texture_storage.cc | 9 +
src/relay/transforms/device_domains.cc | 7 +-
src/relay/transforms/memory_alloc.cc | 4 +-
src/runtime/c_runtime_api.cc | 2 +-
src/runtime/opencl/opencl_device_api.cc | 2 +-
src/runtime/vm/bytecode.cc | 56 +++-
src/runtime/vm/executable.cc | 34 +-
src/runtime/vm/profiler/vm.cc | 16 +-
src/runtime/vm/vm.cc | 47 ++-
src/target/opt/build_cuda_on.cc | 18 +-
src/target/source/codegen_aocl.cc | 19 +-
src/target/source/codegen_c.cc | 153 ++++++---
src/target/source/codegen_c.h | 59 +++-
src/target/source/codegen_c_host.cc | 93 +++---
src/target/source/codegen_c_host.h | 3 +-
src/target/source/codegen_cuda.cc | 4 +-
src/target/source/codegen_cuda.h | 2 +-
src/target/source/codegen_metal.cc | 77 +++--
src/target/source/codegen_metal.h | 3 +-
src/target/source/codegen_opencl.cc | 24 +-
src/target/source/codegen_vhls.cc | 34 +-
src/target/source/codegen_webgpu.cc | 79 ++---
src/target/source/codegen_webgpu.h | 4 +-
src/target/source/source_module.cc | 6 +-
src/tir/op/op.cc | 26 ++
.../relay/aot/test_crt_forward_declarations.py | 4 +-
.../opencl_texture/test_conv2d_nchw_texture.py | 361 ++++++++++++++++-----
.../opencl_texture/test_conv2d_nhwc_texture.py | 245 ++++++++++----
.../test_depthwise_conv2d_nchw_texture.py | 52 ++-
.../test_depthwise_conv2d_nhwc_texture.py | 50 ++-
.../relay/opencl_texture/test_injection_texture.py | 33 +-
tests/python/relay/opencl_texture/test_network.py | 24 +-
.../relay/opencl_texture/test_pool_texture.py | 63 +++-
.../relay/opencl_texture/test_reduction_texture.py | 87 +++--
.../relay/opencl_texture/utils/adreno_utils.py | 84 +++++
.../relay/test_pass_dead_code_elimination.py | 18 +-
tests/python/relay/test_pass_plan_devices.py | 11 +-
.../topi/python/test_topi_conv2d_tensordot_opts.py | 28 +-
.../python/unittest/test_target_codegen_c_host.py | 48 ++-
.../test_tir_transform_inject_ptx_async_copy.py | 1 +
54 files changed, 1587 insertions(+), 608 deletions(-)