This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a change to branch last-successful
in repository https://gitbox.apache.org/repos/asf/tvm.git.
from 1970223 Fixed additional deprecation warning in file (#10318)
add 174d09e [TE][TIR] Implement layout transformations, non-flat memory
buffers (#9727)
No new revisions were added by this update.
Summary of changes:
include/tvm/ir/attrs.h | 41 +
include/tvm/te/operation.h | 1 +
include/tvm/te/schedule.h | 123 +-
include/tvm/tir/buffer.h | 44 +-
include/tvm/tir/builtin.h | 11 +-
include/tvm/tir/expr.h | 16 +
include/tvm/tir/function.h | 44 +-
include/tvm/tir/index_map.h | 140 +
include/tvm/tir/stmt.h | 17 +
include/tvm/topi/transform.h | 8 +-
.../contrib/ethosu/tir/binary_elementwise.py | 6 +-
.../backend/contrib/ethosu/tir/convolution.py | 12 +-
.../relay/backend/contrib/ethosu/tir/depthwise.py | 12 +-
python/tvm/relay/backend/contrib/ethosu/tir/dma.py | 58 +-
.../relay/backend/contrib/ethosu/tir/identity.py | 18 +-
.../tvm/relay/backend/contrib/ethosu/tir/passes.py | 425 +-
.../relay/backend/contrib/ethosu/tir/pooling.py | 4 +-
.../tvm/relay/backend/contrib/ethosu/tir/spec.py | 15 +-
.../relay/backend/contrib/ethosu/tir/transform.py | 11 +-
.../contrib/ethosu/tir/unary_elementwise.py | 6 +-
.../tvm/relay/backend/contrib/ethosu/tir/utils.py | 28 +-
.../backend/contrib/ethosu/tir_to_cs_translator.py | 31 +-
python/tvm/relay/op/_transform.py | 6 +-
python/tvm/relay/op/dyn/_transform.py | 2 +-
python/tvm/relay/op/dyn/nn/_nn.py | 10 +-
python/tvm/script/context_maintainer.py | 3 +
python/tvm/script/parser.py | 65 +-
python/tvm/script/tir/__init__.pyi | 2 +-
python/tvm/script/tir/node.py | 6 +-
python/tvm/script/tir/scope_handler.py | 49 +-
python/tvm/script/tir/special_stmt.py | 54 +
python/tvm/te/__init__.py | 8 +-
python/tvm/te/schedule.py | 152 +-
python/tvm/tir/buffer.py | 38 +
python/tvm/tir/function.py | 37 +-
python/tvm/tir/ir_builder.py | 112 +-
python/tvm/tir/transform/transform.py | 15 +-
python/tvm/topi/cuda/sparse.py | 12 +-
python/tvm/topi/utils.py | 14 +-
src/arith/rewrite_simplify.cc | 6 +-
src/autotvm/feature_visitor.cc | 10 +-
src/autotvm/feature_visitor.h | 4 +-
src/contrib/hybrid/codegen_hybrid.cc | 8 +
src/contrib/hybrid/codegen_hybrid.h | 2 +
src/printer/tir_text_printer.cc | 3 +
src/printer/tvmscript_printer.cc | 127 +-
src/relay/backend/aot_executor_codegen.cc | 14 +-
src/relay/backend/contrib/cmsisnn/relay_to_tir.cc | 2 +-
.../contrib/example_target_hooks/relay_to_tir.cc | 8 +-
src/relay/op/tensor/transform.cc | 6 +-
src/relay/transforms/fold_constant.cc | 1 +
src/target/llvm/codegen_cpu.cc | 6 +-
src/target/llvm/codegen_hexagon.cc | 6 +-
src/target/llvm/codegen_llvm.cc | 182 +-
src/target/llvm/codegen_llvm.h | 7 +-
src/target/source/codegen_c.cc | 199 +-
src/target/source/codegen_c.h | 11 +-
src/target/source/codegen_c_host.cc | 4 +
src/target/source/codegen_cuda.cc | 10 +-
src/target/source/codegen_cuda.h | 3 +-
src/target/source/codegen_metal.cc | 5 +
src/target/source/codegen_opencl.cc | 32 +-
src/target/source/codegen_opencl.h | 7 +-
src/target/source/codegen_source_base.cc | 4 +
src/target/spirv/codegen_spirv.cc | 40 +-
src/target/spirv/codegen_spirv.h | 4 +-
src/target/stackvm/codegen_stackvm.cc | 46 +-
src/target/stackvm/codegen_stackvm.h | 2 +
src/te/operation/cross_thread_reduction.cc | 46 +-
src/te/schedule/message_passing.cc | 130 +
src/te/schedule/schedule_lang.cc | 96 +
src/te/schedule/schedule_ops.cc | 52 +-
src/te/schedule/schedule_postproc_to_primfunc.cc | 276 +-
src/tir/analysis/block_access_region_detector.cc | 10 +-
src/tir/analysis/buffer_access_lca_detector.cc | 21 +-
src/tir/analysis/device_constraint_utils.cc | 27 +-
src/tir/analysis/var_touch.cc | 14 +-
src/tir/analysis/verify_gpu_code.cc | 12 +-
src/tir/analysis/verify_memory.cc | 14 +-
src/tir/ir/buffer.cc | 241 +-
src/tir/ir/expr.cc | 20 +-
src/tir/ir/expr_functor.cc | 12 +-
src/tir/ir/function.cc | 10 +-
src/tir/ir/index_map.cc | 154 +
src/tir/ir/stmt.cc | 17 +-
src/tir/ir/stmt_functor.cc | 82 +-
src/tir/schedule/primitive/cache_read_write.cc | 30 +-
src/tir/schedule/primitive/compute_inline.cc | 42 +-
src/tir/transforms/arg_binder.cc | 77 +-
src/tir/transforms/bf16_legalize.cc | 108 +-
src/tir/transforms/bind_params.cc | 9 +-
src/tir/transforms/bound_checker.cc | 166 +-
src/tir/transforms/compact_buffer_region.cc | 9 +-
src/tir/transforms/coproc_sync.cc | 19 +-
src/tir/transforms/flatten_buffer.cc | 105 +-
src/tir/transforms/inject_copy_intrin.cc | 42 +-
src/tir/transforms/inject_double_buffer.cc | 93 +-
src/tir/transforms/inject_virtual_thread.cc | 160 +-
src/tir/transforms/ir_utils.cc | 128 +-
src/tir/transforms/ir_utils.h | 16 +-
src/tir/transforms/lower_cross_thread_reduction.cc | 2 +-
src/tir/transforms/lower_custom_datatypes.cc | 78 +-
src/tir/transforms/lower_match_buffer.cc | 19 +-
src/tir/transforms/lower_thread_allreduce.cc | 262 +-
src/tir/transforms/lower_tvm_builtin.cc | 183 +-
src/tir/transforms/lower_warp_memory.cc | 107 +-
src/tir/transforms/make_packed_api.cc | 79 +-
.../merge_dynamic_shared_memory_allocations.cc | 87 +-
src/tir/transforms/narrow_datatype.cc | 56 +-
src/tir/transforms/rewrite_unsafe_select.cc | 15 +-
src/tir/transforms/simplify.cc | 34 +-
src/tir/transforms/split_host_device.cc | 26 +-
src/tir/transforms/storage_access.cc | 49 +-
src/tir/transforms/storage_access.h | 9 +-
src/tir/transforms/storage_flatten.cc | 539 ++-
src/tir/transforms/storage_rewrite.cc | 352 +-
src/tir/transforms/thread_storage_sync.cc | 71 +-
src/tir/transforms/unroll_loop.cc | 5 +
src/tir/transforms/update_pointer_storage_scope.cc | 56 +-
src/tir/transforms/update_pointer_storage_scope.h | 8 +
src/tir/transforms/vectorize_loop.cc | 191 +-
src/tir/usmp/analysis/extract_buffer_info.cc | 12 +-
src/tir/usmp/transform/assign_pool_info.cc | 4 +-
.../convert_pool_allocations_to_offsets.cc | 109 +-
tests/cpp/tir_analysis_side_effect.cc | 5 +-
tests/python/contrib/test_ethosu/infra.py | 12 +-
.../contrib/test_ethosu/test_encode_constants.py | 136 +-
.../test_ethosu/test_remove_concatenates.py | 29 +-
.../contrib/test_ethosu/test_replace_conv2d.py | 188 +-
.../contrib/test_ethosu/test_replace_copy.py | 44 +-
.../test_ethosu/test_replace_unary_elementwise.py | 4 +-
tests/python/contrib/test_ethosu/test_scheduler.py | 32 +-
.../test_ethosu/test_tir_to_cs_translator.py | 234 +-
tests/python/contrib/test_ethosu/test_vela_api.py | 26 +-
tests/python/relay/aot/test_crt_aot.py | 19 +-
tests/python/unittest/test_lower_build.py | 36 +-
.../test_meta_schedule_postproc_verify_gpu_code.py | 88 +-
.../test_runtime_module_based_interface.py | 2 +-
tests/python/unittest/test_runtime_module_load.py | 2 +-
tests/python/unittest/test_target_codegen_cuda.py | 48 +-
tests/python/unittest/test_target_codegen_llvm.py | 11 +-
.../python/unittest/test_target_codegen_vulkan.py | 5 +-
.../test_tir_analysis_calculate_workspace.py | 60 +-
.../test_tir_analysis_detect_buffer_access_lca.py | 6 +-
tests/python/unittest/test_tir_buffer.py | 30 +-
tests/python/unittest/test_tir_constructor.py | 25 +-
tests/python/unittest/test_tir_intrin.py | 5 +-
tests/python/unittest/test_tir_ir_builder.py | 4 +-
.../python/unittest/test_tir_lower_match_buffer.py | 4 +-
tests/python/unittest/test_tir_nodes.py | 17 +-
tests/python/unittest/test_tir_ptx_mma.py | 150 +-
.../unittest/test_tir_schedule_cache_read_write.py | 6 +-
.../unittest/test_tir_schedule_compute_inline.py | 20 +-
tests/python/unittest/test_tir_schedule_reorder.py | 4 +-
.../unittest/test_tir_schedule_split_fuse.py | 6 +-
.../test_tir_transform_combine_context_call.py | 6 +-
.../test_tir_transform_common_subexpr_elim.py | 30 +-
.../test_tir_transform_compact_buffer_region.py | 19 +-
.../test_tir_transform_convert_for_loops_serial.py | 20 +-
.../test_tir_transform_extract_constants.py | 6 +-
.../unittest/test_tir_transform_flatten_buffer.py | 56 +-
.../test_tir_transform_inject_double_buffer.py | 4 +-
.../test_tir_transform_inject_rolling_buffer.py | 62 +-
.../test_tir_transform_inject_virtual_thread.py | 41 +-
...test_tir_transform_instrument_bound_checkers.py | 6 +-
.../python/unittest/test_tir_transform_ir_utils.py | 9 +-
.../unittest/test_tir_transform_loop_partition.py | 80 +-
...t_tir_transform_lower_cross_thread_reduction.py | 24 +-
.../test_tir_transform_lower_tvm_builtin.py | 4 +-
.../unittest/test_tir_transform_narrow_datatype.py | 14 +-
.../unittest/test_tir_transform_remove_no_op.py | 2 +-
...test_tir_transform_renormalize_split_pattern.py | 49 +-
.../python/unittest/test_tir_transform_simplify.py | 4 +-
.../unittest/test_tir_transform_storage_flatten.py | 47 +-
.../unittest/test_tir_transform_unroll_loop.py | 27 +-
.../unittest/test_tir_transform_vectorize.py | 9 +-
tests/python/unittest/test_tir_usmp_algo.py | 124 +-
.../test_tir_usmp_analysis_extract_bufferinfo.py | 540 +--
...ransform_convert_pool_allocations_to_offsets.py | 381 +-
tests/python/unittest/test_tir_usmp_utils.py | 40 +-
tests/python/unittest/test_transform_layout.py | 498 ++
tests/python/unittest/test_tvmscript_complete.py | 6 -
.../python/unittest/test_tvmscript_error_report.py | 5 +-
tests/python/unittest/test_tvmscript_roundtrip.py | 4939 ++++++++++----------
vta/python/vta/transform.py | 97 +-
185 files changed, 9634 insertions(+), 5779 deletions(-)
create mode 100644 include/tvm/tir/index_map.h
create mode 100644 src/tir/ir/index_map.cc
create mode 100755 tests/python/unittest/test_transform_layout.py