This is an automated email from the ASF dual-hosted git repository.
junrushao pushed a change to branch ci-docker-staging
in repository https://gitbox.apache.org/repos/asf/tvm.git
discard 8495335179 update image for ci_lint
discard d839db1132 trigger more run
add 91428158f2 [microTVM]Add MLPerfTiny test harness (#14309)
add 10a12bacb8 [CI][EZ] Upgrade CI Lint Image (#14373)
add b56d7f56ab [TIR][Utility] More flexible tir::Substitute arguments
(#14251)
add 3b274aa6c7 [Hexagon] Allow scalar tensors to have null shape during
allocation (#14376)
add 3f56a95b87 [TVMScript] Use new variable frame in If/Then/Else (#14250)
add e5ae4347dd [CUDA][Schedule] Better Layout Transform Schedules (#14167)
add b987556375 [TIR] Remove LoadNode and StoreNode (#14381)
add 67597025e7 [TVMScript][Fix] Fix `bool` printing for roundtrip (#14390)
add ad6fbec066 [TIR] Improved error message in InjectSoftwarePipeline
(#14391)
add b09e72b54b [TIR] Legalize dtype of constants in IndexMap (#14385)
add 4a2a3b5669 [TIR] Improved MakePackedAPI error message (#14387)
add c5075dc30f [TIR] not estimating the flops when there is a default
estimated flops as attr (#14379)
add 0d0d2f0bd3 [CI][microTVM] Enable USE_MICRO for mac and windows CI
builds (#14393)
add 6c34361369 [Hexagon] Adapt some intrinsics for high vector lanes
(#14345)
add 6e70e79162 [microNPU] Upgrade Vela to v3.7.0 (#14374)
add 30bf013e78 [TIR][Schedule] Add unittest for read_write_at (#14395)
add da8335378a [TVMC][microNPU] tvmc option for printing which operators
are offloaded to Ethos-U (#13212)
add a0edf24c60 [TIR] Refactor BF16Legalize (#14405)
add 14ddb37d14 [MetaSchedule][Hexagon] Improve vectorization for
standalone elementwise op (#14408)
add b3a5e18f6f [TVMScript] Improved error message for unexpected top frame
(#14399)
add 0ded2132e6 [skip ci] Replace magic_wand model with micro_speech
(#14414)
add 0e28541149 [microTVM] Update poetry to fix security issues (#14429)
add 9f6ce7cbf9 [relay][frontend][pytorch]Fix a bug in the
_get_pytorch_value_type function (#14421)
add 5cca18bb07 [Frontend] Add ONNX importer for QLinearSoftmax (#14425)
add 4011280b16 [OpenCL][Textures] Always use SSA for texture loading
(#14397)
add a58645352a [CI] Add llvm-15 and enable mlir build for ci_cpu docker
setup.
This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version. This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:
* -- * -- B -- O -- O -- O (8495335179)
\
N -- N -- N refs/heads/ci-docker-staging (a58645352a)
You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
3rdparty/cutlass | 2 +-
3rdparty/mlperftiny/api/submitter_implemented.h | 2 +-
apps/microtvm/cmsisnn/requirements.txt | 10 +-
apps/microtvm/ethosu/requirements.txt | 10 +-
apps/microtvm/poetry.lock | 3342 ++++++++++----------
apps/microtvm/pyproject.toml | 54 +-
conda/recipe/bld.bat | 1 +
conda/recipe/build.sh | 1 +
docker/Dockerfile.ci_cpu | 3 +
docker/install/ubuntu_install_llvm_from_source.sh | 1 +
docker/install/ubuntu_install_vela.sh | 2 +-
gallery/how_to/work_with_microtvm/micro_ethosu.py | 4 +-
gallery/how_to/work_with_microtvm/micro_tvmc.sh | 14 +-
include/tvm/runtime/container/array.h | 6 +
include/tvm/tir/expr.h | 60 -
include/tvm/tir/expr_functor.h | 4 -
include/tvm/tir/stmt.h | 66 -
include/tvm/tir/stmt_functor.h | 148 +-
include/tvm/tir/transform.h | 10 +-
include/tvm/topi/elemwise.h | 6 +-
include/tvm/topi/transform.h | 10 +-
python/gen_requirements.py | 2 +-
python/tvm/driver/tvmc/compiler.py | 173 +
python/tvm/ir/json_compact.py | 2 -
python/tvm/meta_schedule/schedule/cuda/__init__.py | 2 +
.../schedule/cuda/layout_transform.py | 583 ++++
.../tvm/relay/analysis/operations_distribution.py | 102 +
.../tvm/relay/backend/contrib/ethosu/tir/passes.py | 2 +-
.../backend/contrib/ethosu/tir_to_cs_translator.py | 1 -
python/tvm/relay/frontend/onnx.py | 21 +
python/tvm/relay/frontend/pytorch.py | 2 +-
python/tvm/relay/op/_transform.py | 2 +-
python/tvm/relay/op/strategy/cuda.py | 11 +
python/tvm/relay/op/strategy/generic.py | 36 +-
python/tvm/relay/transform/suffixes.py | 105 +
python/tvm/script/ir_builder/tir/ir.py | 2 -
python/tvm/script/parser/tir/parser.py | 6 +-
python/tvm/tir/__init__.py | 3 +-
python/tvm/tir/analysis/analysis.py | 3 +-
python/tvm/tir/expr.py | 30 -
python/tvm/tir/stmt.py | 38 +-
python/tvm/tir/transform/transform.py | 45 +-
python/tvm/topi/hexagon/tensor_intrin.py | 309 +-
python/tvm/topi/transform.py | 17 +-
src/contrib/hybrid/codegen_hybrid.cc | 6 -
src/contrib/hybrid/codegen_hybrid.h | 2 -
src/driver/driver_api.cc | 3 +-
.../postproc/disallow_async_strided_mem_copy.cc | 2 +-
.../postproc/rewrite_parallel_vectorize_unroll.cc | 81 +-
src/meta_schedule/postproc/verify_gpu_code.cc | 2 +-
.../backend/contrib/cmsisnn/extract_constants.cc | 1 +
src/relay/backend/contrib/cmsisnn/fuse_pads.cc | 3 +-
.../backend/contrib/cmsisnn/generate_constants.cc | 12 +-
.../contrib/cmsisnn/scalar_to_tensor_constant.cc | 5 +-
src/relay/printer/text_printer.h | 2 -
src/relay/printer/tir_text_printer.cc | 19 -
src/relay/printer/tvmscript_printer.cc | 26 -
src/relay/transforms/annotate_target.cc | 1 +
src/runtime/hexagon/hexagon_device_api.cc | 2 +-
src/script/ir_builder/tir/utils.h | 26 +-
src/script/printer/legacy_repr.cc | 27 -
src/script/printer/tir/expr.cc | 6 -
src/script/printer/tir/ir.cc | 3 +-
src/script/printer/tir/stmt.cc | 7 -
src/target/codegen.cc | 1 -
src/target/llvm/codegen_llvm.cc | 12 +-
src/target/llvm/codegen_llvm.h | 2 -
src/target/llvm/llvm_module.cc | 1 -
src/target/source/codegen_c.cc | 8 -
src/target/source/codegen_c.h | 2 -
src/target/source/codegen_opencl.cc | 52 +-
src/target/source/codegen_opencl.h | 6 -
src/target/stackvm/codegen_stackvm.cc | 8 -
src/target/stackvm/codegen_stackvm.h | 2 -
src/te/autodiff/jacobian.cc | 1 -
src/te/operation/create_primfunc.cc | 2 +-
src/te/operation/cross_thread_reduction.cc | 1 +
src/te/operation/hybrid_op.cc | 4 +-
src/te/operation/op_utils.cc | 16 -
src/te/operation/op_utils.h | 16 -
src/tir/analysis/block_access_region_detector.cc | 10 -
src/tir/analysis/buffer_access_lca_detector.cc | 9 -
src/tir/analysis/device_constraint_utils.cc | 18 -
src/tir/analysis/estimate_flops.cc | 11 +-
src/tir/analysis/side_effect.cc | 5 -
src/tir/analysis/var_touch.cc | 8 -
src/tir/analysis/var_use_def_analysis.cc | 8 -
src/tir/analysis/var_use_def_analysis.h | 4 -
src/tir/analysis/verify_gpu_code.cc | 8 -
src/tir/analysis/verify_memory.cc | 8 -
src/tir/ir/expr.cc | 70 +-
src/tir/ir/expr_functor.cc | 8 -
src/tir/ir/index_map.cc | 2 +-
src/tir/ir/stmt.cc | 53 -
src/tir/ir/stmt_functor.cc | 27 -
src/tir/op/op.cc | 2 +
src/tir/schedule/analysis/reducer.cc | 18 -
src/tir/schedule/primitive/blockize_tensorize.cc | 2 +-
src/tir/schedule/primitive/cache_index.cc | 8 +-
src/tir/schedule/primitive/cache_read_write.cc | 16 +-
src/tir/schedule/primitive/compute_inline.cc | 8 -
.../schedule/primitive/layout_transformation.cc | 36 +-
src/tir/schedule/primitive/reduction.cc | 8 +-
src/tir/transforms/arg_binder.cc | 2 +-
src/tir/transforms/bf16_legalize.cc | 696 ++--
src/tir/transforms/bound_checker.cc | 8 -
src/tir/transforms/common_subexpr_elim.cc | 5 +-
src/tir/transforms/compact_buffer_region.cc | 8 -
src/tir/transforms/coproc_sync.cc | 6 -
src/tir/transforms/inject_copy_intrin.cc | 2 +-
src/tir/transforms/inject_double_buffer.cc | 8 -
src/tir/transforms/inject_software_pipeline.cc | 16 +-
src/tir/transforms/inject_virtual_thread.cc | 18 +-
src/tir/transforms/install_debug_spans.h | 1 -
src/tir/transforms/ir_utils.cc | 8 -
src/tir/transforms/lower_cross_thread_reduction.cc | 2 +-
src/tir/transforms/lower_custom_datatypes.cc | 8 -
src/tir/transforms/lower_match_buffer.cc | 14 -
src/tir/transforms/lower_thread_allreduce.cc | 8 -
src/tir/transforms/lower_warp_memory.cc | 12 -
src/tir/transforms/make_packed_api.cc | 10 +-
.../manifest_shared_memory_local_stage.cc | 2 +-
.../merge_dynamic_shared_memory_allocations.cc | 16 -
src/tir/transforms/narrow_datatype.cc | 10 +-
src/tir/transforms/renew_defs.cc | 8 -
src/tir/transforms/rewrite_unsafe_select.cc | 3 -
src/tir/transforms/simplify.cc | 4 -
src/tir/transforms/split_host_device.cc | 2 +-
src/tir/transforms/storage_access.cc | 8 -
src/tir/transforms/storage_access.h | 3 -
src/tir/transforms/storage_flatten.cc | 16 -
src/tir/transforms/storage_rewrite.cc | 44 +-
src/tir/transforms/thread_storage_sync.cc | 7 -
src/tir/transforms/unroll_loop.cc | 4 -
src/tir/transforms/update_pointer_storage_scope.cc | 8 -
src/tir/transforms/update_pointer_storage_scope.h | 2 -
src/tir/transforms/vectorize_loop.cc | 19 +-
src/tir/usmp/analysis/extract_buffer_info.cc | 7 +-
src/tir/usmp/transform/create_io_allocates.cc | 6 -
src/topi/transform.cc | 2 +-
.../hexagon/hexagon_device_api_tests.cc | 3 +
tests/lint/check_file_type.py | 1 +
tests/lint/rat-excludes | 1 +
tests/micro/arduino/test_utils.py | 2 +-
tests/micro/common/test_autotune.py | 2 +-
tests/micro/common/test_mlperftiny.py | 130 +-
tests/micro/common/test_tvmc.py | 2 +-
tests/python/contrib/test_ethosu/infra.py | 11 +-
.../test_pass_operations_distribution.py | 173 +
.../test_hexagon/test_fixed_point_multiply.py | 138 +-
tests/python/driver/tvmc/test_compiler.py | 351 ++
tests/python/frontend/onnx/test_forward.py | 33 +
tests/python/integration/test_reduce.py | 4 +-
.../relay/opencl_texture/test_injection_texture.py | 85 +
...e_postproc_rewrite_parallel_vectorize_unroll.py | 44 +
.../test_meta_schedule_relay_integration.py | 3 +
...meta_schedule_schedule_cuda_layout_transform.py | 466 +++
tests/python/unittest/test_target_codegen_llvm.py | 6 +-
.../python/unittest/test_target_codegen_opencl.py | 6 +-
.../unittest/test_target_texture_codegen_opencl.py | 375 +++
.../test_tir_analysis_estimate_tir_flops.py | 30 +
tests/python/unittest/test_tir_nodes.py | 2 +-
.../unittest/test_tir_schedule_compute_inline.py | 2 +-
.../unittest/test_tir_schedule_read_write_at.py | 221 ++
.../unittest/test_tir_schedule_transform_layout.py | 36 +
.../unittest/test_tir_transform_bf16_legalize.py | 257 +-
.../unittest/test_tir_transform_storage_rewrite.py | 8 +-
.../python/unittest/test_tvmscript_printer_tir.py | 2 +-
tests/python/unittest/test_tvmscript_roundtrip.py | 16 +
tests/scripts/request_hook/request_hook.py | 2 +-
170 files changed, 6079 insertions(+), 3306 deletions(-)
create mode 100644 python/tvm/meta_schedule/schedule/cuda/layout_transform.py
create mode 100644 python/tvm/relay/analysis/operations_distribution.py
create mode 100644 python/tvm/relay/transform/suffixes.py
create mode 100644
tests/python/contrib/test_ethosu/test_pass_operations_distribution.py
create mode 100644 tests/python/relay/opencl_texture/test_injection_texture.py
create mode 100644
tests/python/unittest/test_meta_schedule_schedule_cuda_layout_transform.py
create mode 100644 tests/python/unittest/test_tir_schedule_read_write_at.py