This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git
from a7a1980480 [CI] Update ci_cpu image and build with llvm-15 (#14466)
add f79e4ebf30 [Bugfix][Topi] Output strides in pack_buffer() utility
(#14566)
add e5fc9f6add [skip ci][COMMUNITY] Zihao Ye -> Committer (#14578)
add 515583ce28 [AutoTVM] New rank-binary loss_type for the new xgboost >=
2.0.0 behaviour (#14468)
add 51dcafb4ab [microNPU][ETHOSU] Add restrictions to convert to NHCWB16
layout in LayoutOptimization pass (#14464)
add 3a3118a754 feat: use spot instances for ci with on demand as a backup
(#14477)
add b5c71bdab1 [Docs] Fix typo in the Vitis AI Integration docs (#14585)
add 1c5442d2e9 [Codegen][LLVM] Remove cast to i8* in builtin::address_of
(#14563)
add 1db4464c08 [Fix][TIR][Analysis] Reduction block checking alloc_buffers
(#14589)
add 9fb9fd6898 [TIR] Use String instead of StringImm for
AttrStmtNode::node (#14491)
add fb2ae1a676 [Arith] Fix solve inequality of unbound var ranges (#14582)
add f622e7f180 [ARITH][BUGFIX] Fix a bug of iter map floormod(x,2)
simplify (#14571)
add 8554e7afb4 [Bugfix] [Relay] fix a bug caused by IncompleteTypeNode in
EinsumRel while doing MergeComposite (#14556)
add f28fcd1239 [TensorIR] Fix ComputeAt with perfect symbolic bound
(#14592)
add 7766f3c51e [Object] Implemented .as<T> for ObjectRef param, returns
Optional<T> (#14522)
add ca7c3d8a14 [LLVM] Expand tvm::Type to DWARF conversion (#14568)
add 40af75b61f [Fix][TIR] UnifyThreadBinding creating unit loop with
annotation (#14588)
add 1c52e633c7 [TIR][Schedule] Method returning the function being worked
on (#14593)
No new revisions were added by this update.
Summary of changes:
CONTRIBUTORS.md | 1 +
apps/benchmark/adreno/adreno_gpu_bench_clml.py | 36 ++++-
apps/benchmark/adreno/adreno_gpu_bench_texture.py | 36 ++++-
ci/jenkins/generated/arm_jenkinsfile.groovy | 110 +++++++++++---
ci/jenkins/generated/cortexm_jenkinsfile.groovy | 154 +++++++++++++++----
ci/jenkins/generated/cpu_jenkinsfile.groovy | 88 ++++++++---
ci/jenkins/generated/docker_jenkinsfile.groovy | 16 +-
ci/jenkins/generated/gpu_jenkinsfile.groovy | 167 ++++++++++++++++-----
ci/jenkins/generated/hexagon_jenkinsfile.groovy | 110 +++++++++++---
ci/jenkins/generated/i386_jenkinsfile.groovy | 55 +++++--
ci/jenkins/generated/lint_jenkinsfile.groovy | 12 +-
.../generated/minimal_cross_isa_jenkinsfile.groovy | 33 ++--
ci/jenkins/generated/minimal_jenkinsfile.groovy | 33 ++--
ci/jenkins/generated/riscv_jenkinsfile.groovy | 33 ++--
ci/jenkins/generated/wasm_jenkinsfile.groovy | 22 ++-
ci/jenkins/templates/utils/Prepare.groovy.j2 | 4 +-
ci/jenkins/templates/utils/base.groovy.j2 | 6 +-
ci/jenkins/templates/utils/macros.j2 | 23 ++-
docs/how_to/deploy/vitis_ai.rst | 2 +-
.../how_to/deploy_models/deploy_model_on_adreno.py | 38 ++++-
gallery/how_to/tune_with_autotvm/tune_relay_arm.py | 24 ++-
.../how_to/tune_with_autotvm/tune_relay_cuda.py | 24 ++-
.../tune_with_autotvm/tune_relay_mobile_gpu.py | 24 ++-
gallery/how_to/tune_with_autotvm/tune_relay_x86.py | 24 ++-
gallery/tutorial/autotvm_relay_x86.py | 39 ++++-
include/tvm/runtime/container/optional.h | 9 ++
include/tvm/runtime/object.h | 39 ++++-
include/tvm/tir/schedule/schedule.h | 2 +
include/tvm/topi/detail/extern.h | 2 +-
python/tvm/autotvm/testing/tune_relay.py | 2 +-
python/tvm/autotvm/tuner/xgboost_cost_model.py | 45 +++++-
python/tvm/autotvm/tuner/xgboost_tuner.py | 4 +-
python/tvm/contrib/torch/pytorch_tvm.py | 24 ++-
python/tvm/driver/tvmc/autotuner.py | 46 +++++-
python/tvm/relay/backend/contrib/ethosu/codegen.py | 90 +++++++++--
python/tvm/tir/schedule/schedule.py | 7 +-
src/arith/canonical_simplify.cc | 16 +-
src/arith/int_constraints.cc | 25 ++-
src/arith/int_set.cc | 5 +-
src/arith/iter_affine_map.cc | 81 +++++-----
src/arith/rewrite_simplify.cc | 17 ++-
src/contrib/hybrid/codegen_hybrid.cc | 4 +-
src/driver/driver_api.cc | 7 +-
src/ir/expr.cc | 12 +-
src/ir/module.cc | 4 +-
src/ir/type_functor.cc | 8 +-
src/meta_schedule/database/database_utils.cc | 4 +-
src/meta_schedule/postproc/verify_gpu_code.cc | 4 +-
src/meta_schedule/postproc/verify_vtcm_limit.cc | 4 +-
src/meta_schedule/space_generator/schedule_fn.cc | 8 +-
src/relay/analysis/call_graph.cc | 10 +-
src/relay/analysis/get_calibration_data.cc | 11 +-
src/relay/analysis/match_exhaustion.cc | 8 +-
src/relay/analysis/type_solver.cc | 6 +-
src/relay/backend/annotate_used_memory.cc | 5 +-
src/relay/backend/aot/aot_lower_main.cc | 2 +-
src/relay/backend/aot_executor_codegen.cc | 2 +-
.../backend/contrib/cmsisnn/extract_constants.cc | 8 +-
src/relay/backend/contrib/cmsisnn/relay_to_tir.cc | 16 +-
.../contrib/cmsisnn/scalar_to_tensor_constant.cc | 9 +-
src/relay/backend/contrib/ethosu/codegen.cc | 2 +-
src/relay/backend/contrib/ethosu/preprocess.cc | 8 +-
.../contrib/example_target_hooks/relay_to_tir.cc | 13 +-
src/relay/backend/interpreter.cc | 18 +--
src/relay/backend/te_compiler.cc | 21 ++-
src/relay/backend/vm/compiler.cc | 15 +-
src/relay/backend/vm/lambda_lift.cc | 4 +-
src/relay/backend/vm/removed_unused_funcs.cc | 4 +-
src/relay/collage/mock_cost_estimator.cc | 3 +-
src/relay/collage/sub_graph.cc | 4 +-
src/relay/ir/dataflow_matcher.cc | 4 +-
src/relay/ir/expr_functor.cc | 4 +-
src/relay/ir/function.cc | 4 +-
src/relay/op/memory/memory.cc | 4 +-
src/relay/op/tensor/math.cc | 4 +
src/relay/op/type_relations.cc | 4 +-
src/relay/parser/parser.cc | 4 +-
src/relay/printer/relay_text_printer.cc | 24 +--
src/relay/transforms/canonicalize_cast.cc | 4 +-
src/relay/transforms/compiler_function_utils.cc | 4 +-
src/relay/transforms/dead_code.cc | 4 +-
src/relay/transforms/device_planner.cc | 35 ++---
src/relay/transforms/dynamic_to_static.cc | 4 +-
src/relay/transforms/eta_expand.cc | 8 +-
src/relay/transforms/fold_constant.cc | 4 +-
src/relay/transforms/fuse_ops.cc | 4 +-
src/relay/transforms/higher_order_gradient.cc | 16 +-
src/relay/transforms/inline.cc | 8 +-
src/relay/transforms/lazy_gradient_init.cc | 4 +-
src/relay/transforms/partial_eval.cc | 8 +-
src/relay/transforms/partition_graph.cc | 20 +--
src/relay/transforms/simplify_expr.cc | 4 +-
src/relay/transforms/type_infer.cc | 8 +-
src/runtime/debug.cc | 8 +-
src/script/ir_builder/tir/ir.cc | 36 ++---
src/script/printer/doc_printer/base_doc_printer.cc | 96 ++++++------
src/script/printer/ir/ir.cc | 4 +-
src/script/printer/tir/block.cc | 6 +-
src/script/printer/tir/expr.cc | 13 +-
src/target/llvm/codegen_cpu.cc | 28 +++-
src/target/llvm/codegen_llvm.cc | 21 ++-
src/target/source/codegen_c.cc | 4 +-
src/target/source/codegen_cuda.cc | 4 +-
src/target/target.cc | 32 ++--
src/target/target_kind.cc | 7 +-
src/te/operation/create_primfunc.cc | 17 +--
src/tir/analysis/calculate_allocated_memory.cc | 5 +-
src/tir/analysis/control_flow_graph.cc | 8 +-
src/tir/analysis/estimate_flops.cc | 8 +-
src/tir/analysis/identify_memcpy.cc | 8 +-
src/tir/analysis/side_effect.cc | 4 +-
src/tir/analysis/verify_gpu_code.cc | 5 +-
src/tir/analysis/verify_memory.cc | 5 +-
src/tir/analysis/verify_ssa.cc | 5 +-
src/tir/ir/expr.cc | 2 +-
src/tir/ir/stmt_functor.cc | 16 +-
src/tir/schedule/analysis/layout.cc | 4 +-
src/tir/schedule/analysis/reducer.cc | 22 ++-
src/tir/schedule/concrete_schedule.h | 1 +
src/tir/schedule/primitive/annotate.cc | 16 +-
src/tir/schedule/primitive/blockize_tensorize.cc | 8 +-
src/tir/schedule/primitive/cache_read_write.cc | 4 +-
src/tir/schedule/primitive/compute_at.cc | 9 +-
src/tir/schedule/primitive/decompose_padding.cc | 4 +-
src/tir/schedule/primitive/get_block_loop.cc | 8 +-
src/tir/schedule/primitive/loop_transformation.cc | 8 +-
src/tir/schedule/schedule.cc | 78 +++++-----
src/tir/schedule/state.cc | 5 +-
src/tir/schedule/trace.cc | 12 +-
src/tir/transforms/bf16_legalize.cc | 16 +-
src/tir/transforms/extract_constants.cc | 5 +-
src/tir/transforms/hoist_expression.cc | 4 +-
src/tir/transforms/inject_rolling_buffer.cc | 6 +-
src/tir/transforms/lower_custom_datatypes.cc | 4 +-
src/tir/transforms/lower_opaque_block.cc | 8 +-
src/tir/transforms/make_packed_api.cc | 6 +-
src/tir/transforms/make_unpacked_api.cc | 4 +-
src/tir/transforms/profile_instrumentation.cc | 9 +-
.../reduce_branching_through_overcompute.cc | 4 +-
src/tir/transforms/renew_defs.cc | 4 +-
src/tir/transforms/rewrite_unsafe_select.cc | 4 +-
src/tir/transforms/thread_storage_sync.cc | 2 +-
src/tir/transforms/unify_thread_binding.cc | 17 ++-
src/tir/transforms/vectorize_loop.cc | 4 +-
.../test_clml/test_adreno_collage_targets.py | 2 +-
tests/python/contrib/test_ethosu/infra.py | 18 ++-
tests/python/contrib/test_ethosu/test_codegen.py | 56 +++++++
.../contrib/test_ethosu/test_layout_optimizer.py | 38 +++++
tests/python/contrib/test_hexagon/test_autotvm.py | 24 ++-
.../relay/collage/demo_collage_partitioner.py | 2 +-
tests/python/relay/test_pass_merge_composite.py | 47 +++++-
.../unittest/test_arith_canonical_simplify.py | 7 +
.../python/unittest/test_arith_iter_affine_map.py | 10 +-
.../python/unittest/test_arith_rewrite_simplify.py | 22 ++-
.../unittest/test_arith_solve_linear_inequality.py | 15 ++
.../python/unittest/test_autotvm_xgboost_model.py | 4 +-
tests/python/unittest/test_target_codegen_llvm.py | 20 +++
.../unittest/test_tir_schedule_compute_at.py | 41 +++++
.../python/unittest/test_tir_schedule_reduction.py | 54 +++++++
.../python/unittest/test_tir_schedule_utilities.py | 1 +
.../test_tir_transform_inject_software_pipeline.py | 90 +++++------
.../test_tir_transform_unify_thread_binding.py | 25 +++
tests/python/unittest/test_tvmscript_roundtrip.py | 40 +++--
vta/scripts/tune_resnet.py | 24 ++-
vta/tutorials/autotvm/tune_alu_vta.py | 24 ++-
vta/tutorials/autotvm/tune_relay_vta.py | 24 ++-
166 files changed, 2252 insertions(+), 893 deletions(-)