This is an automated email from the ASF dual-hosted git repository. moreau pushed a change to branch ci-docker-staging in repository https://gitbox.apache.org/repos/asf/tvm.git.
from db93cb8 retrigger CI add 2b8d113 [TVMC] Allow manual shape specification in tvmc (#7366) add 0716c2a [AutoScheduler] Add sampling to dispatcher (#7376) add 2999d03 [ONNX] Add CumSum operator to ONNX frontend (#7391) add 68b7e71 [Relay][Topi][CPU] Dense with weight transform (#7404) add 3863e09 [FIX,CMAKE] Only set Clang flags for C++ files (#7424) add 9175c6d TRT Dynamic Reshape Fix (#7412) add 12c6b70 Simplify full broadcast (#7423) add b7808fb [Arith] Fix iter_affine_map with non-const extent (#7437) add d05d75d Stop running some python testsuites twice (#7430) add 6b58321 [BYOC][TRT] Fix small bug preventing TRT runtime compilation for versions < 6 (#7372) add 8b9005f Make the TVM targets list available in Python (#7427) add c52c176 Replace type punning with memcpy. (#7415) add 33829b3 Fix double compile of runtime sources for TRT, ACL (#7436) add d5851dd [TIR][Printer] Fix SelectNode TIRTextPrinter bracket mismatch (#7405) add c7c54de Update tags with minor fix (#7448) add d769727 Add ROCm docker (#7422) add e426c87 [AutoScheduler] Fix distill record (#7439) add b36bdf6 [Relay][Op][Bug] Fix missing return in scatter_nd cuda strategy (#7447) add a1260cc Make keras reshape less restrictive (#7446) add f9ff088 Merge remote-tracking branch 'origin/main' into junit-enable add 6a77cdd prefix junit results with FFI type No new revisions were added by this update. Summary of changes: CMakeLists.txt | 4 +- cmake/modules/ClangFlags.cmake | 19 ++-- cmake/modules/contrib/ArmComputeLib.cmake | 4 +- cmake/modules/contrib/TensorRT.cmake | 4 +- .../{Dockerfile.ci_wasm => Dockerfile.demo_rocm} | 20 +--- docker/bash.sh | 16 ++- docker/install/ubuntu_install_rocm.sh | 6 +- docker/with_the_same_user | 6 ++ include/tvm/relay/attrs/transform.h | 4 + include/tvm/relay/dataflow_pattern.h | 2 + include/tvm/target/target_kind.h | 5 + python/tvm/auto_scheduler/__init__.py | 2 +- python/tvm/auto_scheduler/dispatcher.py | 93 +++++++++++++++- python/tvm/auto_scheduler/measure_record.py | 52 +++++---- python/tvm/driver/tvmc/autotuner.py | 9 +- python/tvm/driver/tvmc/common.py | 39 +++++++ python/tvm/driver/tvmc/compiler.py | 16 ++- python/tvm/driver/tvmc/frontends.py | 47 ++++---- python/tvm/relay/frontend/keras.py | 31 ++---- python/tvm/relay/frontend/onnx.py | 25 ++++- python/tvm/relay/op/_transform.py | 2 +- python/tvm/relay/op/contrib/tensorrt.py | 13 ++- python/tvm/relay/op/nn/_nn.py | 30 ++++++ python/tvm/relay/op/nn/nn.py | 33 ++++++ python/tvm/relay/op/strategy/cuda.py | 1 + python/tvm/relay/op/strategy/generic.py | 15 ++- python/tvm/relay/op/strategy/x86.py | 28 +++-- python/tvm/relay/op/transform.py | 12 ++- python/tvm/target/target.py | 5 + python/tvm/topi/cuda/scan.py | 10 +- python/tvm/topi/cumsum.py | 21 +++- python/tvm/topi/nn/dense.py | 70 ++++++++++++ python/tvm/topi/x86/__init__.py | 1 + python/tvm/topi/x86/dense.py | 120 +++++++++++++++------ python/tvm/topi/x86/dense_alter_op.py | 68 ++++++++++++ src/arith/iter_affine_map.cc | 36 ++++--- src/printer/tir_text_printer.cc | 2 +- src/relay/ir/dataflow_matcher.cc | 8 +- src/relay/ir/dataflow_pattern.cc | 1 + src/relay/op/make_op.h | 6 ++ src/relay/op/nn/nn.cc | 27 +++++ src/relay/op/nn/nn.h | 25 +++++ src/relay/op/tensor/transform.cc | 3 +- src/relay/op/tensor/unary.cc | 6 +- src/relay/transforms/fold_constant.cc | 5 - src/relay/transforms/simplify_expr.cc | 111 ++++++++++++++++--- src/runtime/contrib/tensorrt/tensorrt_ops.cc | 2 +- src/runtime/crt/common/ndarray.c | 14 +-- src/runtime/crt/graph_runtime/graph_runtime.c | 10 +- src/target/tag.cc | 13 +-- src/target/target_kind.cc | 9 ++ tests/cpp/target_test.cc | 6 ++ tests/python/contrib/test_tensorrt.py | 101 +++++++++++++++++ tests/python/driver/tvmc/conftest.py | 17 +++ tests/python/driver/tvmc/test_common.py | 33 ++++++ tests/python/driver/tvmc/test_compiler.py | 31 ++++-- tests/python/driver/tvmc/test_frontends.py | 20 +++- tests/python/frontend/keras/test_forward.py | 10 ++ tests/python/frontend/onnx/test_forward.py | 77 +++++++++++++ tests/python/relay/test_auto_scheduler_tuning.py | 17 ++- tests/python/relay/test_autotvm_task_extraction.py | 12 +-- tests/python/relay/test_dataflow_pattern.py | 2 + tests/python/relay/test_op_level3.py | 83 +++++++------- tests/python/relay/test_pass_alter_op_layout.py | 31 +++++- tests/python/relay/test_pass_fold_constant.py | 16 --- tests/python/relay/test_pass_simplify_expr.py | 65 +++++++++++ .../python/unittest/test_arith_iter_affine_map.py | 3 + tests/python/unittest/test_target_target.py | 8 ++ tests/scripts/setup-pytest-env.sh | 18 ++-- tests/scripts/task_python_arm_compute_library.sh | 3 +- tests/scripts/task_python_ethosn_tests.sh | 2 +- tests/scripts/task_python_frontend.sh | 14 +-- tests/scripts/task_python_frontend_cpu.sh | 6 +- tests/scripts/task_python_integration.sh | 18 ++-- tests/scripts/task_python_microtvm.sh | 2 +- tests/scripts/task_python_nightly.sh | 2 +- tests/scripts/task_python_topi.sh | 2 +- tests/scripts/task_python_unittest.sh | 10 +- tests/scripts/task_python_vta_fsim.sh | 6 +- tests/scripts/task_python_vta_tsim.sh | 6 +- tutorials/auto_scheduler/tune_network_arm.py | 2 +- tutorials/auto_scheduler/tune_network_cuda.py | 2 +- tutorials/auto_scheduler/tune_network_mali.py | 2 +- tutorials/auto_scheduler/tune_network_x86.py | 2 +- tutorials/micro/micro_tflite.py | 2 +- 85 files changed, 1409 insertions(+), 333 deletions(-) copy docker/{Dockerfile.ci_wasm => Dockerfile.demo_rocm} (70%) create mode 100644 python/tvm/topi/x86/dense_alter_op.py