This is an automated email from the ASF dual-hosted git repository.
mousius pushed a change to branch ci-docker-staging
in repository https://gitbox.apache.org/repos/asf/tvm.git.
discard d2cf72c Validate tlcpackstaging/ci_cpu:20211102-232503-054fff568
add b8fb438 Fix several typos in pytest_target_parameterization.rst
(#9447)
add 85fd85f [MetaSchedule] Task Extraction (#9382)
add e24c075 [MetaSchedule] Sample-Perfect-Tile (#9449)
add e3a3043 [CI] Pin setuptools to v58.4.0 in CI to circumvent breaking
change in v58.5 (#9446)
add 5527cbf Update TVM ci-cpu docker image to v.079 (#9454)
add 048994b [Bug][Meta Schedule] Fix Infinite Loop Caused When Calling
Methods Not Overrided In PyClass. (#9451)
add e7024fb [PyTorch]Add PyTorchTVM: compile torchscript to tvm and
export as pytorch_op (#8777)
add 4973cd3 [TIR][Schedule] Add get-child-blocks primitive (#9434)
add efb367a Fix typo. (#9462)
add 374e15b [TensorIR] Print TVMScript with prefix T instead of tir
(#9422)
add 7b58e16 [TensorIR] GetProducer, GetConsumer (#506) (#9464)
add 3a9f40c Fix an infinite recompilation loop in tvm-sys. (#9450)
add 5a4526d [TVMC] Re-enable PyTorch test (#9441)
add 01141d4 Support quantised SQRT operator in TFLite (#9258)
add a644e29 [Frontend][PaddlePaddle] Add operators of interploate/flatten
and modify try_infer_value (#9459)
add 811312c [TIR] Make compact buffer and get access region aware of
conditions (#9372)
add bc505fc add is_entry_func tag for device function (#9436)
add 6aa5ba2 Add back-to-back conv2d Hexagon test for stripe scheduling
(#9390)
add 028f4fa [Relay] Non-recursive Dtor for Let (#9461)
add 7ced071 [Frontend][TFlite] Cast MirrorPad paddings to int32 (#9468)
add 7c3283c Fix function annotation (#9474)
add b86aedd [CMSIS-NN] Convert CMSIS-NN to use Target Hooks (#9397)
add 5147442 [TVMC] Add test for quantized pytorch model (#9467)
add 00b0a81 [TIR] Add type hint for TIR (#9432)
add 6549f47 [AOT][Tests] Use pre-built libraries in Reference System
tests (#9271)
add 675f348 Better host handling in CompilationConfig & debug printing
(#9460)
add fc4069b [microNPU] Replace ICHECK with diagnostic context in type
inference (#9470)
add 0fd83eb [MicroTVM][PyTest] Explicitly skip MicroTVM unittests. (#9335)
add 74accec [CMSIS-NN] Assert correct amount of CMSIS-NN artifacts in MLF
(#9480)
add 86781e9 [ETHOSN] Streamline Ethos(TM)-N cross-compile rpc usage
(#9477)
add 0812c07 Change Call with TIRCallAttrs to call_lowered op (#9312)
add dc56eea [Support] Add libinfo into the runtime build (#9310)
add f1c2c5f Fixed some warnings about lambda's closures that are bigger
than necessary (#9481)
add b26ddfe [HOTFIX][TARGET] Change LOG in compilation config to DLOG
(#9486)
add 1e09bb2 Add default for split op (#9489)
add f7b3909 [COMMUNITY] Junru's and Wuwei's PGP key for ASF release
(#9488)
add e81d391 Arm(R) Ethos(TM)-U NPU BinaryElementwise operators support
(#9442)
add e5427b2 [Relay] Use target_host determined at Relay level instead of
recalculating it (#9499)
add 7f3d363 Add LLVM-13 installation to Docker setup (#9498)
add 4bebfd8 Fix repository URL in ubuntu_install_rocm.sh (#9425)
add 6159b8e [Topi][Op][PyTorch][Vitas] Fix inconsistent kernel layout
conventions for conv2d_transpose (#9336)
add 137def8 [TARGET] Move target_host usage to new target style. (#9497)
add 2dad4d1 [BugFix] Fix divide by zero error in TIR pass
lower_warp_memory (#9485)
add 3ad7c4a [Conv2DTransposed] Fix wrong shape check and add new TOPI
module to support groups (#9465)
add be03d62 Switch PlanDevices pass to be w.r.t. SEScopes instead of
DLDeviceTypes. (#9326)
add 67714c6 [1/3][AOT][DeviceAPI] Connecting devices structure to
relevant operators (#9395)
add 856ebb2 Make version.py to rely on repository metadata to generate
version string. (#9472)
add 4c1b66f [ONNX] Unique op should always return int64 indices (#9490)
add e4904c6 Followup from #9312 (Introduce call_lowered op) (#9491)
add 7ea78cc added tests for quantized tflite sin operator (#9478)
add 08898e1 [TensorIR] Cross-Thread Reduction (#9360)
add 13f54e0 [BugFix][TVMScript] Fix printer for dependent loops (#9506)
add 76c78a9 [Topi] Cortex-M DSP support (#9233)
add 3f9b72d [TVMScript] Report error if add attr to implicit root block
(#9507)
add 22ba652 fix compute inline not to over write annotated opaque
accesses (#9509)
add eda12cb [ONNX][Relay] Support "tf_crop_and_resize" in relay Resize
op. (#9475)
add 948641c [2/3][AOT][DeviceAPI] Add Hooks for
Activate/Deactivate/Open/Close (#9500)
add c3a06ee Add the Arm(R) Ethos(TM)-U NPU identity operator (#9457)
add 3f2ae34 [ETHOSN] Cleanup of trademarks and registered trademarks
(#9516)
add 95ff358 [microNPU] Allow constants to be given as input to an
operator (#9515)
add ee23013 [4/10] Code generation for Conv2D via CMSIS-NN (#9331)
add e9b6845 [microNPU] Adding rounding mode attribute to operators (#9514)
add 9454aa4 Add a 'rolling_buffer' scheduling primitive (#9444)
add 65606c9 [ONNX] Normalize axes for Slice (#9517)
add d66a40a [PROFILER,VM] Fix timer device type for reshape_tensor (#9518)
add e276929 cleanup Hexagon conv2d tests (#9473)
add c64e526 Add Chris (#9532)
add 6832309 [AlterLayout] Respect input layout for dense op if explicitly
specified (#9535)
add 53cb5ea [TVMC][microTVM] Add new micro context (#9229)
add 454e956 [TEST] Fix duplicate definition error for gpu export mod
testcase (#9538)
add 3f5dca5 [Docker][Onnx] Upgrade ONNX to latest version (#9519)
add 0cb6337 [TVMC][Relay] Introduce executor and runtime parameters
(#9352)
add 659631d [Relay][Frontend] Prune redundant logging (#9545)
add 328d7c7 remove compile warning complained by macos clang-13.0 (#9522)
add 8e1425d Expose workspace size in tvmgen_default.h (#9510)
add ecd8a9c [CI.Lint.Black] Use "en_US.UTF-8" for Red Hat 6&7
Compatibility (#9537)
add d061d7f [microNPU] Add unary elementwise operator infrastructure with
ABS (#9530)
add cdca84a [TVMScript][Fix] Add type hints for more uncovered cases
(#9505)
add 44fae01 Revert "[CI.Lint.Black] Use "en_US.UTF-8" for Red Hat 6&7
Compatibility (#9537)" (#9548)
add 008367d [3/3][AOT][DeviceAPI] Wire up cpacked Device API context
(#9501)
add 45af5c7 [Frontend][ONNX] Support RandomNormal operator (#9493)
add 34ea319 [Relay] Prepare DeadCodeElimination for running post
LowerTEPass/ManifestAlloc. (#9542)
add 18730c4 [TIR][USMP] Added buffer info extraction pass (#8468)
add 4a6b8c0 Fix Jenkins skip for CPU/GPU (#9549)
add 4bb6f31 [TensorIR][UX] Type annotation-based runtime type checking
(#9559)
add cf17208 [QNN] Fix order of operations in qnn.quantize slightly to
prevent undefined behavior (#9558)
add 9e59e91 [TensorIR][Schedule] Inherit block anotation upon creating
new blocks (#9573)
add e5cbf46 [BUG][TVMScript] fix block range error (#9574)
add 4efec38 Improve the keras frontend to support tflite 2.6 (#9562)
add 9c4e9ff [ONNX] Add MatMulInteger16 contrib op (#9186)
add 289bd90 Prepare for switching VM to LowerTEPass. (#9550)
add 0195afc [Target] enable -arch=sm_xx for assigning cuda target arch
and deprecate autotvm.measure.set_cuda_target_arch api (#9544)
add 3c48cad WithFields for Tuples (#9533)
add 1466e27 ignore 'training_mode' tag from onnx in batch_norm op (#9575)
add 93c2f2d [FIX,PROFILING] Only check if ops duration is nonzero (#9568)
add a63daab Update license file to note libbacktrace (#9579)
add d6fe9a3 Update NEWS to include v0.8 change log (#9580)
add 0754c86 [FIX][TIR] Remove unused code and fix typo in storage_align
(#9583)
add 0e818bb Bump version to 0.9.dev0 (#9581)
add 238958f [microNPU] Fix incorrectly calculated stride when converting
NHWC to NHCWB16 (#9560)
add c3f5271 [microNPU] Change weights and command stream section (#9523)
add 0a4cc89 [microNPU] Support binary elementwise with non-4D inputs
(#9521)
add 8ca8e38 [Relay] WithFields method for Call, Function, Var,
TupleGetItem, If, Let, RefCreate, RefRead, RefWrite, Match, and Clause (#9569)
add f833b4b Add labels to each Jenkins step (#9556)
add 99b9d42 Introduction tutorial formatting fixes (#9539)
add 8712217 [CI] Use correct variable for image name in Jenkinsfile
This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version. This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:
* -- * -- B -- O -- O -- O (d2cf72c)
\
N -- N -- N refs/heads/ci-docker-staging (8712217)
You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
CMakeLists.txt | 8 +-
CONTRIBUTORS.md | 1 +
Jenkinsfile | 237 ++-
KEYS | 116 ++
LICENSE | 3 +-
NEWS.md | 320 +++-
apps/android_camera/models/prepare_model.py | 2 +-
apps/android_rpc/tests/android_rpc_test.py | 4 +-
apps/benchmark/arm_cpu_imagenet_bench.py | 2 +-
apps/benchmark/mobile_gpu_imagenet_bench.py | 2 +-
apps/bundle_deploy/build_model.py | 35 +-
apps/hexagon_launcher/README.md | 18 +-
apps/ios_rpc/tests/ios_rpc_mobilenet.py | 4 +-
apps/ios_rpc/tests/ios_rpc_test.py | 2 +-
.../template_project/microtvm_api_server.py | 30 +-
apps/microtvm/ethosu/Makefile | 4 +-
apps/microtvm/ethosu/corstone300.ld | 18 +-
.../microtvm/ethosu/include/tvm_ethosu_runtime.h | 32 +-
apps/microtvm/ethosu/run_demo.sh | 8 +-
apps/microtvm/ethosu/src/demo.c | 7 +-
.../microtvm/ethosu/src/tvm_ethosu_runtime.c | 47 +-
.../zephyr/template_project/microtvm_api_server.py | 42 +-
.../env.py => apps/pt_tvmdsoop/CMakeLists.txt | 31 +-
.../pt_tvmdsoop/prepare_and_test_pt_tvm_class.sh | 38 +-
apps/pt_tvmdsoop/tests/test_torch_compile_cpu.py | 68 +
apps/pt_tvmdsoop/tests/test_torch_compile_gpu.py | 63 +
apps/pt_tvmdsoop/tests/test_torch_graph_module.py | 129 ++
apps/pt_tvmdsoop/tests/test_torch_script.py | 116 ++
apps/pt_tvmdsoop/tests/test_torch_vm_module.py | 122 ++
apps/pt_tvmdsoop/tests/test_trace_tvm_module.py | 58 +
apps/topi_recipe/broadcast/test_broadcast_map.py | 4 +-
apps/topi_recipe/conv/depthwise_conv2d_test.py | 4 +-
apps/topi_recipe/conv/test_conv2d_hwcn_map.py | 4 +-
apps/topi_recipe/gemm/android_gemm_square.py | 2 +-
apps/topi_recipe/gemm/cuda_gemm_square.py | 4 +-
apps/topi_recipe/rnn/lstm.py | 4 +-
apps/topi_recipe/rnn/matexp.py | 4 +-
cmake/config.cmake | 3 +
cmake/modules/LibInfo.cmake | 1 +
cmake/modules/contrib/EthosN.cmake | 12 +-
cmake/modules/contrib/PT_TVMDSOOP.cmake | 59 +
cmake/utils/FindEthosN.cmake | 8 +-
conda/recipe/meta.yaml | 2 +-
docker/install/ubuntu1804_install_llvm.sh | 14 +-
docker/install/ubuntu1804_install_python.sh | 4 +-
docker/install/ubuntu1804_install_python_venv.sh | 4 +-
docker/install/ubuntu_install_onnx.sh | 7 +-
docker/install/ubuntu_install_python.sh | 4 +-
docker/install/ubuntu_install_rocm.sh | 6 +-
docker/install/ubuntu_install_vela.sh | 1 -
docs/arch/microtvm_design.rst | 16 +-
docs/dev/how_to/pytest_target_parametrization.rst | 10 +-
docs/how_to/deploy/bnns.rst | 2 +-
docs/how_to/deploy/hls.rst | 5 +-
.../how_to/work_with_microtvm/micro_autotune.py | 10 +-
gallery/how_to/work_with_microtvm/micro_tflite.py | 10 +-
gallery/tutorial/auto_scheduler_matmul_x86.py | 18 +-
gallery/tutorial/autotvm_matmul_x86.py | 2 +-
gallery/tutorial/autotvm_relay_x86.py | 20 +-
gallery/tutorial/install.py | 12 +-
gallery/tutorial/introduction.py | 2 +-
gallery/tutorial/tensor_expr_get_started.py | 21 +-
gallery/tutorial/tvmc_command_line_driver.py | 48 +-
golang/sample/deploy.py | 3 +-
include/tvm/arith/int_set.h | 2 +-
include/tvm/ir/function.h | 12 +-
include/tvm/ir/module.h | 28 +
include/tvm/meta_schedule/builder.h | 1 +
include/tvm/meta_schedule/database.h | 23 +-
include/tvm/meta_schedule/integration.h | 214 +++
include/tvm/meta_schedule/runner.h | 5 +-
include/tvm/meta_schedule/search_strategy.h | 12 +-
include/tvm/meta_schedule/space_generator.h | 4 +
include/tvm/meta_schedule/task_scheduler.h | 68 +-
include/tvm/parser/parser.h | 10 +-
include/tvm/relay/adt.h | 39 +
include/tvm/relay/attrs/annotation.h | 73 -
.../op/vm/vm.h => include/tvm/relay/attrs/call.h | 30 +-
include/tvm/relay/attrs/device_copy.h | 16 +-
include/tvm/relay/attrs/image.h | 24 +
include/tvm/relay/attrs/memory.h | 7 +-
include/tvm/relay/attrs/on_device.h | 101 ++
include/tvm/relay/attrs/random.h | 12 +
include/tvm/relay/executor.h | 24 +-
include/tvm/relay/expr.h | 227 +++
include/tvm/relay/function.h | 29 +
include/tvm/relay/runtime.h | 16 +-
include/tvm/relay/transform.h | 48 +-
include/tvm/runtime/c_runtime_api.h | 2 +-
include/tvm/runtime/vm/bytecode.h | 26 +-
include/tvm/runtime/vm/executable.h | 55 +-
include/tvm/runtime/vm/vm.h | 44 +-
include/tvm/target/compilation_config.h | 22 +-
include/tvm/target/se_scope.h | 6 +
include/tvm/target/target.h | 9 +
include/tvm/te/schedule.h | 7 +
include/tvm/tir/function.h | 7 +
include/tvm/tir/schedule/schedule.h | 34 +
include/tvm/tir/stmt.h | 2 +
include/tvm/tir/transform.h | 7 +
include/tvm/tir/usmp/utils.h | 214 +++
jvm/README.md | 2 +-
jvm/core/src/test/scripts/test_add_cpu.py | 2 +-
jvm/core/src/test/scripts/test_add_gpu.py | 10 +-
python/tvm/__init__.py | 5 +-
python/tvm/_ffi/libinfo.py | 2 +-
python/tvm/auto_scheduler/measure.py | 5 -
python/tvm/auto_scheduler/relay_integration.py | 6 +
python/tvm/autotvm/env.py | 1 -
.../autotvm/graph_tuner/utils/traverse_graph.py | 4 +-
python/tvm/autotvm/measure/measure_methods.py | 54 +-
python/tvm/autotvm/task/relay_integration.py | 8 +-
python/tvm/contrib/nvcc.py | 76 +-
python/tvm/contrib/torch/__init__.py | 51 +
python/tvm/contrib/torch/module.py | 121 ++
python/tvm/contrib/torch/pytorch_tvm.py | 249 ++++
python/tvm/driver/build_module.py | 48 +-
python/tvm/driver/tvmc/__init__.py | 3 +-
python/tvm/driver/tvmc/autotuner.py | 2 +-
python/tvm/driver/tvmc/common.py | 236 ++-
python/tvm/driver/tvmc/compiler.py | 24 +-
python/tvm/driver/tvmc/composite_target.py | 2 +-
python/tvm/driver/tvmc/fmtopt.py | 116 ++
python/tvm/driver/tvmc/main.py | 8 +-
python/tvm/driver/tvmc/micro.py | 300 ++++
python/tvm/driver/tvmc/registry.py | 88 ++
python/tvm/driver/tvmc/runner.py | 332 +++--
python/tvm/driver/tvmc/target.py | 14 +-
python/tvm/ir/module.py | 37 +-
python/tvm/meta_schedule/__init__.py | 1 +
python/tvm/meta_schedule/builder/builder.py | 5 +-
python/tvm/meta_schedule/builder/local_builder.py | 4 -
python/tvm/meta_schedule/database/database.py | 18 +-
python/tvm/meta_schedule/integration.py | 250 ++++
python/tvm/meta_schedule/runner/runner.py | 5 +-
.../search_strategy/search_strategy.py | 27 +-
.../space_generator/space_generator.py | 10 +-
.../meta_schedule/task_scheduler/task_scheduler.py | 122 +-
.../testing}/__init__.py | 3 +
.../{testing.py => testing/local_rpc.py} | 2 +-
python/tvm/meta_schedule/testing/relay_workload.py | 88 ++
python/tvm/meta_schedule/utils.py | 40 +
python/tvm/micro/__init__.py | 7 +-
python/tvm/micro/model_library_format.py | 26 +-
python/tvm/micro/project.py | 11 +
python/tvm/micro/project_api/server.py | 15 +-
python/tvm/micro/session.py | 2 +-
.../tvm/relay/backend/contrib/ethosu/_ffi_api.py | 2 +-
python/tvm/relay/backend/contrib/ethosu/codegen.py | 6 +-
.../tvm/relay/backend/contrib/ethosu/legalize.py | 492 ++++++-
.../relay/backend/contrib/ethosu/op/__init__.py | 3 +
.../contrib/ethosu/op/binary_elementwise.py | 224 +++
.../relay/backend/contrib/ethosu/op/convolution.py | 13 +-
.../relay/backend/contrib/ethosu/op/depthwise.py | 16 +-
.../relay/backend/contrib/ethosu/op/identity.py | 98 ++
.../tvm/relay/backend/contrib/ethosu/op/pooling.py | 15 +-
.../ethosu/op/{pooling.py => unary_elementwise.py} | 105 +-
.../relay/backend/contrib/ethosu/te/__init__.py | 3 +
.../contrib/ethosu/te/binary_elementwise.py | 191 +++
.../relay/backend/contrib/ethosu/te/convolution.py | 8 +
.../relay/backend/contrib/ethosu/te/depthwise.py | 9 +-
python/tvm/relay/backend/contrib/ethosu/te/dma.py | 46 +-
.../relay/backend/contrib/ethosu/te/identity.py | 73 +
.../tvm/relay/backend/contrib/ethosu/te/pooling.py | 7 +
.../ethosu/te/{pooling.py => unary_elementwise.py} | 90 +-
.../tir/{pooling.py => binary_elementwise.py} | 75 +-
.../backend/contrib/ethosu/tir/convolution.py | 1 +
.../relay/backend/contrib/ethosu/tir/depthwise.py | 1 +
python/tvm/relay/backend/contrib/ethosu/tir/dma.py | 12 +-
.../relay/backend/contrib/ethosu/tir/identity.py | 155 ++
.../tvm/relay/backend/contrib/ethosu/tir/passes.py | 15 +-
.../relay/backend/contrib/ethosu/tir/pooling.py | 1 +
.../tvm/relay/backend/contrib/ethosu/tir/spec.py | 48 +
.../tir/{pooling.py => unary_elementwise.py} | 60 +-
.../backend/contrib/ethosu/tir_to_cs_translator.py | 152 +-
python/tvm/relay/backend/contrib/ethosu/util.py | 39 +-
.../tvm/relay/backend/contrib/ethosu/vela_api.py | 2 +-
python/tvm/relay/backend/executor.py | 9 +-
python/tvm/relay/backend/executor_factory.py | 49 +-
python/tvm/relay/backend/graph_executor_codegen.py | 6 +-
python/tvm/relay/backend/runtime.py | 10 +-
python/tvm/relay/backend/vm.py | 17 +
python/tvm/relay/build_module.py | 193 ++-
python/tvm/relay/frontend/caffe.py | 7 +-
python/tvm/relay/frontend/common.py | 20 +-
python/tvm/relay/frontend/keras.py | 28 +-
python/tvm/relay/frontend/mxnet.py | 46 +-
python/tvm/relay/frontend/onnx.py | 344 +++--
python/tvm/relay/frontend/paddlepaddle.py | 147 +-
python/tvm/relay/frontend/pytorch.py | 28 +-
python/tvm/relay/frontend/qnn_torch.py | 12 +-
python/tvm/relay/frontend/tensorflow_ops.py | 9 +-
python/tvm/relay/frontend/tflite.py | 47 +-
python/tvm/relay/op/annotation/annotation.py | 21 +-
python/tvm/relay/op/contrib/cmsisnn.py | 92 +-
python/tvm/relay/op/contrib/ethosn.py | 4 +-
python/tvm/relay/op/contrib/ethosu.py | 532 ++++++-
python/tvm/relay/op/dyn/image/_image.py | 6 +
python/tvm/relay/op/image/_image.py | 12 +
python/tvm/relay/op/image/image.py | 97 +-
python/tvm/relay/op/nn/nn.py | 2 +-
python/tvm/relay/op/random/_kernel.py | 2 +
python/tvm/relay/op/random/kernel.py | 48 +
python/tvm/relay/op/strategy/arm_cpu.py | 93 +-
python/tvm/relay/op/strategy/cuda.py | 4 +-
python/tvm/relay/op/strategy/generic.py | 38 +-
python/tvm/relay/op/strategy/x86.py | 18 +-
python/tvm/relay/op/tensor.py | 36 +-
python/tvm/relay/qnn/op/layout_conversions.py | 2 +-
python/tvm/relay/qnn/op/qnn.py | 8 +-
python/tvm/relay/testing/dcgan.py | 3 +-
python/tvm/relay/transform/transform.py | 33 +-
python/tvm/runtime/vm.py | 21 +-
python/tvm/script/context_maintainer.py | 10 +-
python/tvm/script/parser.py | 21 +-
python/tvm/script/tir/__init__.pyi | 373 +++++
python/tvm/script/tir/scope_handler.py | 1 +
python/tvm/script/tir/special_stmt.py | 37 +-
python/tvm/script/tir/ty.py | 11 +-
python/tvm/target/arm_isa.py | 24 +-
python/tvm/target/codegen.py | 2 +-
python/tvm/target/target.py | 36 +-
python/tvm/te/__init__.py | 2 +-
python/tvm/te/operation.py | 26 +-
python/tvm/te/schedule.py | 8 +
python/tvm/testing/plugin.py | 1 +
python/tvm/testing/utils.py | 16 +-
python/tvm/tir/__init__.py | 1 +
python/tvm/tir/function.py | 2 +-
python/tvm/tir/ir_builder.py | 1 +
python/tvm/tir/schedule/_type_checker.py | 193 +++
python/tvm/tir/schedule/schedule.py | 123 +-
python/tvm/tir/schedule/testing.py | 9 +-
python/tvm/tir/transform/transform.py | 23 +
.../contrib/ethosu/te => tir/usmp}/__init__.py | 8 +-
.../conv2d/__init__.py => tir/usmp/_ffi_api.py} | 6 +-
.../ethosu/te => tir/usmp/analysis}/__init__.py | 7 +-
.../__init__.py => tir/usmp/analysis/_ffi_api.py} | 5 +-
.../tvm/tir/usmp/analysis/analysis.py | 30 +-
python/tvm/tir/usmp/utils.py | 150 ++
python/tvm/topi/arm_cpu/__init__.py | 4 +-
.../tvm/topi/arm_cpu/conv1d.py | 36 +-
python/tvm/topi/arm_cpu/conv2d.py | 23 +-
python/tvm/topi/arm_cpu/cortex_m7/conv2d/direct.py | 186 ---
.../pylint.sh => python/tvm/topi/arm_cpu/dense.py | 10 +-
.../arm_cpu/{cortex_m7 => mprofile}/__init__.py | 5 +-
.../micro_kernel => mprofile/dsp}/__init__.py | 0
.../direct_simd.py => mprofile/dsp/conv1d.py} | 123 +-
.../direct_simd.py => mprofile/dsp/conv2d.py} | 30 +-
python/tvm/topi/arm_cpu/mprofile/dsp/dense.py | 52 +
.../dsp}/micro_kernel/__init__.py | 0
.../arm_cpu/mprofile/dsp/micro_kernel/avg_pool.py | 146 ++
.../arm_cpu/mprofile/dsp/micro_kernel/common.py | 17 +-
.../dsp}/micro_kernel/gemm.py | 91 +-
.../arm_cpu/mprofile/dsp/micro_kernel/max_pool.py | 165 +++
python/tvm/topi/arm_cpu/mprofile/dsp/pool.py | 125 ++
.../tvm/topi/arm_cpu/pooling.py | 10 +-
python/tvm/topi/generic/nn.py | 17 +
python/tvm/topi/image/resize.py | 181 ++-
python/tvm/topi/nn/conv2d_transpose.py | 209 ++-
python/tvm/topi/nn/upsampling.py | 2 +
python/tvm/topi/random/kernel.py | 58 +
python/tvm/topi/testing/conv2d_transpose_python.py | 40 +-
.../tests/test_nn/src/build_test_graph.py | 9 +-
.../tests/test_tvm_basic/src/build_test_lib.py | 4 +-
.../tests/test_wasm32/src/build_test_lib.py | 4 +-
rust/tvm-sys/build.rs | 3 +-
rust/tvm/tests/basics/src/tvm_add.py | 2 +-
src/arith/int_set.cc | 2 +
src/contrib/torch/pt_call_tvm/tvm_class.cc | 686 +++++++++
src/contrib/torch/utils.h | 264 ++++
src/driver/driver_api.cc | 29 +-
src/ir/module.cc | 31 +-
src/meta_schedule/integration.cc | 151 ++
src/meta_schedule/task_scheduler/round_robin.cc | 4 +-
src/meta_schedule/task_scheduler/task_scheduler.cc | 51 +-
src/node/serialization.cc | 34 +-
src/parser/parser.cc | 26 +-
src/printer/relay_text_printer.cc | 185 ++-
src/printer/text_printer.cc | 19 +-
src/printer/text_printer.h | 38 +-
src/printer/tir_text_printer.cc | 3 +
src/printer/tvmscript_printer.cc | 39 +-
src/relay/backend/aot_executor_codegen.cc | 351 +++--
src/relay/backend/build_module.cc | 217 +--
.../backend/contrib/cmsisnn/codegen_cmsisnn.cc | 51 -
.../backend/contrib/cmsisnn/extract_constants.cc | 168 +++
.../backend/contrib/cmsisnn/generate_constants.cc | 244 +++
src/relay/backend/contrib/cmsisnn/relay_to_tir.cc | 293 +++-
.../vm/vm.h => backend/contrib/cmsisnn/target.cc} | 28 +-
.../backend/contrib/cmsisnn/tir_to_runtime.cc | 242 ++-
src/relay/backend/contrib/ethosn/codegen.cc | 4 +-
src/relay/backend/contrib/ethosn/codegen_ethosn.h | 2 +-
src/relay/backend/contrib/ethosn/ethosn_api.cc | 4 +
src/relay/backend/contrib/ethosn/ethosn_api.h | 4 +
.../backend/contrib/ethosn/ethosn_api_version.h | 4 +
src/relay/backend/contrib/ethosu/compiler_attrs.cc | 6 +-
src/relay/backend/contrib/ethosu/preprocess.cc | 4 +-
src/relay/backend/contrib/ethosu/source_module.cc | 37 +-
.../contrib/example_target_hooks/relay_to_tir.cc | 12 +-
.../contrib/example_target_hooks/tir_to_runtime.cc | 2 +
src/relay/backend/executor.cc | 5 +-
src/relay/backend/graph_executor_codegen.cc | 118 +-
src/relay/backend/graph_plan_memory.cc | 103 +-
src/relay/backend/interpreter.cc | 218 +--
src/relay/backend/runtime.cc | 4 +-
src/relay/backend/te_compiler.cc | 385 ++---
src/relay/backend/te_compiler.h | 26 +-
src/relay/backend/te_compiler_cache.cc | 55 +-
src/relay/backend/te_compiler_cache.h | 11 +-
src/relay/backend/utils.cc | 76 +-
src/relay/backend/utils.h | 30 +-
src/relay/backend/vm/compiler.cc | 275 ++--
src/relay/backend/vm/compiler.h | 29 +-
src/relay/backend/vm/lambda_lift.cc | 9 +-
src/relay/ir/adt.cc | 46 +
src/relay/ir/expr.cc | 220 ++-
src/relay/ir/expr_functor.cc | 183 +--
src/relay/ir/function.cc | 51 +
src/relay/op/annotation/annotation.cc | 152 --
src/relay/op/annotation/annotation.h | 106 --
src/relay/op/call/call.cc | 125 ++
src/relay/op/call/call.h | 78 +
src/relay/op/contrib/ethosu/binary_elementwise.cc | 310 ++++
src/relay/op/contrib/ethosu/common.cc | 17 +
src/relay/op/contrib/ethosu/common.h | 10 +
src/relay/op/contrib/ethosu/convolution.cc | 41 +-
src/relay/op/contrib/ethosu/depthwise.cc | 46 +-
src/relay/op/contrib/ethosu/identity.cc | 128 ++
src/relay/op/contrib/ethosu/pooling.cc | 15 +-
.../ethosu/{pooling.cc => unary_elementwise.cc} | 124 +-
src/relay/op/dyn/image/resize.cc | 16 +-
src/relay/op/image/resize.cc | 33 +-
src/relay/op/make_op.h | 7 +-
src/relay/op/memory/device_copy.cc | 55 +-
src/relay/op/memory/device_copy.h | 48 +-
src/relay/op/memory/memory.cc | 21 +-
src/relay/op/memory/memory.h | 6 +-
src/relay/op/memory/on_device.cc | 167 +++
src/relay/op/memory/on_device.h | 144 ++
src/relay/op/nn/convolution.h | 25 +-
src/relay/op/nn/nn.cc | 12 +
src/relay/op/random/kernel.cc | 47 +
src/relay/op/vm/vm.cc | 19 +-
src/relay/op/vm/vm.h | 2 +-
src/relay/qnn/op/quantize.cc | 8 +-
src/relay/transforms/annotate_target.cc | 18 +-
src/relay/transforms/dead_code.cc | 614 ++++++--
src/relay/transforms/device_aware_visitors.cc | 98 +-
src/relay/transforms/device_aware_visitors.h | 81 +-
src/relay/transforms/device_domains.cc | 370 +++--
src/relay/transforms/device_domains.h | 229 +--
src/relay/transforms/device_planner.cc | 446 +++---
src/relay/transforms/dynamic_to_static.cc | 26 +-
src/relay/transforms/first_order_gradient.cc | 12 +-
src/relay/transforms/fold_constant.cc | 52 +-
src/relay/transforms/forward_rewrite.cc | 19 +-
src/relay/transforms/fuse_ops.cc | 12 +-
src/relay/transforms/memory_alloc.cc | 141 +-
src/relay/transforms/partial_eval.cc | 2 +
src/relay/transforms/partition_graph.cc | 15 +-
src/relay/transforms/pass_utils.h | 1 +
src/relay/transforms/pattern_utils.h | 17 +
src/relay/transforms/split_args.cc | 18 +-
src/relay/transforms/to_a_normal_form.cc | 31 +-
src/relay/transforms/to_cps.cc | 9 +-
src/relay/transforms/transform_layout.h | 11 +-
src/runtime/contrib/ethosn/ethosn_device.cc | 2 +-
src/runtime/contrib/ethosn/ethosn_device.h | 2 +-
src/runtime/contrib/ethosn/ethosn_runtime.cc | 2 +-
.../ethosu/bare_metal/tvm_ethosu_runtime.c} | 47 +-
.../ethosu/bare_metal/tvm_ethosu_runtime.h} | 32 +-
src/runtime/crt/common/crt_runtime_api.c | 13 +-
src/runtime/crt/host/microtvm_api_server.py | 5 +-
src/runtime/meta_data.h | 12 +-
src/runtime/vm/bytecode.cc | 33 +-
src/runtime/vm/executable.cc | 97 +-
src/runtime/vm/profiler/vm.cc | 14 +-
src/runtime/vm/serialize_utils.h | 12 +-
src/runtime/vm/vm.cc | 115 +-
src/target/compilation_config.cc | 96 +-
src/target/llvm/llvm_module.cc | 21 +-
src/target/llvm/llvm_module.h | 3 +-
src/target/metadata_module.cc | 23 +-
src/target/metadata_module.h | 18 +-
src/target/opt/build_cuda_on.cc | 4 +
src/target/se_scope.cc | 10 +-
src/target/source/codegen_c_host.cc | 20 +-
src/target/source/codegen_c_host.h | 9 +-
src/target/source/codegen_source_base.h | 23 -
src/target/source/interface_c.cc | 54 +-
src/target/source/source_module.cc | 57 +-
src/target/source/source_module.h | 14 +-
src/target/target.cc | 43 +
src/target/target_kind.cc | 32 +-
src/te/operation/compute_op.cc | 3 +-
src/te/operation/create_primfunc.cc | 38 +-
src/te/schedule/schedule_lang.cc | 9 +
src/te/schedule/schedule_ops.cc | 4 +
src/te/schedule/schedule_postproc_to_primfunc.cc | 3 +-
src/tir/analysis/block_access_region_detector.cc | 34 +
src/tir/schedule/analysis.h | 50 +-
src/tir/schedule/analysis/analysis.cc | 253 +++-
src/tir/schedule/concrete_schedule.cc | 42 +
src/tir/schedule/concrete_schedule.h | 34 +-
src/tir/schedule/error.cc | 2 +-
src/tir/schedule/primitive.h | 62 +-
src/tir/schedule/primitive/block_annotate.cc | 1 -
src/tir/schedule/primitive/compute_inline.cc | 6 +-
src/tir/schedule/primitive/get_block_loop.cc | 132 ++
src/tir/schedule/primitive/reduction.cc | 144 +-
src/tir/schedule/primitive/sampling.cc | 315 +++-
src/tir/schedule/schedule.cc | 18 +
src/tir/schedule/traced_schedule.cc | 60 +
src/tir/schedule/traced_schedule.h | 15 +-
src/tir/schedule/utils.h | 42 +-
src/tir/transforms/compact_buffer_region.cc | 234 +--
src/tir/transforms/inject_rolling_buffer.cc | 317 ++++
src/tir/transforms/ir_utils.cc | 84 ++
src/tir/transforms/ir_utils.h | 39 +
src/tir/transforms/lower_cross_thread_reduction.cc | 645 ++++++++
src/tir/transforms/lower_tvm_builtin.cc | 17 +-
src/tir/transforms/lower_warp_memory.cc | 1 +
src/tir/transforms/make_packed_api.cc | 27 +-
src/tir/transforms/split_host_device.cc | 1 +
src/tir/usmp/analysis/extract_buffer_info.cc | 446 ++++++
src/tir/usmp/utils.cc | 146 ++
tests/cpp/relay/transforms/device_domains_test.cc | 22 +-
tests/cpp/relay_build_module_test.cc | 4 +-
tests/cpp/relay_dismantler_test.cc | 19 +
tests/cpp/runtime_test.cc | 4 +-
tests/cpp/target/compilation_config_test.cc | 66 +-
tests/cpp/target/source/interface_c_test.cc | 129 +-
tests/lint/pylint.sh | 1 +
tests/micro/arduino/conftest.py | 11 +-
tests/micro/arduino/test_arduino_rpc_server.py | 10 +-
tests/micro/zephyr/test_zephyr.py | 25 +-
tests/micro/zephyr/test_zephyr_aot.py | 27 +-
tests/micro/zephyr/test_zephyr_armv7m.py | 31 +-
tests/python/conftest.py | 22 +-
tests/python/contrib/test_bnns/infrastructure.py | 2 +-
.../contrib/test_bnns/test_onnx_topologies.py | 2 +-
.../python/contrib/test_cmsisnn/test_binary_ops.py | 3 +-
tests/python/contrib/test_cmsisnn/test_conv2d.py | 316 ++++
.../contrib/test_cmsisnn/test_extract_constants.py | 179 +++
.../test_cmsisnn/test_generate_constants.py | 229 +++
tests/python/contrib/test_cmsisnn/test_networks.py | 12 +-
tests/python/contrib/test_cmsisnn/test_softmax.py | 8 +-
tests/python/contrib/test_cmsisnn/utils.py | 127 +-
tests/python/contrib/test_ethosn/__init__.py | 2 +-
tests/python/contrib/test_ethosn/infrastructure.py | 18 +-
tests/python/contrib/test_ethosn/test_addition.py | 2 +-
.../python/contrib/test_ethosn/test_concatenate.py | 2 +-
.../test_ethosn/test_constant_duplication.py | 2 +-
tests/python/contrib/test_ethosn/test_conv2d.py | 2 +-
.../contrib/test_ethosn/test_depth_to_space.py | 2 +-
.../contrib/test_ethosn/test_fullyconnected.py | 2 +-
tests/python/contrib/test_ethosn/test_networks.py | 18 +-
.../contrib/test_ethosn/test_partition_params.py | 3 +-
tests/python/contrib/test_ethosn/test_pooling.py | 2 +-
tests/python/contrib/test_ethosn/test_relu.py | 2 +-
tests/python/contrib/test_ethosn/test_reshape.py | 2 +-
tests/python/contrib/test_ethosn/test_sigmoid.py | 2 +-
tests/python/contrib/test_ethosn/test_split.py | 2 +-
.../python/contrib/test_ethosn/test_topologies.py | 3 +-
tests/python/contrib/test_ethosu/infra.py | 162 +-
.../contrib/test_ethosu/test_attr_passing.py | 6 +-
tests/python/contrib/test_ethosu/test_codegen.py | 636 +++++++-
.../contrib/test_ethosu/test_encode_constants.py | 69 +-
tests/python/contrib/test_ethosu/test_legalize.py | 481 +++++-
.../contrib/test_ethosu/test_legalize_no_ops.py | 107 ++
.../python/contrib/test_ethosu/test_preprocess.py | 14 +-
.../test_ethosu/test_replace_binary_elementwise.py | 342 +++++
.../contrib/test_ethosu/test_replace_conv2d.py | 129 +-
.../contrib/test_ethosu/test_replace_copy.py | 6 +-
.../test_ethosu/test_replace_depthwise_conv2d.py | 49 +-
.../contrib/test_ethosu/test_replace_identity.py | 115 ++
.../contrib/test_ethosu/test_replace_pooling.py | 182 ++-
...ooling.py => test_replace_unary_elementwise.py} | 103 +-
.../test_ethosu/test_tir_to_cs_translator.py | 482 +++++-
.../contrib/test_ethosu/test_type_inference.py | 260 +++-
tests/python/contrib/test_ethosu/test_vela_api.py | 2 +
tests/python/contrib/test_hexagon/README.md | 486 +-----
tests/python/contrib/test_hexagon/conftest.py | 11 -
.../python/contrib/test_hexagon/infrastructure.py | 157 +-
.../{README.md => test_conv2d_blocked.md} | 97 +-
.../contrib/test_hexagon/test_conv2d_blocked.py | 500 +------
.../contrib/test_hexagon/test_conv2d_conv2d.md | 986 +++++++++++++
.../contrib/test_hexagon/test_conv2d_conv2d.py | 241 +++
.../contrib/test_hexagon/test_maxpool2d_blocked.py | 10 +-
tests/python/contrib/test_onnx.py | 1 +
.../contrib/test_vitis_ai/test_vitis_ai_codegen.py | 25 +-
tests/python/driver/tvmc/conftest.py | 17 +
tests/python/driver/tvmc/test_compiler.py | 14 +-
tests/python/driver/tvmc/test_frontends.py | 16 +-
tests/python/driver/tvmc/test_mlf.py | 15 +-
tests/python/driver/tvmc/test_registry_options.py | 81 +
tests/python/driver/tvmc/test_target.py | 19 +-
tests/python/driver/tvmc/test_target_options.py | 10 +
tests/python/frontend/caffe/test_forward.py | 3 +-
tests/python/frontend/onnx/test_forward.py | 257 +++-
tests/python/frontend/paddlepaddle/test_forward.py | 89 ++
tests/python/frontend/tensorflow2/common.py | 6 +-
tests/python/frontend/tflite/test_forward.py | 102 +-
tests/python/integration/test_arm_mprofile_dsp.py | 355 +++++
tests/python/integration/test_ewise.py | 4 +-
tests/python/relay/aot/aot_test_utils.py | 164 ++-
tests/python/relay/aot/corstone300.ld | 18 +-
tests/python/relay/aot/corstone300.mk | 26 +-
tests/python/relay/aot/test_c_device_api.py | 255 ++++
tests/python/relay/aot/test_crt_aot.py | 46 +-
tests/python/relay/dyn/test_dynamic_op_level5.py | 2 +-
.../python/relay/op/annotation/test_annotation.py | 27 +-
tests/python/relay/op/test_tensor.py | 52 +
tests/python/relay/test_any.py | 2 +-
tests/python/relay/test_build_module.py | 62 +
tests/python/relay/test_executor.py | 6 +-
tests/python/relay/test_ir_nodes.py | 12 +
tests/python/relay/test_ir_text_printer.py | 2 +-
tests/python/relay/test_op_level10.py | 22 +-
tests/python/relay/test_op_level2.py | 60 +-
tests/python/relay/test_op_level5.py | 12 +-
tests/python/relay/test_op_qnn_conv2_transpose.py | 53 +-
tests/python/relay/test_pass_alter_op_layout.py | 12 +-
tests/python/relay/test_pass_convert_op_layout.py | 16 +-
.../relay/test_pass_dead_code_elimination.py | 181 ++-
tests/python/relay/test_pass_dynamic_to_static.py | 2 +-
tests/python/relay/test_pass_lazy_gradient_init.py | 16 +-
tests/python/relay/test_pass_partial_eval.py | 21 +-
tests/python/relay/test_pass_partition_graph.py | 71 +-
tests/python/relay/test_pass_plan_devices.py | 736 ++++++---
tests/python/relay/test_pass_to_cps.py | 13 +-
tests/python/relay/test_runtime.py | 18 +-
tests/python/relay/test_vm.py | 57 +-
.../python/test_topi_group_conv2d_transpose.py | 156 ++
tests/python/topi/python/test_topi_image.py | 2 +
.../python/unittest/test_auto_scheduler_measure.py | 17 +-
.../unittest/test_auto_scheduler_search_task.py | 4 +-
tests/python/unittest/test_crt.py | 18 +-
tests/python/unittest/test_link_params.py | 32 +-
.../unittest/test_meta_schedule_integration.py | 120 ++
.../unittest/test_meta_schedule_space_generator.py | 8 +-
.../unittest/test_meta_schedule_task_scheduler.py | 75 +-
.../unittest/test_micro_model_library_format.py | 58 +-
tests/python/unittest/test_micro_project_api.py | 165 ++-
tests/python/unittest/test_micro_transport.py | 282 ++--
.../python/unittest/test_runtime_module_export.py | 4 +-
tests/python/unittest/test_runtime_module_load.py | 12 +-
tests/python/unittest/test_runtime_profiling.py | 22 +-
tests/python/unittest/test_runtime_rpc.py | 5 +-
tests/python/unittest/test_runtime_vm_profiler.py | 20 +-
.../python/unittest/test_target_codegen_hexagon.py | 2 +-
tests/python/unittest/test_target_codegen_llvm.py | 11 +-
tests/python/unittest/test_target_target.py | 18 +-
.../test_tir_analysis_get_block_access_region.py | 47 +
.../unittest/test_tir_schedule_compute_inline.py | 65 +
.../python/unittest/test_tir_schedule_reduction.py | 42 +
tests/python/unittest/test_tir_schedule_rfactor.py | 48 +
.../python/unittest/test_tir_schedule_sampling.py | 43 +-
.../python/unittest/test_tir_schedule_utilities.py | 59 +-
.../test_tir_transform_compact_buffer_region.py | 136 ++
.../test_tir_transform_convert_blocks_to_opaque.py | 12 +-
.../test_tir_transform_inject_rolling_buffer.py | 265 ++++
...t_tir_transform_lower_cross_thread_reduction.py | 737 ++++++++++
.../test_tir_transform_lower_warp_memory.py | 32 +-
.../unittest/test_tir_transform_make_packed_api.py | 101 +-
.../test_tir_transform_split_host_device.py | 52 +
.../test_tir_usmp_analysis_extract_bufferinfo.py | 1555 ++++++++++++++++++++
tests/python/unittest/test_tir_usmp_utils.py | 203 +++
.../python/unittest/test_tvmscript_error_report.py | 52 +-
tests/python/unittest/test_tvmscript_roundtrip.py | 29 +
tests/python/unittest/test_tvmscript_type.py | 182 +++
tests/scripts/task_mypy.sh | 4 +
tests/scripts/task_python_integration.sh | 5 +
tests/scripts/task_python_integration_gpuonly.sh | 1 +
version.py | 57 +-
vta/scripts/tune_conv2d_transpose.py | 3 +-
vta/scripts/tune_resnet.py | 11 +-
.../python/integration/test_benchmark_gemm.py | 7 +-
.../integration/test_benchmark_topi_conv2d.py | 10 +-
.../integration/test_benchmark_topi_dense.py | 10 +-
.../test_benchmark_topi_group_conv2d.py | 10 +-
vta/tests/python/unittest/test_vta_insn.py | 16 +-
vta/tutorials/autotvm/tune_alu_vta.py | 3 +-
vta/tutorials/frontend/deploy_classification.py | 4 +-
vta/tutorials/frontend/deploy_detection.py | 4 +-
vta/tutorials/matrix_multiply.py | 4 +-
vta/tutorials/optimize/convolution_opt.py | 4 +-
vta/tutorials/optimize/matrix_multiply_opt.py | 4 +-
vta/tutorials/vta_get_started.py | 4 +-
web/package.json | 2 +-
web/tests/python/prepare_test_libs.py | 6 +-
web/tests/python/webgpu_rpc_test.py | 7 +-
web/tests/python/websock_rpc_test.py | 6 +-
594 files changed, 32982 insertions(+), 7400 deletions(-)
copy src/target/llvm/llvm_module.h =>
apps/microtvm/ethosu/include/tvm_ethosu_runtime.h (53%)
copy src/relay/op/memory/memory.h =>
apps/microtvm/ethosu/src/tvm_ethosu_runtime.c (51%)
copy python/tvm/autotvm/env.py => apps/pt_tvmdsoop/CMakeLists.txt (57%)
copy docker/install/ubuntu_install_python.sh =>
apps/pt_tvmdsoop/prepare_and_test_pt_tvm_class.sh (50%)
create mode 100644 apps/pt_tvmdsoop/tests/test_torch_compile_cpu.py
create mode 100644 apps/pt_tvmdsoop/tests/test_torch_compile_gpu.py
create mode 100644 apps/pt_tvmdsoop/tests/test_torch_graph_module.py
create mode 100644 apps/pt_tvmdsoop/tests/test_torch_script.py
create mode 100644 apps/pt_tvmdsoop/tests/test_torch_vm_module.py
create mode 100644 apps/pt_tvmdsoop/tests/test_trace_tvm_module.py
create mode 100644 cmake/modules/contrib/PT_TVMDSOOP.cmake
create mode 100644 include/tvm/meta_schedule/integration.h
copy src/relay/op/vm/vm.h => include/tvm/relay/attrs/call.h (57%)
create mode 100644 include/tvm/relay/attrs/on_device.h
create mode 100644 include/tvm/tir/usmp/utils.h
create mode 100644 python/tvm/contrib/torch/__init__.py
create mode 100644 python/tvm/contrib/torch/module.py
create mode 100644 python/tvm/contrib/torch/pytorch_tvm.py
create mode 100644 python/tvm/driver/tvmc/fmtopt.py
create mode 100644 python/tvm/driver/tvmc/micro.py
create mode 100644 python/tvm/driver/tvmc/registry.py
create mode 100644 python/tvm/meta_schedule/integration.py
copy python/tvm/{topi/arm_cpu/cortex_m7/micro_kernel =>
meta_schedule/testing}/__init__.py (87%)
rename python/tvm/meta_schedule/{testing.py => testing/local_rpc.py} (97%)
create mode 100644 python/tvm/meta_schedule/testing/relay_workload.py
create mode 100644
python/tvm/relay/backend/contrib/ethosu/op/binary_elementwise.py
create mode 100644 python/tvm/relay/backend/contrib/ethosu/op/identity.py
copy python/tvm/relay/backend/contrib/ethosu/op/{pooling.py =>
unary_elementwise.py} (59%)
create mode 100644
python/tvm/relay/backend/contrib/ethosu/te/binary_elementwise.py
create mode 100644 python/tvm/relay/backend/contrib/ethosu/te/identity.py
copy python/tvm/relay/backend/contrib/ethosu/te/{pooling.py =>
unary_elementwise.py} (56%)
copy python/tvm/relay/backend/contrib/ethosu/tir/{pooling.py =>
binary_elementwise.py} (56%)
create mode 100644 python/tvm/relay/backend/contrib/ethosu/tir/identity.py
copy python/tvm/relay/backend/contrib/ethosu/tir/{pooling.py =>
unary_elementwise.py} (58%)
create mode 100644 python/tvm/script/tir/__init__.pyi
create mode 100644 python/tvm/tir/schedule/_type_checker.py
copy python/tvm/{relay/backend/contrib/ethosu/te => tir/usmp}/__init__.py (83%)
rename python/tvm/{topi/arm_cpu/cortex_m7/conv2d/__init__.py =>
tir/usmp/_ffi_api.py} (89%)
copy python/tvm/{relay/backend/contrib/ethosu/te =>
tir/usmp/analysis}/__init__.py (84%)
copy python/tvm/{topi/arm_cpu/cortex_m7/__init__.py =>
tir/usmp/analysis/_ffi_api.py} (88%)
copy docker/install/ubuntu1804_install_python_venv.sh =>
python/tvm/tir/usmp/analysis/analysis.py (55%)
mode change 100755 => 100644
create mode 100644 python/tvm/tir/usmp/utils.py
copy jvm/core/src/test/scripts/test_add_cpu.py =>
python/tvm/topi/arm_cpu/conv1d.py (52%)
delete mode 100644 python/tvm/topi/arm_cpu/cortex_m7/conv2d/direct.py
copy tests/lint/pylint.sh => python/tvm/topi/arm_cpu/dense.py (72%)
mode change 100755 => 100644
rename python/tvm/topi/arm_cpu/{cortex_m7 => mprofile}/__init__.py (92%)
copy python/tvm/topi/arm_cpu/{cortex_m7/micro_kernel =>
mprofile/dsp}/__init__.py (100%)
copy python/tvm/topi/arm_cpu/{cortex_m7/conv2d/direct_simd.py =>
mprofile/dsp/conv1d.py} (54%)
rename python/tvm/topi/arm_cpu/{cortex_m7/conv2d/direct_simd.py =>
mprofile/dsp/conv2d.py} (88%)
create mode 100644 python/tvm/topi/arm_cpu/mprofile/dsp/dense.py
rename python/tvm/topi/arm_cpu/{cortex_m7 =>
mprofile/dsp}/micro_kernel/__init__.py (100%)
create mode 100644
python/tvm/topi/arm_cpu/mprofile/dsp/micro_kernel/avg_pool.py
copy tests/lint/pylint.sh =>
python/tvm/topi/arm_cpu/mprofile/dsp/micro_kernel/common.py (72%)
mode change 100755 => 100644
rename python/tvm/topi/arm_cpu/{cortex_m7 =>
mprofile/dsp}/micro_kernel/gemm.py (89%)
create mode 100644
python/tvm/topi/arm_cpu/mprofile/dsp/micro_kernel/max_pool.py
create mode 100644 python/tvm/topi/arm_cpu/mprofile/dsp/pool.py
copy tests/lint/pylint.sh => python/tvm/topi/arm_cpu/pooling.py (74%)
mode change 100755 => 100644
create mode 100644 src/contrib/torch/pt_call_tvm/tvm_class.cc
create mode 100644 src/contrib/torch/utils.h
create mode 100644 src/meta_schedule/integration.cc
delete mode 100644 src/relay/backend/contrib/cmsisnn/codegen_cmsisnn.cc
create mode 100644 src/relay/backend/contrib/cmsisnn/extract_constants.cc
create mode 100644 src/relay/backend/contrib/cmsisnn/generate_constants.cc
copy src/relay/{op/vm/vm.h => backend/contrib/cmsisnn/target.cc} (67%)
create mode 100644 src/relay/op/call/call.cc
create mode 100644 src/relay/op/call/call.h
create mode 100644 src/relay/op/contrib/ethosu/binary_elementwise.cc
create mode 100644 src/relay/op/contrib/ethosu/identity.cc
copy src/relay/op/contrib/ethosu/{pooling.cc => unary_elementwise.cc} (52%)
create mode 100644 src/relay/op/memory/on_device.cc
create mode 100644 src/relay/op/memory/on_device.h
copy src/{relay/op/memory/memory.h =>
runtime/contrib/ethosu/bare_metal/tvm_ethosu_runtime.c} (51%)
copy src/{target/llvm/llvm_module.h =>
runtime/contrib/ethosu/bare_metal/tvm_ethosu_runtime.h} (52%)
create mode 100644 src/tir/transforms/inject_rolling_buffer.cc
create mode 100644 src/tir/transforms/lower_cross_thread_reduction.cc
create mode 100644 src/tir/usmp/analysis/extract_buffer_info.cc
create mode 100644 src/tir/usmp/utils.cc
create mode 100644 tests/python/contrib/test_cmsisnn/test_conv2d.py
create mode 100644 tests/python/contrib/test_cmsisnn/test_extract_constants.py
create mode 100644 tests/python/contrib/test_cmsisnn/test_generate_constants.py
create mode 100644 tests/python/contrib/test_ethosu/test_legalize_no_ops.py
create mode 100644
tests/python/contrib/test_ethosu/test_replace_binary_elementwise.py
create mode 100644 tests/python/contrib/test_ethosu/test_replace_identity.py
copy tests/python/contrib/test_ethosu/{test_replace_pooling.py =>
test_replace_unary_elementwise.py} (59%)
copy tests/python/contrib/test_hexagon/{README.md => test_conv2d_blocked.md}
(88%)
create mode 100644 tests/python/contrib/test_hexagon/test_conv2d_conv2d.md
create mode 100644 tests/python/contrib/test_hexagon/test_conv2d_conv2d.py
create mode 100644 tests/python/driver/tvmc/test_registry_options.py
create mode 100644 tests/python/integration/test_arm_mprofile_dsp.py
create mode 100644 tests/python/relay/aot/test_c_device_api.py
create mode 100644 tests/python/relay/op/test_tensor.py
create mode 100644 tests/python/relay/test_build_module.py
create mode 100644 tests/python/topi/python/test_topi_group_conv2d_transpose.py
create mode 100644 tests/python/unittest/test_meta_schedule_integration.py
create mode 100644
tests/python/unittest/test_tir_transform_inject_rolling_buffer.py
create mode 100644
tests/python/unittest/test_tir_transform_lower_cross_thread_reduction.py
create mode 100644
tests/python/unittest/test_tir_transform_split_host_device.py
create mode 100644
tests/python/unittest/test_tir_usmp_analysis_extract_bufferinfo.py
create mode 100644 tests/python/unittest/test_tir_usmp_utils.py
create mode 100644 tests/python/unittest/test_tvmscript_type.py