This is an automated email from the ASF dual-hosted git repository.

github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git


    from 84d05e9a24 [LLVM][Codegen] Cast NaN to bool gives true (#18772)
     add 82b01c9486 [REFACTOR][S-TIR] More migrations to s-tir (#18776)
     add 2a448ce4bb [CI] Update Pillow, pytest-rerunfailures, junitparser, 
xgboost, onnx and pytorch (#18777)
     add f8dbbdaf5c [REFACTOR] Phase out dmlc dep (#18779)

No new revisions were added by this update.

Summary of changes:
 3rdparty/nvbench/l2_cache_flush.h                  |   2 +-
 CMakeLists.txt                                     |  16 +-
 Makefile                                           |   5 +-
 apps/android_rpc/app/src/main/jni/Android.mk       |   1 -
 apps/android_rpc/app/src/main/jni/tvm_runtime.h    |   1 -
 apps/cpp_rpc/CMakeLists.txt                        |   1 -
 apps/cpp_rpc/main.cc                               |   3 -
 apps/cpp_rpc/rpc_env.cc                            |   2 +-
 apps/cpp_rpc/rpc_server.cc                         |   2 -
 apps/hexagon_launcher/cmake/HexagonLauncher.cmake  |   1 -
 apps/hexagon_launcher/cmake/android/CMakeLists.txt |   1 -
 apps/hexagon_launcher/cmake/hexagon/CMakeLists.txt |   2 -
 apps/hexagon_launcher/launcher_core.cc             |  88 ++--
 apps/hexagon_launcher/launcher_core.h              |  10 +-
 apps/ios_rpc/tvmrpc.xcodeproj/project.pbxproj      |   4 -
 cmake/modules/CUDA.cmake                           |   1 -
 cmake/modules/LLVM.cmake                           |   4 +-
 cmake/modules/LibInfo.cmake                        |   1 -
 cmake/modules/contrib/CUTLASS.cmake                |   2 -
 cmake/modules/contrib/MSCCLPP.cmake                |   1 -
 docker/install/ubuntu_install_onnx.sh              |  65 +--
 docker/install/ubuntu_install_python_package.sh    |   6 +-
 docker/install/ubuntu_install_redis.sh             |   2 +-
 docs/Doxyfile                                      |   2 +-
 include/tvm/ir/attrs.h                             |   1 -
 include/tvm/ir/op.h                                |   2 +-
 include/tvm/runtime/disco/session.h                |   2 +
 include/tvm/runtime/logging.h                      |  20 +-
 include/tvm/runtime/module.h                       |   2 +-
 include/tvm/runtime/serializer.h                   |  49 +-
 include/tvm/runtime/tensor.h                       |  29 +-
 include/tvm/runtime/vm/executable.h                |  39 +-
 include/tvm/s_tir/analysis.h                       | 121 +++++
 .../tvm/{tir => s_tir}/backend/adreno/transform.h  |  23 +-
 include/tvm/s_tir/schedule/instruction.h           |   2 +-
 include/tvm/s_tir/transform.h                      |  41 ++
 include/tvm/support/io.h                           | 129 +++++
 include/tvm/support/serializer.h                   | 232 +++++++++
 include/tvm/support/with.h                         |   4 +-
 include/tvm/target/tag.h                           |   2 +-
 include/tvm/target/target_info.h                   |  77 ---
 include/tvm/target/target_kind.h                   |   2 +-
 include/tvm/tir/analysis.h                         | 145 ------
 include/tvm/tir/builtin.h                          |  13 -
 include/tvm/tir/stmt_functor.h                     |   9 -
 include/tvm/tir/transform.h                        | 163 -------
 python/tvm/contrib/hexagon/meta_schedule.py        |   2 +-
 python/tvm/contrib/hexagon/tools.py                |   2 -
 python/tvm/contrib/msc/core/runtime/runner.py      |   2 +-
 .../contrib/msc/framework/tvm/runtime/runner.py    |   4 +-
 python/tvm/libinfo.py                              |   5 -
 python/tvm/relax/frontend/nn/extern.py             |   7 -
 python/tvm/s_tir/__init__.py                       |  19 +
 python/tvm/s_tir/analysis/__init__.py              |  96 +++-
 python/tvm/s_tir/backend/adreno/__init__.py        |   1 +
 python/tvm/s_tir/backend/adreno/pipeline.py        |   4 +-
 .../backend/adreno/transform/__init__.py           |   0
 .../backend/adreno/transform/_ffi_api.py}          |   5 +-
 .../backend/adreno/transform/transform.py          |   0
 .../s_tir/meta_schedule/builder/local_builder.py   |   2 +-
 python/tvm/s_tir/pipeline.py                       |   2 -
 python/tvm/s_tir/transform/transform.py            |  60 +++
 python/tvm/tir/analysis/analysis.py                | 100 +---
 python/tvm/tir/backend/adreno/__init__.py          |   2 -
 .../tvm/tir/backend/adreno/transform/_ffi_api.py   |  21 -
 python/tvm/tir/pipeline.py                         |   3 -
 python/tvm/tir/stmt_functor.py                     |  19 -
 python/tvm/tir/transform/transform.py              | 349 +------------
 src/arith/solve_linear_equation.cc                 |   2 +
 src/contrib/msc/core/codegen/base_codegen.h        |   7 +-
 src/contrib/msc/core/codegen/codegen_json.cc       |   2 +-
 src/contrib/msc/core/codegen/codegen_json.h        |  25 +-
 src/contrib/msc/core/codegen/codegen_utils.h       |  60 ++-
 src/contrib/msc/core/codegen/cpp_codegen.h         |   1 -
 src/contrib/msc/core/codegen/py_codegen.h          |   1 -
 src/contrib/msc/core/ir/graph.cc                   |  48 +-
 src/contrib/msc/core/ir/graph.h                    | 537 ++++++++++++++-------
 src/contrib/msc/core/ir/graph_builder.h            |  88 ++--
 src/contrib/msc/core/ir/plugin.cc                  |  22 +-
 src/contrib/msc/core/ir/plugin.h                   | 326 ++++++++-----
 src/contrib/msc/core/printer/msc_base_printer.h    |  34 +-
 src/contrib/msc/core/transform/set_expr_name.cc    |   2 +
 .../msc/framework/tensorflow/codegen_utils.h       |   8 +-
 src/contrib/msc/framework/tensorflow/config.h      |  13 +-
 src/contrib/msc/framework/tensorrt/codegen_utils.h |  66 +--
 .../msc/framework/tensorrt/transform_tensorrt.cc   |  28 +-
 src/contrib/msc/framework/torch/codegen_utils.h    |   8 +-
 src/contrib/msc/framework/torch/config.h           |  13 +-
 src/contrib/msc/framework/tvm/codegen_utils.h      |  18 +-
 src/contrib/msc/framework/tvm/config.h             |  18 +-
 src/contrib/msc/plugin/base_codegen.h              |   7 +-
 src/contrib/msc/plugin/codegen_utils.h             |  81 +++-
 src/contrib/msc/plugin/tensorrt_codegen.h          |  13 +-
 src/contrib/msc/plugin/torch_codegen.h             |  18 +-
 src/contrib/msc/plugin/tvm_codegen.cc              |   1 -
 src/contrib/msc/plugin/tvm_codegen.h               |  18 +-
 src/ir/instrument.cc                               |  17 +-
 src/ir/transform.cc                                |  12 +-
 src/node/structural_hash.cc                        |  11 +-
 src/relax/analysis/var2value.cc                    |   2 +
 src/relax/backend/contrib/clml/codegen.cc          |  10 +-
 .../backend/contrib/codegen_json/codegen_json.h    |  52 +-
 src/relax/backend/contrib/cublas/codegen.cc        |   2 +-
 src/relax/backend/contrib/cudnn/codegen.cc         |   4 +-
 src/relax/backend/contrib/nnapi/codegen.cc         |  20 +-
 src/relax/backend/contrib/tensorrt/codegen.cc      |   2 +-
 src/relax/backend/vm/exec_builder.cc               |   1 +
 .../transform/lower_global_view_to_local_view.cc   |   3 +-
 src/relax/ir/transform.cc                          |   1 -
 .../transform/attach_attr_layout_free_buffers.cc   |   3 +-
 src/relax/transform/compute_prim_value.cc          |   3 +-
 src/relax/transform/fuse_tir.cc                    |   5 +-
 src/relax/transform/split_call_tir_by_pattern.cc   |   5 +-
 .../transform/split_layout_rewrite_preproc.cc      |   5 +-
 src/runtime/const_loader_module.cc                 |  38 +-
 src/runtime/contrib/clml/clml_runtime.cc           |  50 +-
 src/runtime/contrib/coreml/coreml_runtime.mm       |  23 +-
 src/runtime/contrib/cublas/cublas_utils.cc         |  11 +-
 src/runtime/contrib/cudnn/cudnn_json_runtime.cc    |   1 +
 src/runtime/contrib/cudnn/cudnn_utils.cc           |   6 +-
 src/runtime/contrib/hipblas/hipblas_utils.cc       |  11 +-
 src/runtime/contrib/json/json_node.h               | 292 +++++------
 src/runtime/contrib/json/json_runtime.h            |  72 ++-
 src/runtime/contrib/miopen/miopen_utils.cc         |   6 +-
 src/runtime/contrib/mps/mps_utils.h                |   1 -
 src/runtime/contrib/mps/mps_utils.mm               |   7 +-
 src/runtime/contrib/mrvl/mrvl_hw_runtime.cc        |  35 +-
 src/runtime/contrib/mrvl/mrvl_runtime.cc           |  23 +-
 src/runtime/contrib/msc/tensorrt_runtime.cc        |   1 -
 src/runtime/contrib/random/random.cc               |   6 +-
 src/runtime/contrib/rocblas/rocblas.cc             |  12 +-
 src/runtime/contrib/tensorrt/tensorrt_runtime.cc   |  76 +--
 src/runtime/cpu_device_api.cc                      |  10 +-
 src/runtime/cuda/cuda_device_api.cc                |   8 +-
 src/runtime/cuda/cuda_module.cc                    |  25 +-
 src/runtime/cuda/l2_cache_flush.cc                 |   8 +-
 src/runtime/device_api.cc                          |   1 +
 src/runtime/disco/loader.cc                        |   1 +
 src/runtime/disco/message_queue.h                  |  16 +-
 src/runtime/disco/protocol.h                       |  11 +-
 src/runtime/disco/threaded_session.cc              |  12 +-
 src/runtime/file_utils.cc                          | 138 +++---
 src/runtime/file_utils.h                           |   6 +-
 src/runtime/hexagon/hexagon_device_api.cc          |  10 +-
 src/runtime/hexagon/hexagon_module.cc              |  16 +-
 src/runtime/logging.cc                             |   4 +-
 src/runtime/meta_data.h                            |  27 +-
 src/runtime/metal/metal_device_api.mm              |   8 +-
 src/runtime/metal/metal_module.mm                  |  42 +-
 src/runtime/opencl/opencl_device_api.cc            |  12 +-
 src/runtime/opencl/opencl_module.cc                |  48 +-
 src/runtime/opencl/opencl_module_spirv.cc          |  14 +-
 .../opencl/opencl_wrapper/opencl_wrapper.cc        |   1 -
 src/runtime/pack_args.h                            |   1 +
 src/runtime/profiling.cc                           |  90 ++--
 src/runtime/rocm/rocm_device_api.cc                |   8 +-
 src/runtime/rocm/rocm_module.cc                    |  25 +-
 src/runtime/rpc/rpc_endpoint.cc                    |  30 +-
 src/runtime/rpc/rpc_pipe_impl.cc                   |   6 +-
 src/runtime/rpc/rpc_socket_impl.cc                 |  14 +-
 src/runtime/spirv/spirv_shader.h                   |  24 +-
 src/runtime/static_library.cc                      |  22 +-
 src/runtime/thread_pool.cc                         |  11 +-
 src/runtime/thread_storage_scope.h                 |   1 +
 src/runtime/vm/executable.cc                       |  37 +-
 src/runtime/vm/tensor_cache_support.cc             |   2 +-
 src/runtime/vulkan/vulkan_device.cc                |   4 +-
 src/runtime/vulkan/vulkan_module.cc                |  19 +-
 src/runtime/vulkan/vulkan_wrapped_func.cc          |  27 +-
 src/s_tir/analysis/calculate_allocated_memory.cc   |  12 +-
 src/{tir => s_tir}/analysis/estimate_flops.cc      |   7 +-
 src/s_tir/analysis/find_anchor_sblock.cc           |   3 +-
 src/{tir => s_tir}/analysis/identify_memcpy.cc     |   7 +-
 src/{tir => s_tir}/analysis/is_pure_function.cc    |   9 +-
 src/{tir => s_tir}/analysis/oob_checker.cc         |  15 +-
 .../analysis/sblock_access_region_detector.cc      |   1 +
 src/{tir => s_tir}/analysis/verify_gpu_code.cc     |  15 +-
 .../backend/adreno/inject_texture_alloc.cc         |  14 +-
 .../backend/adreno/texture_flatten.cc              |  12 +-
 src/s_tir/meta_schedule/arg_info.cc                |   4 +-
 .../feature_extractor/per_store_feature.cc         |   2 +-
 src/s_tir/meta_schedule/mutator/mutate_parallel.cc |   1 +
 .../postproc/disallow_async_strided_mem_copy.cc    |   2 +-
 .../meta_schedule/postproc/verify_gpu_code.cc      |   6 +-
 .../meta_schedule/postproc/verify_vtcm_limit.cc    |   6 +-
 .../search_strategy/evolutionary_search.cc         |   2 +
 .../meta_schedule/task_scheduler/task_scheduler.cc |   3 +-
 src/s_tir/meta_schedule/utils.h                    |  16 +-
 src/s_tir/schedule/primitive/hide_buffer_access.cc |   2 +
 .../schedule/primitive/reorder_block_iter_var.cc   |   2 +
 .../transform/decorate_device_scope.cc             |  15 +-
 .../transform/default_gpu_schedule.cc              |  21 +-
 src/s_tir/transform/inject_software_pipeline.cc    |   1 +
 src/s_tir/transform/lower_async_dma.cc             |   6 +-
 .../transform/merge_shared_memory_allocations.cc   |   2 +
 src/{tir => s_tir}/transform/remove_store_undef.cc |  22 +-
 .../remove_weight_layout_rewrite_block.cc          |  13 +-
 src/{tir => s_tir}/transform/renew_defs.cc         |  11 +-
 src/s_tir/transform/storage_access.cc              |   1 -
 .../transform/using_assume_to_reduce_branches.cc   |  13 +-
 .../printer/doc_printer/python_doc_printer.cc      |   1 +
 src/support/base64.h                               |  21 +-
 src/support/bytes_io.h                             | 103 ++++
 src/support/env.h                                  |  63 +++
 src/support/libinfo.cc                             |   1 -
 src/support/pipe.h                                 |   4 +-
 src/support/socket.h                               |   4 +-
 src/target/codegen.cc                              |  31 +-
 src/target/intrin_rule.cc                          |  20 +
 src/target/llvm/codegen_hexagon.cc                 |   2 +-
 src/target/llvm/llvm_instance.cc                   |   3 +-
 src/target/llvm/llvm_module.cc                     |   2 +-
 src/target/source/codegen_webgpu.cc                |  25 +-
 src/target/source/source_module.cc                 |  42 +-
 src/target/spirv/spirv_utils.cc                    |   4 +-
 src/target/target.cc                               |  12 +-
 src/target/target_info.cc                          |  52 --
 src/tir/ir/buffer.cc                               |   1 +
 src/tir/ir/function.cc                             |   4 +-
 src/tir/op/builtin.cc                              |   4 -
 src/tir/transform/bind_target.cc                   |   3 +-
 src/tir/transform/combine_context_call.cc          | 123 -----
 src/tir/transform/convert_for_loops_serial.cc      |  78 ---
 .../transform/lower_device_storage_access_info.cc  | 141 ------
 src/tir/transform/lower_intrin.cc                  |   1 +
 src/tir/transform/make_unpacked_api.cc             | 210 --------
 .../reduce_branching_through_overcompute.cc        | 187 -------
 src/tir/transform/storage_rewrite.cc               |  26 +-
 src/topi/einsum.cc                                 |   3 +
 tests/lint/cpplint.sh                              |  11 +-
 tests/lint/jnilint.sh                              |   3 +-
 tests/python/contrib/test_msc/test_plugin.py       |   2 +-
 .../contrib/test_msc/test_translate_tensorrt.py    |   2 +-
 tests/python/relax/test_codegen_cublas.py          |   2 +-
 tests/python/relax/test_codegen_cutlass.py         |   6 +-
 tests/python/relax/test_contrib_vllm.py            |   2 +-
 ...eliminate_pad_branch_using_buffer_assumption.py |   6 +-
 .../python/relax/test_frontend_nn_extern_module.py |   2 -
 tests/python/relax/test_frontend_nn_op.py          |   8 +-
 tests/python/relax/test_transform_codegen_pass.py  |   4 +-
 .../relax/test_transform_meta_schedule_tuning.py   |   2 +-
 tests/python/relax/test_vm_cuda_graph.py           |   2 +-
 tests/python/relax/test_vm_multi_device.py         |   2 +-
 ...t_s_tir_analysis_calculate_allocated_memory.py} |   6 +-
 .../test_s_tir_analysis_estimate_tir_flops.py}     |   2 +-
 .../test_s_tir_analysis_identify_memcpy.py}        |   2 +-
 .../test_s_tir_analysis_is_pure_function.py}       |   2 +-
 .../analysis/test_s_tir_analysis_oob.py}           |  10 +-
 .../test_s_tir_renew_defs.py}                      |  12 +-
 .../test_s_tir_transform_decorate_device_scope.py} |   2 +-
 .../test_s_tir_transform_default_gpu_schedule.py}  |   2 +-
 .../test_s_tir_transform_inject_double_buffer.py   |   2 +-
 .../test_s_tir_transform_remove_undef.py}          |  12 +-
 ...ransform_remove_weight_layout_rewrite_block.py} |   2 +-
 .../test_tir_transform_combine_context_call.py     | 113 -----
 .../test_tir_transform_convert_for_loops_serial.py |  62 ---
 ...r_transform_lower_device_storage_access_info.py | 155 ------
 .../test_tir_transform_make_unpacked_api.py        | 306 ------------
 ...ansform_reduce_branching_through_overcompute.py | 280 -----------
 .../test_tir_transform_storage_rewrite.py          |  19 -
 web/Makefile                                       |   2 +-
 web/emcc/tvmjs_support.cc                          |   3 +-
 web/emcc/wasm_runtime.cc                           |   1 -
 web/emcc/webgpu_runtime.cc                         |  32 +-
 264 files changed, 3085 insertions(+), 4481 deletions(-)
 rename include/tvm/{tir => s_tir}/backend/adreno/transform.h (73%)
 create mode 100644 include/tvm/support/io.h
 create mode 100644 include/tvm/support/serializer.h
 delete mode 100644 include/tvm/target/target_info.h
 rename python/tvm/{tir => s_tir}/backend/adreno/transform/__init__.py (100%)
 copy python/tvm/{ir/_ffi_analysis_api.py => 
s_tir/backend/adreno/transform/_ffi_api.py} (87%)
 rename python/tvm/{tir => s_tir}/backend/adreno/transform/transform.py (100%)
 delete mode 100644 python/tvm/tir/backend/adreno/transform/_ffi_api.py
 rename src/{tir => s_tir}/analysis/estimate_flops.cc (98%)
 rename src/{tir => s_tir}/analysis/identify_memcpy.cc (98%)
 rename src/{tir => s_tir}/analysis/is_pure_function.cc (94%)
 rename src/{tir => s_tir}/analysis/oob_checker.cc (92%)
 rename src/{tir => s_tir}/analysis/verify_gpu_code.cc (96%)
 rename src/{tir => s_tir}/backend/adreno/inject_texture_alloc.cc (90%)
 rename src/{tir => s_tir}/backend/adreno/texture_flatten.cc (94%)
 rename src/{tir => s_tir}/transform/decorate_device_scope.cc (79%)
 rename src/{tir => s_tir}/transform/default_gpu_schedule.cc (91%)
 rename src/{tir => s_tir}/transform/remove_store_undef.cc (88%)
 rename src/{tir => s_tir}/transform/remove_weight_layout_rewrite_block.cc (93%)
 rename src/{tir => s_tir}/transform/renew_defs.cc (98%)
 rename src/{tir => s_tir}/transform/using_assume_to_reduce_branches.cc (98%)
 create mode 100644 src/support/bytes_io.h
 create mode 100644 src/support/env.h
 delete mode 100644 src/target/target_info.cc
 delete mode 100644 src/tir/transform/combine_context_call.cc
 delete mode 100644 src/tir/transform/convert_for_loops_serial.cc
 delete mode 100644 src/tir/transform/lower_device_storage_access_info.cc
 delete mode 100644 src/tir/transform/make_unpacked_api.cc
 delete mode 100644 src/tir/transform/reduce_branching_through_overcompute.cc
 rename 
tests/python/{tir-analysis/test_tir_analysis_calculate_allocated_memory.py => 
s_tir/analysis/test_s_tir_analysis_calculate_allocated_memory.py} (96%)
 rename tests/python/{tir-analysis/test_tir_analysis_estimate_tir_flops.py => 
s_tir/analysis/test_s_tir_analysis_estimate_tir_flops.py} (98%)
 rename tests/python/{tir-analysis/test_tir_analysis_identify_memcpy.py => 
s_tir/analysis/test_s_tir_analysis_identify_memcpy.py} (99%)
 rename tests/python/{tir-analysis/test_tir_analysis_is_pure_function.py => 
s_tir/analysis/test_s_tir_analysis_is_pure_function.py} (97%)
 rename tests/python/{tir-analysis/test_tir_analysis_oob.py => 
s_tir/analysis/test_s_tir_analysis_oob.py} (84%)
 rename tests/python/{tir-base/test_tir_renew_defs.py => 
s_tir/test_s_tir_renew_defs.py} (96%)
 rename tests/python/{tir-transform/test_tir_transform_decorate_device_scope.py 
=> s_tir/transform/test_s_tir_transform_decorate_device_scope.py} (93%)
 rename tests/python/{tir-transform/test_transform_default_gpu_schedule.py => 
s_tir/transform/test_s_tir_transform_default_gpu_schedule.py} (99%)
 rename tests/python/{tir-transform/test_tir_transform_remove_undef.py => 
s_tir/transform/test_s_tir_transform_remove_undef.py} (90%)
 rename 
tests/python/{tir-transform/test_tir_transform_remove_weight_layout_rewrite_block.py
 => s_tir/transform/test_s_tir_transform_remove_weight_layout_rewrite_block.py} 
(97%)
 delete mode 100644 
tests/python/tir-transform/test_tir_transform_combine_context_call.py
 delete mode 100644 
tests/python/tir-transform/test_tir_transform_convert_for_loops_serial.py
 delete mode 100644 
tests/python/tir-transform/test_tir_transform_lower_device_storage_access_info.py
 delete mode 100644 
tests/python/tir-transform/test_tir_transform_make_unpacked_api.py
 delete mode 100644 
tests/python/tir-transform/test_tir_transform_reduce_branching_through_overcompute.py

Reply via email to