This is an automated email from the ASF dual-hosted git repository.

github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git


    from 00ae64744e [FFI][ABI] Refactor the naming of DLPack speed converter 
(#18308)
     add 678984f62d [FFI][ABI] Better String and Nested Container handling 
(#18311)
     add 5ddc5bc6c3 [FFI][REFACTOR] Update TVM_FFI_STATIC_INIT_BLOCK to fn 
style (#18312)

No new revisions were added by this update.

Summary of changes:
 3rdparty/cutlass_fpA_intB_gemm                     |   2 +-
 apps/cpp_rpc/rpc_server.cc                         |   4 +-
 apps/ios_rpc/tvmrpc/TVMRuntime.mm                  |   8 +-
 docs/arch/device_target_interactions.rst           |   8 +-
 docs/arch/pass_infra.rst                           |   4 +-
 docs/arch/runtime.rst                              |  10 +-
 ffi/docs/guides/packaging.md                       |   4 +-
 ffi/docs/guides/python_guide.md                    |   4 +-
 ffi/examples/packaging/src/extension.cc            |   4 +-
 ffi/include/tvm/ffi/base_details.h                 |  40 ++-
 ffi/include/tvm/ffi/c_api.h                        |  19 ++
 ffi/pyproject.toml                                 |   2 +-
 ffi/python/tvm_ffi/_convert.py                     |  11 +-
 ffi/python/tvm_ffi/_optional_torch_c_dlpack.py     |   1 -
 ffi/python/tvm_ffi/cython/base.pxi                 |  11 +
 ffi/python/tvm_ffi/cython/function.pxi             | 267 ++++++++++++++++-----
 ffi/python/tvm_ffi/cython/object.pxi               |  11 +-
 ffi/python/tvm_ffi/cython/string.pxi               |   5 -
 ffi/python/tvm_ffi/cython/tvm_ffi_python_helpers.h | 101 +++++++-
 ffi/src/ffi/container.cc                           |   4 +-
 ffi/src/ffi/extra/json_parser.cc                   |   4 +-
 ffi/src/ffi/extra/json_writer.cc                   |   4 +-
 ffi/src/ffi/extra/library_module_dynamic_lib.cc    |   4 +-
 ffi/src/ffi/extra/library_module_system_lib.cc     |   4 +-
 ffi/src/ffi/extra/module.cc                        |   4 +-
 ffi/src/ffi/extra/reflection_extra.cc              |   4 +-
 ffi/src/ffi/extra/serialization.cc                 |   4 +-
 ffi/src/ffi/extra/structural_equal.cc              |   4 +-
 ffi/src/ffi/extra/structural_hash.cc               |   4 +-
 ffi/src/ffi/extra/testing.cc                       |   8 +-
 ffi/src/ffi/function.cc                            |   4 +-
 ffi/src/ffi/object.cc                              |  18 ++
 ffi/src/ffi/tensor.cc                              |   4 +-
 ffi/tests/cpp/test_reflection.cc                   |   8 +-
 ffi/tests/python/test_function.py                  |  33 +++
 ffi/tests/python/test_load_inline.py               |  13 +-
 include/tvm/runtime/profiling.h                    |   4 +-
 python/tvm/contrib/msc/plugin/codegen/sources.py   |  13 +-
 src/arith/analyzer.cc                              |   4 +-
 src/arith/bound_deducer.cc                         |   4 +-
 src/arith/const_int_bound.cc                       |   6 +-
 src/arith/detect_common_subexpr.cc                 |   4 +-
 src/arith/detect_linear_equation.cc                |   4 +-
 src/arith/domain_touched.cc                        |   4 +-
 src/arith/int_constraints.cc                       |  16 +-
 src/arith/int_set.cc                               |  10 +-
 src/arith/iter_affine_map.cc                       |  40 +--
 src/arith/modular_set.cc                           |   6 +-
 src/arith/narrow_predicate_expression.cc           |   4 +-
 src/arith/presburger_set.cc                        |   6 +-
 src/arith/rewrite_simplify.cc                      |   2 +-
 src/arith/solve_linear_equation.cc                 |   4 +-
 src/arith/solve_linear_inequality.cc               |   4 +-
 src/contrib/msc/core/ir/graph.cc                   |  16 +-
 src/contrib/msc/core/ir/graph_builder.cc           |   4 +-
 src/contrib/msc/core/ir/plugin.cc                  |   8 +-
 src/contrib/msc/core/printer/msc_doc.cc            |   4 +-
 .../msc/core/transform/bind_named_params.cc        |   4 +-
 src/contrib/msc/core/transform/bind_shape.cc       |   4 +-
 src/contrib/msc/core/transform/fuse_tuple.cc       |   4 +-
 src/contrib/msc/core/transform/inline_params.cc    |   4 +-
 src/contrib/msc/core/transform/set_byoc_attrs.cc   |   4 +-
 src/contrib/msc/core/transform/set_expr_layout.cc  |   4 +-
 src/contrib/msc/core/transform/set_expr_name.cc    |   4 +-
 src/contrib/msc/core/utils.cc                      |   4 +-
 src/contrib/msc/framework/tensorflow/codegen.cc    |   4 +-
 src/contrib/msc/framework/tensorrt/codegen.cc      |   8 +-
 .../msc/framework/tensorrt/transform_tensorrt.cc   |   4 +-
 src/contrib/msc/framework/torch/codegen.cc         |   4 +-
 src/contrib/msc/framework/tvm/codegen.cc           |   4 +-
 src/contrib/msc/plugin/tensorrt_codegen.cc         |   4 +-
 src/contrib/msc/plugin/torch_codegen.cc            |   4 +-
 src/contrib/msc/plugin/tvm_codegen.cc              |   4 +-
 src/ir/analysis.cc                                 |   4 +-
 src/ir/apply_pass_to_function.cc                   |   4 +-
 src/ir/attrs.cc                                    |  10 +-
 src/ir/diagnostic.cc                               |  32 +--
 src/ir/env_func.cc                                 |   6 +-
 src/ir/expr.cc                                     |  20 +-
 src/ir/function.cc                                 |   4 +-
 src/ir/global_info.cc                              |  12 +-
 src/ir/global_var_supply.cc                        |   6 +-
 src/ir/instrument.cc                               |  10 +-
 src/ir/module.cc                                   |   6 +-
 src/ir/name_supply.cc                              |   4 +-
 src/ir/op.cc                                       |   6 +-
 src/ir/replace_global_vars.cc                      |   8 +-
 src/ir/source_map.cc                               |  16 +-
 src/ir/transform.cc                                |  28 +--
 src/ir/type.cc                                     |  20 +-
 src/meta_schedule/arg_info.cc                      |   6 +-
 src/meta_schedule/builder/builder.cc               |   8 +-
 src/meta_schedule/cost_model/cost_model.cc         |   4 +-
 src/meta_schedule/database/database.cc             |   8 +-
 src/meta_schedule/database/json_database.cc        |   6 +-
 src/meta_schedule/database/memory_database.cc      |   6 +-
 .../database/ordered_union_database.cc             |   6 +-
 src/meta_schedule/database/schedule_fn_database.cc |   6 +-
 src/meta_schedule/database/union_database.cc       |   6 +-
 src/meta_schedule/extracted_task.cc                |   6 +-
 .../feature_extractor/feature_extractor.cc         |   8 +-
 .../feature_extractor/per_store_feature.cc         |   6 +-
 .../measure_callback/add_to_database.cc            |   4 +-
 .../measure_callback/measure_callback.cc           |   8 +-
 .../measure_callback/remove_build_artifact.cc      |   4 +-
 .../measure_callback/update_cost_model.cc          |   4 +-
 .../mutator/mutate_compute_location.cc             |   6 +-
 src/meta_schedule/mutator/mutate_parallel.cc       |   6 +-
 src/meta_schedule/mutator/mutate_thread_binding.cc |   6 +-
 src/meta_schedule/mutator/mutate_tile_size.cc      |   6 +-
 src/meta_schedule/mutator/mutate_unroll.cc         |   6 +-
 src/meta_schedule/mutator/mutator.cc               |   8 +-
 .../postproc/disallow_async_strided_mem_copy.cc    |   4 +-
 .../postproc/disallow_dynamic_loop.cc              |   4 +-
 src/meta_schedule/postproc/postproc.cc             |   8 +-
 .../postproc/rewrite_cooperative_fetch.cc          |   6 +-
 src/meta_schedule/postproc/rewrite_layout.cc       |   4 +-
 .../postproc/rewrite_parallel_vectorize_unroll.cc  |   4 +-
 .../postproc/rewrite_reduction_block.cc            |   6 +-
 src/meta_schedule/postproc/rewrite_tensorize.cc    |   6 +-
 .../postproc/rewrite_unbound_block.cc              |   6 +-
 src/meta_schedule/postproc/verify_gpu_code.cc      |   4 +-
 src/meta_schedule/postproc/verify_vtcm_limit.cc    |   4 +-
 src/meta_schedule/profiler.cc                      |   6 +-
 src/meta_schedule/runner/runner.cc                 |   8 +-
 src/meta_schedule/schedule/cpu/winograd.cc         |   4 +-
 src/meta_schedule/schedule/cuda/winograd.cc        |   4 +-
 src/meta_schedule/schedule_rule/add_rfactor.cc     |   6 +-
 .../schedule_rule/apply_custom_rule.cc             |   6 +-
 src/meta_schedule/schedule_rule/auto_bind.cc       |   6 +-
 src/meta_schedule/schedule_rule/auto_inline.cc     |  12 +-
 .../schedule_rule/cross_thread_reduction.cc        |   6 +-
 .../schedule_rule/multi_level_tiling.cc            |   6 +-
 .../multi_level_tiling_tensor_core.cc              |   4 +-
 .../multi_level_tiling_wide_vector.cc              |   4 +-
 .../multi_level_tiling_with_intrin.cc              |   4 +-
 .../schedule_rule/parallel_vectorize_unroll.cc     |   6 +-
 .../schedule_rule/random_compute_location.cc       |   6 +-
 src/meta_schedule/schedule_rule/schedule_rule.cc   |   8 +-
 .../search_strategy/evolutionary_search.cc         |   6 +-
 src/meta_schedule/search_strategy/replay_func.cc   |   6 +-
 src/meta_schedule/search_strategy/replay_trace.cc  |   6 +-
 .../search_strategy/search_strategy.cc             |   8 +-
 .../space_generator/post_order_apply.cc            |   6 +-
 src/meta_schedule/space_generator/schedule_fn.cc   |   6 +-
 .../space_generator/space_generator.cc             |   8 +-
 .../space_generator/space_generator_union.cc       |   6 +-
 src/meta_schedule/task_scheduler/gradient_based.cc |   6 +-
 src/meta_schedule/task_scheduler/round_robin.cc    |   6 +-
 src/meta_schedule/task_scheduler/task_scheduler.cc |   8 +-
 src/meta_schedule/trace_apply.cc                   |   4 +-
 src/meta_schedule/tune_context.cc                  |   6 +-
 src/node/reflection.cc                             |   4 +-
 src/node/repr_printer.cc                           |   4 +-
 src/node/script_printer.cc                         |   6 +-
 src/node/serialization.cc                          |   4 +-
 src/node/structural_equal.cc                       |   4 +-
 src/node/structural_hash.cc                        |  14 +-
 src/relax/analysis/analysis.cc                     |   4 +-
 src/relax/analysis/computable_at_compile_time.cc   |   4 +-
 src/relax/analysis/detect_recursion.cc             |   4 +-
 src/relax/analysis/layout_transformation.cc        |   4 +-
 src/relax/analysis/struct_info_analysis.cc         |  38 +--
 src/relax/analysis/tir_op_pattern_kind.cc          |   4 +-
 src/relax/analysis/udchain.cc                      |   4 +-
 src/relax/analysis/var2value.cc                    |   8 +-
 src/relax/analysis/well_formed.cc                  |   4 +-
 src/relax/backend/contrib/clml/codegen.cc          |  10 +-
 src/relax/backend/contrib/cublas/codegen.cc        |   4 +-
 src/relax/backend/contrib/cudnn/codegen.cc         |   4 +-
 src/relax/backend/contrib/cutlass/codegen.cc       |  10 +-
 src/relax/backend/contrib/dnnl/codegen.cc          |   4 +-
 src/relax/backend/contrib/hipblas/codegen.cc       |   4 +-
 src/relax/backend/contrib/nnapi/codegen.cc         |   4 +-
 src/relax/backend/contrib/tensorrt/codegen.cc      |  10 +-
 src/relax/backend/contrib/utils.cc                 |   4 +-
 src/relax/backend/pattern_registry.cc              |   4 +-
 src/relax/backend/task_extraction.cc               |   4 +-
 src/relax/backend/vm/codegen_vm.cc                 |   8 +-
 src/relax/backend/vm/codegen_vm_tir.cc             |   4 +-
 src/relax/backend/vm/exec_builder.cc               |   6 +-
 src/relax/backend/vm/lower_runtime_builtin.cc      |   4 +-
 src/relax/backend/vm/vm_shape_lower.cc             |   4 +-
 src/relax/distributed/global_info.cc               |   6 +-
 src/relax/distributed/struct_info.cc               |  16 +-
 .../distributed/transform/legalize_redistribute.cc |   4 +-
 src/relax/distributed/transform/lower_distir.cc    |   4 +-
 .../transform/lower_global_view_to_local_view.cc   |   4 +-
 .../distributed/transform/propagate_sharding.cc    |   4 +-
 src/relax/ir/binding_rewrite.cc                    |  32 +--
 src/relax/ir/block_builder.cc                      |   4 +-
 src/relax/ir/dataflow_block_rewriter.cc            |  10 +-
 src/relax/ir/dataflow_expr_rewriter.cc             |  35 +--
 src/relax/ir/dataflow_pattern.cc                   | 100 ++++----
 src/relax/ir/emit_te.cc                            |   6 +-
 src/relax/ir/expr.cc                               |  88 +++----
 src/relax/ir/expr_functor.cc                       |   4 +-
 src/relax/ir/py_expr_functor.cc                    |   8 +-
 src/relax/ir/struct_info.cc                        |  32 +--
 src/relax/ir/tir_pattern.cc                        |   2 +-
 src/relax/ir/transform.cc                          |  12 +-
 src/relax/ir/type.cc                               |  20 +-
 src/relax/op/ccl/ccl.cc                            |  20 +-
 src/relax/op/distributed/distributed.cc            |  18 +-
 src/relax/op/image/resize.cc                       |   6 +-
 src/relax/op/memory/view.cc                        |  12 +-
 src/relax/op/nn/attention.cc                       |   6 +-
 src/relax/op/nn/convolution.cc                     |  24 +-
 src/relax/op/nn/nn.cc                              |  64 ++---
 src/relax/op/nn/nn.h                               |   4 +-
 src/relax/op/nn/pooling.cc                         |  40 +--
 src/relax/op/op.cc                                 | 116 ++++-----
 src/relax/op/op_common.h                           |  15 +-
 src/relax/op/tensor/binary.h                       |   5 +-
 src/relax/op/tensor/create.cc                      |  36 +--
 src/relax/op/tensor/datatype.cc                    |  12 +-
 src/relax/op/tensor/grad.cc                        |  28 +--
 src/relax/op/tensor/index.cc                       |  16 +-
 src/relax/op/tensor/linear_algebra.cc              |  16 +-
 src/relax/op/tensor/manipulate.cc                  | 100 ++++----
 src/relax/op/tensor/qdq.cc                         |  10 +-
 src/relax/op/tensor/sampling.cc                    |   6 +-
 src/relax/op/tensor/search.cc                      |  17 +-
 src/relax/op/tensor/set.cc                         |   8 +-
 src/relax/op/tensor/sorting.cc                     |  16 +-
 src/relax/op/tensor/statistical.cc                 |  12 +-
 src/relax/op/tensor/statistical.h                  |   5 +-
 src/relax/op/tensor/ternary.cc                     |   4 +-
 src/relax/op/tensor/unary.cc                       |   4 +-
 src/relax/op/tensor/unary.h                        |   2 +-
 src/relax/testing/transform.cc                     |   4 +-
 src/relax/training/utils.cc                        |   4 +-
 src/relax/transform/adjust_matmul_order.cc         |   4 +-
 src/relax/transform/allocate_workspace.cc          |   4 +-
 src/relax/transform/alter_op_impl.cc               |   4 +-
 src/relax/transform/annotate_tir_op_pattern.cc     |   4 +-
 .../transform/attach_attr_layout_free_buffers.cc   |   4 +-
 src/relax/transform/attach_global_symbol.cc        |   4 +-
 src/relax/transform/bind_params.cc                 |   8 +-
 src/relax/transform/bind_symbolic_vars.cc          |   8 +-
 src/relax/transform/bundle_model_params.cc         |   4 +-
 src/relax/transform/call_tir_rewrite.cc            |   4 +-
 src/relax/transform/canonicalize_bindings.cc       |   4 +-
 src/relax/transform/combine_parallel_matmul.cc     |   4 +-
 src/relax/transform/compute_prim_value.cc          |   4 +-
 src/relax/transform/convert_dataflow.cc            |   4 +-
 src/relax/transform/convert_layout.cc              |   4 +-
 src/relax/transform/dataflow_inplace.cc            |  10 +-
 src/relax/transform/dead_code_elimination.cc       |   4 +-
 src/relax/transform/decompose_ops.cc               |   4 +-
 src/relax/transform/eliminate_common_subexpr.cc    |   4 +-
 src/relax/transform/expand_matmul_of_sum.cc        |   4 +-
 src/relax/transform/expand_tuple_arguments.cc      |   4 +-
 src/relax/transform/few_shot_tuning.cc             |   4 +-
 src/relax/transform/fold_constant.cc               |   4 +-
 src/relax/transform/fuse_ops.cc                    |  16 +-
 src/relax/transform/fuse_tir.cc                    |   4 +-
 src/relax/transform/gradient.cc                    |   4 +-
 src/relax/transform/infer_layout_utils.cc          |   4 +-
 src/relax/transform/inline_functions.cc            |   8 +-
 src/relax/transform/kill_after_last_use.cc         |   4 +-
 src/relax/transform/lambda_lift.cc                 |   4 +-
 src/relax/transform/lazy_transform_params.cc       |   8 +-
 src/relax/transform/legalize_ops.cc                |   4 +-
 src/relax/transform/lift_transform_params.cc       |   4 +-
 src/relax/transform/lower_alloc_tensor.cc          |   4 +-
 src/relax/transform/merge_composite_functions.cc   |   4 +-
 src/relax/transform/meta_schedule.cc               |   4 +-
 src/relax/transform/normalize.cc                   |   8 +-
 src/relax/transform/realize_vdevice.cc             |   4 +-
 src/relax/transform/remove_purity_checking.cc      |   4 +-
 src/relax/transform/remove_unused_outputs.cc       |   4 +-
 src/relax/transform/remove_unused_parameters.cc    |   4 +-
 .../transform/reorder_permute_dims_after_concat.cc |   4 +-
 src/relax/transform/reorder_take_after_matmul.cc   |   4 +-
 src/relax/transform/rewrite_cuda_graph.cc          |   4 +-
 src/relax/transform/rewrite_dataflow_reshape.cc    |   4 +-
 src/relax/transform/run_codegen.cc                 |   4 +-
 src/relax/transform/split_call_tir_by_pattern.cc   |   4 +-
 .../transform/split_layout_rewrite_preproc.cc      |   4 +-
 src/relax/transform/static_plan_block_memory.cc    |   4 +-
 src/relax/transform/to_mixed_precision.cc          |   4 +-
 src/relax/transform/to_non_dataflow.cc             |   4 +-
 src/relax/transform/topological_sort.cc            |   4 +-
 src/relax/transform/update_param_struct_info.cc    |   4 +-
 src/relax/transform/update_vdevice.cc              |   4 +-
 src/relax/utils.cc                                 |   4 +-
 src/runtime/const_loader_module.cc                 |   4 +-
 src/runtime/contrib/amx/amx_config.cc              |   8 +-
 src/runtime/contrib/arm_compute_lib/acl_runtime.cc |   4 +-
 src/runtime/contrib/bnns/bnns_json_runtime.cc      |   4 +-
 src/runtime/contrib/cblas/cblas.cc                 |   4 +-
 src/runtime/contrib/cblas/dnnl_blas.cc             |   4 +-
 src/runtime/contrib/cblas/mkl.cc                   |   8 +-
 src/runtime/contrib/clml/clml_runtime.cc           |   4 +-
 src/runtime/contrib/coreml/coreml_runtime.mm       |   8 +-
 src/runtime/contrib/cublas/cublas.cc               |  12 +-
 src/runtime/contrib/cublas/cublas_json_runtime.cc  |   4 +-
 src/runtime/contrib/cudnn/conv_backward.cc         |   4 +-
 src/runtime/contrib/cudnn/conv_forward.cc          |   4 +-
 src/runtime/contrib/cudnn/cudnn_json_runtime.cc    |   4 +-
 src/runtime/contrib/cudnn/cudnn_utils.cc           |   4 +-
 src/runtime/contrib/cudnn/softmax.cc               |   4 +-
 src/runtime/contrib/curand/curand.cc               |   4 +-
 .../contrib/cutlass/fp16_group_gemm_sm100.cu       |   4 +-
 .../contrib/cutlass/fp16_group_gemm_sm90.cu        |   4 +-
 src/runtime/contrib/cutlass/fp8_gemm.cu            |   4 +-
 src/runtime/contrib/cutlass/fp8_group_gemm_sm90.cu |   4 +-
 .../cutlass/fp8_groupwise_scaled_gemm_sm100.cu     |   4 +-
 .../cutlass/fp8_groupwise_scaled_gemm_sm90.cu      |   4 +-
 .../fp8_groupwise_scaled_group_gemm_sm100.cu       |   4 +-
 src/runtime/contrib/cutlass/weight_preprocess.cc   |   4 +-
 src/runtime/contrib/dnnl/dnnl.cc                   |   4 +-
 src/runtime/contrib/dnnl/dnnl_json_runtime.cc      |   4 +-
 src/runtime/contrib/edgetpu/edgetpu_runtime.cc     |   4 +-
 src/runtime/contrib/hipblas/hipblas.cc             |   4 +-
 .../contrib/hipblas/hipblas_json_runtime.cc        |   4 +-
 src/runtime/contrib/miopen/conv_forward.cc         |   4 +-
 src/runtime/contrib/miopen/softmax.cc              |   4 +-
 src/runtime/contrib/mps/conv.mm                    |   4 +-
 src/runtime/contrib/mps/gemm.mm                    |   4 +-
 src/runtime/contrib/mrvl/mrvl_hw_runtime.cc        |   4 +-
 src/runtime/contrib/mrvl/mrvl_runtime.cc           |   4 +-
 src/runtime/contrib/msc/tensorrt_runtime.cc        |   4 +-
 src/runtime/contrib/nnapi/nnapi_runtime.cc         |   4 +-
 src/runtime/contrib/nvshmem/init.cc                |   4 +-
 src/runtime/contrib/nvshmem/kv_transfer.cu         |   4 +-
 src/runtime/contrib/nvshmem/memory_allocator.cc    |   8 +-
 src/runtime/contrib/papi/papi.cc                   |   4 +-
 src/runtime/contrib/random/random.cc               |   4 +-
 src/runtime/contrib/rocblas/rocblas.cc             |   4 +-
 src/runtime/contrib/sort/sort.cc                   |   4 +-
 src/runtime/contrib/tensorrt/tensorrt_runtime.cc   |   4 +-
 src/runtime/contrib/tflite/tflite_runtime.cc       |   4 +-
 src/runtime/contrib/thrust/thrust.cu               |  12 +-
 src/runtime/contrib/vllm/attention_kernels.cu      |   8 +-
 src/runtime/contrib/vllm/cache_alloc.cc            |   4 +-
 src/runtime/contrib/vllm/cache_kernels.cu          |   4 +-
 src/runtime/cpu_device_api.cc                      |   4 +-
 src/runtime/cuda/cuda_device_api.cc                |  20 +-
 src/runtime/cuda/cuda_module.cc                    |   4 +-
 src/runtime/cuda/l2_cache_flush.cc                 |   4 +-
 src/runtime/device_api.cc                          |   8 +-
 src/runtime/disco/builtin.cc                       |   4 +-
 src/runtime/disco/cuda_ipc/cuda_ipc_memory.cc      |   4 +-
 src/runtime/disco/cuda_ipc/custom_allreduce.cc     |   4 +-
 src/runtime/disco/distributed/socket_session.cc    |   8 +-
 src/runtime/disco/loader.cc                        |   4 +-
 src/runtime/disco/nccl/nccl.cc                     |   4 +-
 src/runtime/disco/process_session.cc               |   4 +-
 src/runtime/disco/protocol.h                       |   6 +-
 src/runtime/disco/session.cc                       |   4 +-
 src/runtime/file_utils.cc                          |   4 +-
 src/runtime/hexagon/hexagon_common.cc              |   8 +-
 src/runtime/hexagon/hexagon_device_api.cc          |   4 +-
 src/runtime/hexagon/rpc/android/session.cc         |   4 +-
 src/runtime/hexagon/rpc/hexagon/rpc_server.cc      |   8 +-
 src/runtime/hexagon/rpc/simulator/rpc_server.cc    |   8 +-
 src/runtime/hexagon/rpc/simulator/session.cc       |   4 +-
 src/runtime/memory/memory_manager.cc               |   4 +-
 src/runtime/metal/metal_device_api.mm              |   8 +-
 src/runtime/metal/metal_module.mm                  |   8 +-
 src/runtime/minrpc/rpc_reference.h                 |   4 +-
 src/runtime/module.cc                              |   4 +-
 src/runtime/opencl/opencl_device_api.cc            |  12 +-
 src/runtime/opencl/opencl_module.cc                |   4 +-
 src/runtime/profiling.cc                           |  20 +-
 src/runtime/rocm/rocm_device_api.cc                |   8 +-
 src/runtime/rocm/rocm_module.cc                    |   4 +-
 src/runtime/rpc/rpc_device_api.cc                  |   4 +-
 src/runtime/rpc/rpc_endpoint.cc                    |  44 +++-
 src/runtime/rpc/rpc_event_impl.cc                  |   4 +-
 src/runtime/rpc/rpc_local_session.cc               |   4 +-
 src/runtime/rpc/rpc_module.cc                      |  12 +-
 src/runtime/rpc/rpc_pipe_impl.cc                   |   4 +-
 src/runtime/rpc/rpc_server_env.cc                  |   4 +-
 src/runtime/rpc/rpc_socket_impl.cc                 |   8 +-
 src/runtime/static_library.cc                      |   4 +-
 src/runtime/tensor.cc                              |   4 +-
 src/runtime/thread_pool.cc                         |   4 +-
 src/runtime/threading_backend.cc                   |   4 +-
 src/runtime/vm/builtin.cc                          |  64 ++---
 src/runtime/vm/cuda/cuda_graph_builtin.cc          |   4 +-
 src/runtime/vm/executable.cc                       |   8 +-
 src/runtime/vm/hexagon/builtin.cc                  |   4 +-
 src/runtime/vm/kv_state.cc                         |  12 +-
 src/runtime/vm/lm_support.cc                       |  56 ++---
 src/runtime/vm/paged_kv_cache.cc                   |   4 +-
 src/runtime/vm/rnn_state.cc                        |   4 +-
 src/runtime/vm/tensor_cache_support.cc             |   8 +-
 src/runtime/vulkan/vulkan_device_api.cc            |   4 +-
 src/runtime/vulkan/vulkan_module.cc                |   4 +-
 src/script/ir_builder/base.cc                      |   8 +-
 src/script/ir_builder/ir/frame.cc                  |   2 +-
 src/script/ir_builder/ir/ir.cc                     |   4 +-
 src/script/ir_builder/relax/distributed.cc         |   4 +-
 src/script/ir_builder/relax/frame.cc               |   4 +-
 src/script/ir_builder/relax/ir.cc                  |  20 +-
 src/script/ir_builder/tir/frame.cc                 |   4 +-
 src/script/ir_builder/tir/ir.cc                    |  56 ++---
 src/script/printer/doc.cc                          | 112 ++++-----
 .../printer/doc_printer/python_doc_printer.cc      |   4 +-
 src/script/printer/ir/ir.cc                        |   2 +-
 src/script/printer/ir_docsifier.cc                 |   4 +-
 src/script/printer/relax/function.cc               |   2 +-
 src/script/printer/relax/type.cc                   |   4 +-
 src/script/printer/tir/ir.cc                       |   2 +-
 src/support/ffi_testing.cc                         |  18 +-
 src/support/libinfo.cc                             |   4 +-
 src/target/codegen.cc                              |   8 +-
 src/target/datatype/registry.cc                    |   4 +-
 src/target/llvm/codegen_aarch64.cc                 |   4 +-
 src/target/llvm/codegen_amdgpu.cc                  |   4 +-
 src/target/llvm/codegen_arm.cc                     |   4 +-
 src/target/llvm/codegen_cpu.cc                     |   4 +-
 src/target/llvm/codegen_hexagon.cc                 |   4 +-
 src/target/llvm/codegen_llvm.cc                    |   2 +-
 src/target/llvm/codegen_nvptx.cc                   |   4 +-
 src/target/llvm/codegen_x86_64.cc                  |   4 +-
 src/target/llvm/llvm_module.cc                     |   2 +-
 src/target/opt/build_cuda_on.cc                    |   4 +-
 src/target/source/codegen_c_host.cc                |   4 +-
 src/target/source/codegen_metal.cc                 |   4 +-
 src/target/source/codegen_opencl.cc                |   8 +-
 src/target/source/codegen_webgpu.cc                |   4 +-
 src/target/source/source_module.cc                 |   8 +-
 src/target/spirv/build_vulkan.cc                   |   4 +-
 src/target/tag.cc                                  |   6 +-
 src/target/target.cc                               |   6 +-
 src/target/target_info.cc                          |   2 +-
 src/target/target_kind.cc                          |   8 +-
 src/target/virtual_device.cc                       |   6 +-
 src/te/operation/compute_op.cc                     |   8 +-
 src/te/operation/create_primfunc.cc                |   4 +-
 src/te/operation/extern_op.cc                      |   6 +-
 src/te/operation/graph.cc                          |   4 +-
 src/te/operation/placeholder_op.cc                 |   6 +-
 src/te/operation/scan_op.cc                        |   6 +-
 src/te/tensor.cc                                   |  10 +-
 src/tir/analysis/block_access_region_detector.cc   |   4 +-
 src/tir/analysis/buffer_access_lca_detector.cc     |   4 +-
 src/tir/analysis/calculate_allocated_memory.cc     |  12 +-
 src/tir/analysis/deep_equal.cc                     |   4 +-
 src/tir/analysis/estimate_flops.cc                 |   4 +-
 src/tir/analysis/identify_memcpy.cc                |   4 +-
 src/tir/analysis/is_pure_function.cc               |   4 +-
 src/tir/analysis/oob_checker.cc                    |   4 +-
 src/tir/analysis/stmt_finding.cc                   |   4 +-
 src/tir/analysis/var_use_def_analysis.cc           |   4 +-
 src/tir/analysis/verify_gpu_code.cc                |   8 +-
 src/tir/analysis/verify_memory.cc                  |   8 +-
 src/tir/analysis/verify_ssa.cc                     |   8 +-
 src/tir/analysis/verify_well_formed.cc             |   4 +-
 src/tir/ir/block_dependence_info.cc                |   6 +-
 src/tir/ir/block_scope.cc                          |   8 +-
 src/tir/ir/buffer.cc                               |   6 +-
 src/tir/ir/data_layout.cc                          |   8 +-
 src/tir/ir/expr.cc                                 | 140 +++++------
 src/tir/ir/function.cc                             |   8 +-
 src/tir/ir/index_map.cc                            |   6 +-
 src/tir/ir/py_functor.cc                           |  16 +-
 src/tir/ir/script/script_complete.cc               |   4 +-
 src/tir/ir/specialize.cc                           |   4 +-
 src/tir/ir/stmt.cc                                 |  72 +++---
 src/tir/ir/stmt_functor.cc                         |   4 +-
 src/tir/ir/transform.cc                            |   6 +-
 src/tir/op/op.cc                                   |  20 +-
 src/tir/schedule/analysis/analysis.cc              |  24 +-
 src/tir/schedule/analysis/layout.cc                |   4 +-
 src/tir/schedule/instruction.cc                    |   8 +-
 src/tir/schedule/primitive/decompose_padding.cc    |   4 +-
 src/tir/schedule/primitive/reduction.cc            |   4 +-
 src/tir/schedule/schedule.cc                       |  80 +++---
 src/tir/schedule/state.cc                          |   6 +-
 src/tir/schedule/trace.cc                          |   6 +-
 src/tir/schedule/transform.cc                      |   8 +-
 src/tir/transforms/annotate_device_regions.cc      |   4 +-
 src/tir/transforms/bind_target.cc                  |   4 +-
 src/tir/transforms/bound_checker.cc                |   4 +-
 src/tir/transforms/combine_context_call.cc         |   4 +-
 src/tir/transforms/common_subexpr_elim.cc          |   4 +-
 src/tir/transforms/compact_buffer_region.cc        |   4 +-
 src/tir/transforms/convert_blocks_to_opaque.cc     |   4 +-
 src/tir/transforms/convert_for_loops_serial.cc     |   4 +-
 src/tir/transforms/decorate_device_scope.cc        |   4 +-
 src/tir/transforms/default_gpu_schedule.cc         |   4 +-
 src/tir/transforms/extract_constants.cc            |   4 +-
 src/tir/transforms/flatten_buffer.cc               |   4 +-
 src/tir/transforms/force_narrow_index_to_i32.cc    |   4 +-
 src/tir/transforms/hoist_expression.cc             |  16 +-
 src/tir/transforms/inject_double_buffer.cc         |   6 +-
 src/tir/transforms/inject_permuted_layout.cc       |   4 +-
 src/tir/transforms/inject_ptx_async_copy.cc        |   4 +-
 src/tir/transforms/inject_ptx_ldg32.cc             |   4 +-
 src/tir/transforms/inject_rolling_buffer.cc        |   4 +-
 src/tir/transforms/inject_software_pipeline.cc     |   4 +-
 src/tir/transforms/inject_virtual_thread.cc        |   4 +-
 src/tir/transforms/inline_private_functions.cc     |   4 +-
 src/tir/transforms/ir_utils.cc                     |   4 +-
 src/tir/transforms/lift_thread_binding.cc          |   4 +-
 src/tir/transforms/loop_partition.cc               |   6 +-
 src/tir/transforms/lower_async_dma.cc              |   4 +-
 src/tir/transforms/lower_cross_thread_reduction.cc |   4 +-
 src/tir/transforms/lower_custom_datatypes.cc       |   4 +-
 src/tir/transforms/lower_device_kernel_launch.cc   |   4 +-
 .../transforms/lower_device_storage_access_info.cc |   4 +-
 src/tir/transforms/lower_init_block.cc             |   4 +-
 src/tir/transforms/lower_intrin.cc                 |   4 +-
 src/tir/transforms/lower_match_buffer.cc           |   4 +-
 src/tir/transforms/lower_opaque_block.cc           |   4 +-
 src/tir/transforms/lower_thread_allreduce.cc       |   4 +-
 src/tir/transforms/lower_tvm_builtin.cc            |   4 +-
 src/tir/transforms/lower_vtcm_alloc.cc             |   4 +-
 src/tir/transforms/lower_warp_memory.cc            |   4 +-
 src/tir/transforms/make_packed_api.cc              |   4 +-
 src/tir/transforms/make_unpacked_api.cc            |   4 +-
 .../manifest_shared_memory_local_stage.cc          |   4 +-
 src/tir/transforms/memhammer_lower_auto_copy.cc    |   4 +-
 .../transforms/merge_shared_memory_allocations.cc  |   4 +-
 src/tir/transforms/narrow_datatype.cc              |   4 +-
 .../plan_update_buffer_allocation_location.cc      |   4 +-
 src/tir/transforms/primfunc_utils.cc               |   4 +-
 src/tir/transforms/profile_instrumentation.cc      |   4 +-
 .../reduce_branching_through_overcompute.cc        |   6 +-
 src/tir/transforms/remap_thread_axis.cc            |   4 +-
 src/tir/transforms/remove_assume.cc                |   4 +-
 src/tir/transforms/remove_no_op.cc                 |   6 +-
 src/tir/transforms/remove_store_undef.cc           |   4 +-
 .../remove_weight_layout_rewrite_block.cc          |   4 +-
 src/tir/transforms/renew_defs.cc                   |   4 +-
 src/tir/transforms/renormalize_split_pattern.cc    |   4 +-
 src/tir/transforms/rewrite_unsafe_select.cc        |   4 +-
 src/tir/transforms/simplify.cc                     |   6 +-
 src/tir/transforms/skip_assert.cc                  |   4 +-
 src/tir/transforms/split_host_device.cc            |   4 +-
 src/tir/transforms/storage_rewrite.cc              |   8 +-
 src/tir/transforms/tensorcore_infer_fragment.cc    |   4 +-
 src/tir/transforms/thread_storage_sync.cc          |   4 +-
 src/tir/transforms/transform_mma_buffer_layout.cc  |   4 +-
 src/tir/transforms/unify_thread_binding.cc         |   4 +-
 src/tir/transforms/unroll_loop.cc                  |   6 +-
 src/tir/transforms/unsupported_dtype_legalize.cc   |  16 +-
 .../transforms/using_assume_to_reduce_branches.cc  |   4 +-
 src/tir/transforms/vectorize_loop.cc               |   4 +-
 src/topi/broadcast.cc                              |   4 +-
 src/topi/einsum.cc                                 |   4 +-
 src/topi/elemwise.cc                               |   4 +-
 src/topi/nn.cc                                     |  52 ++--
 src/topi/reduction.cc                              |   4 +-
 src/topi/transform.cc                              |   4 +-
 src/topi/utils.cc                                  |   4 +-
 src/topi/vision.cc                                 |   4 +-
 tests/cpp-runtime/hexagon/run_all_tests.cc         |   4 +-
 tests/cpp-runtime/hexagon/run_unit_tests.cc        |   4 +-
 tests/python/contrib/test_hexagon/README_RPC.md    |   8 +-
 web/emcc/tvmjs_support.cc                          |   4 +-
 web/emcc/wasm_runtime.cc                           |  16 +-
 web/emcc/webgpu_runtime.cc                         |   4 +-
 558 files changed, 2673 insertions(+), 2323 deletions(-)

Reply via email to