This is an automated email from the ASF dual-hosted git repository.

github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git


    from ada7c7c7cc [Relax][Frontend][ONNX] Fix: bitwise_not misclassified as 
binary (is … (#18001)
     add 2d964b4133 [REFACTOR][FFI] Phase out legacy C API (#18010)

No new revisions were added by this update.

Summary of changes:
 3rdparty/cutlass_fpA_intB_gemm                     |   2 +-
 apps/android_rpc/app/src/main/jni/tvm_runtime.h    |   4 +-
 apps/cpp_rpc/rpc_env.cc                            |   4 +-
 apps/cpp_rpc/rpc_env.h                             |   2 +-
 apps/cpp_rpc/rpc_server.cc                         |   4 +-
 apps/cpp_rpc/rpc_server.h                          |   2 +-
 apps/hexagon_launcher/launcher_core.cc             |   2 +-
 apps/ios_rpc/tvmrpc/RPCServer.mm                   |   2 +-
 apps/ios_rpc/tvmrpc/TVMRuntime.mm                  |   8 +-
 docs/arch/device_target_interactions.rst           |  10 +-
 docs/arch/pass_infra.rst                           |   2 +-
 docs/arch/runtime.rst                              |   8 +-
 ffi/include/tvm/ffi/c_api.h                        |   7 +
 ffi/include/tvm/ffi/function.h                     |   2 +-
 include/tvm/ir/op.h                                |   2 +-
 include/tvm/ir/source_map.h                        |   2 +-
 include/tvm/node/node.h                            |   2 +-
 include/tvm/node/reflection.h                      |   2 +-
 include/tvm/node/serialization.h                   |   2 +-
 include/tvm/relax/exec_builder.h                   |   2 +-
 include/tvm/relax/type.h                           |   2 +-
 .../tvm/runtime/base.h                             |  46 +-
 include/tvm/runtime/builtin_fp16.h                 |   2 +-
 include/tvm/runtime/c_backend_api.h                |  34 +-
 include/tvm/runtime/c_runtime_api.h                | 732 -------------------
 include/tvm/runtime/data_type.h                    |   5 +-
 include/tvm/runtime/device_api.h                   |  42 +-
 include/tvm/runtime/disco/cuda_ipc_memory.h        |   2 +-
 include/tvm/runtime/logging.h                      |   2 +-
 include/tvm/runtime/memory/memory_manager.h        |   2 +-
 include/tvm/runtime/module.h                       |   2 +-
 include/tvm/runtime/ndarray.h                      |  48 +-
 include/tvm/runtime/nvtx.h                         |   2 +-
 include/tvm/runtime/object.h                       |   2 +-
 include/tvm/runtime/packed_func.h                  | 282 +------
 include/tvm/runtime/profiling.h                    |   6 +-
 include/tvm/runtime/registry.h                     | 102 ---
 include/tvm/runtime/relax_vm/executable.h          |   2 +-
 .../tvm/runtime/relax_vm/ndarray_cache_support.h   |   2 +-
 include/tvm/runtime/serializer.h                   |   2 +-
 include/tvm/support/parallel_for.h                 |   2 +-
 include/tvm/tir/builtin.h                          |  20 +-
 include/tvm/tir/expr.h                             |   2 +-
 include/tvm/tir/transform.h                        |   4 +-
 python/tvm/contrib/cutlass/gen_tensor_op.py        |   2 +-
 python/tvm/relax/frontend/nn/op.py                 |   2 +-
 python/tvm/runtime/_ffi_api.py                     |   4 +-
 python/tvm/runtime/_ffi_node_api.py                |   6 +-
 src/arith/analyzer.cc                              |   4 +-
 src/arith/bound_deducer.cc                         |   4 +-
 src/arith/const_int_bound.cc                       |   4 +-
 src/arith/detect_common_subexpr.cc                 |   2 +-
 src/arith/detect_linear_equation.cc                |   6 +-
 src/arith/domain_touched.cc                        |   6 +-
 src/arith/int_constraints.cc                       |  13 +-
 src/arith/int_set.cc                               |  30 +-
 src/arith/iter_affine_map.cc                       |  18 +-
 src/arith/modular_set.cc                           |   4 +-
 src/arith/narrow_predicate_expression.cc           |   5 +-
 src/arith/presburger_set.cc                        |   4 +-
 src/arith/solve_linear_equation.cc                 |   4 +-
 src/arith/solve_linear_inequality.cc               |   8 +-
 src/contrib/msc/core/ir/graph.cc                   | 101 +--
 src/contrib/msc/core/ir/graph_builder.cc           |   4 +-
 src/contrib/msc/core/ir/plugin.cc                  |   8 +-
 .../msc/core/transform/bind_named_params.cc        |   2 +-
 src/contrib/msc/core/transform/bind_shape.cc       |   2 +-
 src/contrib/msc/core/transform/fuse_tuple.cc       |   2 +-
 src/contrib/msc/core/transform/inline_params.cc    |   2 +-
 src/contrib/msc/core/transform/set_byoc_attrs.cc   |   2 +-
 src/contrib/msc/core/transform/set_expr_layout.cc  |   2 +-
 src/contrib/msc/core/transform/set_expr_name.cc    |   2 +-
 src/contrib/msc/core/utils.cc                      |  12 +-
 src/contrib/msc/framework/tensorflow/codegen.cc    |   2 +-
 src/contrib/msc/framework/tensorrt/codegen.cc      |   6 +-
 .../msc/framework/tensorrt/transform_tensorrt.cc   |   2 +-
 src/contrib/msc/framework/torch/codegen.cc         |   2 +-
 src/contrib/msc/framework/tvm/codegen.cc           |   2 +-
 src/contrib/msc/plugin/tensorrt_codegen.cc         |   2 +-
 src/contrib/msc/plugin/torch_codegen.cc            |   2 +-
 src/contrib/msc/plugin/tvm_codegen.cc              |   8 +-
 src/ir/analysis.cc                                 |   2 +-
 src/ir/apply_pass_to_function.cc                   |   4 +-
 src/ir/attrs.cc                                    |   6 +-
 src/ir/diagnostic.cc                               |  22 +-
 src/ir/env_func.cc                                 |   8 +-
 src/ir/expr.cc                                     |  14 +-
 src/ir/function.cc                                 |  14 +-
 src/ir/global_info.cc                              |   9 +-
 src/ir/global_var_supply.cc                        |  17 +-
 src/ir/instrument.cc                               |   8 +-
 src/ir/module.cc                                   |  46 +-
 src/ir/name_supply.cc                              |  11 +-
 src/ir/op.cc                                       |  26 +-
 src/ir/replace_global_vars.cc                      |   4 +-
 src/ir/source_map.cc                               |  23 +-
 src/ir/transform.cc                                |  46 +-
 src/ir/type.cc                                     |  15 +-
 src/meta_schedule/arg_info.cc                      |  11 +-
 src/meta_schedule/builder/builder.cc               |   8 +-
 src/meta_schedule/cost_model/cost_model.cc         |  11 +-
 src/meta_schedule/database/database.cc             |  45 +-
 src/meta_schedule/database/json_database.cc        |   3 +-
 src/meta_schedule/database/memory_database.cc      |   2 +-
 .../database/ordered_union_database.cc             |   2 +-
 src/meta_schedule/database/schedule_fn_database.cc |   2 +-
 src/meta_schedule/database/union_database.cc       |   3 +-
 src/meta_schedule/extracted_task.cc                |   2 +-
 .../feature_extractor/feature_extractor.cc         |   4 +-
 .../feature_extractor/per_store_feature.cc         |   2 +-
 .../measure_callback/add_to_database.cc            |   2 +-
 .../measure_callback/measure_callback.cc           |   6 +-
 .../measure_callback/remove_build_artifact.cc      |   2 +-
 .../measure_callback/update_cost_model.cc          |   2 +-
 .../mutator/mutate_compute_location.cc             |   2 +-
 src/meta_schedule/mutator/mutate_parallel.cc       |   3 +-
 src/meta_schedule/mutator/mutate_thread_binding.cc |   2 +-
 src/meta_schedule/mutator/mutate_tile_size.cc      |   3 +-
 src/meta_schedule/mutator/mutate_unroll.cc         |   2 +-
 src/meta_schedule/mutator/mutator.cc               |  17 +-
 .../postproc/disallow_async_strided_mem_copy.cc    |   2 +-
 .../postproc/disallow_dynamic_loop.cc              |   2 +-
 src/meta_schedule/postproc/postproc.cc             |  16 +-
 .../postproc/rewrite_cooperative_fetch.cc          |   2 +-
 src/meta_schedule/postproc/rewrite_layout.cc       |   3 +-
 .../postproc/rewrite_parallel_vectorize_unroll.cc  |   2 +-
 .../postproc/rewrite_reduction_block.cc            |   2 +-
 src/meta_schedule/postproc/rewrite_tensorize.cc    |   2 +-
 .../postproc/rewrite_unbound_block.cc              |   2 +-
 src/meta_schedule/postproc/verify_gpu_code.cc      |   3 +-
 src/meta_schedule/postproc/verify_vtcm_limit.cc    |   2 +-
 src/meta_schedule/profiler.cc                      |  14 +-
 src/meta_schedule/runner/runner.cc                 |  15 +-
 src/meta_schedule/schedule/cpu/winograd.cc         |   8 +-
 src/meta_schedule/schedule/cuda/winograd.cc        |   8 +-
 src/meta_schedule/schedule_rule/add_rfactor.cc     |   2 +-
 .../schedule_rule/apply_custom_rule.cc             |   2 +-
 src/meta_schedule/schedule_rule/auto_bind.cc       |   3 +-
 src/meta_schedule/schedule_rule/auto_inline.cc     |   4 +-
 .../schedule_rule/cross_thread_reduction.cc        |   2 +-
 .../schedule_rule/multi_level_tiling.cc            |   2 +-
 .../multi_level_tiling_tensor_core.cc              |   2 +-
 .../multi_level_tiling_wide_vector.cc              |   2 +-
 .../multi_level_tiling_with_intrin.cc              |   2 +-
 .../schedule_rule/parallel_vectorize_unroll.cc     |   2 +-
 .../schedule_rule/random_compute_location.cc       |   2 +-
 src/meta_schedule/schedule_rule/schedule_rule.cc   |  20 +-
 .../search_strategy/evolutionary_search.cc         |   6 +-
 src/meta_schedule/search_strategy/replay_func.cc   |   2 +-
 src/meta_schedule/search_strategy/replay_trace.cc  |   2 +-
 .../search_strategy/search_strategy.cc             |  16 +-
 .../space_generator/post_order_apply.cc            |   2 +-
 src/meta_schedule/space_generator/schedule_fn.cc   |   2 +-
 .../space_generator/space_generator.cc             |   8 +-
 .../space_generator/space_generator_union.cc       |   2 +-
 src/meta_schedule/task_scheduler/gradient_based.cc |   2 +-
 src/meta_schedule/task_scheduler/round_robin.cc    |   2 +-
 src/meta_schedule/task_scheduler/task_scheduler.cc |  15 +-
 src/meta_schedule/trace_apply.cc                   |   2 +-
 src/meta_schedule/tune_context.cc                  |   8 +-
 src/node/container_printing.cc                     |   2 +-
 src/node/object_path.cc                            |  24 +-
 src/node/reflection.cc                             |   8 +-
 src/node/repr_printer.cc                           |   6 +-
 src/node/script_printer.cc                         |   6 +-
 src/node/serialization.cc                          |   7 +-
 src/node/structural_equal.cc                       |  10 +-
 src/node/structural_hash.cc                        |   4 +-
 src/relax/analysis/analysis.cc                     |  10 +-
 src/relax/analysis/computable_at_compile_time.cc   |   2 +-
 src/relax/analysis/detect_recursion.cc             |   2 +-
 src/relax/analysis/layout_transformation.cc        |   2 +-
 src/relax/analysis/struct_info_analysis.cc         |  22 +-
 src/relax/analysis/tir_op_pattern_kind.cc          |   2 +-
 src/relax/analysis/udchain.cc                      |   2 +-
 src/relax/analysis/var2value.cc                    |   4 +-
 src/relax/analysis/well_formed.cc                  |   2 +-
 src/relax/backend/contrib/clml/codegen.cc          |   7 +-
 src/relax/backend/contrib/cublas/codegen.cc        |   2 +-
 src/relax/backend/contrib/cudnn/codegen.cc         |   2 +-
 src/relax/backend/contrib/cutlass/codegen.cc       |   4 +-
 src/relax/backend/contrib/dnnl/codegen.cc          |   2 +-
 src/relax/backend/contrib/hipblas/codegen.cc       |   2 +-
 src/relax/backend/contrib/nnapi/codegen.cc         |   4 +-
 src/relax/backend/contrib/tensorrt/codegen.cc      |   7 +-
 src/relax/backend/contrib/utils.cc                 |   2 +-
 src/relax/backend/pattern_registry.cc              |   9 +-
 src/relax/backend/task_extraction.cc               |   2 +-
 src/relax/backend/vm/codegen_vm.cc                 |   4 +-
 src/relax/backend/vm/codegen_vm_tir.cc             |   2 +-
 src/relax/backend/vm/exec_builder.cc               |  44 +-
 src/relax/backend/vm/lower_runtime_builtin.cc      |   2 +-
 src/relax/backend/vm/vm_shape_lower.cc             |   2 +-
 src/relax/distributed/global_info.cc               |   2 +-
 src/relax/distributed/struct_info.cc               |  10 +-
 .../distributed/transform/legalize_redistribute.cc |   2 +-
 src/relax/distributed/transform/lower_distir.cc    |   2 +-
 .../transform/lower_global_view_to_local_view.cc   |   2 +-
 .../distributed/transform/propagate_sharding.cc    |   2 +-
 src/relax/ir/binding_rewrite.cc                    |  16 +-
 src/relax/ir/block_builder.cc                      |  40 +-
 src/relax/ir/dataflow_block_rewriter.cc            |   4 +-
 src/relax/ir/dataflow_expr_rewriter.cc             |  21 +-
 src/relax/ir/dataflow_pattern.cc                   |  74 +-
 src/relax/ir/emit_te.cc                            |   2 +-
 src/relax/ir/expr.cc                               |  62 +-
 src/relax/ir/expr_functor.cc                       |   2 +-
 src/relax/ir/py_expr_functor.cc                    |  50 +-
 src/relax/ir/struct_info.cc                        |  31 +-
 src/relax/ir/transform.cc                          |   6 +-
 src/relax/ir/type.cc                               |  12 +-
 src/relax/op/ccl/ccl.cc                            |   9 +-
 src/relax/op/distributed/distributed.cc            |   8 +-
 src/relax/op/image/resize.cc                       |   2 +-
 src/relax/op/memory/view.cc                        |   7 +-
 src/relax/op/nn/attention.cc                       |   4 +-
 src/relax/op/nn/convolution.cc                     |  10 +-
 src/relax/op/nn/nn.cc                              |  28 +-
 src/relax/op/nn/pooling.cc                         |  18 +-
 src/relax/op/op.cc                                 |  56 +-
 src/relax/op/op_common.h                           |   2 +-
 src/relax/op/tensor/binary.h                       |   2 +-
 src/relax/op/tensor/create.cc                      |  22 +-
 src/relax/op/tensor/datatype.cc                    |   4 +-
 src/relax/op/tensor/grad.cc                        |  14 +-
 src/relax/op/tensor/index.cc                       |   6 +-
 src/relax/op/tensor/linear_algebra.cc              |   6 +-
 src/relax/op/tensor/manipulate.cc                  |  46 +-
 src/relax/op/tensor/qdq.cc                         |   4 +-
 src/relax/op/tensor/sampling.cc                    |   3 +-
 src/relax/op/tensor/search.cc                      |   4 +-
 src/relax/op/tensor/set.cc                         |   4 +-
 src/relax/op/tensor/sorting.cc                     |   6 +-
 src/relax/op/tensor/statistical.cc                 |   4 +-
 src/relax/op/tensor/statistical.h                  |   2 +-
 src/relax/op/tensor/ternary.cc                     |   2 +-
 src/relax/op/tensor/unary.cc                       |   2 +-
 src/relax/testing/transform.cc                     |   2 +-
 src/relax/training/utils.cc                        |   2 +-
 src/relax/transform/adjust_matmul_order.cc         |   2 +-
 src/relax/transform/allocate_workspace.cc          |   2 +-
 src/relax/transform/alter_op_impl.cc               |   2 +-
 src/relax/transform/annotate_tir_op_pattern.cc     |   3 +-
 .../transform/attach_attr_layout_free_buffers.cc   |   2 +-
 src/relax/transform/attach_global_symbol.cc        |   2 +-
 src/relax/transform/bind_params.cc                 |   4 +-
 src/relax/transform/bind_symbolic_vars.cc          |   4 +-
 src/relax/transform/bundle_model_params.cc         |   2 +-
 src/relax/transform/call_tir_rewrite.cc            |   2 +-
 src/relax/transform/canonicalize_bindings.cc       |   3 +-
 src/relax/transform/combine_parallel_matmul.cc     |   3 +-
 src/relax/transform/compute_prim_value.cc          |   2 +-
 src/relax/transform/convert_dataflow.cc            |   2 +-
 src/relax/transform/convert_layout.cc              |   2 +-
 src/relax/transform/dataflow_inplace.cc            |  10 +-
 src/relax/transform/dead_code_elimination.cc       |   2 +-
 src/relax/transform/decompose_ops.cc               |   4 +-
 src/relax/transform/eliminate_common_subexpr.cc    |   2 +-
 src/relax/transform/expand_matmul_of_sum.cc        |   2 +-
 src/relax/transform/expand_tuple_arguments.cc      |   3 +-
 src/relax/transform/few_shot_tuning.cc             |   2 +-
 src/relax/transform/fold_constant.cc               |   2 +-
 src/relax/transform/fuse_ops.cc                    |   6 +-
 src/relax/transform/fuse_tir.cc                    |   2 +-
 src/relax/transform/gradient.cc                    |   2 +-
 src/relax/transform/inline_functions.cc            |   4 +-
 src/relax/transform/kill_after_last_use.cc         |   2 +-
 src/relax/transform/lambda_lift.cc                 |   2 +-
 src/relax/transform/lazy_transform_params.cc       |   4 +-
 src/relax/transform/legalize_ops.cc                |   2 +-
 src/relax/transform/lift_transform_params.cc       |   2 +-
 src/relax/transform/lower_alloc_tensor.cc          |   2 +-
 src/relax/transform/merge_composite_functions.cc   |   2 +-
 src/relax/transform/meta_schedule.cc               |   7 +-
 src/relax/transform/normalize.cc                   |   4 +-
 src/relax/transform/realize_vdevice.cc             |   2 +-
 src/relax/transform/remove_purity_checking.cc      |   3 +-
 src/relax/transform/remove_unused_outputs.cc       |   2 +-
 src/relax/transform/remove_unused_parameters.cc    |   2 +-
 .../transform/reorder_permute_dims_after_concat.cc |   2 +-
 src/relax/transform/reorder_take_after_matmul.cc   |   2 +-
 src/relax/transform/rewrite_cuda_graph.cc          |   2 +-
 src/relax/transform/rewrite_dataflow_reshape.cc    |   2 +-
 src/relax/transform/run_codegen.cc                 |   2 +-
 src/relax/transform/split_call_tir_by_pattern.cc   |   3 +-
 .../transform/split_layout_rewrite_preproc.cc      |   2 +-
 src/relax/transform/static_plan_block_memory.cc    |   3 +-
 src/relax/transform/to_mixed_precision.cc          |   2 +-
 src/relax/transform/to_non_dataflow.cc             |   2 +-
 src/relax/transform/topological_sort.cc            |   2 +-
 src/relax/transform/tuning_api/database.cc         |  26 +-
 src/relax/transform/tuning_api/primitives.cc       |  39 +-
 src/relax/transform/update_param_struct_info.cc    |   3 +-
 src/relax/transform/update_vdevice.cc              |   2 +-
 src/relax/utils.cc                                 |   2 +-
 src/runtime/builtin_fp16.cc                        |   8 +-
 src/runtime/c_runtime_api.cc                       | 807 ---------------------
 src/runtime/const_loader_module.cc                 |   6 +-
 src/runtime/container.cc                           | 101 ---
 src/runtime/contrib/amx/amx_config.cc              |   6 +-
 .../contrib/arm_compute_lib/acl_allocator.h        |   2 +-
 src/runtime/contrib/arm_compute_lib/acl_runtime.cc |   6 +-
 src/runtime/contrib/bnns/bnns_json_runtime.cc      |   6 +-
 src/runtime/contrib/cblas/cblas.cc                 |   8 +-
 src/runtime/contrib/cblas/dnnl_blas.cc             |   4 +-
 src/runtime/contrib/cblas/gemm_common.h            |   2 +-
 src/runtime/contrib/cblas/mkl.cc                   |  10 +-
 src/runtime/contrib/clml/clml_runtime.cc           |   4 +-
 src/runtime/contrib/clml/clml_runtime.h            |   2 +-
 src/runtime/contrib/coreml/coreml_runtime.mm       |   7 +-
 src/runtime/contrib/cublas/cublas.cc               |   8 +-
 src/runtime/contrib/cublas/cublas_json_runtime.cc  |   6 +-
 src/runtime/contrib/cublas/cublas_utils.cc         |   2 +-
 src/runtime/contrib/cudnn/conv_backward.cc         |  10 +-
 src/runtime/contrib/cudnn/conv_forward.cc          |  10 +-
 .../contrib/cudnn/cudnn_frontend/attention.cc      |   2 +-
 .../contrib/cudnn/cudnn_frontend/attention.h       |   2 +-
 src/runtime/contrib/cudnn/cudnn_json_runtime.cc    |   6 +-
 src/runtime/contrib/cudnn/cudnn_utils.cc           |   4 +-
 src/runtime/contrib/cudnn/softmax.cc               |   6 +-
 src/runtime/contrib/curand/curand.cc               |   6 +-
 src/runtime/contrib/curand/helper_cuda_kernels.h   |   2 +-
 src/runtime/contrib/cutlass/fp16_group_gemm.cu     |   4 +-
 .../contrib/cutlass/fp8_blockwise_scaled_gemm.cu   |   6 +-
 src/runtime/contrib/cutlass/fp8_gemm.cu            |   8 +-
 src/runtime/contrib/cutlass/fp8_group_gemm.cu      |   8 +-
 src/runtime/contrib/cutlass/weight_preprocess.cc   |   4 +-
 src/runtime/contrib/dnnl/dnnl.cc                   |   2 +-
 src/runtime/contrib/dnnl/dnnl_json_runtime.cc      |   6 +-
 src/runtime/contrib/dnnl/dnnl_kernel.h             |   4 +-
 src/runtime/contrib/edgetpu/edgetpu_runtime.cc     |   4 +-
 src/runtime/contrib/hipblas/hipblas.cc             |   6 +-
 .../contrib/hipblas/hipblas_json_runtime.cc        |   7 +-
 src/runtime/contrib/hipblas/hipblas_utils.cc       |   2 +-
 src/runtime/contrib/miopen/conv_forward.cc         |   6 +-
 src/runtime/contrib/miopen/miopen_utils.cc         |   2 +-
 src/runtime/contrib/miopen/softmax.cc              |   6 +-
 src/runtime/contrib/mps/conv.mm                    |   6 +-
 src/runtime/contrib/mps/gemm.mm                    |   2 +-
 src/runtime/contrib/mps/mps_utils.h                |   2 +-
 src/runtime/contrib/mrvl/mrvl_hw_runtime.cc        |   6 +-
 src/runtime/contrib/mrvl/mrvl_runtime.cc           |   6 +-
 src/runtime/contrib/mrvl/mrvl_sw_runtime_lib.cc    |   2 +-
 src/runtime/contrib/msc/tensorrt_runtime.cc        |   7 +-
 src/runtime/contrib/mscclpp/allreduce.cu           |   2 +-
 src/runtime/contrib/nnapi/nnapi_runtime.cc         |   6 +-
 src/runtime/contrib/nvshmem/init.cc                |   8 +-
 src/runtime/contrib/nvshmem/kv_transfer.cu         |   6 +-
 src/runtime/contrib/nvshmem/memory_allocator.cc    |   6 +-
 src/runtime/contrib/papi/papi.cc                   |   2 +-
 src/runtime/contrib/random/random.cc               |  12 +-
 src/runtime/contrib/rocblas/rocblas.cc             |   6 +-
 src/runtime/contrib/sort/sort.cc                   |  21 +-
 src/runtime/contrib/tensorrt/tensorrt_runtime.cc   |   6 +-
 src/runtime/contrib/tflite/tflite_runtime.cc       |   6 +-
 src/runtime/contrib/thrust/thrust.cu               |   8 +-
 src/runtime/contrib/vllm/attention_kernels.cu      |   8 +-
 src/runtime/contrib/vllm/cache_alloc.cc            |   4 +-
 src/runtime/contrib/vllm/cache_kernels.cu          |   8 +-
 src/runtime/cpu_device_api.cc                      |   4 +-
 src/runtime/cuda/cuda_device_api.cc                |  21 +-
 src/runtime/cuda/cuda_module.cc                    |   8 +-
 src/runtime/cuda/l2_cache_flush.cc                 |  13 +-
 src/runtime/debug_compile.cc                       |   6 +-
 src/runtime/device_api.cc                          | 271 +++++++
 src/runtime/disco/bcast_session.cc                 |   2 +-
 src/runtime/disco/builtin.cc                       |  48 +-
 src/runtime/disco/cuda_ipc/cuda_ipc_memory.cc      |   9 +-
 src/runtime/disco/cuda_ipc/custom_allreduce.cc     |   4 +-
 src/runtime/disco/disco_worker.cc                  |   2 +-
 src/runtime/disco/distributed/socket_session.cc    |   8 +-
 src/runtime/disco/loader.cc                        |  25 +-
 src/runtime/disco/nccl/nccl.cc                     |  35 +-
 src/runtime/disco/nccl/nccl_context.h              |   4 +-
 src/runtime/disco/process_session.cc               |   8 +-
 src/runtime/disco/protocol.h                       |   4 +-
 src/runtime/disco/session.cc                       |  24 +-
 src/runtime/disco/threaded_session.cc              |   2 +-
 src/runtime/dso_library.cc                         |   4 +-
 src/runtime/file_utils.cc                          |  17 +-
 src/runtime/hexagon/hexagon_buffer.h               |   2 +-
 src/runtime/hexagon/hexagon_common.cc              |   6 +-
 src/runtime/hexagon/hexagon_device_api.cc          |  31 +-
 src/runtime/hexagon/hexagon_module.cc              |   2 +-
 src/runtime/hexagon/hexagon_thread_manager.h       |   2 +-
 src/runtime/hexagon/hexagon_vtcm_pool.h            |   2 +-
 src/runtime/hexagon/ops/conv2d.h                   |   2 +-
 src/runtime/hexagon/ops/conv2d_fp16_hvx.cc         |  30 +-
 src/runtime/hexagon/ops/conv2d_quant_hvx.cc        |  49 +-
 src/runtime/hexagon/rpc/android/session.cc         |   4 +-
 src/runtime/hexagon/rpc/hexagon/rpc_server.cc      |   8 +-
 src/runtime/hexagon/rpc/simulator/rpc_server.cc    |   8 +-
 src/runtime/hexagon/rpc/simulator/session.cc       |   4 +-
 src/runtime/library_module.cc                      |   2 +-
 src/runtime/library_module.h                       |   2 +-
 src/runtime/logging.cc                             |   2 +-
 src/runtime/memory/memory_manager.cc               |   4 +-
 src/runtime/meta_data.h                            |   2 -
 src/runtime/metal/metal_common.h                   |   2 +-
 src/runtime/metal/metal_device_api.mm              |   8 +-
 src/runtime/metal/metal_module.mm                  |   6 +-
 src/runtime/minrpc/minrpc_server.h                 |   2 +-
 src/runtime/module.cc                              |  28 +-
 src/runtime/ndarray.cc                             | 101 +--
 src/runtime/object.cc                              |  92 ---
 src/runtime/object_internal.h                      |  96 ---
 src/runtime/opencl/opencl_common.h                 |   2 +-
 src/runtime/opencl/opencl_device_api.cc            |  19 +-
 src/runtime/opencl/opencl_module.cc                |  10 +-
 src/runtime/opencl/opencl_module_spirv.cc          |   2 +-
 src/runtime/pack_args.h                            |   9 +-
 src/runtime/packed_func.cc                         |   2 +-
 src/runtime/profiling.cc                           |  32 +-
 src/runtime/regex.cc                               |  11 +-
 src/runtime/registry.cc                            | 266 -------
 src/runtime/relax_vm/builtin.cc                    | 129 ++--
 src/runtime/relax_vm/cuda/cuda_graph_builtin.cc    |   6 +-
 src/runtime/relax_vm/executable.cc                 |   8 +-
 src/runtime/relax_vm/hexagon/builtin.cc            |   6 +-
 src/runtime/relax_vm/kv_state.cc                   |  52 +-
 src/runtime/relax_vm/kv_state.h                    |   2 +-
 src/runtime/relax_vm/lm_support.cc                 |  32 +-
 src/runtime/relax_vm/ndarray_cache_support.cc      |  28 +-
 src/runtime/relax_vm/paged_kv_cache.cc             |   4 +-
 src/runtime/relax_vm/rnn_state.cc                  |   2 +-
 src/runtime/relax_vm/vm.cc                         |   7 -
 src/runtime/rocm/rocm_device_api.cc                |  17 +-
 src/runtime/rocm/rocm_module.cc                    |  10 +-
 src/runtime/rpc/rpc_device_api.cc                  |   4 +-
 src/runtime/rpc/rpc_endpoint.cc                    |   5 +-
 src/runtime/rpc/rpc_event_impl.cc                  |   4 +-
 src/runtime/rpc/rpc_local_session.cc               |   4 +-
 src/runtime/rpc/rpc_module.cc                      |  32 +-
 src/runtime/rpc/rpc_pipe_impl.cc                   |  17 +-
 src/runtime/rpc/rpc_server_env.cc                  |   8 +-
 src/runtime/rpc/rpc_socket_impl.cc                 |   8 +-
 src/runtime/runtime_base.h                         |  67 --
 src/runtime/spirv/spirv_shader.h                   |   2 +-
 src/runtime/static_library.cc                      |   6 +-
 src/runtime/system_library.cc                      |  17 +-
 src/runtime/thread_pool.cc                         |   8 +-
 src/runtime/threading_backend.cc                   |   5 +-
 src/runtime/vulkan/vulkan_common.h                 |   4 +-
 src/runtime/vulkan/vulkan_device_api.cc            |  11 +-
 src/runtime/vulkan/vulkan_module.cc                |   6 +-
 src/runtime/vulkan/vulkan_wrapped_func.cc          |   2 +-
 src/script/ir_builder/base.cc                      |  26 +-
 src/script/ir_builder/ir/frame.cc                  |   2 +-
 src/script/ir_builder/ir/ir.cc                     |  18 +-
 src/script/ir_builder/relax/distributed.cc         |   2 +-
 src/script/ir_builder/relax/ir.cc                  |  33 +-
 src/script/ir_builder/tir/ir.cc                    | 180 ++---
 src/script/printer/doc.cc                          |  76 +-
 .../printer/doc_printer/python_doc_printer.cc      |   4 +-
 src/script/printer/ir_docsifier.cc                 |   2 +-
 src/script/printer/relax/type.cc                   |   2 +-
 src/support/ffi_testing.cc                         | 101 +--
 src/support/libinfo.cc                             |   4 +-
 src/support/socket.h                               |   3 +-
 src/target/build_common.h                          |   2 +-
 src/target/codegen.cc                              |  14 +-
 src/target/datatype/myfloat/myfloat.cc             |   2 +-
 src/target/datatype/posit/posit-wrapper.cc         |   2 +-
 src/target/datatype/registry.cc                    |  10 +-
 src/target/datatype/registry.h                     |   4 +-
 src/target/intrin_rule.h                           |   2 +-
 src/target/llvm/codegen_aarch64.cc                 |   4 +-
 src/target/llvm/codegen_amdgpu.cc                  |   8 +-
 src/target/llvm/codegen_arm.cc                     |   4 +-
 src/target/llvm/codegen_cpu.cc                     |   8 +-
 src/target/llvm/codegen_hexagon.cc                 |   4 +-
 src/target/llvm/codegen_llvm.cc                    |  13 +-
 src/target/llvm/codegen_nvptx.cc                   |   4 +-
 src/target/llvm/codegen_x86_64.cc                  |   4 +-
 src/target/llvm/intrin_rule_llvm.h                 |   2 +-
 src/target/llvm/intrin_rule_nvptx.cc               |   2 +-
 src/target/llvm/intrin_rule_rocm.cc                |   2 +-
 src/target/llvm/llvm_module.cc                     |  59 +-
 src/target/opt/build_cuda_on.cc                    |   2 +-
 src/target/source/codegen_c.cc                     |  17 +-
 src/target/source/codegen_c_host.cc                |  16 +-
 src/target/source/codegen_cuda.cc                  |   2 +-
 src/target/source/codegen_metal.cc                 |   2 +-
 src/target/source/codegen_opencl.cc                |   4 +-
 src/target/source/codegen_webgpu.cc                |   2 +-
 src/target/source/source_module.cc                 |   8 +-
 src/target/spirv/build_vulkan.cc                   |   2 +-
 src/target/spirv/intrin_rule_spirv.cc              |   2 +-
 src/target/tag.cc                                  |   6 +-
 src/target/target.cc                               |  20 +-
 src/target/target_info.cc                          |   2 +-
 src/target/target_kind.cc                          |  11 +-
 src/target/virtual_device.cc                       |   2 +-
 src/te/operation/compute_op.cc                     |   4 +-
 src/te/operation/create_primfunc.cc                |  21 +-
 src/te/operation/extern_op.cc                      |   4 +-
 src/te/operation/graph.cc                          |   6 +-
 src/te/operation/placeholder_op.cc                 |   4 +-
 src/te/operation/scan_op.cc                        |   4 +-
 src/te/tensor.cc                                   |  14 +-
 src/tir/analysis/block_access_region_detector.cc   |   5 +-
 src/tir/analysis/buffer_access_lca_detector.cc     |   3 +-
 src/tir/analysis/calculate_allocated_memory.cc     |   6 +-
 src/tir/analysis/control_flow_graph.cc             |   2 +-
 src/tir/analysis/deep_equal.cc                     |   4 +-
 src/tir/analysis/estimate_flops.cc                 |  23 +-
 src/tir/analysis/identify_memcpy.cc                |   2 +-
 src/tir/analysis/is_pure_function.cc               |   2 +-
 src/tir/analysis/oob_checker.cc                    |   2 +-
 src/tir/analysis/stmt_finding.cc                   |   2 +-
 src/tir/analysis/var_use_def_analysis.cc           |   2 +-
 src/tir/analysis/verify_gpu_code.cc                |   6 +-
 src/tir/analysis/verify_memory.cc                  |   6 +-
 src/tir/analysis/verify_ssa.cc                     |   6 +-
 src/tir/analysis/verify_well_formed.cc             |   4 +-
 src/tir/ir/block_dependence_info.cc                |   6 +-
 src/tir/ir/block_scope.cc                          |  19 +-
 src/tir/ir/buffer.cc                               |  17 +-
 src/tir/ir/data_layout.cc                          |  34 +-
 src/tir/ir/expr.cc                                 |  83 ++-
 src/tir/ir/function.cc                             |  10 +-
 src/tir/ir/index_map.cc                            |  19 +-
 src/tir/ir/script/script_complete.cc               |   2 +-
 src/tir/ir/script/script_complete.h                |   2 +-
 src/tir/ir/specialize.cc                           |   4 +-
 src/tir/ir/stmt.cc                                 |  47 +-
 src/tir/ir/stmt_functor.cc                         |  10 +-
 src/tir/ir/transform.cc                            |   4 +-
 src/tir/op/builtin.cc                              |   2 +-
 src/tir/op/op.cc                                   |  72 +-
 src/tir/schedule/analysis/analysis.cc              |  27 +-
 src/tir/schedule/analysis/layout.cc                |   2 +-
 src/tir/schedule/instruction.cc                    |   4 +-
 src/tir/schedule/primitive/decompose_padding.cc    |   2 +-
 src/tir/schedule/primitive/reduction.cc            |   2 +-
 src/tir/schedule/schedule.cc                       | 136 ++--
 src/tir/schedule/state.cc                          |  10 +-
 src/tir/schedule/trace.cc                          |  20 +-
 src/tir/schedule/transform.cc                      |   4 +-
 src/tir/transforms/annotate_device_regions.cc      |   5 +-
 src/tir/transforms/bind_params.cc                  |   2 +-
 src/tir/transforms/bound_checker.cc                |   4 +-
 src/tir/transforms/combine_context_call.cc         |   4 +-
 src/tir/transforms/common_subexpr_elim.cc          |   2 +-
 src/tir/transforms/compact_buffer_region.cc        |   2 +-
 src/tir/transforms/convert_blocks_to_opaque.cc     |   3 +-
 src/tir/transforms/convert_for_loops_serial.cc     |   2 +-
 src/tir/transforms/decorate_device_scope.cc        |   4 +-
 src/tir/transforms/default_gpu_schedule.cc         |   2 +-
 src/tir/transforms/extract_constants.cc            |   4 +-
 src/tir/transforms/flatten_buffer.cc               |   2 +-
 src/tir/transforms/force_narrow_index_to_i32.cc    |   2 +-
 src/tir/transforms/hoist_expression.cc             |   8 +-
 src/tir/transforms/inject_double_buffer.cc         |   4 +-
 src/tir/transforms/inject_permuted_layout.cc       |   2 +-
 src/tir/transforms/inject_ptx_async_copy.cc        |   2 +-
 src/tir/transforms/inject_ptx_ldg32.cc             |   4 +-
 src/tir/transforms/inject_rolling_buffer.cc        |   4 +-
 src/tir/transforms/inject_software_pipeline.cc     |   3 +-
 src/tir/transforms/inject_virtual_thread.cc        |   4 +-
 src/tir/transforms/inline_private_functions.cc     |   5 +-
 src/tir/transforms/ir_utils.cc                     |   2 +-
 src/tir/transforms/lift_thread_binding.cc          |   2 +-
 src/tir/transforms/loop_partition.cc               |   4 +-
 src/tir/transforms/lower_async_dma.cc              |   2 +-
 src/tir/transforms/lower_cross_thread_reduction.cc |   2 +-
 src/tir/transforms/lower_custom_datatypes.cc       |   4 +-
 src/tir/transforms/lower_device_kernel_launch.cc   |   4 +-
 .../transforms/lower_device_storage_access_info.cc |   4 +-
 src/tir/transforms/lower_init_block.cc             |   2 +-
 src/tir/transforms/lower_intrin.cc                 |   4 +-
 src/tir/transforms/lower_match_buffer.cc           |   2 +-
 src/tir/transforms/lower_opaque_block.cc           |   2 +-
 src/tir/transforms/lower_thread_allreduce.cc       |   4 +-
 src/tir/transforms/lower_tvm_builtin.cc            |   4 +-
 src/tir/transforms/lower_vtcm_alloc.cc             |   2 +-
 src/tir/transforms/lower_warp_memory.cc            |   4 +-
 src/tir/transforms/make_packed_api.cc              |   6 +-
 src/tir/transforms/make_unpacked_api.cc            |   4 +-
 .../manifest_shared_memory_local_stage.cc          |   2 +-
 src/tir/transforms/memhammer_lower_auto_copy.cc    |   4 +-
 src/tir/transforms/memhammer_rewrite_rule.h        |   2 +-
 .../transforms/merge_shared_memory_allocations.cc  |   4 +-
 src/tir/transforms/narrow_datatype.cc              |   4 +-
 .../plan_update_buffer_allocation_location.cc      |   2 +-
 src/tir/transforms/primfunc_utils.cc               |   6 +-
 src/tir/transforms/profile_instrumentation.cc      |   2 +-
 .../reduce_branching_through_overcompute.cc        |   2 +-
 src/tir/transforms/remap_thread_axis.cc            |   4 +-
 src/tir/transforms/remove_assume.cc                |   4 +-
 src/tir/transforms/remove_no_op.cc                 |   4 +-
 src/tir/transforms/remove_store_undef.cc           |   4 +-
 .../remove_weight_layout_rewrite_block.cc          |   2 +-
 src/tir/transforms/renew_defs.cc                   |   2 +-
 src/tir/transforms/renormalize_split_pattern.cc    |   4 +-
 src/tir/transforms/rewrite_unsafe_select.cc        |   4 +-
 src/tir/transforms/simplify.cc                     |   4 +-
 src/tir/transforms/skip_assert.cc                  |   4 +-
 src/tir/transforms/split_host_device.cc            |   4 +-
 src/tir/transforms/storage_rewrite.cc              |   6 +-
 src/tir/transforms/tensorcore_infer_fragment.cc    |   4 +-
 src/tir/transforms/thread_storage_sync.cc          |   4 +-
 src/tir/transforms/transform_mma_buffer_layout.cc  |   2 +-
 src/tir/transforms/unify_thread_binding.cc         |   2 +-
 src/tir/transforms/unroll_loop.cc                  |   4 +-
 src/tir/transforms/unsupported_dtype_legalize.cc   |  10 +-
 .../transforms/using_assume_to_reduce_branches.cc  |   2 +-
 src/tir/transforms/vectorize_loop.cc               |   4 +-
 src/topi/broadcast.cc                              |  35 +-
 src/topi/einsum.cc                                 |   2 +-
 src/topi/elemwise.cc                               |  75 +-
 src/topi/nn.cc                                     | 116 +--
 src/topi/reduction.cc                              |  25 +-
 src/topi/transform.cc                              | 169 ++---
 src/topi/utils.cc                                  |   8 +-
 src/topi/vision.cc                                 |   9 +-
 tests/cpp-runtime/hexagon/run_all_tests.cc         |   4 +-
 tests/cpp-runtime/hexagon/run_unit_tests.cc        |   4 +-
 tests/cpp-runtime/opencl/texture_copy_test.cc      |   2 +-
 tests/cpp/llvm_codegen_registry_test.cc            |   2 +-
 tests/python/contrib/test_hexagon/README_RPC.md    |   4 +-
 tests/python/runtime/test_runtime_rpc.py           |   6 +-
 version.py                                         |   4 +-
 web/emcc/tvmjs_support.cc                          |   4 +-
 web/emcc/wasm_runtime.cc                           |   5 +-
 625 files changed, 3189 insertions(+), 5392 deletions(-)
 copy ffi/tests/cpp/test_c_ffi_abi.cc => include/tvm/runtime/base.h (51%)
 delete mode 100644 include/tvm/runtime/c_runtime_api.h
 delete mode 100644 include/tvm/runtime/registry.h
 delete mode 100644 src/runtime/c_runtime_api.cc
 delete mode 100644 src/runtime/container.cc
 create mode 100644 src/runtime/device_api.cc
 delete mode 100644 src/runtime/object.cc
 delete mode 100644 src/runtime/object_internal.h
 delete mode 100644 src/runtime/registry.cc
 delete mode 100644 src/runtime/runtime_base.h


Reply via email to