This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git
from c655f14e03 [3rdparty] Bump cutlass_fpA_intB_gemm to fix SM90 build
(#18291)
add abc8ae802f [FFI][REFACTOR] Streamline Object Declare Macros (#18289)
add cf80a824d1 [Fix] Set DRefObj and CUDAIPCMemoryObj as mutable (#18294)
add 73b6851a54 [FFI][ABI] Introduce generic stream exchange protocol
(#18295)
add bf71ef4a0c [FFI] Temp skip windows tests (#18297)
add 3ff16e8253 [Fix] Add libxml2 dependency to fix Windows CI build
failure (#18296)
add 485a309dcd [FFI] Fix system library symbol lookup (#18298)
No new revisions were added by this update.
Summary of changes:
.github/workflows/main.yml | 2 +-
cmake/utils/FindLLVM.cmake | 4 +
conda/build-environment.yaml | 1 +
docs/arch/pass_infra.rst | 2 +-
docs/arch/runtime.rst | 4 +-
ffi/docs/guides/cpp_guide.md | 6 +-
ffi/docs/guides/python_guide.md | 5 +-
ffi/include/tvm/ffi/container/array.h | 3 +-
ffi/include/tvm/ffi/container/map.h | 3 +-
ffi/include/tvm/ffi/container/shape.h | 5 +-
ffi/include/tvm/ffi/container/tensor.h | 5 +-
ffi/include/tvm/ffi/error.h | 5 +-
ffi/include/tvm/ffi/extra/c_env_api.h | 6 +-
ffi/include/tvm/ffi/extra/module.h | 6 +-
ffi/include/tvm/ffi/function.h | 5 +-
ffi/include/tvm/ffi/object.h | 106 ++++++------
ffi/include/tvm/ffi/reflection/access_path.h | 10 +-
ffi/include/tvm/ffi/string.h | 6 +-
ffi/pyproject.toml | 2 +-
ffi/python/tvm_ffi/cython/base.pxi | 91 ++++++----
ffi/python/tvm_ffi/cython/function.pxi | 29 +++-
ffi/python/tvm_ffi/cython/tensor.pxi | 24 +++
ffi/scripts/benchmark_dlpack.py | 26 ++-
ffi/src/ffi/extra/library_module_system_lib.cc | 15 +-
ffi/src/ffi/extra/stream_context.cc | 4 +-
ffi/src/ffi/extra/testing.cc | 11 +-
ffi/tests/cpp/test_example.cc | 5 +-
ffi/tests/cpp/test_reflection.cc | 7 +-
ffi/tests/cpp/testing_object.h | 36 ++--
ffi/tests/python/test_load_inline.py | 4 +
include/tvm/arith/analyzer.h | 10 +-
include/tvm/arith/int_set.h | 6 +-
include/tvm/arith/int_solver.h | 20 +--
include/tvm/arith/iter_affine_map.h | 25 +--
include/tvm/ir/attrs.h | 17 +-
include/tvm/ir/diagnostic.h | 18 +-
include/tvm/ir/env_func.h | 4 +-
include/tvm/ir/expr.h | 47 ++----
include/tvm/ir/function.h | 5 +-
include/tvm/ir/global_info.h | 16 +-
include/tvm/ir/global_var_supply.h | 8 +-
include/tvm/ir/instrument.h | 6 +-
include/tvm/ir/module.h | 3 +-
include/tvm/ir/name_supply.h | 6 +-
include/tvm/ir/op.h | 5 +-
include/tvm/ir/source_map.h | 27 ++-
include/tvm/ir/transform.h | 22 +--
include/tvm/ir/type.h | 36 ++--
include/tvm/meta_schedule/arg_info.h | 11 +-
include/tvm/meta_schedule/builder.h | 25 ++-
include/tvm/meta_schedule/cost_model.h | 10 +-
include/tvm/meta_schedule/database.h | 25 ++-
include/tvm/meta_schedule/extracted_task.h | 10 +-
include/tvm/meta_schedule/feature_extractor.h | 11 +-
include/tvm/meta_schedule/measure_callback.h | 11 +-
include/tvm/meta_schedule/measure_candidate.h | 6 +-
include/tvm/meta_schedule/mutator.h | 10 +-
include/tvm/meta_schedule/postproc.h | 10 +-
include/tvm/meta_schedule/profiler.h | 6 +-
include/tvm/meta_schedule/runner.h | 33 ++--
include/tvm/meta_schedule/schedule_rule.h | 11 +-
include/tvm/meta_schedule/search_strategy.h | 11 +-
include/tvm/meta_schedule/space_generator.h | 11 +-
include/tvm/meta_schedule/task_scheduler.h | 17 +-
include/tvm/meta_schedule/tune_context.h | 6 +-
include/tvm/node/script_printer.h | 8 +-
include/tvm/relax/attrs/ccl.h | 13 +-
include/tvm/relax/attrs/create.h | 8 +-
include/tvm/relax/attrs/datatype.h | 8 +-
include/tvm/relax/attrs/distributed.h | 5 +-
include/tvm/relax/attrs/image.h | 4 +-
include/tvm/relax/attrs/index.h | 9 +-
include/tvm/relax/attrs/linear_algebra.h | 8 +-
include/tvm/relax/attrs/manipulate.h | 77 +++------
include/tvm/relax/attrs/nn.h | 107 ++++--------
include/tvm/relax/attrs/op.h | 24 +--
include/tvm/relax/attrs/qdq.h | 4 +-
include/tvm/relax/attrs/sampling.h | 5 +-
include/tvm/relax/attrs/search.h | 9 +-
include/tvm/relax/attrs/sorting.h | 12 +-
include/tvm/relax/attrs/statistical.h | 9 +-
include/tvm/relax/binding_rewrite.h | 7 +-
include/tvm/relax/block_builder.h | 6 +-
include/tvm/relax/dataflow_pattern.h | 158 +++++++-----------
include/tvm/relax/distributed/global_info.h | 6 +-
include/tvm/relax/distributed/struct_info.h | 19 +--
include/tvm/relax/exec_builder.h | 6 +-
include/tvm/relax/expr.h | 127 +++++---------
include/tvm/relax/struct_info.h | 36 ++--
include/tvm/relax/tir_pattern.h | 6 +-
include/tvm/relax/transform.h | 15 +-
include/tvm/relax/type.h | 24 +--
include/tvm/runtime/disco/cuda_ipc_memory.h | 6 +-
include/tvm/runtime/disco/session.h | 13 +-
include/tvm/runtime/memory/memory_manager.h | 6 +-
include/tvm/runtime/object.h | 37 ++---
include/tvm/runtime/profiling.h | 42 ++---
include/tvm/runtime/vm/vm.h | 11 +-
include/tvm/script/ir_builder/base.h | 13 +-
include/tvm/script/ir_builder/ir/frame.h | 8 +-
include/tvm/script/ir_builder/relax/frame.h | 48 +++---
include/tvm/script/ir_builder/tir/frame.h | 115 +++++--------
include/tvm/script/printer/doc.h | 185 ++++++---------------
include/tvm/script/printer/ir_docsifier.h | 14 +-
include/tvm/target/tag.h | 7 +-
include/tvm/target/target.h | 5 +-
include/tvm/target/target_info.h | 7 +-
include/tvm/target/target_kind.h | 5 +-
include/tvm/target/virtual_device.h | 6 +-
include/tvm/te/operation.h | 38 ++---
include/tvm/te/tensor.h | 5 +-
include/tvm/tir/block_dependence_info.h | 8 +-
include/tvm/tir/block_scope.h | 21 +--
include/tvm/tir/buffer.h | 11 +-
include/tvm/tir/data_layout.h | 12 +-
include/tvm/tir/expr.h | 127 ++++++--------
include/tvm/tir/function.h | 12 +-
include/tvm/tir/index_map.h | 5 +-
include/tvm/tir/schedule/instruction.h | 13 +-
include/tvm/tir/schedule/schedule.h | 18 +-
include/tvm/tir/schedule/state.h | 9 +-
include/tvm/tir/schedule/trace.h | 6 +-
include/tvm/tir/stmt.h | 106 ++++--------
include/tvm/tir/var.h | 11 +-
python/tvm/contrib/nvcc.py | 7 +-
src/arith/canonical_simplify.cc | 14 +-
src/arith/interval_set.h | 6 +-
src/arith/presburger_set.h | 10 +-
src/arith/rewrite_simplify.h | 8 +-
src/contrib/msc/core/ir/graph.h | 44 ++---
src/contrib/msc/core/ir/plugin.h | 20 +--
src/contrib/msc/core/printer/msc_doc.h | 44 ++---
src/ir/instrument.cc | 8 +-
src/ir/transform.cc | 6 +-
src/meta_schedule/database/json_database.cc | 4 +-
src/meta_schedule/database/memory_database.cc | 5 +-
.../database/ordered_union_database.cc | 5 +-
src/meta_schedule/database/schedule_fn_database.cc | 5 +-
src/meta_schedule/database/union_database.cc | 4 +-
.../feature_extractor/per_store_feature.cc | 5 +-
.../measure_callback/add_to_database.cc | 5 +-
.../measure_callback/remove_build_artifact.cc | 5 +-
.../measure_callback/update_cost_model.cc | 5 +-
.../mutator/mutate_compute_location.cc | 5 +-
src/meta_schedule/mutator/mutate_parallel.cc | 5 +-
src/meta_schedule/mutator/mutate_thread_binding.cc | 5 +-
src/meta_schedule/mutator/mutate_tile_size.cc | 5 +-
src/meta_schedule/mutator/mutate_unroll.cc | 4 +-
.../postproc/disallow_async_strided_mem_copy.cc | 5 +-
.../postproc/disallow_dynamic_loop.cc | 5 +-
.../postproc/rewrite_cooperative_fetch.cc | 5 +-
src/meta_schedule/postproc/rewrite_layout.cc | 4 +-
.../postproc/rewrite_parallel_vectorize_unroll.cc | 5 +-
.../postproc/rewrite_reduction_block.cc | 5 +-
src/meta_schedule/postproc/rewrite_tensorize.cc | 5 +-
.../postproc/rewrite_unbound_block.cc | 5 +-
src/meta_schedule/postproc/verify_gpu_code.cc | 4 +-
src/meta_schedule/postproc/verify_vtcm_limit.cc | 5 +-
src/meta_schedule/schedule_rule/add_rfactor.cc | 4 +-
.../schedule_rule/apply_custom_rule.cc | 5 +-
src/meta_schedule/schedule_rule/auto_bind.cc | 4 +-
src/meta_schedule/schedule_rule/auto_inline.cc | 9 +-
.../schedule_rule/cross_thread_reduction.cc | 5 +-
.../schedule_rule/multi_level_tiling.h | 11 +-
.../multi_level_tiling_tensor_core.cc | 11 +-
.../multi_level_tiling_wide_vector.cc | 5 +-
.../multi_level_tiling_with_intrin.cc | 5 +-
.../schedule_rule/parallel_vectorize_unroll.cc | 5 +-
.../schedule_rule/random_compute_location.cc | 5 +-
.../search_strategy/evolutionary_search.cc | 9 +-
src/meta_schedule/search_strategy/replay_func.cc | 4 +-
src/meta_schedule/search_strategy/replay_trace.cc | 5 +-
.../space_generator/post_order_apply.cc | 4 +-
src/meta_schedule/space_generator/schedule_fn.cc | 4 +-
.../space_generator/space_generator_union.cc | 5 +-
src/meta_schedule/task_scheduler/gradient_based.cc | 5 +-
src/meta_schedule/task_scheduler/round_robin.cc | 4 +-
src/relax/backend/contrib/clml/codegen.cc | 9 +-
src/relax/backend/contrib/cutlass/codegen.cc | 6 +-
src/relax/backend/contrib/tensorrt/codegen.cc | 9 +-
src/relax/ir/dataflow_block_rewriter.cc | 9 +-
src/relax/ir/dataflow_rewriter.h | 31 ++--
src/relax/ir/emit_te.h | 5 +-
src/relax/ir/py_expr_functor.cc | 12 +-
src/relax/ir/transform.cc | 12 +-
src/relax/transform/dataflow_inplace.cc | 6 +-
src/relax/transform/infer_layout_utils.h | 12 +-
src/relax/transform/static_plan_block_memory.cc | 6 +-
.../contrib/cudnn/cudnn_frontend/attention.h | 4 +-
src/runtime/contrib/papi/papi.cc | 13 +-
src/runtime/cuda/cuda_device_api.cc | 4 +-
src/runtime/device_api.cc | 3 +-
src/runtime/disco/bcast_session.h | 2 +-
src/runtime/disco/distributed/socket_session.cc | 5 +-
src/runtime/disco/loader.cc | 4 +-
src/runtime/disco/process_session.cc | 4 +-
src/runtime/disco/protocol.h | 4 +-
src/runtime/disco/threaded_session.cc | 5 +-
src/runtime/hexagon/hexagon_common.cc | 5 +-
src/runtime/metal/metal_device_api.mm | 4 +-
src/runtime/opencl/opencl_common.h | 3 +-
src/runtime/profiling.cc | 7 +-
src/runtime/rocm/rocm_device_api.cc | 4 +-
src/runtime/rpc/rpc_session.h | 5 +-
src/runtime/vm/cuda/cuda_graph_builtin.cc | 16 +-
src/runtime/vm/kv_state.h | 18 +-
src/runtime/vm/lm_support.cc | 9 +-
src/runtime/vm/paged_kv_cache.cc | 5 +-
src/runtime/vm/rnn_state.cc | 3 +-
src/script/printer/ir/utils.h | 6 +-
src/script/printer/relax/utils.h | 6 +-
src/script/printer/tir/utils.h | 6 +-
src/support/ffi_testing.cc | 4 +-
src/tir/ir/py_functor.cc | 16 +-
src/tir/ir/transform.cc | 6 +-
src/tir/schedule/analysis.h | 15 +-
src/tir/transforms/hoist_expression.cc | 18 +-
src/tir/transforms/inject_double_buffer.cc | 9 +-
src/tir/transforms/loop_partition.cc | 8 +-
.../reduce_branching_through_overcompute.cc | 9 +-
src/tir/transforms/remove_no_op.cc | 7 +-
src/tir/transforms/simplify.cc | 7 +-
src/tir/transforms/unroll_loop.cc | 7 +-
tests/cpp/object_protocol_test.cc | 12 +-
224 files changed, 1340 insertions(+), 2024 deletions(-)