This is an automated email from the ASF dual-hosted git repository.
ruihangl pushed a change to branch metal-ci
in repository https://gitbox.apache.org/repos/asf/tvm.git
discard 3b8f2c3a78 [CI] Enable Metal support in TVM build process
omit abc8ae802f [FFI][REFACTOR] Streamline Object Declare Macros (#18289)
add c457400bab [CI] Enable Metal support in TVM build process
This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version. This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:
* -- * -- B -- O -- O -- O (3b8f2c3a78)
\
N -- N -- N refs/heads/metal-ci (c457400bab)
You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
docs/arch/pass_infra.rst | 2 +-
docs/arch/runtime.rst | 4 +-
ffi/docs/guides/cpp_guide.md | 6 +-
ffi/docs/guides/python_guide.md | 5 +-
ffi/include/tvm/ffi/container/array.h | 3 +-
ffi/include/tvm/ffi/container/map.h | 3 +-
ffi/include/tvm/ffi/container/shape.h | 5 +-
ffi/include/tvm/ffi/container/tensor.h | 5 +-
ffi/include/tvm/ffi/error.h | 5 +-
ffi/include/tvm/ffi/extra/module.h | 6 +-
ffi/include/tvm/ffi/function.h | 5 +-
ffi/include/tvm/ffi/object.h | 106 ++++++------
ffi/include/tvm/ffi/reflection/access_path.h | 10 +-
ffi/include/tvm/ffi/string.h | 6 +-
ffi/src/ffi/extra/testing.cc | 11 +-
ffi/tests/cpp/test_example.cc | 5 +-
ffi/tests/cpp/test_reflection.cc | 7 +-
ffi/tests/cpp/testing_object.h | 36 ++--
include/tvm/arith/analyzer.h | 10 +-
include/tvm/arith/int_set.h | 6 +-
include/tvm/arith/int_solver.h | 20 ++-
include/tvm/arith/iter_affine_map.h | 25 ++-
include/tvm/ir/attrs.h | 17 +-
include/tvm/ir/diagnostic.h | 18 +-
include/tvm/ir/env_func.h | 4 +-
include/tvm/ir/expr.h | 47 ++++--
include/tvm/ir/function.h | 5 +-
include/tvm/ir/global_info.h | 16 +-
include/tvm/ir/global_var_supply.h | 8 +-
include/tvm/ir/instrument.h | 6 +-
include/tvm/ir/module.h | 3 +-
include/tvm/ir/name_supply.h | 6 +-
include/tvm/ir/op.h | 5 +-
include/tvm/ir/source_map.h | 27 +--
include/tvm/ir/transform.h | 22 ++-
include/tvm/ir/type.h | 36 ++--
include/tvm/meta_schedule/arg_info.h | 11 +-
include/tvm/meta_schedule/builder.h | 25 +--
include/tvm/meta_schedule/cost_model.h | 10 +-
include/tvm/meta_schedule/database.h | 25 +--
include/tvm/meta_schedule/extracted_task.h | 10 +-
include/tvm/meta_schedule/feature_extractor.h | 11 +-
include/tvm/meta_schedule/measure_callback.h | 11 +-
include/tvm/meta_schedule/measure_candidate.h | 6 +-
include/tvm/meta_schedule/mutator.h | 10 +-
include/tvm/meta_schedule/postproc.h | 10 +-
include/tvm/meta_schedule/profiler.h | 6 +-
include/tvm/meta_schedule/runner.h | 33 ++--
include/tvm/meta_schedule/schedule_rule.h | 11 +-
include/tvm/meta_schedule/search_strategy.h | 11 +-
include/tvm/meta_schedule/space_generator.h | 11 +-
include/tvm/meta_schedule/task_scheduler.h | 17 +-
include/tvm/meta_schedule/tune_context.h | 6 +-
include/tvm/node/script_printer.h | 8 +-
include/tvm/relax/attrs/ccl.h | 13 +-
include/tvm/relax/attrs/create.h | 8 +-
include/tvm/relax/attrs/datatype.h | 8 +-
include/tvm/relax/attrs/distributed.h | 5 +-
include/tvm/relax/attrs/image.h | 4 +-
include/tvm/relax/attrs/index.h | 9 +-
include/tvm/relax/attrs/linear_algebra.h | 8 +-
include/tvm/relax/attrs/manipulate.h | 77 ++++++---
include/tvm/relax/attrs/nn.h | 107 ++++++++----
include/tvm/relax/attrs/op.h | 24 ++-
include/tvm/relax/attrs/qdq.h | 4 +-
include/tvm/relax/attrs/sampling.h | 5 +-
include/tvm/relax/attrs/search.h | 9 +-
include/tvm/relax/attrs/sorting.h | 12 +-
include/tvm/relax/attrs/statistical.h | 9 +-
include/tvm/relax/binding_rewrite.h | 7 +-
include/tvm/relax/block_builder.h | 6 +-
include/tvm/relax/dataflow_pattern.h | 158 +++++++++++-------
include/tvm/relax/distributed/global_info.h | 6 +-
include/tvm/relax/distributed/struct_info.h | 19 ++-
include/tvm/relax/exec_builder.h | 6 +-
include/tvm/relax/expr.h | 127 +++++++++-----
include/tvm/relax/struct_info.h | 36 ++--
include/tvm/relax/tir_pattern.h | 6 +-
include/tvm/relax/transform.h | 15 +-
include/tvm/relax/type.h | 24 ++-
include/tvm/runtime/disco/cuda_ipc_memory.h | 6 +-
include/tvm/runtime/disco/session.h | 12 +-
include/tvm/runtime/memory/memory_manager.h | 6 +-
include/tvm/runtime/object.h | 37 +++--
include/tvm/runtime/profiling.h | 42 +++--
include/tvm/runtime/vm/vm.h | 11 +-
include/tvm/script/ir_builder/base.h | 13 +-
include/tvm/script/ir_builder/ir/frame.h | 8 +-
include/tvm/script/ir_builder/relax/frame.h | 48 +++---
include/tvm/script/ir_builder/tir/frame.h | 115 ++++++++-----
include/tvm/script/printer/doc.h | 185 +++++++++++++++------
include/tvm/script/printer/ir_docsifier.h | 14 +-
include/tvm/target/tag.h | 7 +-
include/tvm/target/target.h | 5 +-
include/tvm/target/target_info.h | 7 +-
include/tvm/target/target_kind.h | 5 +-
include/tvm/target/virtual_device.h | 6 +-
include/tvm/te/operation.h | 38 +++--
include/tvm/te/tensor.h | 5 +-
include/tvm/tir/block_dependence_info.h | 8 +-
include/tvm/tir/block_scope.h | 21 ++-
include/tvm/tir/buffer.h | 11 +-
include/tvm/tir/data_layout.h | 12 +-
include/tvm/tir/expr.h | 127 ++++++++------
include/tvm/tir/function.h | 12 +-
include/tvm/tir/index_map.h | 5 +-
include/tvm/tir/schedule/instruction.h | 13 +-
include/tvm/tir/schedule/schedule.h | 18 +-
include/tvm/tir/schedule/state.h | 9 +-
include/tvm/tir/schedule/trace.h | 6 +-
include/tvm/tir/stmt.h | 106 ++++++++----
include/tvm/tir/var.h | 11 +-
python/tvm/contrib/nvcc.py | 7 +-
src/arith/canonical_simplify.cc | 14 +-
src/arith/interval_set.h | 6 +-
src/arith/presburger_set.h | 10 +-
src/arith/rewrite_simplify.h | 8 +-
src/contrib/msc/core/ir/graph.h | 44 +++--
src/contrib/msc/core/ir/plugin.h | 20 ++-
src/contrib/msc/core/printer/msc_doc.h | 44 +++--
src/ir/instrument.cc | 8 +-
src/ir/transform.cc | 6 +-
src/meta_schedule/database/json_database.cc | 4 +-
src/meta_schedule/database/memory_database.cc | 5 +-
.../database/ordered_union_database.cc | 5 +-
src/meta_schedule/database/schedule_fn_database.cc | 5 +-
src/meta_schedule/database/union_database.cc | 4 +-
.../feature_extractor/per_store_feature.cc | 5 +-
.../measure_callback/add_to_database.cc | 5 +-
.../measure_callback/remove_build_artifact.cc | 5 +-
.../measure_callback/update_cost_model.cc | 5 +-
.../mutator/mutate_compute_location.cc | 5 +-
src/meta_schedule/mutator/mutate_parallel.cc | 5 +-
src/meta_schedule/mutator/mutate_thread_binding.cc | 5 +-
src/meta_schedule/mutator/mutate_tile_size.cc | 5 +-
src/meta_schedule/mutator/mutate_unroll.cc | 4 +-
.../postproc/disallow_async_strided_mem_copy.cc | 5 +-
.../postproc/disallow_dynamic_loop.cc | 5 +-
.../postproc/rewrite_cooperative_fetch.cc | 5 +-
src/meta_schedule/postproc/rewrite_layout.cc | 4 +-
.../postproc/rewrite_parallel_vectorize_unroll.cc | 5 +-
.../postproc/rewrite_reduction_block.cc | 5 +-
src/meta_schedule/postproc/rewrite_tensorize.cc | 5 +-
.../postproc/rewrite_unbound_block.cc | 5 +-
src/meta_schedule/postproc/verify_gpu_code.cc | 4 +-
src/meta_schedule/postproc/verify_vtcm_limit.cc | 5 +-
src/meta_schedule/schedule_rule/add_rfactor.cc | 4 +-
.../schedule_rule/apply_custom_rule.cc | 5 +-
src/meta_schedule/schedule_rule/auto_bind.cc | 4 +-
src/meta_schedule/schedule_rule/auto_inline.cc | 9 +-
.../schedule_rule/cross_thread_reduction.cc | 5 +-
.../schedule_rule/multi_level_tiling.h | 11 +-
.../multi_level_tiling_tensor_core.cc | 11 +-
.../multi_level_tiling_wide_vector.cc | 5 +-
.../multi_level_tiling_with_intrin.cc | 5 +-
.../schedule_rule/parallel_vectorize_unroll.cc | 5 +-
.../schedule_rule/random_compute_location.cc | 5 +-
.../search_strategy/evolutionary_search.cc | 9 +-
src/meta_schedule/search_strategy/replay_func.cc | 4 +-
src/meta_schedule/search_strategy/replay_trace.cc | 5 +-
.../space_generator/post_order_apply.cc | 4 +-
src/meta_schedule/space_generator/schedule_fn.cc | 4 +-
.../space_generator/space_generator_union.cc | 5 +-
src/meta_schedule/task_scheduler/gradient_based.cc | 5 +-
src/meta_schedule/task_scheduler/round_robin.cc | 4 +-
src/relax/backend/contrib/clml/codegen.cc | 9 +-
src/relax/backend/contrib/cutlass/codegen.cc | 6 +-
src/relax/backend/contrib/tensorrt/codegen.cc | 9 +-
src/relax/ir/dataflow_block_rewriter.cc | 9 +-
src/relax/ir/dataflow_rewriter.h | 31 ++--
src/relax/ir/emit_te.h | 5 +-
src/relax/ir/py_expr_functor.cc | 12 +-
src/relax/ir/transform.cc | 12 +-
src/relax/transform/dataflow_inplace.cc | 6 +-
src/relax/transform/infer_layout_utils.h | 12 +-
src/relax/transform/static_plan_block_memory.cc | 6 +-
.../contrib/cudnn/cudnn_frontend/attention.h | 4 +-
src/runtime/contrib/papi/papi.cc | 13 +-
src/runtime/cuda/cuda_device_api.cc | 4 +-
src/runtime/disco/bcast_session.h | 2 +-
src/runtime/disco/distributed/socket_session.cc | 5 +-
src/runtime/disco/loader.cc | 4 +-
src/runtime/disco/process_session.cc | 4 +-
src/runtime/disco/protocol.h | 4 +-
src/runtime/disco/threaded_session.cc | 5 +-
src/runtime/hexagon/hexagon_common.cc | 5 +-
src/runtime/metal/metal_device_api.mm | 4 +-
src/runtime/opencl/opencl_common.h | 3 +-
src/runtime/profiling.cc | 7 +-
src/runtime/rocm/rocm_device_api.cc | 4 +-
src/runtime/rpc/rpc_session.h | 5 +-
src/runtime/vm/cuda/cuda_graph_builtin.cc | 9 +-
src/runtime/vm/kv_state.h | 18 +-
src/runtime/vm/lm_support.cc | 9 +-
src/runtime/vm/paged_kv_cache.cc | 5 +-
src/runtime/vm/rnn_state.cc | 3 +-
src/script/printer/ir/utils.h | 6 +-
src/script/printer/relax/utils.h | 6 +-
src/script/printer/tir/utils.h | 6 +-
src/support/ffi_testing.cc | 4 +-
src/tir/ir/py_functor.cc | 16 +-
src/tir/ir/transform.cc | 6 +-
src/tir/schedule/analysis.h | 15 +-
src/tir/transforms/hoist_expression.cc | 18 +-
src/tir/transforms/inject_double_buffer.cc | 9 +-
src/tir/transforms/loop_partition.cc | 8 +-
.../reduce_branching_through_overcompute.cc | 9 +-
src/tir/transforms/remove_no_op.cc | 7 +-
src/tir/transforms/simplify.cc | 7 +-
src/tir/transforms/unroll_loop.cc | 7 +-
tests/cpp/object_protocol_test.cc | 12 +-
tests/python/codegen/test_gpu_codegen_allreduce.py | 13 +-
212 files changed, 1975 insertions(+), 1183 deletions(-)