This is an automated email from the ASF dual-hosted git repository.
github-actions[bot] pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git
from 81e62ecbb2 [TIRx][LLVM] Support scalable Ramp lowering (#19866)
add 120812e9ac [REFACTOR][Relax] Phase out PrimValue and Relax expression
wrappers (#19891)
add 08f7d9b984 [Relax] Use optional dtype for absent Relax dtype fields
(#19890)
add acb65f79c6 [ONNX] Use structural checks for composite frontend tests
(#19880)
add b00b85b30b [Frontend][ONNX] Fix structural tests for TVMScript checks
(#19894)
add 46a9a00c8e [DOCS][TIRX] Add in-kernel profiling (CudaProfiler)
tutorial (#19895)
No new revisions were added by this update.
Summary of changes:
docs/deep_dive/relax/tutorials/relax_creation.py | 2 +-
docs/get_started/tutorials/ir_module.py | 4 +-
docs/how_to/tutorials/cross_compilation_and_rpc.py | 4 +-
docs/how_to/tutorials/optimize_llm.py | 2 +-
docs/reference/api/python/ir.rst | 1 +
docs/reference/api/python/relax/op.rst | 10 +
docs/tirx/native_basics.rst | 1 +
docs/tirx/native_basics/cuda/profiling.rst | 310 +
include/tvm/ir/base_expr.h | 18 +-
include/tvm/ir/expr.h | 57 +-
include/tvm/ir/function.h | 8 +-
include/tvm/ir/module.h | 2 +-
include/tvm/ir/op.h | 14 +-
include/tvm/relax/attrs/create.h | 2 +-
include/tvm/relax/attrs/image.h | 4 +-
include/tvm/relax/attrs/linear_algebra.h | 2 +-
include/tvm/relax/attrs/manipulate.h | 6 +-
include/tvm/relax/attrs/nn.h | 12 +-
include/tvm/relax/attrs/sorting.h | 10 +-
include/tvm/relax/attrs/statistical.h | 2 +-
include/tvm/relax/expr.h | 109 +-
include/tvm/relax/expr_functor.h | 51 +-
include/tvm/relax/type.h | 18 +-
include/tvm/tirx/expr.h | 6 +-
python/tvm/backend/cuda/op.py | 7 +-
python/tvm/ir/__init__.py | 2 +-
python/tvm/ir/expr.py | 28 +-
python/tvm/ir/function.py | 4 +-
python/tvm/ir/module.py | 5 +-
python/tvm/ir/op.py | 4 +-
python/tvm/relax/__init__.py | 2 +-
python/tvm/relax/backend/metal/coreml.py | 5 +-
python/tvm/relax/expr.py | 57 +-
python/tvm/relax/expr_functor.py | 40 +-
python/tvm/relax/frontend/nn/extern.py | 6 +-
python/tvm/relax/frontend/nn/llm/kv_cache.py | 48 +-
python/tvm/relax/frontend/nn/modules.py | 4 +-
python/tvm/relax/frontend/nn/op.py | 12 +-
python/tvm/relax/frontend/onnx/onnx_frontend.py | 61 +-
.../tvm/relax/frontend/tflite/tflite_frontend.py | 12 +-
.../frontend/torch/base_fx_graph_translator.py | 26 +-
.../frontend/torch/exported_program_translator.py | 4 +-
python/tvm/relax/frontend/torch/fx_translator.py | 4 +-
python/tvm/relax/op/base.py | 2 +-
python/tvm/relax/op/builtin/builtin.py | 4 +-
python/tvm/relax/op/create.py | 73 +-
python/tvm/relax/op/manipulate.py | 34 +-
python/tvm/relax/op/memory/memory.py | 8 +-
python/tvm/relax/op/memory/view.py | 12 +-
python/tvm/relax/op/set.py | 12 +-
python/tvm/relax/op/vm/vm.py | 8 +-
python/tvm/relax/relax_to_pyfunc_converter.py | 8 +-
python/tvm/relax/script/builder/ir.py | 18 +-
python/tvm/relax/script/parser/parser.py | 27 +-
python/tvm/relax/testing/ast_printer.py | 3 -
.../fold_batch_norm_to_conv2d_for_inference.py | 2 +-
.../tvm/relax/transform/ipc_allreduce_rewrite.py | 2 +-
.../tvm/relax/transform/lazy_transform_params.py | 6 +-
python/tvm/relax/transform/legalize_ops/binary.py | 10 +-
python/tvm/relax/transform/legalize_ops/common.py | 6 +-
python/tvm/relax/transform/legalize_ops/create.py | 18 +-
.../tvm/relax/transform/legalize_ops/datatype.py | 4 +-
python/tvm/relax/transform/legalize_ops/index.py | 6 +-
.../relax/transform/legalize_ops/linear_algebra.py | 2 +-
.../tvm/relax/transform/legalize_ops/manipulate.py | 5 +-
.../relax/transform/lower_gpu_ipc_alloc_storage.py | 2 +-
python/tvm/relax/type.py | 2 +
python/tvm/relax/utils.py | 28 +-
src/arith/canonical_simplify.cc | 12 +-
src/arith/const_fold.h | 4 +-
src/arith/iter_affine_map.cc | 8 +-
src/backend/trn/transform/lower_trainium_layout.cc | 2 +-
src/ir/expr.cc | 7 +-
src/ir/module.cc | 4 +-
src/relax/analysis/type_analysis.cc | 35 +-
src/relax/backend/contrib/codegen_c/codegen_c.h | 2 +-
.../backend/contrib/codegen_json/codegen_json.h | 4 +-
src/relax/backend/contrib/cutlass/codegen.cc | 4 +-
src/relax/backend/contrib/tensorrt/codegen.cc | 11 +-
src/relax/backend/vm/codegen_vm.cc | 15 +-
src/relax/backend/vm/codegen_vm_tir.cc | 10 +-
src/relax/backend/vm/lower_runtime_builtin.cc | 10 +-
src/relax/backend/vm/vm_shape_lower.cc | 60 +-
src/relax/ir/block_builder.cc | 2 +-
src/relax/ir/dataflow_expr_rewriter.cc | 4 +-
src/relax/ir/dataflow_matcher.cc | 2 +-
src/relax/ir/dependent_type.cc | 11 +-
src/relax/ir/emit_te.cc | 2 +-
src/relax/ir/expr.cc | 19 -
src/relax/ir/expr_functor.cc | 21 +-
src/relax/ir/py_expr_functor.cc | 26 +-
src/relax/op/ccl/ccl.cc | 4 +-
src/relax/op/distributed/binary.h | 2 +-
src/relax/op/distributed/distributed.cc | 2 +-
src/relax/op/distributed/linear_algebra.cc | 6 +-
src/relax/op/distributed/nn.cc | 4 +-
src/relax/op/distributed/unary.h | 5 +-
src/relax/op/image/resize.cc | 20 +-
src/relax/op/memory/view.cc | 70 +-
src/relax/op/nn/convolution.cc | 48 +-
src/relax/op/nn/convolution.h | 2 +-
src/relax/op/nn/nn.cc | 18 +-
src/relax/op/op.cc | 58 +-
src/relax/op/op_common.h | 37 +-
src/relax/op/tensor/binary.cc | 5 +-
src/relax/op/tensor/create.cc | 99 +-
src/relax/op/tensor/create.h | 8 +-
src/relax/op/tensor/index.cc | 43 +-
src/relax/op/tensor/inspect.cc | 26 +-
src/relax/op/tensor/linear_algebra.cc | 10 +-
src/relax/op/tensor/manipulate.cc | 86 +-
src/relax/op/tensor/manipulate.h | 6 +-
src/relax/op/tensor/qdq.cc | 24 +-
src/relax/op/tensor/sampling.cc | 10 +-
src/relax/op/tensor/search.cc | 5 +-
src/relax/op/tensor/set.cc | 37 +-
src/relax/op/tensor/set.h | 4 +-
src/relax/op/tensor/sorting.cc | 15 +-
src/relax/op/tensor/sorting.h | 5 +-
src/relax/op/tensor/statistical.cc | 9 +-
src/relax/op/tensor/ternary.cc | 4 +-
src/relax/op/tensor/unary.cc | 12 +-
src/relax/script/printer/dependent_type.cc | 3 +-
src/relax/script/printer/distributed.cc | 5 +-
src/relax/script/printer/expr.cc | 8 -
src/relax/transform/adjust_matmul_order.cc | 12 +-
src/relax/transform/allocate_workspace.cc | 2 +-
src/relax/transform/alter_op_impl.cc | 2 +-
src/relax/transform/call_tir_rewrite.cc | 8 +-
src/relax/transform/combine_parallel_matmul.cc | 3 +-
src/relax/transform/compute_prim_value.cc | 19 +-
src/relax/transform/dataflow_inplace.cc | 4 +-
src/relax/transform/decompose_ops.cc | 8 +-
src/relax/transform/expand_matmul_of_sum.cc | 3 +-
src/relax/transform/fold_constant.cc | 4 +-
src/relax/transform/fuse_ops.cc | 10 +-
src/relax/transform/fuse_tir.cc | 10 +-
src/relax/transform/gradient.cc | 8 +-
src/relax/transform/infer_amp_utils.cc | 8 +-
src/relax/transform/lazy_transform_params.cc | 6 +-
src/relax/transform/lift_transform_params.cc | 2 +-
src/relax/transform/lower_alloc_tensor.cc | 8 +-
src/relax/transform/merge_composite_functions.cc | 2 +-
src/relax/transform/remove_unused_outputs.cc | 3 +-
src/relax/transform/remove_unused_parameters.cc | 2 +-
src/relax/transform/reorder_take_after_matmul.cc | 4 +-
src/relax/transform/rewrite_cuda_graph.cc | 10 +-
.../specialize_primfunc_based_on_callsite.cc | 8 +-
src/relax/transform/static_plan_block_memory.cc | 26 +-
src/relax/transform/to_mixed_precision.cc | 10 +-
src/relax/utils.cc | 10 +-
src/runtime/extra/contrib/tensorrt/tensorrt_ops.cc | 2 +-
src/runtime/vm/builtin.cc | 20 +-
src/s_tir/transform/inject_virtual_thread.cc | 2 +-
src/tirx/ir/expr.cc | 68 +-
src/tirx/ir/expr_functor.cc | 4 +-
src/tirx/op/op.cc | 4 +-
src/tirx/transform/flatten_buffer.cc | 2 +-
src/tirx/transform/lower_tirx_cleanup.cc | 2 +-
.../relax/backend/adreno/test_texture_network.py | 24 +-
...est_distributed_transform_propagate_sharding.py | 136 +-
.../test_distributed_tvmscript_printer.py | 2 +-
tests/python/relax/test_analysis_type_analysis.py | 2 +-
tests/python/relax/test_ast_printer.py | 11 +-
.../relax/test_backend_transform_shape_lower.py | 5 +-
tests/python/relax/test_bind_params.py | 2 +-
tests/python/relax/test_blockbuilder_core.py | 4 +-
tests/python/relax/test_codegen_cutlass.py | 2 +-
tests/python/relax/test_codegen_tensorrt.py | 2 +-
tests/python/relax/test_dataflow_inplace.py | 12 +-
tests/python/relax/test_dataflow_pattern.py | 23 +-
tests/python/relax/test_dataflow_rewriter.py | 4 +-
tests/python/relax/test_expr.py | 52 +-
tests/python/relax/test_expr_functor.py | 16 +-
tests/python/relax/test_frontend_dynamo.py | 2 +-
.../relax/test_frontend_from_exported_program.py | 23 +-
tests/python/relax/test_frontend_from_fx.py | 21 +-
tests/python/relax/test_frontend_nn_exporter.py | 2 +-
tests/python/relax/test_frontend_nn_modules.py | 29 +-
tests/python/relax/test_frontend_nn_op.py | 12 +-
tests/python/relax/test_frontend_onnx.py | 8949 +++++++++++++++-----
tests/python/relax/test_frontend_tflite.py | 93 +-
tests/python/relax/test_op_ccl.py | 20 +-
tests/python/relax/test_op_create.py | 66 +-
tests/python/relax/test_op_index.py | 120 +-
tests/python/relax/test_op_manipulate.py | 23 +-
tests/python/relax/test_op_qdq.py | 28 +
tests/python/relax/test_op_search.py | 2 +-
tests/python/relax/test_op_view.py | 12 +
tests/python/relax/test_relax_operators.py | 2 +-
.../python/relax/test_relax_to_pyfunc_converter.py | 4 +-
tests/python/relax/test_runtime_builtin.py | 6 +-
tests/python/relax/test_training_loss.py | 6 +-
.../relax/test_transform_adjust_matmul_order.py | 104 +-
.../relax/test_transform_canonicalize_bindings.py | 6 +-
tests/python/relax/test_transform_codegen_pass.py | 2 +-
.../test_transform_combine_parallel_matmul.py | 8 +-
.../python/relax/test_transform_convert_layout.py | 2 -
.../relax/test_transform_fuse_ops_by_pattern.py | 2 +-
tests/python/relax/test_transform_gradient.py | 10 +-
.../relax/test_transform_lazy_transform_params.py | 2 +-
.../relax/test_transform_lift_transform_params.py | 16 +-
.../test_transform_merge_composite_functions.py | 2 +-
.../relax/test_transform_to_mixed_precision.py | 14 +
tests/python/relax/test_tvmscript_parser.py | 30 +-
tests/python/relax/test_tvmscript_printer_relax.py | 29 +-
tests/python/relax/test_utils.py | 1 -
tests/python/relax/test_vm_build.py | 4 +-
tests/python/relax/test_vm_codegen_only.py | 4 +-
209 files changed, 9009 insertions(+), 3503 deletions(-)
create mode 100644 docs/tirx/native_basics/cuda/profiling.rst