This is an automated email from the ASF dual-hosted git repository.

github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git


    from 38b85c9f61 [Fix][dlight] add an explicit reduction loop check in 
Reduce (#17711)
     add be8e43814a [Refactor] Migrate build API to `tvm.compile` (#17718)
     add 56bfd72f7b [FFI] Fix dynamic FFI index to ensure compatibility (#17727)
     add e973770932 [DataType] BF16 Support (#17670)

No new revisions were added by this update.

Summary of changes:
 apps/android_rpc/tests/android_rpc_test.py         |   2 +-
 apps/ios_rpc/tests/ios_rpc_test.py                 |   2 +-
 docs/deep_dive/tensor_ir/tutorials/tir_creation.py |   2 +-
 .../tensor_ir/tutorials/tir_transformation.py      |   2 +-
 docs/get_started/tutorials/ir_module.py            |   4 +-
 docs/get_started/tutorials/quick_start.py          |   2 +-
 docs/how_to/tutorials/cross_compilation_and_rpc.py |   4 +-
 docs/how_to/tutorials/customize_opt.py             |   2 +-
 docs/how_to/tutorials/e2e_opt_model.py             |   2 +-
 docs/reference/api/python/driver.rst               |   2 +-
 include/tvm/runtime/data_type.h                    |   2 +
 include/tvm/runtime/object.h                       |   9 +-
 include/tvm/runtime/profiling.h                    |   2 +-
 include/tvm/script/ir_builder/tir/ir.h             |   2 +
 python/tvm/_ffi/runtime_ctypes.py                  |   1 +
 python/tvm/contrib/msc/core/runtime/runner.py      |   4 +-
 .../contrib/msc/framework/tvm/runtime/runner.py    |   8 +-
 python/tvm/dlight/benchmark/bench.py               |   2 +-
 python/tvm/exec/gpu_memory_bandwidth.py            |   4 +-
 python/tvm/ir/instrument.py                        |   2 +-
 .../tvm/meta_schedule/testing/validate_database.py |   2 +-
 python/tvm/relax/frontend/nn/extern.py             |   2 +-
 python/tvm/relax/pipeline.py                       |   4 +-
 python/tvm/relax/training/trainer.py               |   2 +-
 .../transform/tuning_api/default_functions.py      |   2 +-
 python/tvm/relax/vm_build.py                       |   2 +-
 python/tvm/runtime/profiling/__init__.py           |   2 +-
 python/tvm/runtime/relax_vm.py                     |   6 +-
 python/tvm/script/ir_builder/tir/ir.py             |   4 +-
 python/tvm/testing/utils.py                        |   2 +-
 python/tvm/topi/sort.py                            |   2 +-
 .../postproc/disallow_async_strided_mem_copy.cc    |  10 +-
 src/relax/op/nn/nn.cc                              |   3 +-
 src/relax/op/op_common.h                           |   3 +-
 src/script/ir_builder/tir/ir.cc                    |   2 +
 src/target/source/codegen_c_host.cc                |  14 +-
 src/target/source/codegen_cuda.cc                  |   2 +-
 src/target/source/intrin_rule_cuda.cc              |   8 +-
 src/tir/op/op.cc                                   |   2 +-
 src/tir/transforms/unsupported_dtype_legalize.cc   |  48 ++-
 .../test_minimal_target_codegen_llvm.py            |   2 +-
 tests/python/codegen/test_gpu_codegen_allreduce.py |   6 +-
 tests/python/codegen/test_inject_ptx_ldg32.py      |   2 +-
 tests/python/codegen/test_target_codegen.py        |   8 +-
 .../python/codegen/test_target_codegen_aarch64.py  |  40 +--
 tests/python/codegen/test_target_codegen_arm.py    |   8 +-
 tests/python/codegen/test_target_codegen_blob.py   |   4 +-
 tests/python/codegen/test_target_codegen_bool.py   |   2 +-
 tests/python/codegen/test_target_codegen_c_host.py |  12 +-
 .../codegen/test_target_codegen_cross_llvm.py      |   4 +-
 tests/python/codegen/test_target_codegen_cuda.py   |  57 ++--
 .../python/codegen/test_target_codegen_cuda_fp4.py |   8 +-
 .../python/codegen/test_target_codegen_cuda_fp8.py |  24 +-
 tests/python/codegen/test_target_codegen_device.py |   4 +-
 tests/python/codegen/test_target_codegen_extern.py |   6 +-
 .../codegen/test_target_codegen_gpu_common.py      |   2 +-
 .../python/codegen/test_target_codegen_hexagon.py  |   6 +-
 tests/python/codegen/test_target_codegen_llvm.py   |  93 +++---
 tests/python/codegen/test_target_codegen_metal.py  |  14 +-
 tests/python/codegen/test_target_codegen_opencl.py |  23 +-
 tests/python/codegen/test_target_codegen_riscv.py  |   5 +-
 tests/python/codegen/test_target_codegen_rocm.py   |   8 +-
 tests/python/codegen/test_target_codegen_vulkan.py |  18 +-
 tests/python/codegen/test_target_codegen_x86.py    |   7 +-
 tests/python/contrib/test_cblas.py                 |   8 +-
 tests/python/contrib/test_dlpack.py                |   2 +-
 .../python/contrib/test_hexagon/infrastructure.py  |   2 +-
 .../test_hexagon/test_2d_physical_buffers.py       |   4 +-
 .../test_hexagon/test_async_dma_pipeline.py        |   2 +-
 .../test_hexagon/test_benchmark_elemwise_add.py    |   2 +-
 .../test_hexagon/test_benchmark_maxpool2d.py       |   2 +-
 .../contrib/test_hexagon/test_dma_builtin.py       |   2 +-
 .../contrib/test_hexagon/test_memory_alloc.py      |   2 +-
 .../contrib/test_hexagon/test_meta_schedule.py     |   2 +-
 .../contrib/test_hexagon/test_parallel_hvx.py      |   2 +-
 .../test_hexagon/test_parallel_hvx_load_vtcm.py    |   4 +-
 .../contrib/test_hexagon/test_parallel_scalar.py   |   2 +-
 .../test_relax_2d_buffer_allocation.py             |   2 +-
 .../contrib/test_hexagon/test_relax_integration.py |   8 +-
 tests/python/contrib/test_hexagon/test_sigmoid.py  |   2 +-
 .../test_hexagon/test_software_pipeline_async.py   |   2 +-
 tests/python/contrib/test_hexagon/test_take.py     |   2 +-
 .../contrib/test_hexagon/test_thread_pool.py       |   4 +-
 tests/python/contrib/test_hexagon/test_vtcm.py     |   8 +-
 .../contrib/test_hexagon/test_vtcm_bandwidth.py    |   2 +-
 tests/python/contrib/test_hipblas.py               |   4 +-
 tests/python/contrib/test_mps.py                   |   4 +-
 tests/python/contrib/test_msc/test_plugin.py       |   2 +-
 .../contrib/test_msc/test_translate_relax.py       |   2 +-
 .../contrib/test_msc/test_translate_tensorrt.py    |   2 +-
 tests/python/contrib/test_random.py                |   6 +-
 tests/python/contrib/test_rocblas.py               |   4 +-
 tests/python/contrib/test_sort.py                  |   4 +-
 .../python/contrib/test_tir_triton_integration.py  |   2 +-
 tests/python/disco/test_callback.py                |   2 +-
 tests/python/disco/test_ccl.py                     |   4 +-
 tests/python/disco/test_loader.py                  |   2 +-
 tests/python/disco/test_session.py                 |   4 +-
 tests/python/ir/test_datatype_nv_fp8.py            |   2 +-
 tests/python/ir/test_pass_instrument.py            |   2 +-
 .../meta_schedule/test_meta_schedule_tune_tir.py   |   2 +-
 tests/python/nightly/test_nnapi/infrastructure.py  |   2 +-
 tests/python/nightly/test_nnapi/test_network.py    |   2 +-
 tests/python/nightly/test_nnapi/test_ops.py        |   2 +-
 tests/python/relax/backend/clml/utils.py           |   4 +-
 .../test_runtime_builtin_kv_cache_transfer.py      |   2 +-
 .../relax/test_backend_dispatch_sort_scan.py       |   2 +-
 tests/python/relax/test_codegen_coreml.py          |   4 +-
 tests/python/relax/test_codegen_cublas.py          |   2 +-
 tests/python/relax/test_codegen_cudnn.py           |   2 +-
 tests/python/relax/test_codegen_cutlass.py         |  18 +-
 tests/python/relax/test_codegen_dnnl.py            |   2 +-
 tests/python/relax/test_codegen_hipblas.py         |   2 +-
 tests/python/relax/test_codegen_tensorrt.py        |   2 +-
 tests/python/relax/test_codegen_tir_cutlass.py     |  12 +-
 tests/python/relax/test_contrib_vllm.py            |   2 +-
 tests/python/relax/test_dataflow_inplace.py        |   4 +-
 tests/python/relax/test_dataflow_pattern.py        |   4 +-
 tests/python/relax/test_e2e_op_dynamic.py          |   2 +-
 .../python/relax/test_frontend_nn_extern_module.py |   4 +-
 tests/python/relax/test_frontend_nn_op.py          |   8 +-
 tests/python/relax/test_frontend_onnx.py           |   2 +-
 tests/python/relax/test_frontend_stablehlo.py      |   4 +-
 tests/python/relax/test_op_gradient_numeric.py     |   4 +-
 tests/python/relax/test_op_inspect.py              |  18 +-
 tests/python/relax/test_op_take.py                 |  10 +-
 tests/python/relax/test_op_view.py                 |  10 +-
 tests/python/relax/test_pipeline.py                |   4 +-
 ...runtime_builtin_paged_attention_kv_cache_cpu.py |   2 +-
 ..._builtin_paged_attention_kv_cache_flashinfer.py |   2 +-
 ...ltin_paged_attention_kv_cache_mla_flashinfer.py |   2 +-
 ...ime_builtin_paged_attention_kv_cache_mla_tir.py |   2 +-
 ...runtime_builtin_paged_attention_kv_cache_tir.py |   2 +-
 .../python/relax/test_runtime_builtin_rnn_state.py |   2 +-
 tests/python/relax/test_tir_call_source_kernel.py  |   2 +-
 .../relax/test_training_optimizer_numeric.py       |   2 +-
 .../python/relax/test_training_trainer_numeric.py  |   8 +-
 tests/python/relax/test_transform_bind_params.py   |   4 +-
 tests/python/relax/test_transform_codegen_pass.py  |   6 +-
 .../python/relax/test_transform_few_shot_tuning.py |   4 +-
 .../test_transform_fold_batch_norm_to_conv2d.py    |   4 +-
 .../relax/test_transform_gradient_numeric.py       |   2 +-
 .../relax/test_transform_lazy_transform_params.py  |   2 +-
 .../relax/test_vm_alloc_storage_with_scope.py      |   6 +-
 tests/python/relax/test_vm_builtin.py              |   4 +-
 tests/python/relax/test_vm_callback_function.py    |   6 +-
 tests/python/relax/test_vm_cuda_graph.py           |   2 +-
 tests/python/relax/test_vm_execbuilder.py          |   2 +-
 tests/python/relax/test_vm_instrument.py           |   4 +-
 tests/python/relax/test_vm_multi_device.py         |   2 +-
 tests/python/relax/test_vm_profiler.py             |   4 +-
 .../python/runtime/test_evaluator_with_preproc.py  |  10 +-
 tests/python/runtime/test_runtime_dlpack.py        |   2 +-
 tests/python/runtime/test_runtime_extension.py     |   2 +-
 tests/python/runtime/test_runtime_measure.py       |   2 +-
 tests/python/runtime/test_runtime_module_export.py |   4 +-
 tests/python/runtime/test_runtime_module_load.py   |  25 +-
 .../python/runtime/test_runtime_module_property.py |   2 +-
 tests/python/runtime/test_runtime_rpc.py           |  10 +-
 tests/python/runtime/test_runtime_trace.py         |  14 +-
 tests/python/target/test_arm_target.py             |   8 +-
 tests/python/target/test_target_target.py          |   2 +-
 tests/python/te/test_te_create_primfunc.py         |   4 +-
 tests/python/tir-base/test_tir_base.py             |   2 +-
 tests/python/tir-base/test_tir_imm_values.py       |  48 +--
 tests/python/tir-base/test_tir_intrin.py           |  10 +-
 tests/python/tir-base/test_tir_ptx_cp_async.py     |   6 +-
 tests/python/tir-base/test_tir_ptx_ldmatrix.py     |   2 +-
 tests/python/tir-base/test_tir_ptx_mma.py          |  40 ++-
 tests/python/tir-base/test_tir_ptx_mma_sp.py       |   4 +-
 .../python/tir-base/test_tir_te_extern_primfunc.py |   4 +-
 tests/python/tir-base/test_tir_texture_scope.py    |   2 +-
 .../test_tir_schedule_decompose_padding.py         |   4 +-
 .../test_tir_schedule_rolling_buffer.py            |   4 +-
 ..._tir_schedule_tensorize_ldmatrix_mma_numeric.py |   2 +-
 .../test_tir_schedule_tensorize_mfma_numeric.py    |   2 +-
 .../test_tir_transform_bf16_legalize.py            | 364 ++++++++++++++++-----
 .../test_tir_transform_inject_ptx_async_copy.py    |  10 +-
 .../test_tir_transform_inject_software_pipeline.py |   2 +-
 .../test_tir_transform_lower_intrin.py             |   2 +-
 .../test_tir_transform_lower_tvm_builtin.py        |   4 +-
 .../test_tir_transform_make_packed_api.py          |   8 +-
 .../tir-transform/test_tir_transform_vectorize.py  |   6 +-
 tests/python/tvmscript/test_tvmscript_ops.py       |   8 +-
 184 files changed, 869 insertions(+), 619 deletions(-)

Reply via email to