This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a change to branch nightly
in repository https://gitbox.apache.org/repos/asf/tvm.git
from 162d43a997 [Relax][PyTorch] Add support for torch.einsum (#17186)
add e647684775 [MetaSchedule] Replace `xgboost.rabit` with
`xgboost.collective` because it's deprecated (#17166)
add bbc97c77fb [Disco] Group-wise operation (#17180)
add 50d1c97dc9 [DLIGHT][GPU] Add OpenCL dequant matmul schedule (#17187)
add 7c9969bbdf Remove and replace deprecated `distutils.util.strtobool()`
(#17185)
add 89b91e2b11 [KVCache] Partial layers support (#17192)
No new revisions were added by this update.
Summary of changes:
include/tvm/relax/attrs/ccl.h | 18 ++
include/tvm/runtime/disco/builtin.h | 15 +-
include/tvm/runtime/disco/disco_worker.h | 23 ++-
include/tvm/runtime/disco/session.h | 8 +-
python/tvm/auto_scheduler/testing/tune_onnx.py | 2 +-
python/tvm/auto_scheduler/testing/tune_relay.py | 2 +-
python/tvm/auto_scheduler/testing/tune_te.py | 2 +-
python/tvm/autotvm/testing/tune_relay.py | 2 +-
python/tvm/dlight/gpu/matmul.py | 144 ++++++++++++++--
python/tvm/exec/disco_worker.py | 15 +-
python/tvm/meta_schedule/cost_model/xgb_model.py | 9 +-
python/tvm/meta_schedule/testing/tune_onnx.py | 2 +-
python/tvm/meta_schedule/testing/tune_relay.py | 2 +-
python/tvm/meta_schedule/testing/tune_te.py | 2 +-
.../tvm/meta_schedule/testing/validate_database.py | 2 +-
python/tvm/relax/frontend/nn/op.py | 13 +-
python/tvm/relax/op/ccl/ccl.py | 24 +--
python/tvm/relax/transform/legalize_ops/ccl.py | 10 +-
python/tvm/runtime/disco/process_pool.py | 10 +-
python/tvm/runtime/disco/session.py | 101 ++++++++---
python/tvm/testing/utils.py | 15 ++
src/relax/op/ccl/ccl.cc | 22 ++-
src/relax/op/ccl/ccl.h | 4 +-
src/runtime/disco/builtin.cc | 34 ++--
src/runtime/disco/cuda_ipc/cuda_ipc_memory.cc | 4 +-
src/runtime/disco/cuda_ipc/custom_allreduce.cc | 4 +-
src/runtime/disco/disco_worker.cc | 9 -
src/runtime/disco/disco_worker_thread.h | 4 +-
src/runtime/disco/loader.cc | 8 +-
src/runtime/disco/nccl/nccl.cc | 102 ++++++-----
src/runtime/disco/nccl/nccl_context.h | 13 +-
src/runtime/disco/process_session.cc | 21 ++-
src/runtime/disco/threaded_session.cc | 16 +-
src/runtime/relax_vm/paged_kv_cache.cc | 82 ++++++---
tests/python/disco/test_callback.py | 11 +-
tests/python/disco/test_ccl.py | 168 +++++++++++++++++-
tests/python/disco/test_loader.py | 3 +-
tests/python/disco/test_session.py | 20 +--
tests/python/dlight/test_gpu_matmul.py | 192 +++++++++++++++++----
...ributed_transform_lower_global_to_local_view.py | 4 +-
..._builtin_paged_attention_kv_cache_flashinfer.py | 2 +-
...runtime_builtin_paged_attention_kv_cache_tir.py | 2 +-
.../relax/test_transform_legalize_ops_ccl.py | 18 +-
43 files changed, 886 insertions(+), 278 deletions(-)