This is an automated email from the ASF dual-hosted git repository.

tqchen pushed a change to branch unity-staging
in repository https://gitbox.apache.org/repos/asf/tvm.git


    omit d103ee2070 [Unity][Fix] FX translating dtype (#14201)
    omit f7f24b7d16 [Unity][Frontend] FX translator returning weights with 
`keep_params_as_input` (#14197)
    omit 284b278706 [Unity][Frontend] FX translator supporting more ops (#14196)
    omit 0e98e6e478 [Unity][Op] Legalize `round`, `floor`, `ceil`, `sign` 
(#14198)
    omit 88ab7302ba [Unity][Op] Argmax and argmin (#14195)
    omit 22b65bc6eb [Unity][Op] Group normalization (#14194)
    omit 1f042218d3 [Unity][Transform] LiftTransformParams handling multiple 
functions (#14192)
    omit ed5367d161 [Unity][WEBGPU] Codegen improvements and WebRuntime (#14187)
    omit 38315afbf2 [Unity][OP] Add an operator for fused multi head attention 
(#14150)
    omit 475f3c24fa [Unity][Analysis] Restore Python bindings for var analyses 
(#14180)
    omit 781bfe0a21 [Unity][Op] Full support of Relax op `power` (#14171)
    omit 8423811429 [Unity][BYOC] Add batch matmul support to Relax CUTLASS 
BYOC (#14166)
    omit 6ee79e1e08 [Unity][Analysis] Analysis for detecting recursion in Relax 
(#14149)
    omit 3fa880aeb5 [Unity] Add bind_constants option to FuseOpsByPattern 
(#14151)
    omit e57f59178f [Unity][BYOC] Use Relax legalize + CPU build for reference 
in tests (#14162)
    omit 67659acf34 [Unity][Analysis] Checking function return struct info in 
well-formed check (#14155)
    omit 8a1e623fc1 [Unity][Pass] Support Symbolic Shape Deduction during 
BindParam (#14154)
    omit 4c085d2212 [Unity][Debugging] AST printer (#14152)
    omit c29ac7eef0 [Unity][Pass] Enhance constant folding to fold relax ops by 
evaluating them. (#14146)
    omit 7a5d313068 [Unity][Legalize] Fix Scalar Constant Legalization (#14127)
    omit 63ce37d30b [Unity] Add callback to FuseOpsByPattern to check match 
result is accepted (#14109)
    omit 28c6825655 [Unity][BYOC] Assign group to unused bindings and ignroe 
PrimFunc (#14139)
    omit 4713b527cb [Unity][TVMScript] emit_te sugar (#14123)
    omit 368d9f6193 [Unity][BYOC] Add transposed matmul support to Relax 
CUTLASS BYOC (#14128)
    omit 61c27610c9 [Unity] Add Global info (#14132)
    omit 57c86eb774 [Unity][WEB] Relax vm on web runtime (#14131)
    omit c7d2c38dd9 [Unity][BlockBuilder] Add `name_hint` argument for `emit` 
and `emit_output` (#14126)
    omit 02b3a1f2ff [Unity][Fix] Fix bug in MergeCompositeFunctions (#14117)
    omit 89bb68b0a0 [Unity] Update tests again to adapt to latest TVMScript 
syntax (#14115)
    omit eaaa1fbdcb [Unity][BYOC]Add relax backend pattern registry (#14106)
    omit b755a6f004 [Unity] Remove attributes of relax.print, assert and unique 
(#14101)
    omit 98d0a01bc9 [Unity][Layout] Add layout transformation analysis for 
PrimFunc (#14066)
    omit 74f3007c81 [Unity] Relax Recursive function (#14092)
    omit a8338e6b69 [Unity] Lower `shape_of` to a builtin (#14093)
    omit b1f2d530fc [Unity] Fix typo in the comment (#14096)
    omit cf36b7bdac [Unity][Relax] Set Shape Function to Be Host Function 
(#14090)
    omit 19509408b4 [Unity] Refactor Relax Build JIT UX (#14088)
    omit acd0e0b999 [Unity][Fix][Pass] FoldConstant with DCE in dataflow block 
(#14087)
    omit 6e2d7bbfd4 [Unity][Analysis] TIR pattern kind analysis for 
multi-buffer write block (#14075)
    omit 7645aa7688 [Unity][Op] `log_softmax` and `cross_entropy_with_logits` 
(#14083)
    omit defc15b6f2 [Unity][BYOC] Add DNNL backend (#14082)
    omit b8460ebabc [Unity][BYOC] Add CUTLASS backend (#14081)
    omit 3a64963901 [Unity] Add testcases for `expr_args_converter` (#14080)
    omit 4ad8d64155 [Unity][Pass] Canonicalize Bindings (#14079)
    omit e8a0c4d01f [Unity][BYOC][Pass] RunCodegen and TensorRT  (#14078)
    omit 246c4c13b8 [Unity][Transform] Add LiftTransformParams pass (#14069)
    omit 0d5883539d [Unity][Frontend] Annotate number of non-static input of FX 
function (#14067)
    omit ed2696a595 [Unity][BYOC] Add pass to merge composite functions to 
offload large subgraphs (#14062)
    omit a9032d98e6 [Unity][Pass] Remove Unused Function (#14061)
    omit 06de35ec74 [Unity][Fix][Pass] Fix FuseOps for lack graph edges (#14058)
    omit fada709394 [Unity] Relax op: collapse sum (#14059)
    omit aa55c05560 [Unity][BYOC] Add pattern-based partitioning pass (#14054)
    omit fe528f647c [Unity][VM] Add per-op profiling support  (#14053)
    omit 180bead06b [Unity][TVMScript] Overload `__neg__` for relax expr 
(#14045)
    omit c1439b3adb [Unity][Pass] FuseOps FuseTIR fixes (#14044)
    omit 1b85765d5c [Unity] Statement rewriter for DataflowBlock (#14043)
    omit 782c632604 [Unity] Relax dataflow pattern language (matching) (#14041)
    omit 8039f6a75e [Unity] Update tests to adapt to latest TVMScript syntax 
(#14039)
    omit d8fdd5cdb6 [Unity] Disallow inline prim_func in relax IR (#14040)
    omit fd35d1ef5e [Unity][Pass] Block-level static memory planning (#14038)
    omit 9b5f2148fb [Unity] Initial PyTorch Frontend (#14037)
    omit 449e094e80 [Unity][Op] Add ShapeExpr Tests for Reshape Op (#14035)
    omit b150b1a6ac [Unity][Pass] Operator legalization (#14029)
    omit 596d472a4f [Unity][TVMScript] Move tir/relax import in script out of 
__init__.py (#14033)
    omit 53f800d32f [Unity][Pass] Wellformed Analysis (#14032)
    omit 91adf7b0a4 [Unity][BlockBuilder] CallTE convert PrimValue args  
(#14028)
    omit fc0540cf11 [Unity][Pass] Normalize Pass (#14031)
    omit 24470c95d7 [Unity] Relay -> Relax translator  (#14026)
    omit 88852c1e16 [Unity][Pass][TuningAPI] Introduce TuningAPI and 
MetaSchedule pass (#14014)
    omit 733fc00145 [Unity][Pass] BindParams pass, FoldConstant pass (#14016)
    omit fd5c73d62c [Unity][VM] Supporting "compiled" exec mode. (#14015)
    omit 33c4aabff9 [Unity][Pass] LambdaLift pass (#14012)
    omit 07e0dfb06e [Unity][Pass] Operator Fusion Passes (#14001)
    omit 9317ec8db7 [Unity] NestedMsg Support utility (#13995)
    omit 17cf44657d [Unity] Relax op: manipulation (#13989)
    omit b6818bba6b [Unity] Relax op: search (#13992)
    omit c788135337 [Unity] Relax op: linear algebra (#13988)
    omit 9113fc992d [Unity] Relax op: creation (#13984)
    omit 71437f7488 [Unity] Relax op: neural networks (#13993)
    omit f491b96273 [Unity] Relax op: statistical (#13991)
    omit 72bca0f3ea [Unity] Relax op: arithmetic, comparison (#13983)
    omit 5723ebb2fd [Unity] Relax op: image (#13994)
    omit 68a04a8144 [Unity] Relax op: set (#13990)
    omit 2e08c8c8bc [Unity] Relax op: datatype (#13986)
    omit e8227b91f8 [Unity] Relax op: index (#13987)
    omit ad4185cf07 [Unity][TVMScript] Use explicit `R.shape` in TVMScript 
(#13979)
    omit f735d932f6 [Unity] e2e Relax minimum build flow (#13961)
    omit a966cf115b [Unity] Relax VM shape lowering pass (#13956)
    omit 850d6a4c66 [Unity] Relax VM codegen (#13954)
    omit 846a2c59aa [Unity] Relax TVMScript Printer (#13944)
    omit 1807e6f015 [Unity] Relax TVMScript Parser. (#13932)
    omit bb0c129b7c [Unity] Relax BlockBuilder and ExprMutator (#13926)
    omit ff8bfa2732 [Unity] Basic StructInfo Analysis and Expr construction 
(#13916)
    omit b59ad4839c [Unity][CI] Unity specific jenkins setup (do not upstream 
to main) (#13910)
    omit 4d46290e7b [Unity][IR] First-class StructInfo (#13907)
    omit 9508a18d9e [Unity] Relax expressions and types (#13901)
    omit e7b02f29c1 [Unity] Relax VM (#13878)
     add a15ade30b1 [TVMC] Add option to dump TIR code to file (#14186)
     add 424c749a3d [MetaSchedule] Tile and pack intermediate output for CUDA 
TensorCore (#14108)
     add e1c2ad18e9 [TVMScript] Distinguish LetStmt and Let expression (#14207)
     add 9b9124721c [Frontend][PaddlePaddle] Fix bug in tests for upgrading 
paddlepaddle to 2.4.2 (#14206)
     add 012d6a72f6 [IR] Platform-independent SHash (#14204)
     add 2f2d5d439a [MetaSchedule] preseve global_symbol attached to function 
after applying MS (#14219)
     add be66a7e0e4 [TVMScript] Sugar T.env_thread + T.launch_thread (#14217)
     add 2c4af88563 [TVMScript] Sugar Var Definition in TIR Buffer (#14223)
     add 082c4432fb [Refactor] Move `VarUseDefAnalysis` to header file (#14185)
     add ca48cafae3 [Docker] Add script to build llvm from source (#13823)
     add 56ddd37d78 [TIR] Enhance loop unroll with unroll local access (#14224)
     add e59d1efc68 [Fix][TVMScript]TVMScript BinOP printing refactor  (#14200)
     add 9d732d0faa [TensorIR][Primitive] New schedule primitive 
`reindex_cache_read/write` (#14161)
     add e8576db88b [Fix]Fix function ObjectPath in IRModule SEqual (#14230)
     add 902c2e2db7 [TVMScript] Support SizeVar Roundtripping (#14227)
     add 1453fe0780 [PaddlePaddle Hackathon 4][Frontend][Paddle]Add 
tile/mish/stack/unstack/silu/softshrink/where op for paddle frontend (#14160)
     add 6b4e3d08ea [TEST] Fix division by 0 in llvm codegen test (#14232)
     add 52292cfa60 [TVMC][TRANSFORMS] ToMixedPrecision transform support with 
custom options enabled (#14010)
     add 75f8307c48 [LLVM][BugFix] Fix include Triplet.h bug when LLVM 
version>= 17 (#14235)
     add fd5eae44dc [CI] Update cpu and gpu image (#14245)
     add f3b64b7a67 Update to v0.12.dev0 (#14241)
     add 594bc0fea8 Relay transform for rolling a known pattern into 
batch_matmul (#14210)
     add 422ca2855a [TIR][Schedule] Fix reverse_compute_inline (#14263)
     add 302cee9948 [BYOC] DNNL C_SRC Fix (#14267)
     add 852f97d4b5 [SVE] Adding codegen tests for SVE (#14239)
     add c59bc29512 [Arith] Add simplification rule for `x - max(x+y, z)` 
(#14271)
     add 92de8e9afe [Transform] Use callable() instead of isinstance() for type 
checking (#14248)
     add e3c8f2bc2d [Frontend][Paddle]add take_alone_axis and topk converter 
for paddle frontend (#14170)
     add caf6b0339c [TVMScript][Parser] Add more warp-level builtins and 
`Range` (#14279)
     add 6fa88e38a6 [PaddlePaddle Hackathon 4][Frontend][Paddle]add 
thresholded_relu/index_select/eye/linspace/take_alone_axis/dist for paddle 
frontend (#14172)
     new 99b5cdd22a [Unity] Relax VM (#13878)
     new e9b9218cc4 [Unity] Relax expressions and types (#13901)
     new efd9a8a0ad [Unity][IR] First-class StructInfo (#13907)
     new fff7f9201a [Unity][CI] Unity specific jenkins setup (do not upstream 
to main) (#13910)
     new c1a0907f60 [Unity] Basic StructInfo Analysis and Expr construction 
(#13916)
     new 187d5f87f2 [Unity] Relax BlockBuilder and ExprMutator (#13926)
     new 60ae9aca7f [Unity] Relax TVMScript Parser. (#13932)
     new 974d00c535 [Unity] Relax TVMScript Printer (#13944)
     new 70c466d1fe [Unity] Relax VM codegen (#13954)
     new 84b9b1dd3d [Unity] Relax VM shape lowering pass (#13956)
     new dc52afb470 [Unity] e2e Relax minimum build flow (#13961)
     new 3e8560e4bc [Unity][TVMScript] Use explicit `R.shape` in TVMScript 
(#13979)
     new 57800b3103 [Unity] Relax op: index (#13987)
     new 47106a3250 [Unity] Relax op: datatype (#13986)
     new 20995b420d [Unity] Relax op: set (#13990)
     new ec01577489 [Unity] Relax op: image (#13994)
     new 73e2cb1237 [Unity] Relax op: arithmetic, comparison (#13983)
     new b94c6e4f11 [Unity] Relax op: statistical (#13991)
     new 1525c64151 [Unity] Relax op: neural networks (#13993)
     new 25d66c0b62 [Unity] Relax op: creation (#13984)
     new 8a8674f242 [Unity] Relax op: linear algebra (#13988)
     new f2ae9fc2ce [Unity] Relax op: search (#13992)
     new 6ec3ca0422 [Unity] Relax op: manipulation (#13989)
     new 17b4090846 [Unity] NestedMsg Support utility (#13995)
     new 2b6cc7b35b [Unity][Pass] Operator Fusion Passes (#14001)
     new bfd2ca073c [Unity][Pass] LambdaLift pass (#14012)
     new fb8260aa0d [Unity][VM] Supporting "compiled" exec mode. (#14015)
     new b96dbcec2d [Unity][Pass] BindParams pass, FoldConstant pass (#14016)
     new 6107a8c018 [Unity][Pass][TuningAPI] Introduce TuningAPI and 
MetaSchedule pass (#14014)
     new 4eb8887636 [Unity] Relay -> Relax translator  (#14026)
     new ff44563d87 [Unity][Pass] Normalize Pass (#14031)
     new da584fadc5 [Unity][BlockBuilder] CallTE convert PrimValue args  
(#14028)
     new 2f148e383b [Unity][Pass] Wellformed Analysis (#14032)
     new 286f737481 [Unity][TVMScript] Move tir/relax import in script out of 
__init__.py (#14033)
     new 14f16d5994 [Unity][Pass] Operator legalization (#14029)
     new 080ac05f49 [Unity][Op] Add ShapeExpr Tests for Reshape Op (#14035)
     new a063fa2b6b [Unity] Initial PyTorch Frontend (#14037)
     new 889749014a [Unity][Pass] Block-level static memory planning (#14038)
     new 444e1ee26e [Unity] Disallow inline prim_func in relax IR (#14040)
     new bce1fd0514 [Unity] Update tests to adapt to latest TVMScript syntax 
(#14039)
     new 9166b5c7b6 [Unity] Relax dataflow pattern language (matching) (#14041)
     new 604fd4ce94 [Unity] Statement rewriter for DataflowBlock (#14043)
     new c8455a23e0 [Unity][Pass] FuseOps FuseTIR fixes (#14044)
     new 5a33692494 [Unity][TVMScript] Overload `__neg__` for relax expr 
(#14045)
     new 8432c1ff21 [Unity][VM] Add per-op profiling support  (#14053)
     new 96d21260bf [Unity][BYOC] Add pattern-based partitioning pass (#14054)
     new 3736c5fcdf [Unity] Relax op: collapse sum (#14059)
     new 8efdb5bfe7 [Unity][Fix][Pass] Fix FuseOps for lack graph edges (#14058)
     new f04810b118 [Unity][Pass] Remove Unused Function (#14061)
     new 8a46f67af1 [Unity][BYOC] Add pass to merge composite functions to 
offload large subgraphs (#14062)
     new 680c811b86 [Unity][Frontend] Annotate number of non-static input of FX 
function (#14067)
     new 8700dfc00b [Unity][Transform] Add LiftTransformParams pass (#14069)
     new 2fa1246a6e [Unity][BYOC][Pass] RunCodegen and TensorRT  (#14078)
     new fd2cfc5f2a [Unity][Pass] Canonicalize Bindings (#14079)
     new c6158401ee [Unity] Add testcases for `expr_args_converter` (#14080)
     new 336fb434e5 [Unity][BYOC] Add CUTLASS backend (#14081)
     new 6758d4222f [Unity][BYOC] Add DNNL backend (#14082)
     new 3fafeb2089 [Unity][Op] `log_softmax` and `cross_entropy_with_logits` 
(#14083)
     new 74343978e9 [Unity][Analysis] TIR pattern kind analysis for 
multi-buffer write block (#14075)
     new b7d09e394f [Unity][Fix][Pass] FoldConstant with DCE in dataflow block 
(#14087)
     new 8627e158f3 [Unity] Refactor Relax Build JIT UX (#14088)
     new 58c51b2c50 [Unity][Relax] Set Shape Function to Be Host Function 
(#14090)
     new 8369c84a2b [Unity] Fix typo in the comment (#14096)
     new b070703c44 [Unity] Lower `shape_of` to a builtin (#14093)
     new c281556950 [Unity] Relax Recursive function (#14092)
     new a15cbb31bc [Unity][Layout] Add layout transformation analysis for 
PrimFunc (#14066)
     new 08fb0046d1 [Unity] Remove attributes of relax.print, assert and unique 
(#14101)
     new 4e9223c18c [Unity][BYOC]Add relax backend pattern registry (#14106)
     new 04ee096572 [Unity] Update tests again to adapt to latest TVMScript 
syntax (#14115)
     new d0a8113593 [Unity][Fix] Fix bug in MergeCompositeFunctions (#14117)
     new 8ed0b4d8b8 [Unity][BlockBuilder] Add `name_hint` argument for `emit` 
and `emit_output` (#14126)
     new 48c309e3e3 [Unity][WEB] Relax vm on web runtime (#14131)
     new a54001759d [Unity] Add Global info (#14132)
     new 25b00b9b19 [Unity][BYOC] Add transposed matmul support to Relax 
CUTLASS BYOC (#14128)
     new 055e2adada [Unity][TVMScript] emit_te sugar (#14123)
     new 15d30ba845 [Unity][BYOC] Assign group to unused bindings and ignroe 
PrimFunc (#14139)
     new fbb6fba774 [Unity] Add callback to FuseOpsByPattern to check match 
result is accepted (#14109)
     new 3103bc643e [Unity][Legalize] Fix Scalar Constant Legalization (#14127)
     new 02ce8fa5ae [Unity][Pass] Enhance constant folding to fold relax ops by 
evaluating them. (#14146)
     new c72af8043e [Unity][Debugging] AST printer (#14152)
     new bab52c564f [Unity][Pass] Support Symbolic Shape Deduction during 
BindParam (#14154)
     new d3c9e3c72b [Unity][Analysis] Checking function return struct info in 
well-formed check (#14155)
     new c8ec0ffd47 [Unity][BYOC] Use Relax legalize + CPU build for reference 
in tests (#14162)
     new 1cbc233f35 [Unity] Add bind_constants option to FuseOpsByPattern 
(#14151)
     new 4b681c805e [Unity][Analysis] Analysis for detecting recursion in Relax 
(#14149)
     new 80cba01e4a [Unity][BYOC] Add batch matmul support to Relax CUTLASS 
BYOC (#14166)
     new 5d7adf90c9 [Unity][Op] Full support of Relax op `power` (#14171)
     new 0004320e82 [Unity][Analysis] Restore Python bindings for var analyses 
(#14180)
     new cc9afb3bba [Unity][OP] Add an operator for fused multi head attention 
(#14150)
     new d72f6fc919 [Unity][WEBGPU] Codegen improvements and WebRuntime (#14187)
     new 10df00c36d [Unity][Transform] LiftTransformParams handling multiple 
functions (#14192)
     new 823bedc8ff [Unity][Op] Group normalization (#14194)
     new 0f40563fed [Unity][Op] Argmax and argmin (#14195)
     new 7205c0c255 [Unity][Op] Legalize `round`, `floor`, `ceil`, `sign` 
(#14198)
     new f8a3784815 [Unity][Frontend] FX translator supporting more ops (#14196)
     new bf4359f174 [Unity][Frontend] FX translator returning weights with 
`keep_params_as_input` (#14197)
     new 4b89fa518e [Unity][Fix] FX translating dtype (#14201)
     new 433e126bda [Unity][TIR][Pass] ForceNarrowIndexToInt32 (#14203)
     new f7bc435ad3 [Unity][Frontend] FX translator support torch.baddbmm 
(#14202)
     new 4ae250cb26 [Unity] Introduce Default GPU Schedule Pass (#14182)
     new 7f33052905 [Unity][Frontend] Attach imported model weights, deprecate 
ImporterOutput (#14211)
     new 60ca6b0aca [Unity][Frontend] FX translator supports unwrapping unit 
return tuple (#14212)
     new 02a824a56a [Unity][WEB] Improve webgpu codegen options to skip 
readonly (#14213)
     new 2d03ca5735 [Unity][Frontend] from_fx keeps parameters in order (#14214)
     new 8379ed97ef [Unity][BYOC] Add dynamic shape support to CUTLASS matmul 
(#14216)
     new eb0faae8d3 [Unity][Transform] Memory plan across the IRModule (#14220)
     new 8fbd14d7b1 [Unity][WEB] Simplify WebGPU Codegen per spec (#14225)
     new f055ab90db [Unity] ensure memory.alloc_tensor/storage roundtrippable 
(#14226)
     new 2d6e528e1c [Unity] Improve implementation of FuseOps (#14229)
     new 62bb5b7630 [Unity][Transform] SimplifyNormInference (#14221)
     new 40ca12b6e1 [Unity][Bugfix] Do not include `PrimFunc`s in the 
dependency graph when checking for recursion (#14228)
     new 70ecb435be [Unity][TVMScript] Enable Context-Aware Parsing (#14234)
     new c77caeb65a [Unity][TVMScript] Fix prim_func lost issue in 
relax.emit_te (#14189)
     new e0ec19adfa [Unity][WEB] Update text prompts for syntactical 
correctness (#14237)
     new af1792ebb9 [Unity][WEB] Improve ndarray cache (#14236)
     new 48eb2582e1 [Unity][Op][Tweak] Improve `StructInfo` inference for 
`shape_of` (#14243)
     new 73ab563208 [Unity][Op] Add repeat, tile, conv2d_transpose, avg_pool2d 
(#14238)
     new 229bfaca1b [Unity] Allow user defined func attrs in emit_te (#14255)
     new 2c205e6ea0 [Unity][BYOC] Add conv2d and residual block patterns for 
Relax cutlass BYOC (#14252)
     new e27508de6e [Unity][Frontend] Import `tanh` and fix `layer_norm` 
(#14247)
     new 0e56872c20 [Unity] Consider target context for Relay to Relax 
conversion (#14269)
     new aaf00080e5 [Unity] Introduce call_dps_packed (#14183)
     new 536498b17a [Unity][ci] Use CPU-SMALL instances (#14256)
     new abc474887b [TVMScript][Unity] Improve PyLint Compatibility (#14276)

This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version.  This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:

 * -- * -- B -- O -- O -- O   (d103ee2070)
            \
             N -- N -- N   refs/heads/unity-staging (abc474887b)

You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.

Any revisions marked "omit" are not gone; other references still
refer to them.  Any revisions marked "discard" are gone forever.

The 124 revisions listed above as "new" are entirely new to this
repository and will be described in separate emails.  The revisions
listed as "add" were already present in the repository and have only
been added to this reference.


Summary of changes:
 ci/jenkins/docker-images.ini                       |   4 +-
 ci/jenkins/unity_jenkinsfile.groovy                |   4 +-
 cmake/modules/contrib/DNNL.cmake                   |   1 +
 conda/recipe/meta.yaml                             |   2 +-
 docker/Dockerfile.ci_arm                           |   4 +-
 docker/install/ubuntu_install_llvm_from_source.sh  | 100 +++
 docker/install/ubuntu_install_paddle.sh            |   2 +-
 include/tvm/node/reflection.h                      |   2 +-
 include/tvm/node/script_printer.h                  |  10 +
 include/tvm/node/structural_hash.h                 |  74 +-
 include/tvm/relax/attrs/manipulate.h               |  23 +
 include/tvm/relax/attrs/nn.h                       |  55 +-
 include/tvm/relax/dataflow_pattern.h               |   4 +
 include/tvm/relax/transform.h                      |   9 +-
 include/tvm/runtime/c_runtime_api.h                |   2 +-
 include/tvm/runtime/container/string.h             |  73 +-
 include/tvm/runtime/module.h                       |   4 +
 include/tvm/script/ir_builder/tir/ir.h             |  41 +-
 include/tvm/tir/analysis.h                         |  10 +-
 include/tvm/tir/schedule/schedule.h                |  28 +
 include/tvm/tir/transform.h                        |  20 +
 include/tvm/tir/var.h                              |   7 +
 python/tvm/_ffi/libinfo.py                         |  14 +-
 python/tvm/contrib/cutlass/build.py                |  51 +-
 python/tvm/contrib/cutlass/conv2d_operation.py     |  15 +-
 python/tvm/contrib/cutlass/gen_tensor_op.py        |  66 +-
 python/tvm/contrib/hexagon/transform.py            | 163 +++++
 python/tvm/contrib/tvmjs.py                        | 207 +++++-
 python/tvm/driver/tvmc/autotuner.py                |  67 +-
 python/tvm/driver/tvmc/compiler.py                 |  97 ++-
 python/tvm/driver/tvmc/transform.py                | 203 +++++-
 python/tvm/ir/transform.py                         |   3 +-
 .../tvm/meta_schedule/testing/space_generation.py  |   2 +-
 python/tvm/meta_schedule/tune_context.py           |   3 +-
 python/tvm/relax/__init__.py                       |   3 +-
 python/tvm/relax/backend/contrib/cutlass.py        | 257 ++++---
 python/tvm/relax/backend/patterns.py               |  47 +-
 python/tvm/relax/block_builder.py                  | 176 +----
 python/tvm/relax/dpl/pattern.py                    |  18 +-
 python/tvm/relax/expr.py                           |   4 +-
 python/tvm/relax/frontend/__init__.py              |   3 +-
 python/tvm/relax/frontend/common.py                |  51 +-
 python/tvm/relax/frontend/torch/dynamo.py          |  26 +-
 python/tvm/relax/frontend/torch/fx_translator.py   | 155 +++-
 python/tvm/relax/op/base.py                        |  54 +-
 python/tvm/relax/op/manipulate.py                  |  74 ++
 python/tvm/relax/op/memory/memory.py               |  34 +-
 python/tvm/relax/op/nn/nn.py                       | 182 ++++-
 python/tvm/relax/op/op_attrs.py                    |  19 +-
 python/tvm/relax/op/{memory => vm}/__init__.py     |   4 +-
 python/tvm/relax/op/{ => vm}/_ffi_api.py           |   4 +-
 python/tvm/relax/op/{memory/memory.py => vm/vm.py} |  73 +-
 python/tvm/relax/testing/relay_translator.py       |   2 +-
 python/tvm/relax/transform/legalize_ops/common.py  |   2 +-
 python/tvm/relax/transform/legalize_ops/index.py   |   6 +-
 .../tvm/relax/transform/legalize_ops/manipulate.py |  25 +
 python/tvm/relax/transform/legalize_ops/nn.py      |  58 ++
 python/tvm/relax/transform/transform.py            |  16 +-
 python/tvm/relax/utils.py                          | 188 ++++-
 python/tvm/relay/frontend/paddlepaddle.py          | 231 +++++-
 python/tvm/relay/op/op_attrs.py                    |  10 -
 python/tvm/relay/transform/transform.py            |   2 +-
 python/tvm/runtime/module.py                       |   8 +-
 python/tvm/runtime/script_printer.py               |  15 +
 python/tvm/script/ir_builder/relax/ir.py           |  41 +-
 python/tvm/script/ir_builder/tir/frame.py          |   8 +-
 python/tvm/script/ir_builder/tir/ir.py             | 171 ++++-
 python/tvm/script/parser/core/parser.py            |  42 +-
 python/tvm/script/parser/core/utils.py             |  26 +-
 python/tvm/script/parser/ir/parser.py              |  34 +-
 python/tvm/script/parser/relax/__init__.py         |  13 +-
 python/tvm/script/parser/relax/parser.py           |  45 +-
 python/tvm/script/parser/tir/operation.py          |  20 +-
 python/tvm/script/parser/tir/parser.py             |  14 +-
 python/tvm/te/hybrid/parser.py                     |   3 +-
 python/tvm/tir/op.py                               | 108 ++-
 python/tvm/tir/schedule/schedule.py                | 195 ++++-
 python/tvm/tir/transform/function_pass.py          |   3 +-
 python/tvm/tir/transform/transform.py              |  33 +
 src/arith/rewrite_simplify.cc                      |   2 +
 src/ir/module.cc                                   |  39 +-
 src/meta_schedule/postproc/verify_gpu_code.cc      |   1 +
 .../schedule_rule/multi_level_tiling.cc            |  13 +-
 .../schedule_rule/multi_level_tiling.h             |   8 +-
 .../multi_level_tiling_tensor_core.cc              | 176 ++++-
 .../multi_level_tiling_wide_vector.cc              |  15 +-
 .../space_generator/post_order_apply.cc            |  62 --
 src/meta_schedule/utils.h                          |  62 ++
 src/node/script_printer.cc                         |  26 +
 src/node/structural_hash.cc                        |  82 +--
 src/relax/analysis/detect_recursion.cc             |  13 +-
 src/relax/backend/task_extraction.cc               |   5 -
 src/relax/ir/dataflow_pattern.cc                   |  14 +
 src/relax/op/nn/convolution.cc                     | 144 ++++
 src/relax/op/nn/convolution.h                      |  11 +
 src/relax/op/nn/pooling.cc                         |  44 +-
 src/relax/op/nn/pooling.h                          |   4 +
 src/relax/op/op.cc                                 | 101 ++-
 src/relax/op/tensor/manipulate.cc                  | 126 ++++
 src/relax/op/tensor/manipulate.h                   |  27 +
 src/relax/transform/call_tir_rewrite.cc            |   5 +-
 src/relax/transform/fold_constant.cc               |  12 +-
 src/relax/transform/fuse_ops.cc                    |  38 +-
 src/relax/transform/fuse_tir.cc                    |  23 +-
 src/relax/transform/legalize_ops.cc                |   3 +-
 src/relax/transform/rewrite_dataflow_reshape.cc    |   7 +-
 src/relax/transform/run_codegen.cc                 |   9 +-
 src/relax/transform/simplify_norm_inference.cc     | 131 ++++
 src/relax/transform/static_plan_block_memory.cc    | 101 ++-
 src/relax/transform/utils.h                        | 105 +++
 src/relay/backend/contrib/dnnl/codegen.cc          |  52 +-
 src/relay/backend/utils.h                          |   2 +-
 src/runtime/metal/metal_module.mm                  |   9 +
 src/runtime/module.cc                              |   4 +
 src/script/ir_builder/ir/ir.cc                     |   4 +-
 src/script/ir_builder/ir/utils.h                   |  11 +
 src/script/ir_builder/tir/ir.cc                    |  54 +-
 .../printer/doc_printer/python_doc_printer.cc      |   7 +-
 src/script/printer/ir/ir.cc                        |  14 +-
 src/script/printer/ir_docsifier.cc                 |   4 +
 src/script/printer/relax/call.cc                   |  23 +-
 src/script/printer/relax/function.cc               |   5 +-
 src/script/printer/relax/tir.cc                    |  60 +-
 src/script/printer/relax/utils.h                   |   4 +-
 src/script/printer/tir/buffer.cc                   | 140 +++-
 src/script/printer/tir/expr.cc                     | 116 +--
 src/script/printer/tir/function.cc                 |  10 +-
 src/script/printer/tir/stmt.cc                     | 120 ++--
 src/script/printer/tir/utils.h                     |   9 +
 src/script/printer/utils.h                         |  10 +-
 src/target/llvm/codegen_blob.cc                    |   4 +
 src/target/llvm/codegen_llvm.cc                    |   4 +
 src/target/source/codegen_webgpu.cc                |  60 +-
 src/target/source/codegen_webgpu.h                 |   2 +-
 src/tir/analysis/block_access_region_detector.cc   |   9 +-
 src/tir/analysis/var_use_def_analysis.cc           | 176 +++++
 src/tir/analysis/var_use_def_analysis.h            |  89 +++
 src/tir/ir/expr.cc                                 |   9 +
 src/tir/schedule/concrete_schedule.cc              |  24 +
 src/tir/schedule/concrete_schedule.h               |   4 +
 src/tir/schedule/ir_comparator.cc                  |  10 +-
 src/tir/schedule/ir_comparator.h                   |   7 +-
 src/tir/schedule/primitive.h                       |  33 +
 src/tir/schedule/primitive/cache_read_write.cc     | 716 ++++++++++++++++++-
 src/tir/schedule/primitive/compute_inline.cc       |   4 +-
 src/tir/schedule/schedule.cc                       |   4 +
 src/tir/schedule/traced_schedule.cc                |  32 +
 src/tir/schedule/traced_schedule.h                 |   4 +
 src/tir/transforms/default_gpu_schedule.cc         | 116 +++
 src/tir/transforms/force_narrow_index_to_i32.cc    |  84 +++
 src/tir/transforms/split_host_device.cc            | 229 ++----
 src/tir/transforms/unroll_loop.cc                  |  64 +-
 .../contrib/test_hexagon/test_relay_transforms.py  | 120 ++++
 tests/python/driver/tvmc/test_compiler.py          |  31 +-
 tests/python/driver/tvmc/test_transform.py         | 101 ++-
 tests/python/frontend/paddlepaddle/test_forward.py | 354 +++++++++-
 tests/python/relax/test_analysis.py                |  15 +-
 .../python/relax/test_analysis_detect_recursion.py | 166 +++--
 .../relax/test_analysis_estimate_memory_usage.py   |  11 +-
 tests/python/relax/test_analysis_well_formed.py    |   6 +-
 tests/python/relax/test_ast_printer.py             |  74 +-
 .../relax/test_backend_transform_shape_lower.py    |   7 +-
 tests/python/relax/test_binding_rewrite.py         |  16 +-
 tests/python/relax/test_codegen_cutlass.py         | 288 +++++---
 tests/python/relax/test_dataflow_pattern.py        | 265 +++----
 .../test_frontend_common.py}                       |  27 +-
 tests/python/relax/test_frontend_dynamo.py         |  12 +-
 tests/python/relax/test_frontend_from_fx.py        | 216 +++++-
 tests/python/relax/test_op_manipulate.py           | 246 +++++++
 tests/python/relax/test_op_misc.py                 |   2 +-
 tests/python/relax/test_op_nn_convolution.py       | 385 ++++++++++
 tests/python/relax/test_op_nn_pooling.py           | 228 +++++-
 tests/python/relax/test_relax_operators.py         |  26 +-
 tests/python/relax/test_transform.py               |  46 +-
 .../relax/test_transform_attach_global_symbol.py   |   4 +-
 tests/python/relax/test_transform_bind_params.py   |   6 +-
 tests/python/relax/test_transform_codegen_pass.py  |  13 +-
 tests/python/relax/test_transform_fold_constant.py |  31 +-
 tests/python/relax/test_transform_fuse_ops.py      | 184 ++++-
 .../relax/test_transform_fuse_ops_by_pattern.py    |  65 +-
 tests/python/relax/test_transform_fuse_tir.py      |   6 +-
 tests/python/relax/test_transform_lambda_lift.py   |  17 +-
 tests/python/relax/test_transform_legalize_ops.py  |  27 +-
 .../relax/test_transform_legalize_ops_binary.py    |  72 +-
 .../test_transform_legalize_ops_create_datatype.py |  44 +-
 .../relax/test_transform_legalize_ops_image.py     |   4 +-
 ..._transform_legalize_ops_index_linear_algebra.py |  20 +-
 .../test_transform_legalize_ops_manipulate.py      | 243 ++++++-
 .../python/relax/test_transform_legalize_ops_nn.py | 403 ++++++++++-
 ...st_transform_legalize_ops_search_statistical.py |  40 +-
 .../relax/test_transform_legalize_ops_unary.py     |  62 +-
 .../relax/test_transform_lift_transform_params.py  |   6 +-
 .../test_transform_merge_composite_functions.py    | 111 +--
 .../relax/test_transform_meta_schedule_tuning.py   |   5 +-
 tests/python/relax/test_transform_normalize.py     |   6 +-
 .../relax/test_transform_remove_unused_funcs.py    |   8 +-
 .../test_transform_rewrite_dataflow_reshape.py     |  13 +-
 .../test_transform_simpilify_norm_inference.py     | 153 ++++
 .../test_transform_static_plan_block_memory.py     | 214 +++++-
 tests/python/relax/test_tuning_api.py              |   3 +-
 tests/python/relax/test_tvmscript_ir_builder.py    |  38 +-
 tests/python/relax/test_tvmscript_parser.py        | 256 +++++--
 .../relax/test_tvmscript_parser_op_manipulate.py   |  45 ++
 tests/python/relax/test_tvmscript_parser_op_nn.py  |  37 +
 tests/python/relax/test_tvmscript_printer_relax.py |  97 ++-
 tests/python/relax/test_vm_build.py                |  26 +-
 tests/python/relax/test_vm_codegen_tir.py          |   2 +-
 tests/python/relay/aot/test_pass_aot_lower_main.py |   2 +-
 .../python/unittest/test_arith_rewrite_simplify.py |   4 +
 tests/python/unittest/test_inject_ptx_ldg32.py     |   2 +-
 ...schedule_feature_extractor_per_store_feature.py |   2 +-
 .../test_meta_schedule_schedule_rule_mlt_tc.py     | 783 +++++++++------------
 .../unittest/test_meta_schedule_space_cuda.py      |   6 +-
 .../python/unittest/test_target_codegen_aarch64.py | 480 +++++++++++++
 tests/python/unittest/test_target_codegen_llvm.py  |   4 +-
 .../unittest/test_tir_schedule_cache_read_write.py | 140 ++++
 .../unittest/test_tir_schedule_compute_inline.py   |  24 +
 .../test_tir_transform_common_subexpr_elim.py      |   7 +-
 ...test_tir_transform_force_narrow_index_to_i32.py | 220 ++++++
 .../test_tir_transform_hoist_expression.py         |   9 +-
 .../test_tir_transform_inject_software_pipeline.py |  16 +-
 .../test_tir_transform_inject_virtual_thread.py    |   8 +-
 .../unittest/test_tir_transform_unroll_loop.py     |  42 ++
 ...ransform_convert_pool_allocations_to_offsets.py |  26 +-
 .../test_transform_default_gpu_schedule.py         | 417 +++++++++++
 .../unittest/test_tvmscript_ir_builder_tir.py      |   2 +-
 tests/python/unittest/test_tvmscript_printer_ir.py |  17 +-
 .../test_tvmscript_printer_structural_equal.py     |  40 +-
 .../python/unittest/test_tvmscript_printer_tir.py  |  62 +-
 .../unittest/test_tvmscript_printer_underlining.py |  86 ++-
 tests/python/unittest/test_tvmscript_roundtrip.py  | 140 +++-
 tests/scripts/task_config_build_arm.sh             |   2 +-
 .../scripts/task_config_build_minimal_cross_isa.sh |   2 +-
 version.py                                         |   2 +-
 web/apps/browser/rpc_server.html                   |   3 +-
 web/package.json                                   |   2 +-
 web/src/rpc_server.ts                              |  10 +-
 web/src/runtime.ts                                 |  92 ++-
 web/src/webgpu.ts                                  |  21 +-
 239 files changed, 12398 insertions(+), 2802 deletions(-)
 create mode 100644 docker/install/ubuntu_install_llvm_from_source.sh
 copy python/tvm/relax/op/{memory => vm}/__init__.py (94%)
 copy python/tvm/relax/op/{ => vm}/_ffi_api.py (90%)
 copy python/tvm/relax/op/{memory/memory.py => vm/vm.py} (58%)
 create mode 100644 src/relax/transform/simplify_norm_inference.cc
 create mode 100644 src/tir/analysis/var_use_def_analysis.cc
 create mode 100644 src/tir/analysis/var_use_def_analysis.h
 create mode 100644 src/tir/transforms/default_gpu_schedule.cc
 create mode 100644 src/tir/transforms/force_narrow_index_to_i32.cc
 create mode 100644 tests/python/contrib/test_hexagon/test_relay_transforms.py
 copy tests/python/{unittest/test_arith_simplify.py => 
relax/test_frontend_common.py} (55%)
 create mode 100644 
tests/python/relax/test_transform_simpilify_norm_inference.py
 create mode 100644 tests/python/unittest/test_target_codegen_aarch64.py
 create mode 100644 
tests/python/unittest/test_tir_transform_force_narrow_index_to_i32.py
 create mode 100644 tests/python/unittest/test_transform_default_gpu_schedule.py


Reply via email to