This is an automated email from the ASF dual-hosted git repository.
tqchen pushed a commit to branch asf-site
in repository https://gitbox.apache.org/repos/asf/tvm-site.git
The following commit(s) were added to refs/heads/asf-site by this push:
new 03b0e83e31 deploying docs
(apache/tvm@420b84703401d1d9fe99cb42568a3edca644975e)
03b0e83e31 is described below
commit 03b0e83e31c29f20b40fb1daaee0e050a504cdeb
Author: tvm-bot <[email protected]>
AuthorDate: Fri Aug 22 13:49:15 2025 +0000
deploying docs (apache/tvm@420b84703401d1d9fe99cb42568a3edca644975e)
---
.../11c11e53c7dace51a8be968ee169ed0d/ir_module.zip | Bin 23868 -> 23868 bytes
.../tir_transformation.zip | Bin 15563 -> 15563 bytes
.../relax_creation.zip | Bin 22392 -> 22392 bytes
.../relax_transformation.zip | Bin 11460 -> 11460 bytes
.../optimize_llm.zip | Bin 54065 -> 54065 bytes
.../e2e_opt_model.zip | Bin 11213 -> 11213 bytes
.../quick_start.zip | Bin 16274 -> 16274 bytes
.../tir_creation.zip | Bin 24343 -> 24343 bytes
.../cross_compilation_and_rpc.zip | Bin 21652 -> 21652 bytes
.../customize_opt.zip | Bin 19789 -> 19789 bytes
.../relax/tutorials/sg_execution_times.rst.txt | 6 +--
.../tensor_ir/tutorials/sg_execution_times.rst.txt | 6 +--
.../tensor_ir/tutorials/tir_creation.rst.txt | 20 +++++-----
.../tensor_ir/tutorials/tir_transformation.rst.txt | 6 +--
.../get_started/tutorials/ir_module.rst.txt | 8 ++--
.../get_started/tutorials/quick_start.rst.txt | 4 +-
.../tutorials/sg_execution_times.rst.txt | 6 +--
.../tutorials/cross_compilation_and_rpc.rst.txt | 2 +-
.../how_to/tutorials/customize_opt.rst.txt | 4 +-
.../how_to/tutorials/e2e_opt_model.rst.txt | 2 +-
.../_sources/how_to/tutorials/optimize_llm.rst.txt | 5 +++
.../how_to/tutorials/sg_execution_times.rst.txt | 10 ++---
docs/_sources/sg_execution_times.rst.txt | 26 ++++++------
.../relax/tutorials/sg_execution_times.html | 6 +--
.../tensor_ir/tutorials/sg_execution_times.html | 6 +--
.../tensor_ir/tutorials/tir_creation.html | 44 ++++++---------------
.../tensor_ir/tutorials/tir_transformation.html | 23 +++--------
docs/get_started/tutorials/ir_module.html | 8 ++--
docs/get_started/tutorials/quick_start.html | 4 +-
docs/get_started/tutorials/sg_execution_times.html | 6 +--
.../tutorials/cross_compilation_and_rpc.html | 2 +-
docs/how_to/tutorials/customize_opt.html | 4 +-
docs/how_to/tutorials/e2e_opt_model.html | 6 +--
docs/how_to/tutorials/optimize_llm.html | 1 +
docs/how_to/tutorials/sg_execution_times.html | 10 ++---
docs/searchindex.js | 2 +-
docs/sg_execution_times.html | 26 ++++++------
37 files changed, 113 insertions(+), 140 deletions(-)
diff --git a/docs/_downloads/11c11e53c7dace51a8be968ee169ed0d/ir_module.zip
b/docs/_downloads/11c11e53c7dace51a8be968ee169ed0d/ir_module.zip
index 982f0e0afa..2754f6e1a7 100644
Binary files a/docs/_downloads/11c11e53c7dace51a8be968ee169ed0d/ir_module.zip
and b/docs/_downloads/11c11e53c7dace51a8be968ee169ed0d/ir_module.zip differ
diff --git
a/docs/_downloads/18ba0d2ee8120824175aaef66bc9c9bf/tir_transformation.zip
b/docs/_downloads/18ba0d2ee8120824175aaef66bc9c9bf/tir_transformation.zip
index 275dce6767..1b8f9ba466 100644
Binary files
a/docs/_downloads/18ba0d2ee8120824175aaef66bc9c9bf/tir_transformation.zip and
b/docs/_downloads/18ba0d2ee8120824175aaef66bc9c9bf/tir_transformation.zip differ
diff --git
a/docs/_downloads/4753776bbe68e7c9ee4d19117973fc8b/relax_creation.zip
b/docs/_downloads/4753776bbe68e7c9ee4d19117973fc8b/relax_creation.zip
index b2d3501b9b..ec5e0077da 100644
Binary files
a/docs/_downloads/4753776bbe68e7c9ee4d19117973fc8b/relax_creation.zip and
b/docs/_downloads/4753776bbe68e7c9ee4d19117973fc8b/relax_creation.zip differ
diff --git
a/docs/_downloads/7d201684dfa095a5ea48d98e9a2ef7ad/relax_transformation.zip
b/docs/_downloads/7d201684dfa095a5ea48d98e9a2ef7ad/relax_transformation.zip
index 2c026060a1..f4c9816fd8 100644
Binary files
a/docs/_downloads/7d201684dfa095a5ea48d98e9a2ef7ad/relax_transformation.zip and
b/docs/_downloads/7d201684dfa095a5ea48d98e9a2ef7ad/relax_transformation.zip
differ
diff --git a/docs/_downloads/83e85f38cf16f1d926d06615fd54095c/optimize_llm.zip
b/docs/_downloads/83e85f38cf16f1d926d06615fd54095c/optimize_llm.zip
index ddd24d9be7..8fd1199225 100644
Binary files
a/docs/_downloads/83e85f38cf16f1d926d06615fd54095c/optimize_llm.zip and
b/docs/_downloads/83e85f38cf16f1d926d06615fd54095c/optimize_llm.zip differ
diff --git a/docs/_downloads/a7dd7652b2ad50f82d7b739ce3645799/e2e_opt_model.zip
b/docs/_downloads/a7dd7652b2ad50f82d7b739ce3645799/e2e_opt_model.zip
index 10038951fc..7d20d0295f 100644
Binary files
a/docs/_downloads/a7dd7652b2ad50f82d7b739ce3645799/e2e_opt_model.zip and
b/docs/_downloads/a7dd7652b2ad50f82d7b739ce3645799/e2e_opt_model.zip differ
diff --git a/docs/_downloads/bb7db6678496193ed0c55d3b95fa6778/quick_start.zip
b/docs/_downloads/bb7db6678496193ed0c55d3b95fa6778/quick_start.zip
index 4becc2ff5f..56b4a3870f 100644
Binary files a/docs/_downloads/bb7db6678496193ed0c55d3b95fa6778/quick_start.zip
and b/docs/_downloads/bb7db6678496193ed0c55d3b95fa6778/quick_start.zip differ
diff --git a/docs/_downloads/be26483bb70b8468499a01c55e8e866c/tir_creation.zip
b/docs/_downloads/be26483bb70b8468499a01c55e8e866c/tir_creation.zip
index 1d1b65a165..7713c0f7ba 100644
Binary files
a/docs/_downloads/be26483bb70b8468499a01c55e8e866c/tir_creation.zip and
b/docs/_downloads/be26483bb70b8468499a01c55e8e866c/tir_creation.zip differ
diff --git
a/docs/_downloads/f69380821f417ef2210f45503d81bded/cross_compilation_and_rpc.zip
b/docs/_downloads/f69380821f417ef2210f45503d81bded/cross_compilation_and_rpc.zip
index 24a8053ae0..758b7d8f3d 100644
Binary files
a/docs/_downloads/f69380821f417ef2210f45503d81bded/cross_compilation_and_rpc.zip
and
b/docs/_downloads/f69380821f417ef2210f45503d81bded/cross_compilation_and_rpc.zip
differ
diff --git a/docs/_downloads/f69433a4a80715725df90d1386679956/customize_opt.zip
b/docs/_downloads/f69433a4a80715725df90d1386679956/customize_opt.zip
index c692f3181e..18bedbcae1 100644
Binary files
a/docs/_downloads/f69433a4a80715725df90d1386679956/customize_opt.zip and
b/docs/_downloads/f69433a4a80715725df90d1386679956/customize_opt.zip differ
diff --git a/docs/_sources/deep_dive/relax/tutorials/sg_execution_times.rst.txt
b/docs/_sources/deep_dive/relax/tutorials/sg_execution_times.rst.txt
index f148037641..8671dbc744 100644
--- a/docs/_sources/deep_dive/relax/tutorials/sg_execution_times.rst.txt
+++ b/docs/_sources/deep_dive/relax/tutorials/sg_execution_times.rst.txt
@@ -6,7 +6,7 @@
Computation times
=================
-**00:00.210** total execution time for 2 files **from
deep_dive/relax/tutorials**:
+**00:00.268** total execution time for 2 files **from
deep_dive/relax/tutorials**:
.. container::
@@ -33,8 +33,8 @@ Computation times
- Time
- Mem (MB)
* - :ref:`sphx_glr_deep_dive_relax_tutorials_relax_creation.py`
(``relax_creation.py``)
- - 00:00.132
+ - 00:00.176
- 0.0
* - :ref:`sphx_glr_deep_dive_relax_tutorials_relax_transformation.py`
(``relax_transformation.py``)
- - 00:00.079
+ - 00:00.092
- 0.0
diff --git
a/docs/_sources/deep_dive/tensor_ir/tutorials/sg_execution_times.rst.txt
b/docs/_sources/deep_dive/tensor_ir/tutorials/sg_execution_times.rst.txt
index 883b7f6869..0ac02d4dc3 100644
--- a/docs/_sources/deep_dive/tensor_ir/tutorials/sg_execution_times.rst.txt
+++ b/docs/_sources/deep_dive/tensor_ir/tutorials/sg_execution_times.rst.txt
@@ -6,7 +6,7 @@
Computation times
=================
-**00:00.528** total execution time for 2 files **from
deep_dive/tensor_ir/tutorials**:
+**00:00.696** total execution time for 2 files **from
deep_dive/tensor_ir/tutorials**:
.. container::
@@ -33,8 +33,8 @@ Computation times
- Time
- Mem (MB)
* - :ref:`sphx_glr_deep_dive_tensor_ir_tutorials_tir_transformation.py`
(``tir_transformation.py``)
- - 00:00.331
+ - 00:00.422
- 0.0
* - :ref:`sphx_glr_deep_dive_tensor_ir_tutorials_tir_creation.py`
(``tir_creation.py``)
- - 00:00.198
+ - 00:00.273
- 0.0
diff --git a/docs/_sources/deep_dive/tensor_ir/tutorials/tir_creation.rst.txt
b/docs/_sources/deep_dive/tensor_ir/tutorials/tir_creation.rst.txt
index 26ab2b3350..fc397e546a 100644
--- a/docs/_sources/deep_dive/tensor_ir/tutorials/tir_creation.rst.txt
+++ b/docs/_sources/deep_dive/tensor_ir/tutorials/tir_creation.rst.txt
@@ -325,17 +325,17 @@ Now let's check the runtime dynamic shape inference:
.. code-block:: none
- [[1.4639008 0.81149524 1.2469165 0.79718184]
- [1.0503372 0.49676353 0.85672927 0.47976065]
- [1.2796788 0.7559935 0.85851413 0.93546313]
- [0.95638275 0.40652537 0.6003208 0.7082942 ]]
- [[29.328182 29.246191 32.116787 ... 29.927141 29.233265 29.068287]
- [30.687939 31.419153 34.005787 ... 33.354244 32.725533 30.230991]
- [32.0926 32.731964 36.339134 ... 35.212177 31.287153 31.665817]
+ [[0.4997607 0.39404696 0.6161485 0.72112775]
+ [0.48272523 0.7631872 1.0439384 1.1835594 ]
+ [0.76485586 0.6593715 0.6234958 1.0389844 ]
+ [1.0580477 1.3580152 1.3343425 1.9772978 ]]
+ [[35.02986 33.522823 33.989853 ... 31.136143 35.698112 32.371902]
+ [36.67233 34.473907 33.172703 ... 32.911404 37.53281 34.922924]
+ [33.071457 31.164038 29.987707 ... 31.901619 34.543198 31.53511 ]
...
- [27.469896 28.020096 31.106714 ... 29.485088 29.01112 28.66413 ]
- [29.355347 29.80985 33.124912 ... 32.228813 32.64193 31.742935]
- [30.603958 29.392557 32.4566 ... 31.786282 29.480438 31.995554]]
+ [36.057602 32.758816 33.335747 ... 32.881447 37.72857 34.011456]
+ [30.424395 29.545507 29.550253 ... 27.73667 31.73645 31.601265]
+ [31.421236 28.996126 27.744043 ... 31.313503 31.505651 30.765842]]
diff --git
a/docs/_sources/deep_dive/tensor_ir/tutorials/tir_transformation.rst.txt
b/docs/_sources/deep_dive/tensor_ir/tutorials/tir_transformation.rst.txt
index 3d27f5b500..26107d8707 100644
--- a/docs/_sources/deep_dive/tensor_ir/tutorials/tir_transformation.rst.txt
+++ b/docs/_sources/deep_dive/tensor_ir/tutorials/tir_transformation.rst.txt
@@ -123,7 +123,7 @@ original implementation.
Execution time summary:
mean (ms) median (ms) max (ms) min (ms) std (ms)
- 2.3096 2.3096 2.3096 2.3096 0.0000
+ 2.5497 2.5497 2.5497 2.5497 0.0000
@@ -295,7 +295,7 @@ action involves reordering these two loops.
Execution time summary:
mean (ms) median (ms) max (ms) min (ms) std (ms)
- 0.8744 0.8744 0.8744 0.8744 0.0000
+ 0.9417 0.9417 0.9417 0.9417 0.0000
@@ -423,7 +423,7 @@ from the reduction update via the **decompose_reduction**
primitive.
Execution time summary:
mean (ms) median (ms) max (ms) min (ms) std (ms)
- 0.3312 0.3312 0.3312 0.3312 0.0000
+ 0.3378 0.3378 0.3378 0.3378 0.0000
diff --git a/docs/_sources/get_started/tutorials/ir_module.rst.txt
b/docs/_sources/get_started/tutorials/ir_module.rst.txt
index 3eab6677f2..544fe5f418 100644
--- a/docs/_sources/get_started/tutorials/ir_module.rst.txt
+++ b/docs/_sources/get_started/tutorials/ir_module.rst.txt
@@ -698,8 +698,8 @@ We can deploy the IRModule on CPU by specifying the target
as ``llvm``.
.. code-block:: none
- [[ 0.1682995 -0.15936302 -0.1740453 -0.05549686 -0.02969982 0.20223626
- -0.24181096 0.10161518 0.06414028 0.01500236]]
+ [[-0.03393523 0.21668282 -0.055739 -0.38880786 0.058215 -0.12301907
+ 0.14273655 0.34130883 -0.04027858 -0.1037481 ]]
@@ -765,8 +765,8 @@ Now we can compile the IRModule on GPU, the similar way as
we did on CPU.
.. code-block:: none
- [[ 0.16829953 -0.15936302 -0.17404532 -0.05549683 -0.02969979 0.20223626
- -0.24181092 0.10161518 0.06414025 0.01500237]]
+ [[-0.03393522 0.21668276 -0.05573907 -0.38880786 0.05821501 -0.1230191
+ 0.14273658 0.34130886 -0.04027862 -0.10374808]]
diff --git a/docs/_sources/get_started/tutorials/quick_start.rst.txt
b/docs/_sources/get_started/tutorials/quick_start.rst.txt
index 99d00ebc2d..54cbe5a5dc 100644
--- a/docs/_sources/get_started/tutorials/quick_start.rst.txt
+++ b/docs/_sources/get_started/tutorials/quick_start.rst.txt
@@ -230,8 +230,8 @@ different devices.
.. code-block:: none
- [[25847.475 24279.332 24694.084 25823.77 26742.688 24573.928 26191.004
- 24160.408 25489.828 27646.2 ]]
+ [[24768.424 25633.959 24707.258 24859.969 25869.365 26105.26 24190.537
+ 24394.252 25021.393 25690.172]]
diff --git a/docs/_sources/get_started/tutorials/sg_execution_times.rst.txt
b/docs/_sources/get_started/tutorials/sg_execution_times.rst.txt
index 2287016f7a..fd2c736016 100644
--- a/docs/_sources/get_started/tutorials/sg_execution_times.rst.txt
+++ b/docs/_sources/get_started/tutorials/sg_execution_times.rst.txt
@@ -6,7 +6,7 @@
Computation times
=================
-**00:06.766** total execution time for 2 files **from get_started/tutorials**:
+**00:07.595** total execution time for 2 files **from get_started/tutorials**:
.. container::
@@ -33,8 +33,8 @@ Computation times
- Time
- Mem (MB)
* - :ref:`sphx_glr_get_started_tutorials_ir_module.py` (``ir_module.py``)
- - 00:06.570
+ - 00:07.365
- 0.0
* - :ref:`sphx_glr_get_started_tutorials_quick_start.py`
(``quick_start.py``)
- - 00:00.196
+ - 00:00.230
- 0.0
diff --git a/docs/_sources/how_to/tutorials/cross_compilation_and_rpc.rst.txt
b/docs/_sources/how_to/tutorials/cross_compilation_and_rpc.rst.txt
index 4e42be276f..e92bc96512 100644
--- a/docs/_sources/how_to/tutorials/cross_compilation_and_rpc.rst.txt
+++ b/docs/_sources/how_to/tutorials/cross_compilation_and_rpc.rst.txt
@@ -274,7 +274,7 @@ device and returns the measured cost. Network overhead is
excluded.
.. code-block:: none
- 1.251e-07 secs/op
+ 1.3e-07 secs/op
diff --git a/docs/_sources/how_to/tutorials/customize_opt.rst.txt
b/docs/_sources/how_to/tutorials/customize_opt.rst.txt
index 042df740ab..6bcae65120 100644
--- a/docs/_sources/how_to/tutorials/customize_opt.rst.txt
+++ b/docs/_sources/how_to/tutorials/customize_opt.rst.txt
@@ -420,8 +420,8 @@ We can build and deploy the optimized model to the TVM
runtime.
.. code-block:: none
- [[25474.455 24978.242 25313.082 25500.371 26524.494 26827.518 25888.547
- 25291.809 25186.93 25487.4 ]]
+ [[25338.746 24784.14 25818.207 25163.271 25910.93 25604.75 24958.316
+ 24613.84 24797.094 26070.352]]
diff --git a/docs/_sources/how_to/tutorials/e2e_opt_model.rst.txt
b/docs/_sources/how_to/tutorials/e2e_opt_model.rst.txt
index 67b0fe5a96..2d7af8c657 100644
--- a/docs/_sources/how_to/tutorials/e2e_opt_model.rst.txt
+++ b/docs/_sources/how_to/tutorials/e2e_opt_model.rst.txt
@@ -59,7 +59,7 @@ PyTorch.
.. code-block:: none
Downloading: "https://download.pytorch.org/models/resnet18-f37072fd.pth"
to /workspace/.cache/torch/hub/checkpoints/resnet18-f37072fd.pth
- 0%| | 0.00/44.7M [00:00<?, ?B/s] 38%|███▊ |
17.1M/44.7M [00:00<00:00, 179MB/s] 89%|████████▊ | 39.6M/44.7M
[00:00<00:00, 212MB/s] 100%|██████████| 44.7M/44.7M [00:00<00:00, 210MB/s]
+ 0%| | 0.00/44.7M [00:00<?, ?B/s] 30%|██▉ |
13.4M/44.7M [00:00<00:00, 140MB/s] 67%|██████▋ | 30.1M/44.7M
[00:00<00:00, 161MB/s] 100%|██████████| 44.7M/44.7M [00:00<00:00, 163MB/s]
diff --git a/docs/_sources/how_to/tutorials/optimize_llm.rst.txt
b/docs/_sources/how_to/tutorials/optimize_llm.rst.txt
index 28f101414f..a28f540ef2 100644
--- a/docs/_sources/how_to/tutorials/optimize_llm.rst.txt
+++ b/docs/_sources/how_to/tutorials/optimize_llm.rst.txt
@@ -863,6 +863,11 @@ IRModule to generate the token.
+.. rst-class:: sphx-glr-timing
+
+ **Total running time of the script:** (1 minutes 21.675 seconds)
+
+
.. _sphx_glr_download_how_to_tutorials_optimize_llm.py:
.. only:: html
diff --git a/docs/_sources/how_to/tutorials/sg_execution_times.rst.txt
b/docs/_sources/how_to/tutorials/sg_execution_times.rst.txt
index 06ff1f0e17..b87cd7787f 100644
--- a/docs/_sources/how_to/tutorials/sg_execution_times.rst.txt
+++ b/docs/_sources/how_to/tutorials/sg_execution_times.rst.txt
@@ -6,7 +6,7 @@
Computation times
=================
-**00:40.385** total execution time for 4 files **from how_to/tutorials**:
+**01:23.653** total execution time for 4 files **from how_to/tutorials**:
.. container::
@@ -33,14 +33,14 @@ Computation times
- Time
- Mem (MB)
* - :ref:`sphx_glr_how_to_tutorials_optimize_llm.py` (``optimize_llm.py``)
- - 00:38.743
+ - 01:21.675
- 0.0
* - :ref:`sphx_glr_how_to_tutorials_e2e_opt_model.py` (``e2e_opt_model.py``)
- - 00:00.749
+ - 00:00.885
- 0.0
* - :ref:`sphx_glr_how_to_tutorials_customize_opt.py` (``customize_opt.py``)
- - 00:00.677
+ - 00:00.827
- 0.0
* - :ref:`sphx_glr_how_to_tutorials_cross_compilation_and_rpc.py`
(``cross_compilation_and_rpc.py``)
- - 00:00.216
+ - 00:00.266
- 0.0
diff --git a/docs/_sources/sg_execution_times.rst.txt
b/docs/_sources/sg_execution_times.rst.txt
index 2ab8b7a19a..8ceb40ecfa 100644
--- a/docs/_sources/sg_execution_times.rst.txt
+++ b/docs/_sources/sg_execution_times.rst.txt
@@ -6,7 +6,7 @@
Computation times
=================
-**00:47.890** total execution time for 10 files **from all galleries**:
+**01:32.212** total execution time for 10 files **from all galleries**:
.. container::
@@ -33,32 +33,32 @@ Computation times
- Time
- Mem (MB)
* - :ref:`sphx_glr_how_to_tutorials_optimize_llm.py`
(``../how_to/tutorials/optimize_llm.py``)
- - 00:38.743
+ - 01:21.675
- 0.0
* - :ref:`sphx_glr_get_started_tutorials_ir_module.py`
(``../get_started/tutorials/ir_module.py``)
- - 00:06.570
+ - 00:07.365
- 0.0
* - :ref:`sphx_glr_how_to_tutorials_e2e_opt_model.py`
(``../how_to/tutorials/e2e_opt_model.py``)
- - 00:00.749
+ - 00:00.885
- 0.0
* - :ref:`sphx_glr_how_to_tutorials_customize_opt.py`
(``../how_to/tutorials/customize_opt.py``)
- - 00:00.677
+ - 00:00.827
- 0.0
* - :ref:`sphx_glr_deep_dive_tensor_ir_tutorials_tir_transformation.py`
(``../deep_dive/tensor_ir/tutorials/tir_transformation.py``)
- - 00:00.331
- - 0.0
- * - :ref:`sphx_glr_how_to_tutorials_cross_compilation_and_rpc.py`
(``../how_to/tutorials/cross_compilation_and_rpc.py``)
- - 00:00.216
+ - 00:00.422
- 0.0
* - :ref:`sphx_glr_deep_dive_tensor_ir_tutorials_tir_creation.py`
(``../deep_dive/tensor_ir/tutorials/tir_creation.py``)
- - 00:00.198
+ - 00:00.273
+ - 0.0
+ * - :ref:`sphx_glr_how_to_tutorials_cross_compilation_and_rpc.py`
(``../how_to/tutorials/cross_compilation_and_rpc.py``)
+ - 00:00.266
- 0.0
* - :ref:`sphx_glr_get_started_tutorials_quick_start.py`
(``../get_started/tutorials/quick_start.py``)
- - 00:00.196
+ - 00:00.230
- 0.0
* - :ref:`sphx_glr_deep_dive_relax_tutorials_relax_creation.py`
(``../deep_dive/relax/tutorials/relax_creation.py``)
- - 00:00.132
+ - 00:00.176
- 0.0
* - :ref:`sphx_glr_deep_dive_relax_tutorials_relax_transformation.py`
(``../deep_dive/relax/tutorials/relax_transformation.py``)
- - 00:00.079
+ - 00:00.092
- 0.0
diff --git a/docs/deep_dive/relax/tutorials/sg_execution_times.html
b/docs/deep_dive/relax/tutorials/sg_execution_times.html
index 09610d2fa4..d7c0ea9ef0 100644
--- a/docs/deep_dive/relax/tutorials/sg_execution_times.html
+++ b/docs/deep_dive/relax/tutorials/sg_execution_times.html
@@ -299,7 +299,7 @@
<section id="computation-times">
<span
id="sphx-glr-deep-dive-relax-tutorials-sg-execution-times"></span><h1>Computation
times<a class="headerlink" href="#computation-times" title="Link to this
heading"></a></h1>
-<p><strong>00:00.210</strong> total execution time for 2 files <strong>from
deep_dive/relax/tutorials</strong>:</p>
+<p><strong>00:00.268</strong> total execution time for 2 files <strong>from
deep_dive/relax/tutorials</strong>:</p>
<div class="docutils container">
<style scoped>
<link
href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/5.3.0/css/bootstrap.min.css"
rel="stylesheet" />
@@ -321,11 +321,11 @@ $(document).ready( function () {
</thead>
<tbody>
<tr class="row-even"><td><p><a class="reference internal"
href="relax_creation.html#sphx-glr-deep-dive-relax-tutorials-relax-creation-py"><span
class="std std-ref">Relax Creation</span></a> (<code class="docutils literal
notranslate"><span class="pre">relax_creation.py</span></code>)</p></td>
-<td><p>00:00.132</p></td>
+<td><p>00:00.176</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="relax_transformation.html#sphx-glr-deep-dive-relax-tutorials-relax-transformation-py"><span
class="std std-ref">Transformation</span></a> (<code class="docutils literal
notranslate"><span class="pre">relax_transformation.py</span></code>)</p></td>
-<td><p>00:00.079</p></td>
+<td><p>00:00.092</p></td>
<td><p>0.0</p></td>
</tr>
</tbody>
diff --git a/docs/deep_dive/tensor_ir/tutorials/sg_execution_times.html
b/docs/deep_dive/tensor_ir/tutorials/sg_execution_times.html
index dc4dc15f01..cf9a563b20 100644
--- a/docs/deep_dive/tensor_ir/tutorials/sg_execution_times.html
+++ b/docs/deep_dive/tensor_ir/tutorials/sg_execution_times.html
@@ -299,7 +299,7 @@
<section id="computation-times">
<span
id="sphx-glr-deep-dive-tensor-ir-tutorials-sg-execution-times"></span><h1>Computation
times<a class="headerlink" href="#computation-times" title="Link to this
heading"></a></h1>
-<p><strong>00:00.528</strong> total execution time for 2 files <strong>from
deep_dive/tensor_ir/tutorials</strong>:</p>
+<p><strong>00:00.696</strong> total execution time for 2 files <strong>from
deep_dive/tensor_ir/tutorials</strong>:</p>
<div class="docutils container">
<style scoped>
<link
href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/5.3.0/css/bootstrap.min.css"
rel="stylesheet" />
@@ -321,11 +321,11 @@ $(document).ready( function () {
</thead>
<tbody>
<tr class="row-even"><td><p><a class="reference internal"
href="tir_transformation.html#sphx-glr-deep-dive-tensor-ir-tutorials-tir-transformation-py"><span
class="std std-ref">Transformation</span></a> (<code class="docutils literal
notranslate"><span class="pre">tir_transformation.py</span></code>)</p></td>
-<td><p>00:00.331</p></td>
+<td><p>00:00.422</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="tir_creation.html#sphx-glr-deep-dive-tensor-ir-tutorials-tir-creation-py"><span
class="std std-ref">TensorIR Creation</span></a> (<code class="docutils
literal notranslate"><span class="pre">tir_creation.py</span></code>)</p></td>
-<td><p>00:00.198</p></td>
+<td><p>00:00.273</p></td>
<td><p>0.0</p></td>
</tr>
</tbody>
diff --git a/docs/deep_dive/tensor_ir/tutorials/tir_creation.html
b/docs/deep_dive/tensor_ir/tutorials/tir_creation.html
index f4c63cfa7a..a4c5e34b65 100644
--- a/docs/deep_dive/tensor_ir/tutorials/tir_creation.html
+++ b/docs/deep_dive/tensor_ir/tutorials/tir_creation.html
@@ -198,29 +198,9 @@
<li class="toctree-l1"><a class="reference internal"
href="../../../how_to/dev/index.html">Development Guides</a></li>
</ul>
<p class="caption" role="heading"><span class="caption-text">Deep
Dive</span></p>
-<ul class="current">
+<ul>
<li class="toctree-l1"><a class="reference internal"
href="../../../arch/index.html">Design and Architecture</a></li>
-<li class="toctree-l1 current"><a class="reference internal"
href="../index.html">TensorIR</a><ul class="current">
-<li class="toctree-l2"><a class="reference internal"
href="../abstraction.html">Tensor Program Abstraction</a></li>
-<li class="toctree-l2"><a class="reference internal"
href="../learning.html">Understand TensorIR Abstraction</a></li>
-<li class="toctree-l2 current"><a class="current reference internal"
href="#">TensorIR Creation</a><ul>
-<li class="toctree-l3"><a class="reference internal"
href="#create-tensorir-using-tvmscript">Create TensorIR using TVMScript</a><ul>
-<li class="toctree-l4"><a class="reference internal"
href="#standard-format">Standard Format</a></li>
-<li class="toctree-l4"><a class="reference internal"
href="#concise-with-syntactic-sugar">Concise with Syntactic Sugar</a></li>
-<li class="toctree-l4"><a class="reference internal"
href="#interactive-with-python-variables">Interactive with Python
Variables</a></li>
-<li class="toctree-l4"><a class="reference internal"
href="#tensorir-function-with-dynamic-shapes">TensorIR Function with Dynamic
Shapes</a></li>
-</ul>
-</li>
-<li class="toctree-l3"><a class="reference internal"
href="#create-tensorir-using-tensor-expression">Create TensorIR using Tensor
Expression</a><ul>
-<li class="toctree-l4"><a class="reference internal"
href="#create-static-shape-functions">Create Static-Shape Functions</a></li>
-<li class="toctree-l4"><a class="reference internal"
href="#create-dynamic-shape-functions">Create Dynamic-Shape Functions</a></li>
-</ul>
-</li>
-</ul>
-</li>
-<li class="toctree-l2"><a class="reference internal"
href="tir_transformation.html">Transformation</a></li>
-</ul>
-</li>
+<li class="toctree-l1"><a class="reference internal"
href="../index.html">TensorIR</a></li>
<li class="toctree-l1"><a class="reference internal"
href="../../relax/index.html">Relax</a></li>
</ul>
<p class="caption" role="heading"><span class="caption-text">API
Reference</span></p>
@@ -517,17 +497,17 @@ be used to ascertain the shape and data type of a
TensorIR.</p>
<span class="nb">print</span><span class="p">(</span><span
class="n">evaluate_dynamic_shape</span><span class="p">(</span><span
class="n">dyn_shape_lib</span><span class="p">,</span> <span
class="n">m</span><span class="o">=</span><span class="mi">64</span><span
class="p">,</span> <span class="n">n</span><span class="o">=</span><span
class="mi">64</span><span class="p">,</span> <a
href="../../../reference/api/python/tir/tir.html#tvm.tir.IterVar"
title="tvm.tir.IterVar" class="sphx-glr-ba [...]
</pre></div>
</div>
-<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[1.4639008 0.81149524 1.2469165
0.79718184]
- [1.0503372 0.49676353 0.85672927 0.47976065]
- [1.2796788 0.7559935 0.85851413 0.93546313]
- [0.95638275 0.40652537 0.6003208 0.7082942 ]]
-[[29.328182 29.246191 32.116787 ... 29.927141 29.233265 29.068287]
- [30.687939 31.419153 34.005787 ... 33.354244 32.725533 30.230991]
- [32.0926 32.731964 36.339134 ... 35.212177 31.287153 31.665817]
+<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[0.4997607 0.39404696 0.6161485
0.72112775]
+ [0.48272523 0.7631872 1.0439384 1.1835594 ]
+ [0.76485586 0.6593715 0.6234958 1.0389844 ]
+ [1.0580477 1.3580152 1.3343425 1.9772978 ]]
+[[35.02986 33.522823 33.989853 ... 31.136143 35.698112 32.371902]
+ [36.67233 34.473907 33.172703 ... 32.911404 37.53281 34.922924]
+ [33.071457 31.164038 29.987707 ... 31.901619 34.543198 31.53511 ]
...
- [27.469896 28.020096 31.106714 ... 29.485088 29.01112 28.66413 ]
- [29.355347 29.80985 33.124912 ... 32.228813 32.64193 31.742935]
- [30.603958 29.392557 32.4566 ... 31.786282 29.480438 31.995554]]
+ [36.057602 32.758816 33.335747 ... 32.881447 37.72857 34.011456]
+ [30.424395 29.545507 29.550253 ... 27.73667 31.73645 31.601265]
+ [31.421236 28.996126 27.744043 ... 31.313503 31.505651 30.765842]]
</pre></div>
</div>
</section>
diff --git a/docs/deep_dive/tensor_ir/tutorials/tir_transformation.html
b/docs/deep_dive/tensor_ir/tutorials/tir_transformation.html
index 6b9e3577ca..c71e7f96c1 100644
--- a/docs/deep_dive/tensor_ir/tutorials/tir_transformation.html
+++ b/docs/deep_dive/tensor_ir/tutorials/tir_transformation.html
@@ -197,22 +197,9 @@
<li class="toctree-l1"><a class="reference internal"
href="../../../how_to/dev/index.html">Development Guides</a></li>
</ul>
<p class="caption" role="heading"><span class="caption-text">Deep
Dive</span></p>
-<ul class="current">
+<ul>
<li class="toctree-l1"><a class="reference internal"
href="../../../arch/index.html">Design and Architecture</a></li>
-<li class="toctree-l1 current"><a class="reference internal"
href="../index.html">TensorIR</a><ul class="current">
-<li class="toctree-l2"><a class="reference internal"
href="../abstraction.html">Tensor Program Abstraction</a></li>
-<li class="toctree-l2"><a class="reference internal"
href="../learning.html">Understand TensorIR Abstraction</a></li>
-<li class="toctree-l2"><a class="reference internal"
href="tir_creation.html">TensorIR Creation</a></li>
-<li class="toctree-l2 current"><a class="current reference internal"
href="#">Transformation</a><ul>
-<li class="toctree-l3"><a class="reference internal"
href="#initialization-schedule">Initialization Schedule</a></li>
-<li class="toctree-l3"><a class="reference internal" href="#loop-tiling">Loop
Tiling</a></li>
-<li class="toctree-l3"><a class="reference internal"
href="#leverage-localities">Leverage Localities</a></li>
-<li class="toctree-l3"><a class="reference internal"
href="#rewrite-reduction">Rewrite Reduction</a></li>
-<li class="toctree-l3"><a class="reference internal"
href="#trace-the-transformation">Trace the Transformation</a></li>
-</ul>
-</li>
-</ul>
-</li>
+<li class="toctree-l1"><a class="reference internal"
href="../index.html">TensorIR</a></li>
<li class="toctree-l1"><a class="reference internal"
href="../../relax/index.html">Relax</a></li>
</ul>
<p class="caption" role="heading"><span class="caption-text">API
Reference</span></p>
@@ -389,7 +376,7 @@ original implementation.</p>
</div>
<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>Execution time summary:
mean (ms) median (ms) max (ms) min (ms) std (ms)
- 2.3096 2.3096 2.3096 2.3096 0.0000
+ 2.5497 2.5497 2.5497 2.5497 0.0000
</pre></div>
</div>
<section id="initialization-schedule">
@@ -485,7 +472,7 @@ class Module:
Execution time summary:
mean (ms) median (ms) max (ms) min (ms) std (ms)
- 0.8744 0.8744 0.8744 0.8744 0.0000
+ 0.9417 0.9417 0.9417 0.9417 0.0000
</pre></div>
</div>
</section>
@@ -579,7 +566,7 @@ class Module:
Execution time summary:
mean (ms) median (ms) max (ms) min (ms) std (ms)
- 0.3312 0.3312 0.3312 0.3312 0.0000
+ 0.3378 0.3378 0.3378 0.3378 0.0000
</pre></div>
</div>
</section>
diff --git a/docs/get_started/tutorials/ir_module.html
b/docs/get_started/tutorials/ir_module.html
index 830b3edcb1..b88d2a2999 100644
--- a/docs/get_started/tutorials/ir_module.html
+++ b/docs/get_started/tutorials/ir_module.html
@@ -819,8 +819,8 @@ backends.</p>
<span class="nb">print</span><span class="p">(</span><span
class="n">cpu_out</span><span class="p">)</span>
</pre></div>
</div>
-<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[ 0.1682995 -0.15936302 -0.1740453
-0.05549686 -0.02969982 0.20223626
- -0.24181096 0.10161518 0.06414028 0.01500236]]
+<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[-0.03393523 0.21668282 -0.055739
-0.38880786 0.058215 -0.12301907
+ 0.14273655 0.34130883 -0.04027858 -0.1037481 ]]
</pre></div>
</div>
</section>
@@ -854,8 +854,8 @@ the details of <code class="docutils literal
notranslate"><span class="pre">DLig
<span class="k">assert</span> <span class="n">np</span><span
class="o">.</span><span class="n">allclose</span><span class="p">(</span><span
class="n">cpu_out</span><span class="p">,</span> <span
class="n">gpu_out</span><span class="p">,</span> <span
class="n">atol</span><span class="o">=</span><span class="mf">1e-3</span><span
class="p">)</span>
</pre></div>
</div>
-<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[ 0.16829953 -0.15936302 -0.17404532
-0.05549683 -0.02969979 0.20223626
- -0.24181092 0.10161518 0.06414025 0.01500237]]
+<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[-0.03393522 0.21668276 -0.05573907
-0.38880786 0.05821501 -0.1230191
+ 0.14273658 0.34130886 -0.04027862 -0.10374808]]
</pre></div>
</div>
</section>
diff --git a/docs/get_started/tutorials/quick_start.html
b/docs/get_started/tutorials/quick_start.html
index 4277872183..875a3fd264 100644
--- a/docs/get_started/tutorials/quick_start.html
+++ b/docs/get_started/tutorials/quick_start.html
@@ -465,8 +465,8 @@ different devices.</p>
<span class="nb">print</span><span class="p">(</span><a
href="../../reference/api/python/runtime/vm.html#tvm.runtime.vm.VirtualMachine"
title="tvm.runtime.vm.VirtualMachine"
class="sphx-glr-backref-module-tvm-runtime-vm sphx-glr-backref-type-py-class
sphx-glr-backref-instance"><span class="n">vm</span></a><span
class="p">[</span><span class="s2">"forward"</span><span
class="p">](</span><span class="n">tvm_data</span><span class="p">,</span>
<span class="o">*</span><a href="http [...]
</pre></div>
</div>
-<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[25847.475 24279.332 24694.084 25823.77
26742.688 24573.928 26191.004
- 24160.408 25489.828 27646.2 ]]
+<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[24768.424 25633.959 24707.258 24859.969
25869.365 26105.26 24190.537
+ 24394.252 25021.393 25690.172]]
</pre></div>
</div>
<p>Our goal is to bring machine learning to the application with any language
of interest,
diff --git a/docs/get_started/tutorials/sg_execution_times.html
b/docs/get_started/tutorials/sg_execution_times.html
index 0e93d61bbe..22f278bea9 100644
--- a/docs/get_started/tutorials/sg_execution_times.html
+++ b/docs/get_started/tutorials/sg_execution_times.html
@@ -299,7 +299,7 @@
<section id="computation-times">
<span
id="sphx-glr-get-started-tutorials-sg-execution-times"></span><h1>Computation
times<a class="headerlink" href="#computation-times" title="Link to this
heading"></a></h1>
-<p><strong>00:06.766</strong> total execution time for 2 files <strong>from
get_started/tutorials</strong>:</p>
+<p><strong>00:07.595</strong> total execution time for 2 files <strong>from
get_started/tutorials</strong>:</p>
<div class="docutils container">
<style scoped>
<link
href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/5.3.0/css/bootstrap.min.css"
rel="stylesheet" />
@@ -321,11 +321,11 @@ $(document).ready( function () {
</thead>
<tbody>
<tr class="row-even"><td><p><a class="reference internal"
href="ir_module.html#sphx-glr-get-started-tutorials-ir-module-py"><span
class="std std-ref">IRModule</span></a> (<code class="docutils literal
notranslate"><span class="pre">ir_module.py</span></code>)</p></td>
-<td><p>00:06.570</p></td>
+<td><p>00:07.365</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="quick_start.html#sphx-glr-get-started-tutorials-quick-start-py"><span
class="std std-ref">Quick Start</span></a> (<code class="docutils literal
notranslate"><span class="pre">quick_start.py</span></code>)</p></td>
-<td><p>00:00.196</p></td>
+<td><p>00:00.230</p></td>
<td><p>0.0</p></td>
</tr>
</tbody>
diff --git a/docs/how_to/tutorials/cross_compilation_and_rpc.html
b/docs/how_to/tutorials/cross_compilation_and_rpc.html
index f7851d61fc..c063ae3285 100644
--- a/docs/how_to/tutorials/cross_compilation_and_rpc.html
+++ b/docs/how_to/tutorials/cross_compilation_and_rpc.html
@@ -480,7 +480,7 @@ device and returns the measured cost. Network overhead is
excluded.</p>
<span class="nb">print</span><span class="p">(</span><span
class="s2">"</span><span class="si">%g</span><span class="s2">
secs/op"</span> <span class="o">%</span> <span class="n">cost</span><span
class="p">)</span>
</pre></div>
</div>
-<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>1.251e-07 secs/op
+<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>1.3e-07 secs/op
</pre></div>
</div>
</section>
diff --git a/docs/how_to/tutorials/customize_opt.html
b/docs/how_to/tutorials/customize_opt.html
index b05378ff24..2a516aee5b 100644
--- a/docs/how_to/tutorials/customize_opt.html
+++ b/docs/how_to/tutorials/customize_opt.html
@@ -614,8 +614,8 @@ pushing the performance to the limit. The current
optimization may not be the be
<span class="nb">print</span><span class="p">(</span><span
class="n">gpu_out</span><span class="p">)</span>
</pre></div>
</div>
-<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[25474.455 24978.242 25313.082 25500.371
26524.494 26827.518 25888.547
- 25291.809 25186.93 25487.4 ]]
+<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>[[25338.746 24784.14 25818.207 25163.271
25910.93 25604.75 24958.316
+ 24613.84 24797.094 26070.352]]
</pre></div>
</div>
</section>
diff --git a/docs/how_to/tutorials/e2e_opt_model.html
b/docs/how_to/tutorials/e2e_opt_model.html
index 391fb9e266..1236bb8522 100644
--- a/docs/how_to/tutorials/e2e_opt_model.html
+++ b/docs/how_to/tutorials/e2e_opt_model.html
@@ -336,9 +336,9 @@ PyTorch.</p>
<div class="sphx-glr-script-out highlight-none notranslate"><div
class="highlight"><pre><span></span>Downloading:
"https://download.pytorch.org/models/resnet18-f37072fd.pth" to
/workspace/.cache/torch/hub/checkpoints/resnet18-f37072fd.pth
0%| | 0.00/44.7M [00:00<?, ?B/s]
- 38%|███▊ | 17.1M/44.7M [00:00<00:00, 179MB/s]
- 89%|████████▊ | 39.6M/44.7M [00:00<00:00, 212MB/s]
-100%|██████████| 44.7M/44.7M [00:00<00:00, 210MB/s]
+ 30%|██▉ | 13.4M/44.7M [00:00<00:00, 140MB/s]
+ 67%|██████▋ | 30.1M/44.7M [00:00<00:00, 161MB/s]
+100%|██████████| 44.7M/44.7M [00:00<00:00, 163MB/s]
</pre></div>
</div>
</section>
diff --git a/docs/how_to/tutorials/optimize_llm.html
b/docs/how_to/tutorials/optimize_llm.html
index 76b261f2c6..57161680cc 100644
--- a/docs/how_to/tutorials/optimize_llm.html
+++ b/docs/how_to/tutorials/optimize_llm.html
@@ -912,6 +912,7 @@ IRModule to generate the token.</p>
<span class="nb">print</span><span class="p">(</span><span
class="n">tokenizer</span><span class="o">.</span><span
class="n">decode</span><span class="p">(</span><span
class="n">output_tokens</span><span class="p">))</span>
</pre></div>
</div>
+<p class="sphx-glr-timing"><strong>Total running time of the script:</strong>
(1 minutes 21.675 seconds)</p>
<div class="sphx-glr-footer sphx-glr-footer-example docutils container"
id="sphx-glr-download-how-to-tutorials-optimize-llm-py">
<div class="sphx-glr-download sphx-glr-download-jupyter docutils container">
<p><a class="reference download internal" download=""
href="../../_downloads/ab03cb35cd7f92b5425a8974fcab921a/optimize_llm.ipynb"><code
class="xref download docutils literal notranslate"><span
class="pre">Download</span> <span class="pre">Jupyter</span> <span
class="pre">notebook:</span> <span
class="pre">optimize_llm.ipynb</span></code></a></p>
diff --git a/docs/how_to/tutorials/sg_execution_times.html
b/docs/how_to/tutorials/sg_execution_times.html
index a94d477bed..23e09656bd 100644
--- a/docs/how_to/tutorials/sg_execution_times.html
+++ b/docs/how_to/tutorials/sg_execution_times.html
@@ -299,7 +299,7 @@
<section id="computation-times">
<span id="sphx-glr-how-to-tutorials-sg-execution-times"></span><h1>Computation
times<a class="headerlink" href="#computation-times" title="Link to this
heading"></a></h1>
-<p><strong>00:40.385</strong> total execution time for 4 files <strong>from
how_to/tutorials</strong>:</p>
+<p><strong>01:23.653</strong> total execution time for 4 files <strong>from
how_to/tutorials</strong>:</p>
<div class="docutils container">
<style scoped>
<link
href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/5.3.0/css/bootstrap.min.css"
rel="stylesheet" />
@@ -321,19 +321,19 @@ $(document).ready( function () {
</thead>
<tbody>
<tr class="row-even"><td><p><a class="reference internal"
href="optimize_llm.html#sphx-glr-how-to-tutorials-optimize-llm-py"><span
class="std std-ref">Optimize Large Language Model</span></a> (<code
class="docutils literal notranslate"><span
class="pre">optimize_llm.py</span></code>)</p></td>
-<td><p>00:38.743</p></td>
+<td><p>01:21.675</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="e2e_opt_model.html#sphx-glr-how-to-tutorials-e2e-opt-model-py"><span
class="std std-ref">End-to-End Optimize Model</span></a> (<code class="docutils
literal notranslate"><span class="pre">e2e_opt_model.py</span></code>)</p></td>
-<td><p>00:00.749</p></td>
+<td><p>00:00.885</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-even"><td><p><a class="reference internal"
href="customize_opt.html#sphx-glr-how-to-tutorials-customize-opt-py"><span
class="std std-ref">Customize Optimization</span></a> (<code class="docutils
literal notranslate"><span class="pre">customize_opt.py</span></code>)</p></td>
-<td><p>00:00.677</p></td>
+<td><p>00:00.827</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="cross_compilation_and_rpc.html#sphx-glr-how-to-tutorials-cross-compilation-and-rpc-py"><span
class="std std-ref">Cross Compilation and RPC</span></a> (<code
class="docutils literal notranslate"><span
class="pre">cross_compilation_and_rpc.py</span></code>)</p></td>
-<td><p>00:00.216</p></td>
+<td><p>00:00.266</p></td>
<td><p>0.0</p></td>
</tr>
</tbody>
diff --git a/docs/searchindex.js b/docs/searchindex.js
index c84fd9ccab..4e6cda2fe6 100644
--- a/docs/searchindex.js
+++ b/docs/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"alltitles": {"1. Cross Compile TVM Runtime": [[40,
"cross-compile-tvm-runtime"]], "1. The lack of numpy on device machine caused
the RPC server can\u2019t be launched.": [[40,
"the-lack-of-numpy-on-device-machine-caused-the-rpc-server-can-t-be-launched"]],
"2. Pack and Deploy to Device Machine": [[40,
"pack-and-deploy-to-device-machine"]], "2. The lack of cloudpickle on device
machine caused the RPC server can\u2019t be launched.": [[40,
"the-lack-of-cloudpickle-on-devi [...]
\ No newline at end of file
+Search.setIndex({"alltitles": {"1. Cross Compile TVM Runtime": [[40,
"cross-compile-tvm-runtime"]], "1. The lack of numpy on device machine caused
the RPC server can\u2019t be launched.": [[40,
"the-lack-of-numpy-on-device-machine-caused-the-rpc-server-can-t-be-launched"]],
"2. Pack and Deploy to Device Machine": [[40,
"pack-and-deploy-to-device-machine"]], "2. The lack of cloudpickle on device
machine caused the RPC server can\u2019t be launched.": [[40,
"the-lack-of-cloudpickle-on-devi [...]
\ No newline at end of file
diff --git a/docs/sg_execution_times.html b/docs/sg_execution_times.html
index b543f5e351..cea96a6a69 100644
--- a/docs/sg_execution_times.html
+++ b/docs/sg_execution_times.html
@@ -299,7 +299,7 @@
<section id="computation-times">
<span id="sphx-glr-sg-execution-times"></span><h1>Computation times<a
class="headerlink" href="#computation-times" title="Link to this
heading"></a></h1>
-<p><strong>00:47.890</strong> total execution time for 10 files <strong>from
all galleries</strong>:</p>
+<p><strong>01:32.212</strong> total execution time for 10 files <strong>from
all galleries</strong>:</p>
<div class="docutils container">
<style scoped>
<link
href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/5.3.0/css/bootstrap.min.css"
rel="stylesheet" />
@@ -321,43 +321,43 @@ $(document).ready( function () {
</thead>
<tbody>
<tr class="row-even"><td><p><a class="reference internal"
href="how_to/tutorials/optimize_llm.html#sphx-glr-how-to-tutorials-optimize-llm-py"><span
class="std std-ref">Optimize Large Language Model</span></a> (<code
class="docutils literal notranslate"><span
class="pre">../how_to/tutorials/optimize_llm.py</span></code>)</p></td>
-<td><p>00:38.743</p></td>
+<td><p>01:21.675</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="get_started/tutorials/ir_module.html#sphx-glr-get-started-tutorials-ir-module-py"><span
class="std std-ref">IRModule</span></a> (<code class="docutils literal
notranslate"><span
class="pre">../get_started/tutorials/ir_module.py</span></code>)</p></td>
-<td><p>00:06.570</p></td>
+<td><p>00:07.365</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-even"><td><p><a class="reference internal"
href="how_to/tutorials/e2e_opt_model.html#sphx-glr-how-to-tutorials-e2e-opt-model-py"><span
class="std std-ref">End-to-End Optimize Model</span></a> (<code
class="docutils literal notranslate"><span
class="pre">../how_to/tutorials/e2e_opt_model.py</span></code>)</p></td>
-<td><p>00:00.749</p></td>
+<td><p>00:00.885</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="how_to/tutorials/customize_opt.html#sphx-glr-how-to-tutorials-customize-opt-py"><span
class="std std-ref">Customize Optimization</span></a> (<code class="docutils
literal notranslate"><span
class="pre">../how_to/tutorials/customize_opt.py</span></code>)</p></td>
-<td><p>00:00.677</p></td>
+<td><p>00:00.827</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-even"><td><p><a class="reference internal"
href="deep_dive/tensor_ir/tutorials/tir_transformation.html#sphx-glr-deep-dive-tensor-ir-tutorials-tir-transformation-py"><span
class="std std-ref">Transformation</span></a> (<code class="docutils literal
notranslate"><span
class="pre">../deep_dive/tensor_ir/tutorials/tir_transformation.py</span></code>)</p></td>
-<td><p>00:00.331</p></td>
+<td><p>00:00.422</p></td>
<td><p>0.0</p></td>
</tr>
-<tr class="row-odd"><td><p><a class="reference internal"
href="how_to/tutorials/cross_compilation_and_rpc.html#sphx-glr-how-to-tutorials-cross-compilation-and-rpc-py"><span
class="std std-ref">Cross Compilation and RPC</span></a> (<code
class="docutils literal notranslate"><span
class="pre">../how_to/tutorials/cross_compilation_and_rpc.py</span></code>)</p></td>
-<td><p>00:00.216</p></td>
+<tr class="row-odd"><td><p><a class="reference internal"
href="deep_dive/tensor_ir/tutorials/tir_creation.html#sphx-glr-deep-dive-tensor-ir-tutorials-tir-creation-py"><span
class="std std-ref">TensorIR Creation</span></a> (<code class="docutils
literal notranslate"><span
class="pre">../deep_dive/tensor_ir/tutorials/tir_creation.py</span></code>)</p></td>
+<td><p>00:00.273</p></td>
<td><p>0.0</p></td>
</tr>
-<tr class="row-even"><td><p><a class="reference internal"
href="deep_dive/tensor_ir/tutorials/tir_creation.html#sphx-glr-deep-dive-tensor-ir-tutorials-tir-creation-py"><span
class="std std-ref">TensorIR Creation</span></a> (<code class="docutils
literal notranslate"><span
class="pre">../deep_dive/tensor_ir/tutorials/tir_creation.py</span></code>)</p></td>
-<td><p>00:00.198</p></td>
+<tr class="row-even"><td><p><a class="reference internal"
href="how_to/tutorials/cross_compilation_and_rpc.html#sphx-glr-how-to-tutorials-cross-compilation-and-rpc-py"><span
class="std std-ref">Cross Compilation and RPC</span></a> (<code
class="docutils literal notranslate"><span
class="pre">../how_to/tutorials/cross_compilation_and_rpc.py</span></code>)</p></td>
+<td><p>00:00.266</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="get_started/tutorials/quick_start.html#sphx-glr-get-started-tutorials-quick-start-py"><span
class="std std-ref">Quick Start</span></a> (<code class="docutils literal
notranslate"><span
class="pre">../get_started/tutorials/quick_start.py</span></code>)</p></td>
-<td><p>00:00.196</p></td>
+<td><p>00:00.230</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-even"><td><p><a class="reference internal"
href="deep_dive/relax/tutorials/relax_creation.html#sphx-glr-deep-dive-relax-tutorials-relax-creation-py"><span
class="std std-ref">Relax Creation</span></a> (<code class="docutils literal
notranslate"><span
class="pre">../deep_dive/relax/tutorials/relax_creation.py</span></code>)</p></td>
-<td><p>00:00.132</p></td>
+<td><p>00:00.176</p></td>
<td><p>0.0</p></td>
</tr>
<tr class="row-odd"><td><p><a class="reference internal"
href="deep_dive/relax/tutorials/relax_transformation.html#sphx-glr-deep-dive-relax-tutorials-relax-transformation-py"><span
class="std std-ref">Transformation</span></a> (<code class="docutils literal
notranslate"><span
class="pre">../deep_dive/relax/tutorials/relax_transformation.py</span></code>)</p></td>
-<td><p>00:00.079</p></td>
+<td><p>00:00.092</p></td>
<td><p>0.0</p></td>
</tr>
</tbody>