This is an automated email from the ASF dual-hosted git repository.

tqchen pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/tvm.git


The following commit(s) were added to refs/heads/main by this push:
     new 74eae2f59d [3rdparty] Phasing out FlashInfer AOT from 3rdparty (#18046)
74eae2f59d is described below

commit 74eae2f59dd0602953a704043e1e324752576949
Author: Ruihang Lai <[email protected]>
AuthorDate: Fri Jun 6 12:04:54 2025 -0400

    [3rdparty] Phasing out FlashInfer AOT from 3rdparty (#18046)
    
    This PR phases out the FlashInfer from 3rdparty as we are
    moving towards compiling FlashInfer kernels with just-in-time (JIT)
    compilation.  The existing 3rdparty served for the AOT kernel
    compilation purposes in the past, which we will not plan to use
    in the future.
---
 .gitmodules                  |  3 ---
 3rdparty/flashinfer          |  1 -
 CMakeLists.txt               | 23 -----------------------
 cmake/modules/LibInfo.cmake  |  1 -
 docs/install/from_source.rst |  3 +--
 src/support/libinfo.cc       |  1 -
 6 files changed, 1 insertion(+), 31 deletions(-)

diff --git a/.gitmodules b/.gitmodules
index e8a48d99c2..a481df2438 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -25,9 +25,6 @@
 [submodule "3rdparty/libflash_attn"]
        path = 3rdparty/libflash_attn
        url = https://github.com/tlc-pack/libflash_attn
-[submodule "3rdparty/flashinfer"]
-       path = 3rdparty/flashinfer
-       url = https://github.com/flashinfer-ai/flashinfer.git
 [submodule "3rdparty/zlib"]
        path = 3rdparty/zlib
        url = https://github.com/madler/zlib.git
diff --git a/3rdparty/flashinfer b/3rdparty/flashinfer
deleted file mode 160000
index a76ceedb94..0000000000
--- a/3rdparty/flashinfer
+++ /dev/null
@@ -1 +0,0 @@
-Subproject commit a76ceedb9495d3d05648c29a8e6bb45baa265f6c
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 15a2244f81..c52f3b363a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -845,26 +845,3 @@ if(USE_ROCM AND USE_RCCL)
   target_link_libraries(tvm PRIVATE rccl)
   target_link_libraries(tvm_runtime PRIVATE rccl)
 endif()
-
-
-option(USE_FLASHINFER "Build TVM with FlashInfer" OFF)
-if (USE_FLASHINFER STREQUAL "ON")
-  message(STATUS "Build with FlashInfer")
-  set(FLASHINFER_TVM_BINDING ON)
-  set(FLASHINFER_TVM_SOURCE_DIR ${PROJECT_SOURCE_DIR})
-  set(FLASHINFER_PREFILL OFF)
-  set(FLASHINFER_DECODE OFF)
-  set(FLASHINFER_PAGE OFF)
-  set(FLASHINFER_CASCADE OFF)
-  set(FLASHINFER_SAMPLING OFF)
-  set(FLASHINFER_NORM OFF)
-  add_subdirectory(3rdparty/flashinfer)
-else ()
-  message(STATUS "Build without FlashInfer")
-endif ()
-
-
-if (USE_FLASHINFER STREQUAL "ON")
-  target_link_libraries(tvm PRIVATE flashinfer_tvm)
-  target_link_libraries(tvm_runtime PRIVATE flashinfer_tvm)
-endif ()
diff --git a/cmake/modules/LibInfo.cmake b/cmake/modules/LibInfo.cmake
index b94bb42b25..14c63f8aa3 100644
--- a/cmake/modules/LibInfo.cmake
+++ b/cmake/modules/LibInfo.cmake
@@ -74,7 +74,6 @@ function(add_lib_info src_file)
     TVM_INFO_USE_CUDNN="${USE_CUDNN}"
     TVM_INFO_USE_CUSTOM_LOGGING="${USE_CUSTOM_LOGGING}"
     TVM_INFO_USE_CUTLASS="${USE_CUTLASS}"
-    TVM_INFO_USE_FLASHINFER="${USE_FLASHINFER}"
     TVM_INFO_USE_AMX="${USE_AMX}"
     TVM_INFO_USE_DNNL="${USE_DNNL}"
     TVM_INFO_USE_FALLBACK_STL_MAP="${USE_FALLBACK_STL_MAP}"
diff --git a/docs/install/from_source.rst b/docs/install/from_source.rst
index cc50f9fec9..55a1bcc09b 100644
--- a/docs/install/from_source.rst
+++ b/docs/install/from_source.rst
@@ -230,8 +230,7 @@ Advanced Build Configuration
 Ccache
 ~~~~~~
 On supported platforms, the `Ccache compiler wrapper <https://ccache.dev/>`_ 
may be helpful for
-reducing TVM's build time, especially when building with `cutlass 
<https://github.com/NVIDIA/cutlass>`_
-or `flashinfer <https://github.com/flashinfer-ai/flashinfer>`_.
+reducing TVM's build time, especially when building with `cutlass 
<https://github.com/NVIDIA/cutlass>`_.
 There are several ways to enable CCache in TVM builds:
 
     - Leave ``USE_CCACHE=AUTO`` in ``build/config.cmake``. CCache will be used 
if it is found.
diff --git a/src/support/libinfo.cc b/src/support/libinfo.cc
index 01b49bb92e..6723cf0639 100644
--- a/src/support/libinfo.cc
+++ b/src/support/libinfo.cc
@@ -304,7 +304,6 @@ TVM_DLL ffi::Map<ffi::String, ffi::String> GetLibInfo() {
       {"USE_CUDNN", TVM_INFO_USE_CUDNN},
       {"USE_CUSTOM_LOGGING", TVM_INFO_USE_CUSTOM_LOGGING},
       {"USE_CUTLASS", TVM_INFO_USE_CUTLASS},
-      {"USE_FLASHINFER", TVM_INFO_USE_FLASHINFER},
       {"USE_AMX", TVM_INFO_USE_AMX},
       {"USE_DNNL", TVM_INFO_USE_DNNL},
       {"USE_FALLBACK_STL_MAP", TVM_INFO_USE_FALLBACK_STL_MAP},

Reply via email to