This is an automated email from the ASF dual-hosted git repository.
tqchen pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/tvm.git
The following commit(s) were added to refs/heads/main by this push:
new 74eae2f59d [3rdparty] Phasing out FlashInfer AOT from 3rdparty (#18046)
74eae2f59d is described below
commit 74eae2f59dd0602953a704043e1e324752576949
Author: Ruihang Lai <[email protected]>
AuthorDate: Fri Jun 6 12:04:54 2025 -0400
[3rdparty] Phasing out FlashInfer AOT from 3rdparty (#18046)
This PR phases out the FlashInfer from 3rdparty as we are
moving towards compiling FlashInfer kernels with just-in-time (JIT)
compilation. The existing 3rdparty served for the AOT kernel
compilation purposes in the past, which we will not plan to use
in the future.
---
.gitmodules | 3 ---
3rdparty/flashinfer | 1 -
CMakeLists.txt | 23 -----------------------
cmake/modules/LibInfo.cmake | 1 -
docs/install/from_source.rst | 3 +--
src/support/libinfo.cc | 1 -
6 files changed, 1 insertion(+), 31 deletions(-)
diff --git a/.gitmodules b/.gitmodules
index e8a48d99c2..a481df2438 100644
--- a/.gitmodules
+++ b/.gitmodules
@@ -25,9 +25,6 @@
[submodule "3rdparty/libflash_attn"]
path = 3rdparty/libflash_attn
url = https://github.com/tlc-pack/libflash_attn
-[submodule "3rdparty/flashinfer"]
- path = 3rdparty/flashinfer
- url = https://github.com/flashinfer-ai/flashinfer.git
[submodule "3rdparty/zlib"]
path = 3rdparty/zlib
url = https://github.com/madler/zlib.git
diff --git a/3rdparty/flashinfer b/3rdparty/flashinfer
deleted file mode 160000
index a76ceedb94..0000000000
--- a/3rdparty/flashinfer
+++ /dev/null
@@ -1 +0,0 @@
-Subproject commit a76ceedb9495d3d05648c29a8e6bb45baa265f6c
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 15a2244f81..c52f3b363a 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -845,26 +845,3 @@ if(USE_ROCM AND USE_RCCL)
target_link_libraries(tvm PRIVATE rccl)
target_link_libraries(tvm_runtime PRIVATE rccl)
endif()
-
-
-option(USE_FLASHINFER "Build TVM with FlashInfer" OFF)
-if (USE_FLASHINFER STREQUAL "ON")
- message(STATUS "Build with FlashInfer")
- set(FLASHINFER_TVM_BINDING ON)
- set(FLASHINFER_TVM_SOURCE_DIR ${PROJECT_SOURCE_DIR})
- set(FLASHINFER_PREFILL OFF)
- set(FLASHINFER_DECODE OFF)
- set(FLASHINFER_PAGE OFF)
- set(FLASHINFER_CASCADE OFF)
- set(FLASHINFER_SAMPLING OFF)
- set(FLASHINFER_NORM OFF)
- add_subdirectory(3rdparty/flashinfer)
-else ()
- message(STATUS "Build without FlashInfer")
-endif ()
-
-
-if (USE_FLASHINFER STREQUAL "ON")
- target_link_libraries(tvm PRIVATE flashinfer_tvm)
- target_link_libraries(tvm_runtime PRIVATE flashinfer_tvm)
-endif ()
diff --git a/cmake/modules/LibInfo.cmake b/cmake/modules/LibInfo.cmake
index b94bb42b25..14c63f8aa3 100644
--- a/cmake/modules/LibInfo.cmake
+++ b/cmake/modules/LibInfo.cmake
@@ -74,7 +74,6 @@ function(add_lib_info src_file)
TVM_INFO_USE_CUDNN="${USE_CUDNN}"
TVM_INFO_USE_CUSTOM_LOGGING="${USE_CUSTOM_LOGGING}"
TVM_INFO_USE_CUTLASS="${USE_CUTLASS}"
- TVM_INFO_USE_FLASHINFER="${USE_FLASHINFER}"
TVM_INFO_USE_AMX="${USE_AMX}"
TVM_INFO_USE_DNNL="${USE_DNNL}"
TVM_INFO_USE_FALLBACK_STL_MAP="${USE_FALLBACK_STL_MAP}"
diff --git a/docs/install/from_source.rst b/docs/install/from_source.rst
index cc50f9fec9..55a1bcc09b 100644
--- a/docs/install/from_source.rst
+++ b/docs/install/from_source.rst
@@ -230,8 +230,7 @@ Advanced Build Configuration
Ccache
~~~~~~
On supported platforms, the `Ccache compiler wrapper <https://ccache.dev/>`_
may be helpful for
-reducing TVM's build time, especially when building with `cutlass
<https://github.com/NVIDIA/cutlass>`_
-or `flashinfer <https://github.com/flashinfer-ai/flashinfer>`_.
+reducing TVM's build time, especially when building with `cutlass
<https://github.com/NVIDIA/cutlass>`_.
There are several ways to enable CCache in TVM builds:
- Leave ``USE_CCACHE=AUTO`` in ``build/config.cmake``. CCache will be used
if it is found.
diff --git a/src/support/libinfo.cc b/src/support/libinfo.cc
index 01b49bb92e..6723cf0639 100644
--- a/src/support/libinfo.cc
+++ b/src/support/libinfo.cc
@@ -304,7 +304,6 @@ TVM_DLL ffi::Map<ffi::String, ffi::String> GetLibInfo() {
{"USE_CUDNN", TVM_INFO_USE_CUDNN},
{"USE_CUSTOM_LOGGING", TVM_INFO_USE_CUSTOM_LOGGING},
{"USE_CUTLASS", TVM_INFO_USE_CUTLASS},
- {"USE_FLASHINFER", TVM_INFO_USE_FLASHINFER},
{"USE_AMX", TVM_INFO_USE_AMX},
{"USE_DNNL", TVM_INFO_USE_DNNL},
{"USE_FALLBACK_STL_MAP", TVM_INFO_USE_FALLBACK_STL_MAP},