diff --git a/cpp/tensorrt_llm/CMakeLists.txt b/cpp/tensorrt_llm/CMakeLists.txt index 4c97c8c1803..be85ccc9fbe 100644 --- a/cpp/tensorrt_llm/CMakeLists.txt +++ b/cpp/tensorrt_llm/CMakeLists.txt @@ -147,24 +147,6 @@ add_subdirectory(runtime) add_subdirectory(testing) add_subdirectory(executor_worker) -if(ENABLE_CUFILE) - find_library( - CUFILE_LIBRARY cufile HINTS ${CUDAToolkit_LIBRARY_DIR} - /usr/lib/${TARGET_ARCH} /usr/local/lib) - if(NOT CUFILE_LIBRARY) - # FATAL_ERROR if user explicitly requests with GDS if CUDA's libcufile.so is - # not found. - message( - FATAL_ERROR - "cuFile library not found. Set -DENABLE_CUFILE=OFF if cufile isn't required." - ) - else() - message(STATUS "Linking with cufile: ${CUFILE_LIBRARY}") - endif() -else() - message(STATUS "ENABLE_CUFILE=OFF, skipping GDS linkage.") -endif() - set(BATCH_MANAGER_TARGET tensorrt_llm_batch_manager_static) set(BATCH_MANAGER_TARGET_ARCH ${TARGET_ARCH}) add_subdirectory(batch_manager) @@ -263,10 +245,6 @@ set_target_properties( target_link_libraries(${SHARED_TARGET} PUBLIC ${TRTLLM_LINK_LIBS}) -if(ENABLE_CUFILE) - target_link_libraries(${SHARED_TARGET} PUBLIC ${CUFILE_LIBRARY}) -endif() - target_link_libraries( ${SHARED_TARGET} PRIVATE $ diff --git a/cpp/tensorrt_llm/batch_manager/CMakeLists.txt b/cpp/tensorrt_llm/batch_manager/CMakeLists.txt index 4baeba6375e..225de2ee4b2 100644 --- a/cpp/tensorrt_llm/batch_manager/CMakeLists.txt +++ b/cpp/tensorrt_llm/batch_manager/CMakeLists.txt @@ -94,10 +94,6 @@ set(TOP_LEVEL_DIR "${PROJECT_SOURCE_DIR}/..") target_compile_definitions(${BATCH_MANAGER_STATIC_TARGET} PUBLIC TOP_LEVEL_DIR="${TOP_LEVEL_DIR}") -if(ENABLE_CUFILE) - target_link_libraries(${BATCH_MANAGER_STATIC_TARGET} PUBLIC ${CUFILE_LIBRARY}) -endif() - if(ENABLE_UCX) find_package(ucx REQUIRED) find_package(ucxx REQUIRED) diff --git a/cpp/tensorrt_llm/batch_manager/kvCacheTransferManager.cpp b/cpp/tensorrt_llm/batch_manager/kvCacheTransferManager.cpp index 35868b35ac1..fd5758a8368 100644 --- a/cpp/tensorrt_llm/batch_manager/kvCacheTransferManager.cpp +++ b/cpp/tensorrt_llm/batch_manager/kvCacheTransferManager.cpp @@ -28,18 +28,6 @@ #include "tensorrt_llm/runtime/cudaEvent.h" #include "tensorrt_llm/runtime/cudaStream.h" -#ifdef ENABLE_CUFILE -#include -#endif -#include -#include -#include -#include - -#include -#include -#include - namespace tr = tensorrt_llm::runtime; namespace tk = tensorrt_llm::kernels; namespace kvc = tensorrt_llm::executor::kv_cache;