@@ -38,12 +38,13 @@ endif()
3838
3939# Ensure that dependent libraries are installed
4040find_library (MLX5_lib NAMES mlx5 REQUIRED)
41- set (NVSHMEM_INSTALL_PREFIX "${TORCH_INSTALL_PREFIX} /../nvidia/shmem " )
41+ set (NVSHMEM_INSTALL_PREFIX "${TORCH_INSTALL_PREFIX} /../nvidia/nvshmem " )
4242# message("Torch Install Prefix: ${TORCH_INSTALL_PREFIX}")
4343
4444find_path (NVSHMEM_INCLUDE_DIR nvshmem.h HINTS ${NVSHMEM_INSTALL_PREFIX} /include )
45- find_library (NVSHMEM_HOST_LIBRARY nvshmem_host.so.3 HINTS ${NVSHMEM_INSTALL_PREFIX} /lib)
45+ # set (NVSHMEM_HOST_LIBRARY ${NVSHMEM_INSTALL_PREFIX}/lib/libnvshmem_host.so.3 )
4646find_library (NVSHMEM_DEVICE_LIBRARY nvshmem_device HINTS ${NVSHMEM_INSTALL_PREFIX} /lib)
47+ find_library (NVSHMEM_HOST_LIBRARY libnvshmem_host.so.3 HINTS ${NVSHMEM_INSTALL_PREFIX} /lib)
4748
4849
4950# Prepare files
@@ -114,7 +115,7 @@ set_target_properties(
114115 CUDA_SEPARABLE_COMPILATION ON
115116 CUDA_ARCHITECTURES "${DEEP_EP_CUDA_ARCHITECTURES} "
116117 LINK_DEPENDS ${CMAKE_CURRENT_SOURCE_DIR} /deep_ep_cpp_tllm.version
117- INSTALL_RPATH "${TORCH_INSTALL_PREFIX} /lib"
118+ INSTALL_RPATH "${TORCH_INSTALL_PREFIX} /lib; ${NVSHMEM_INSTALL_PREFIX} /lib "
118119 BUILD_WITH_INSTALL_RPATH TRUE )
119120target_compile_options (
120121 deep_ep_cpp_tllm
@@ -125,7 +126,7 @@ target_compile_definitions(
125126 TORCH_EXTENSION_NAME=deep_ep_cpp_tllm)
126127target_include_directories (deep_ep_cpp_tllm PRIVATE ${NVSHMEM_INCLUDE_DIR} )
127128target_link_libraries (
128- deep_ep_cpp_tllm PRIVATE ${NVSHMEM_DEVICE_LIBRARY} ${TORCH_LIBRARIES}
129+ deep_ep_cpp_tllm PRIVATE ${NVSHMEM_DEVICE_LIBRARY} ${NVSHMEM_HOST_LIBRARY} ${ TORCH_LIBRARIES}
129130 ${TORCH_PYTHON_LIB} )
130131target_link_options (
131132 deep_ep_cpp_tllm PRIVATE
0 commit comments