Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
105 commits
Select commit Hold shift + click to select a range
a024f61
jit lto interleaved scan
divyegala Oct 2, 2025
45da4aa
fix dependencies.yaml
divyegala Oct 2, 2025
a7c8621
generate files at build time, use tags to avoid compilation of types
divyegala Oct 4, 2025
eb2d74b
passing tests
divyegala Oct 5, 2025
d2318e8
update gitignore
divyegala Oct 6, 2025
5e6afcd
separate out distance function from main kernel
divyegala Oct 6, 2025
6eee4da
fix deps
divyegala Oct 6, 2025
1de8f28
add filters as jit device functions, rework caching logic
divyegala Oct 7, 2025
84c6020
lto post lambda, cleanup files, generate cmake in build dir
divyegala Oct 7, 2025
22680c8
don't read hardcoded kernels, use generator properly
divyegala Oct 8, 2025
37f1163
random cmake changes carried over from 25.10
divyegala Oct 8, 2025
0ae5383
cmake format
divyegala Oct 8, 2025
fe56aec
remove dep on kernel list
divyegala Oct 8, 2025
40c8fd6
attempt to solve overlinking problem
divyegala Oct 9, 2025
e87a8c7
reorder if-else in compiler check
divyegala Oct 9, 2025
179d733
Merge branch 'branch-25.12' into jit-lto-ivf-flat-interleaved
divyegala Oct 9, 2025
32a67bd
use cudart apis
divyegala Oct 9, 2025
c27612e
merge
divyegala Oct 9, 2025
a4b48b1
attempt to link cudart
divyegala Oct 9, 2025
d5d692e
revert cudart link, try all arch build of jit lto fatbin sources
divyegala Oct 9, 2025
1c6dd94
cmake format
divyegala Oct 9, 2025
30f5ab6
missing shared mem setting
divyegala Oct 10, 2025
9674969
separate cuda 12 and 13 compilation
divyegala Oct 22, 2025
24fc47d
merge upstream
divyegala Oct 22, 2025
db9a487
remove bench
divyegala Oct 22, 2025
aa9294f
c include directory
divyegala Oct 22, 2025
2eb77fe
style check
divyegala Oct 22, 2025
6c685fa
merge upstream
divyegala Oct 22, 2025
3e35b99
guard cuda calls and use shared_ptr
divyegala Oct 23, 2025
d0ff62c
add AlgorithmPlanner to main target
divyegala Oct 23, 2025
eb87577
merge upstream
divyegala Oct 23, 2025
445a6c4
remove nvjitlink as cuda 12 dep
divyegala Oct 23, 2025
92a27d4
address review
divyegala Oct 24, 2025
8549172
merge upstream
divyegala Oct 24, 2025
67579f4
add include guard
divyegala Oct 27, 2025
7ad8774
add and remove couple of comments
divyegala Oct 27, 2025
816a480
merge upstream
divyegala Oct 27, 2025
ab35ef3
delete readme
divyegala Oct 27, 2025
cdd4c85
increase warmup time
divyegala Oct 27, 2025
87334b2
merge upstream
divyegala Oct 27, 2025
c1eff9f
use new copyright
divyegala Oct 27, 2025
ece09b8
new copyright
divyegala Oct 27, 2025
4dacc6e
remove one more straggling comment
divyegala Oct 27, 2025
1fd95cd
use raft expects
divyegala Oct 27, 2025
64cde0d
Merge branch 'main' into jit-lto-ivf-flat-interleaved
divyegala Oct 27, 2025
5ac127b
merge upstream
divyegala Dec 12, 2025
78002c6
address review
divyegala Dec 12, 2025
9ad6a0b
pre-commit
divyegala Dec 12, 2025
bf4c4ad
address review
divyegala Dec 12, 2025
18b2af9
Generate kernel files in CMake instead of Python
KyleFromNVIDIA Dec 12, 2025
ece5cad
Merge remote-tracking branch 'refs/remotes/github/divyegala/jit-lto-i…
KyleFromNVIDIA Dec 12, 2025
8ce70c2
Style
KyleFromNVIDIA Dec 12, 2025
fdc4239
Style
KyleFromNVIDIA Dec 12, 2025
be3cf0d
Style
KyleFromNVIDIA Dec 12, 2025
7e644c3
Lint
KyleFromNVIDIA Dec 12, 2025
235938a
Style, lint
KyleFromNVIDIA Dec 12, 2025
e3b749d
Fix nvjitlink_checker
KyleFromNVIDIA Dec 15, 2025
f42ae3f
Style
KyleFromNVIDIA Dec 15, 2025
b606df9
Merge branch 'main' into jit-lto-ivf-flat-interleaved
KyleFromNVIDIA Dec 15, 2025
5ce7aab
Refactor JIT LTO kernel compilation
KyleFromNVIDIA Dec 15, 2025
eaad347
Style
KyleFromNVIDIA Dec 15, 2025
eb3b468
pic
KyleFromNVIDIA Dec 15, 2025
912279c
style
KyleFromNVIDIA Dec 15, 2025
19f1af3
Verbose build
KyleFromNVIDIA Dec 15, 2025
087b943
static
KyleFromNVIDIA Dec 15, 2025
c16e109
style
KyleFromNVIDIA Dec 15, 2025
323b79f
TARGET_OBJECTS
KyleFromNVIDIA Dec 15, 2025
9f13e73
Disable sccache
KyleFromNVIDIA Dec 16, 2025
eaf9d39
Recache
KyleFromNVIDIA Dec 16, 2025
ce40c51
Revert CI debugging
KyleFromNVIDIA Dec 16, 2025
0d0abb9
Install and link object library
KyleFromNVIDIA Dec 17, 2025
84bfa92
Style
KyleFromNVIDIA Dec 17, 2025
21241eb
Alias
KyleFromNVIDIA Dec 17, 2025
7c0ac13
Make cuvs_jit_lto_kernels a static library
KyleFromNVIDIA Dec 17, 2025
880dbf2
Style
KyleFromNVIDIA Dec 17, 2025
d04d7c1
rapids_cuda_init_architectures() for C tests
KyleFromNVIDIA Dec 17, 2025
19581f9
Be more specific about where we search for libclang
KyleFromNVIDIA Dec 17, 2025
a61f019
More libclang updates
KyleFromNVIDIA Dec 17, 2025
2eeb913
Revert "Fix libclang download for Rust, CUDA initialization for C tests"
KyleFromNVIDIA Dec 17, 2025
55ec26c
Merge branch 'main' into jit-lto-ivf-flat-interleaved
KyleFromNVIDIA Dec 18, 2025
10228c5
Merge branch 'main' into jit-lto-ivf-flat-interleaved
KyleFromNVIDIA Dec 18, 2025
031ce21
Merge branch 'main' into jit-lto-ivf-flat-interleaved
KyleFromNVIDIA Jan 14, 2026
088c21e
Copyright
KyleFromNVIDIA Jan 14, 2026
8ca1062
Apply suggestions from code review
divyegala Jan 22, 2026
d5ab5bf
merge upstream
divyegala Jan 22, 2026
b8c0d42
address some review comments
divyegala Jan 22, 2026
17d34ae
remove too many underscores
divyegala Jan 22, 2026
282b376
Simplify
KyleFromNVIDIA Feb 4, 2026
609a4d6
Merge branch 'main' into jit-lto-ivf-flat-interleaved
KyleFromNVIDIA Feb 4, 2026
3115d07
address reviews
divyegala Feb 4, 2026
bb524ae
Merge remote-tracking branch 'origin/main' into jit-lto-ivf-flat-inte…
divyegala Feb 4, 2026
30a8a9f
Merge branch 'jit-lto-ivf-flat-interleaved' of github.com:divyegala/c…
divyegala Feb 4, 2026
72ddb36
Merge branch 'main' into jit-lto-ivf-flat-interleaved
divyegala Feb 5, 2026
4bd2102
add to docs and log about jit
divyegala Feb 10, 2026
fb722f0
Merge branch 'jit-lto-ivf-flat-interleaved' of github.com:divyegala/c…
divyegala Feb 10, 2026
3523b96
Merge remote-tracking branch 'origin/main' into jit-lto-ivf-flat-inte…
divyegala Feb 10, 2026
ba758a2
address review
divyegala Feb 10, 2026
42b78ae
rename inner_product to inner_prod
divyegala Feb 10, 2026
2e3a471
Merge remote-tracking branch 'origin/main' into jit-lto-ivf-flat-inte…
divyegala Feb 10, 2026
f6377fa
include header and form better log
divyegala Feb 10, 2026
533b770
address review and move
divyegala Feb 11, 2026
af23585
Merge remote-tracking branch 'origin/main' into jit-lto-ivf-flat-inte…
divyegala Feb 11, 2026
78c59d9
one more fix
divyegala Feb 11, 2026
7f8802b
correct path
divyegala Feb 11, 2026
27acbb6
merge upstream
divyegala Feb 13, 2026
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions conda/environments/all_cuda-131_arch-aarch64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,7 @@ dependencies:
- libcurand-dev
- libcusolver-dev
- libcusparse-dev
- libnvjitlink-dev
- librmm==26.4.*,>=0.0.0a0
- make
- nccl>=2.19
Expand Down
1 change: 1 addition & 0 deletions conda/environments/all_cuda-131_arch-x86_64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -31,6 +31,7 @@ dependencies:
- libcurand-dev
- libcusolver-dev
- libcusparse-dev
- libnvjitlink-dev
- librmm==26.4.*,>=0.0.0a0
- make
- nccl>=2.19
Expand Down
1 change: 1 addition & 0 deletions conda/environments/bench_ann_cuda-131_arch-aarch64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -30,6 +30,7 @@ dependencies:
- libcusolver-dev
- libcusparse-dev
- libcuvs==26.4.*,>=0.0.0a0
- libnvjitlink-dev
- librmm==26.4.*,>=0.0.0a0
- matplotlib-base>=3.9
- nccl>=2.19
Expand Down
1 change: 1 addition & 0 deletions conda/environments/bench_ann_cuda-131_arch-x86_64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,7 @@ dependencies:
- libcusolver-dev
- libcusparse-dev
- libcuvs==26.4.*,>=0.0.0a0
- libnvjitlink-dev
- librmm==26.4.*,>=0.0.0a0
- matplotlib-base>=3.9
- mkl-devel=2023
Expand Down
1 change: 1 addition & 0 deletions conda/environments/go_cuda-131_arch-aarch64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@ dependencies:
- libcusolver-dev
- libcusparse-dev
- libcuvs==26.4.*,>=0.0.0a0
- libnvjitlink-dev
- libraft==26.4.*,>=0.0.0a0
- nccl>=2.19
- ninja
Expand Down
1 change: 1 addition & 0 deletions conda/environments/go_cuda-131_arch-x86_64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@ dependencies:
- libcusolver-dev
- libcusparse-dev
- libcuvs==26.4.*,>=0.0.0a0
- libnvjitlink-dev
- libraft==26.4.*,>=0.0.0a0
- nccl>=2.19
- ninja
Expand Down
1 change: 1 addition & 0 deletions conda/environments/rust_cuda-131_arch-aarch64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,7 @@ dependencies:
- libcusolver-dev
- libcusparse-dev
- libcuvs==26.4.*,>=0.0.0a0
- libnvjitlink-dev
- libraft==26.4.*,>=0.0.0a0
- make
- nccl>=2.19
Expand Down
1 change: 1 addition & 0 deletions conda/environments/rust_cuda-131_arch-x86_64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -22,6 +22,7 @@ dependencies:
- libcusolver-dev
- libcusparse-dev
- libcuvs==26.4.*,>=0.0.0a0
- libnvjitlink-dev
- libraft==26.4.*,>=0.0.0a0
- make
- nccl>=2.19
Expand Down
41 changes: 40 additions & 1 deletion conda/recipes/libcuvs/recipe.yaml
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION.
# SPDX-FileCopyrightText: Copyright (c) 2025-2026, NVIDIA CORPORATION.
# SPDX-License-Identifier: Apache-2.0
schema_version: 1

Expand Down Expand Up @@ -72,6 +72,9 @@ cache:
- ninja
- ${{ stdlib("c") }}
host:
- if: cuda_major == "13"
then:
- libnvjitlink-dev
- librmm =${{ minor_version }}
- libraft-headers =${{ minor_version }}
- nccl ${{ nccl_version }}
Expand Down Expand Up @@ -118,6 +121,9 @@ outputs:
- libcurand-dev
- libcusolver-dev
- libcusparse-dev
- if: cuda_major == "13"
then:
- libnvjitlink-dev
run:
- ${{ pin_compatible("cuda-version", upper_bound="x", lower_bound="x") }}
- libraft-headers =${{ minor_version }}
Expand All @@ -128,6 +134,9 @@ outputs:
- libcurand
- libcusolver
- libcusparse
- if: cuda_major == "13"
then:
- libnvjitlink
ignore_run_exports:
by_name:
- cuda-cudart
Expand All @@ -141,6 +150,9 @@ outputs:
- librmm
- mkl
- nccl
- if: cuda_major == "13"
then:
- libnvjitlink
about:
homepage: ${{ load_from_file("python/libcuvs/pyproject.toml").project.urls.Homepage }}
license: ${{ load_from_file("python/libcuvs/pyproject.toml").project.license }}
Expand Down Expand Up @@ -177,6 +189,9 @@ outputs:
- libcurand-dev
- libcusolver-dev
- libcusparse-dev
- if: cuda_major == "13"
then:
- libnvjitlink-dev
run:
- ${{ pin_compatible("cuda-version", upper_bound="x", lower_bound="x") }}
- ${{ pin_subpackage("libcuvs-headers", exact=True) }}
Expand All @@ -188,6 +203,9 @@ outputs:
- libcurand
- libcusolver
- libcusparse
- if: cuda_major == "13"
then:
- libnvjitlink
ignore_run_exports:
by_name:
- cuda-cudart
Expand All @@ -201,6 +219,9 @@ outputs:
- librmm
- mkl
- nccl
- if: cuda_major == "13"
then:
- libnvjitlink
about:
homepage: ${{ load_from_file("python/libcuvs/pyproject.toml").project.urls.Homepage }}
license: ${{ load_from_file("python/libcuvs/pyproject.toml").project.license }}
Expand Down Expand Up @@ -235,6 +256,9 @@ outputs:
- libcurand-dev
- libcusolver-dev
- libcusparse-dev
- if: cuda_major == "13"
then:
- libnvjitlink-dev
run:
- ${{ pin_compatible("cuda-version", upper_bound="x", lower_bound="x") }}
- ${{ pin_subpackage("libcuvs-headers", exact=True) }}
Expand All @@ -246,6 +270,9 @@ outputs:
- libcurand
- libcusolver
- libcusparse
- if: cuda_major == "13"
then:
- libnvjitlink
ignore_run_exports:
by_name:
- cuda-cudart
Expand All @@ -256,6 +283,9 @@ outputs:
- libcurand
- libcusolver
- libcusparse
- if: cuda_major == "13"
then:
- libnvjitlink
- librmm
- mkl
- nccl
Expand Down Expand Up @@ -393,6 +423,9 @@ outputs:
- libcurand-dev
- libcusolver-dev
- libcusparse-dev
- if: cuda_major == "13"
then:
- libnvjitlink-dev
run:
- ${{ pin_subpackage("libcuvs-headers", exact=True) }}
- ${{ pin_subpackage("libcuvs", exact=True) }}
Expand All @@ -403,6 +436,9 @@ outputs:
- libcurand
- libcusolver
- libcusparse
- if: cuda_major == "13"
then:
- libnvjitlink
ignore_run_exports:
by_name:
- cuda-cudart
Expand All @@ -413,6 +449,9 @@ outputs:
- libcurand
- libcusolver
- libcusparse
- if: cuda_major == "13"
then:
- libnvjitlink
- librmm
- mkl
- nccl
Expand Down
76 changes: 63 additions & 13 deletions cpp/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -343,6 +343,29 @@ if(NOT BUILD_CPU_ONLY)
)
endif()

set(JIT_LTO_TARGET_ARCHITECTURE "")
set(JIT_LTO_COMPILATION OFF)
set(JIT_LTO_FILES "")
if(CMAKE_CUDA_COMPILER_VERSION VERSION_GREATER_EQUAL 13.0)
set(JIT_LTO_TARGET_ARCHITECTURE "75-real")
set(JIT_LTO_COMPILATION ON)
endif()

if(JIT_LTO_COMPILATION)
# Generate interleaved scan kernel files at build time
include(cmake/modules/generate_jit_lto_kernels.cmake)
generate_jit_lto_kernels(cuvs_jit_lto_kernels)
add_library(cuvs::cuvs_jit_lto_kernels ALIAS cuvs_jit_lto_kernels)

set(JIT_LTO_FILES
src/detail/jit_lto/AlgorithmLauncher.cu
src/detail/jit_lto/AlgorithmPlanner.cu
src/detail/jit_lto/FragmentDatabase.cu
src/detail/jit_lto/FragmentEntry.cu
src/detail/jit_lto/nvjitlink_checker.cpp
)
endif()

add_library(
cuvs_objs OBJECT
src/cluster/detail/minClusterDistanceCompute.cu
Expand Down Expand Up @@ -556,6 +579,7 @@ if(NOT BUILD_CPU_ONLY)
src/stats/silhouette_score.cu
src/stats/trustworthiness_score.cu
${CUVS_MG_ALGOS}
$<$<BOOL:${JIT_LTO_COMPILATION}>:${JIT_LTO_FILES}>
)

set_target_properties(
Expand All @@ -572,8 +596,10 @@ if(NOT BUILD_CPU_ONLY)
)

target_compile_definitions(
cuvs_objs PRIVATE $<$<BOOL:${BUILD_CAGRA_HNSWLIB}>:CUVS_BUILD_CAGRA_HNSWLIB>
$<$<BOOL:${CUVS_NVTX}>:NVTX_ENABLED>
cuvs_objs
PRIVATE $<$<BOOL:${BUILD_CAGRA_HNSWLIB}>:CUVS_BUILD_CAGRA_HNSWLIB>
$<$<BOOL:${CUVS_NVTX}>:NVTX_ENABLED>
$<$<BOOL:${JIT_LTO_COMPILATION}>:CUVS_ENABLE_JIT_LTO>
)

target_link_libraries(
Expand All @@ -586,6 +612,13 @@ if(NOT BUILD_CPU_ONLY)
$<TARGET_NAME_IF_EXISTS:hnswlib::hnswlib>
)

target_include_directories(
cuvs_objs
PUBLIC "$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/include>"
"$<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}/../c/include>"
INTERFACE "$<INSTALL_INTERFACE:include>"
)

# Endian detection
include(TestBigEndian)
test_big_endian(BIG_ENDIAN)
Expand Down Expand Up @@ -640,8 +673,10 @@ if(NOT BUILD_CPU_ONLY)
"$<$<COMPILE_LANGUAGE:CUDA>:${CUVS_CUDA_FLAGS}>"
)
target_compile_definitions(
cuvs PUBLIC $<$<BOOL:${BUILD_CAGRA_HNSWLIB}>:CUVS_BUILD_CAGRA_HNSWLIB>
$<$<BOOL:${CUVS_NVTX}>:NVTX_ENABLED>
cuvs
PUBLIC $<$<BOOL:${BUILD_CAGRA_HNSWLIB}>:CUVS_BUILD_CAGRA_HNSWLIB>
$<$<BOOL:${CUVS_NVTX}>:NVTX_ENABLED>
$<$<BOOL:${JIT_LTO_COMPILATION}>:CUVS_ENABLE_JIT_LTO>
)

target_link_libraries(
Expand All @@ -653,8 +688,12 @@ if(NOT BUILD_CPU_ONLY)
$<BUILD_LOCAL_INTERFACE:$<TARGET_NAME_IF_EXISTS:NCCL::NCCL>>
$<BUILD_LOCAL_INTERFACE:$<TARGET_NAME_IF_EXISTS:hnswlib::hnswlib>>
$<$<BOOL:${CUVS_NVTX}>:CUDA::nvtx3>
PRIVATE $<TARGET_NAME_IF_EXISTS:OpenMP::OpenMP_CXX> $<COMPILE_ONLY:nvidia::cutlass::cutlass>
$<COMPILE_ONLY:cuco::cuco>
PRIVATE
$<TARGET_NAME_IF_EXISTS:OpenMP::OpenMP_CXX>
$<COMPILE_ONLY:nvidia::cutlass::cutlass>
$<COMPILE_ONLY:cuco::cuco>
$<$<BOOL:${JIT_LTO_COMPILATION}>:CUDA::nvJitLink>
$<$<BOOL:${JIT_LTO_COMPILATION}>:$<LINK_LIBRARY:WHOLE_ARCHIVE,cuvs::cuvs_jit_lto_kernels>>
)

# ensure CUDA symbols aren't relocated to the middle of the debug build binaries
Expand Down Expand Up @@ -692,8 +731,10 @@ SECTIONS

target_compile_options(cuvs_static PRIVATE "$<$<COMPILE_LANGUAGE:CXX>:${CUVS_CXX_FLAGS}>")
target_compile_definitions(
cuvs_static PUBLIC $<$<BOOL:${BUILD_CAGRA_HNSWLIB}>:CUVS_BUILD_CAGRA_HNSWLIB>
$<$<BOOL:${CUVS_NVTX}>:NVTX_ENABLED>
cuvs_static
PUBLIC $<$<BOOL:${BUILD_CAGRA_HNSWLIB}>:CUVS_BUILD_CAGRA_HNSWLIB>
$<$<BOOL:${CUVS_NVTX}>:NVTX_ENABLED>
$<$<BOOL:${JIT_LTO_COMPILATION}>:CUVS_ENABLE_JIT_LTO>
)

target_include_directories(cuvs_static INTERFACE "$<INSTALL_INTERFACE:include>")
Expand All @@ -709,8 +750,13 @@ SECTIONS
${CUVS_CTK_MATH_DEPENDENCIES}
$<TARGET_NAME_IF_EXISTS:NCCL::NCCL> # needs to be public for DT_NEEDED
$<BUILD_LOCAL_INTERFACE:$<TARGET_NAME_IF_EXISTS:hnswlib::hnswlib>> # header only
PRIVATE $<TARGET_NAME_IF_EXISTS:OpenMP::OpenMP_CXX> $<$<BOOL:${CUVS_NVTX}>:CUDA::nvtx3>
$<COMPILE_ONLY:nvidia::cutlass::cutlass> $<COMPILE_ONLY:cuco::cuco>
PRIVATE
$<TARGET_NAME_IF_EXISTS:OpenMP::OpenMP_CXX>
$<$<BOOL:${JIT_LTO_COMPILATION}>:CUDA::nvJitLink>
$<$<BOOL:${CUVS_NVTX}>:CUDA::nvtx3>
$<COMPILE_ONLY:nvidia::cutlass::cutlass>
$<COMPILE_ONLY:cuco::cuco>
$<$<BOOL:${JIT_LTO_COMPILATION}>:$<LINK_LIBRARY:WHOLE_ARCHIVE,cuvs::cuvs_jit_lto_kernels>>
)
endif()

Expand Down Expand Up @@ -751,9 +797,11 @@ target_compile_definitions(cuvs::cuvs INTERFACE $<$<BOOL:${CUVS_NVTX}>:NVTX_ENAB
include(GNUInstallDirs)
include(CPack)

set(target_names cuvs cuvs_static cuvs_cpp_headers cuvs_c)
set(component_names cuvs_shared cuvs_static cuvs_cpp_headers c_api)
set(export_names cuvs-shared-exports cuvs-static-exports cuvs-cpp-headers-exports cuvs-c-exports)
set(target_names cuvs cuvs_static cuvs_jit_lto_kernels cuvs_cpp_headers cuvs_c)
set(component_names cuvs_shared cuvs_static cuvs_static cuvs_cpp_headers c_api)
set(export_names cuvs-shared-exports cuvs-static-exports cuvs-static-exports
cuvs-cpp-headers-exports cuvs-c-exports
)
foreach(target component export IN ZIP_LISTS target_names component_names export_names)
if(TARGET ${target})
install(
Expand Down Expand Up @@ -794,6 +842,8 @@ target_compile_definitions(cuvs::cuvs INTERFACE $<$<BOOL:${CUVS_NVTX}>:NVTX_ENAB
)
endif()

list(REMOVE_DUPLICATES cuvs_components)
list(REMOVE_DUPLICATES cuvs_export_sets)
include(cmake/modules/generate_cuvs_export.cmake)
generate_cuvs_export(COMPONENTS ${cuvs_components} EXPORT_SETS ${cuvs_export_sets})

Expand Down
9 changes: 9 additions & 0 deletions cpp/cmake/config.json
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,15 @@
"ADDITIONAL_DEP": "?",
"PATH": "*"
}
},
"embed_jit_lto_fatbin": {
"kwargs": {
"FATBIN_TARGET": 1,
"FATBIN_SOURCE": 1,
"EMBEDDED_TARGET": 1,
"EMBEDDED_HEADER": 1,
"EMBEDDED_ARRAY": 1
}
}
}
},
Expand Down
Loading