NVIDIA · rapids-bot · May 21, 2026 · May 16, 2026 · May 17, 2026 · May 17, 2026
@@ -1072,6 +1072,7 @@ if(NOT BUILD_CPU_ONLY)
                CUDA_STANDARD_REQUIRED ON
                POSITION_INDEPENDENT_CODE ON
                CXX_VISIBILITY_PRESET hidden
+               CUDA_VISIBILITY_PRESET hidden
                VISIBILITY_INLINES_HIDDEN ON
   )
   target_compile_options(

@@ -0,0 +1,18 @@
+/*
+ * SPDX-FileCopyrightText: Copyright (c) 2025-2026, NVIDIA CORPORATION.
+ * SPDX-License-Identifier: Apache-2.0
+ */
+
+#pragma once
+
+// Wrapper for cuda_fp16.h that ensures __half gets default symbol visibility.
+//
+// GCC's "type visibility" rule causes template instantiations over __half to
+// inherit hidden visibility when -fvisibility=hidden is in effect, because
+// __half is a user-defined type first seen under hidden visibility. By
+// including cuda_fp16.h under #pragma GCC visibility push(default), the __half
+// type acquires default visibility, and downstream template instantiations
+// (e.g., index<__half, ...>) will be properly exported from shared libraries.
+#pragma GCC visibility push(default)
+#include <cuda_fp16.h>  // NOLINT
+#pragma GCC visibility pop
@@ -6,7 +6,7 @@
 #pragma once
 
 #include <cstdint>
-#include <cuda_fp16.h>
+#include <cuvs/core/cuda_fp16.hpp>
 #include <cuvs/core/export.hpp>
 #include <raft/core/device_csr_matrix.hpp>
 #include <raft/core/device_mdspan.hpp>

@@ -12,7 +12,7 @@
 #include <raft/core/handle.hpp>
 #include <raft/core/host_mdspan.hpp>
 
-#include <cuda_fp16.h>
+#include <cuvs/core/cuda_fp16.hpp>
 #include <cuvs/core/export.hpp>
 
 namespace CUVS_EXPORT cuvs {
@@ -35,7 +35,7 @@ struct search_params : cuvs::neighbors::search_params {};
  * @tparam T data element type
  */
 template <typename T, typename DistT = T>
-struct index : cuvs::neighbors::index {
+struct CUVS_EXPORT index : cuvs::neighbors::index {
   using index_params_type  = brute_force::index_params;
   using search_params_type = brute_force::search_params;
   using index_type         = int64_t;
@@ -166,6 +166,7 @@ struct index : cuvs::neighbors::index {
   raft::device_matrix_view<const T, int64_t, raft::row_major> dataset_view_;
   DistT metric_arg_;
 };
+
 /**
  * @}
  */

@@ -391,7 +391,7 @@ static_assert(std::is_aggregate_v<search_params>);
  *
  */
 template <typename T, typename IdxT>
-struct index : cuvs::neighbors::index {
+struct CUVS_EXPORT index : cuvs::neighbors::index {
   using index_params_type  = cagra::index_params;
   using search_params_type = cagra::search_params;
   using index_type         = IdxT;
@@ -883,6 +883,7 @@ struct index : cuvs::neighbors::index {
   size_t dim_          = 0;
   size_t graph_degree_ = 0;
 };
+
 /**
  * @}
  */

@@ -19,6 +19,7 @@
 
 #include <cuvs/core/bitmap.hpp>
 #include <cuvs/core/bitset.hpp>
+#include <cuvs/core/export.hpp>
 #include <raft/core/detail/macros.hpp>
 
 #include <memory>
@@ -27,7 +28,6 @@
 
 #ifdef __cpp_lib_bitops
 #include <bit>
-#include <cuvs/core/export.hpp>
 #endif
 
 namespace CUVS_EXPORT cuvs {
@@ -811,11 +811,11 @@ using enable_if_valid_list_t = typename enable_if_valid_list<ListT, T>::type;
  *       `cuvs::neighbors::ivf_pq::helpers::resize_list` which handle type casting internally.
  */
 template <typename ListT>
-void resize_list(raft::resources const& res,
-                 std::shared_ptr<ListT>& orig_list,  // NOLINT
-                 const typename ListT::spec_type& spec,
-                 typename ListT::size_type new_used_size,
-                 typename ListT::size_type old_used_size);
+CUVS_EXPORT void resize_list(raft::resources const& res,
+                             std::shared_ptr<ListT>& orig_list,  // NOLINT
+                             const typename ListT::spec_type& spec,
+                             typename ListT::size_type new_used_size,
+                             typename ListT::size_type old_used_size);
 
 /**
  * Serialize a list to an output stream.

@@ -41,7 +41,7 @@ namespace composite {
  * @endcode
  */
 template <typename T, typename IdxT, typename OutputIdxT = IdxT>
-class composite_index {
+class CUVS_EXPORT composite_index {
  public:
   using value_type        = T;
   using index_type        = IdxT;

@@ -3576,4 +3576,5 @@ __device__ __forceinline__ void compute_dist_udf_impl(AccT& acc, AccT x, AccT y)
 
 }  // namespace ivf_flat
 }  // namespace neighbors
+
 }  // namespace CUVS_EXPORT cuvs
@@ -5,7 +5,7 @@
 
 #pragma once
 
-#include <cuda_fp16.h>
+#include <cuvs/core/cuda_fp16.hpp>
 
 #include <cuvs/neighbors/common.hpp>
 

@@ -16,7 +16,7 @@
 
 #include <cuvs/distance/distance.hpp>
 
-#include <cuda_fp16.h>
+#include <cuvs/core/cuda_fp16.hpp>
 #include <cuvs/core/export.hpp>
 
 namespace CUVS_EXPORT cuvs {

@@ -11,7 +11,7 @@
 #include <raft/core/host_mdarray.hpp>
 #include <raft/core/host_mdspan.hpp>
 
-#include <cuda_fp16.h>
+#include <cuvs/core/cuda_fp16.hpp>
 #include <cuvs/core/export.hpp>
 
 namespace CUVS_EXPORT cuvs {

@@ -11,7 +11,7 @@
 #include <raft/core/host_mdarray.hpp>
 #include <raft/core/host_mdspan.hpp>
 
-#include <cuda_fp16.h>
+#include <cuvs/core/cuda_fp16.hpp>
 #include <cuvs/core/export.hpp>
 
 namespace CUVS_EXPORT cuvs {

@@ -5,7 +5,7 @@
 
 #pragma once
 
-#include <cuda_fp16.h>
+#include <cuvs/core/cuda_fp16.hpp>
 
 #include <raft/core/device_mdspan.hpp>
 #include <raft/core/resources.hpp>

@@ -1,15 +1,19 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2024, NVIDIA CORPORATION.
+ * SPDX-FileCopyrightText: Copyright (c) 2024-2026, NVIDIA CORPORATION.
  * SPDX-License-Identifier: Apache-2.0
  */
 
+#include <cuvs/core/cuda_fp16.hpp>
+
 #include "./detail/knn_brute_force.cuh"
 
 #include <cuvs/neighbors/brute_force.hpp>
 
 #include <raft/core/copy.hpp>
 
-namespace cuvs::neighbors::brute_force {
+namespace CUVS_EXPORT cuvs {
+namespace neighbors {
+namespace brute_force {
 
 template <typename T, typename DistT>
 index<T, DistT>::index(raft::resources const& res)
@@ -227,13 +231,16 @@ void index<T, DistT>::update_dataset(
   {                                                                                             \
     detail::search<T, int64_t, DistT, raft::col_major>(                                         \
       res, idx, queries, neighbors, distances, sample_filter);                                  \
-  }                                                                                             \
-                                                                                                \
-  template struct cuvs::neighbors::brute_force::index<T, DistT>;
+  }
 
 CUVS_INST_BFKNN(float, float);
 CUVS_INST_BFKNN(half, float);
 
+template class cuvs::neighbors::brute_force::index<float, float>;
+template class cuvs::neighbors::brute_force::index<half, float>;
+
 #undef CUVS_INST_BFKNN
 
-}  // namespace cuvs::neighbors::brute_force
+}  // namespace brute_force
+}  // namespace neighbors
+}  // namespace CUVS_EXPORT cuvs
@@ -3,6 +3,8 @@
  * SPDX-License-Identifier: Apache-2.0
  */
 
+#include <cuvs/core/cuda_fp16.hpp>
+
 #include <cuvs/neighbors/cagra.hpp>
 #include <neighbors/cagra.cuh>
 
@@ -39,4 +41,6 @@ auto build(raft::resources const& handle,
   return cuvs::neighbors::cagra::build<data_t, index_t>(handle, params, dataset);
 }
 
+template struct index<data_t, index_t>;
+
 }  // namespace cuvs::neighbors::cagra
@@ -3,6 +3,8 @@
  * SPDX-License-Identifier: Apache-2.0
  */
 
+#include <cuvs/core/cuda_fp16.hpp>
+
 #include <cuvs/neighbors/cagra.hpp>
 #include <neighbors/cagra.cuh>
 

@@ -3,6 +3,8 @@
  * SPDX-License-Identifier: Apache-2.0
  */
 
+#include <cuvs/core/cuda_fp16.hpp>
+
 #include <cuvs/neighbors/cagra.hpp>
 #include <neighbors/cagra.cuh>
 

@@ -3,6 +3,8 @@
  * SPDX-License-Identifier: Apache-2.0
  */
 
+#include <cuvs/core/cuda_fp16.hpp>
+
 #include <neighbors/cagra_serialize.cuh>
 
 namespace {

@@ -111,13 +111,13 @@ void composite_index<T, IdxT, OutputIdxT>::search(
                             cuvs::selection::SelectAlgo::kAuto);
 }
 
-template class composite_index<float, uint32_t, uint32_t>;
-template class composite_index<float, uint32_t, int64_t>;
-template class composite_index<half, uint32_t, uint32_t>;
-template class composite_index<half, uint32_t, int64_t>;
-template class composite_index<int8_t, uint32_t, uint32_t>;
-template class composite_index<int8_t, uint32_t, int64_t>;
-template class composite_index<uint8_t, uint32_t, uint32_t>;
-template class composite_index<uint8_t, uint32_t, int64_t>;
+template class CUVS_EXPORT composite_index<float, uint32_t, uint32_t>;
+template class CUVS_EXPORT composite_index<float, uint32_t, int64_t>;
+template class CUVS_EXPORT composite_index<half, uint32_t, uint32_t>;
+template class CUVS_EXPORT composite_index<half, uint32_t, int64_t>;
+template class CUVS_EXPORT composite_index<int8_t, uint32_t, uint32_t>;
+template class CUVS_EXPORT composite_index<int8_t, uint32_t, int64_t>;
+template class CUVS_EXPORT composite_index<uint8_t, uint32_t, uint32_t>;
+template class CUVS_EXPORT composite_index<uint8_t, uint32_t, int64_t>;
 
 }  // namespace cuvs::neighbors::composite
@@ -151,7 +151,7 @@ class BloomFilter {
 };
 
 template <typename Index_t>
-struct GnndGraph {
+struct CUVS_EXPORT GnndGraph {
   raft::resources const& res;
   static constexpr int segment_size = 32;
   InternalID_t<Index_t>* h_graph;
@@ -192,7 +192,7 @@ struct GnndGraph {
 };
 
 template <typename Data_t = float, typename Index_t = int>
-class GNND {
+class CUVS_EXPORT GNND {
  public:
   GNND(raft::resources const& res, const BuildConfig& build_config);
   GNND(const GNND&)            = delete;

@@ -1,5 +1,5 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2024, NVIDIA CORPORATION.
+ * SPDX-FileCopyrightText: Copyright (c) 2024-2026, NVIDIA CORPORATION.
  * SPDX-License-Identifier: Apache-2.0
  */
 
@@ -21,7 +21,7 @@ namespace cuvs::neighbors::dynamic_batching {
 #define CUVS_INST_DYNAMIC_BATCHING_INDEX(T, IdxT, Namespace, ...)                         \
   template <>                                                                             \
   template <>                                                                             \
-  index<T, IdxT>::index<Namespace ::__VA_ARGS__>(                                         \
+  CUVS_EXPORT index<T, IdxT>::index<Namespace ::__VA_ARGS__>(                             \
     const raft::resources& res,                                                           \
     const cuvs::neighbors::dynamic_batching::index_params& params,                        \
     const Namespace ::__VA_ARGS__& upstream_index,                                        \

@@ -3,6 +3,8 @@
  * SPDX-License-Identifier: Apache-2.0
  */
 
+#include <cuvs/core/cuda_fp16.hpp>
+
 #include <cuvs/neighbors/ivf_flat.hpp>
 
 #include <neighbors/ivf_flat/ivf_flat_build.cuh>
@@ -84,3 +86,14 @@ void extend(raft::resources const& handle,
 }
 
 }  // namespace cuvs::neighbors::ivf_flat
+
+namespace cuvs::neighbors::ivf {
+
+template void resize_list<list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, data_t, index_t>>(
+  raft::resources const&,
+  std::shared_ptr<list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, data_t, index_t>>&,
+  const list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, data_t, index_t>::spec_type&,
+  list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, data_t, index_t>::size_type,
+  list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, data_t, index_t>::size_type);
+
+}  // namespace cuvs::neighbors::ivf
@@ -1,11 +1,12 @@
 /*
- * SPDX-FileCopyrightText: Copyright (c) 2023, NVIDIA CORPORATION.
+ * SPDX-FileCopyrightText: Copyright (c) 2023-2026, NVIDIA CORPORATION.
  * SPDX-License-Identifier: Apache-2.0
  */
 
 #include <cstdint>
 
 #include "../ivf_common.cuh"
+#include "../ivf_list.cuh"
 #include "ivf_flat_helpers.cuh"
 #include <cuvs/neighbors/ivf_flat.hpp>
 
@@ -206,3 +207,15 @@ void recompute_internal_state(const raft::resources& res, index<uint8_t, int64_t
 }
 
 }  // namespace cuvs::neighbors::ivf_flat::helpers
+
+namespace cuvs::neighbors::ivf {
+
+template CUVS_EXPORT void
+resize_list<list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, half, int64_t>>(
+  raft::resources const&,
+  std::shared_ptr<list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, half, int64_t>>&,
+  const list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, half, int64_t>::spec_type&,
+  list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, half, int64_t>::size_type,
+  list<cuvs::neighbors::ivf_flat::list_spec, uint32_t, half, int64_t>::size_type);
+
+}  // namespace cuvs::neighbors::ivf
@@ -62,11 +62,11 @@ list<SpecT, SizeT, SpecExtraArgs...>::list(raft::resources const& res,
 }
 
 template <typename ListT>
-void resize_list(raft::resources const& res,
-                 std::shared_ptr<ListT>& orig_list,  // NOLINT
-                 const typename ListT::spec_type& spec,
-                 typename ListT::size_type new_used_size,
-                 typename ListT::size_type old_used_size)
+CUVS_EXPORT void resize_list(raft::resources const& res,
+                             std::shared_ptr<ListT>& orig_list,  // NOLINT
+                             const typename ListT::spec_type& spec,
+                             typename ListT::size_type new_used_size,
+                             typename ListT::size_type old_used_size)
 {
   bool skip_resize = false;
   if (orig_list) {
Original file line number	Diff line number	Diff line change
Expand Up		@@ -3576,4 +3576,5 @@ __device__ __forceinline__ void compute_dist_udf_impl(AccT& acc, AccT x, AccT y)

		} // namespace ivf_flat
		} // namespace neighbors

		} // namespace CUVS_EXPORT cuvs