rapidsai · rapids-bot · Feb 22, 2022 · Dec 6, 2021 · Dec 7, 2021 · Jan 12, 2022
diff --git a/build.sh b/build.sh
@@ -53,7 +53,7 @@ BUILD_DIRS="${LIBCUGRAPH_BUILD_DIR} ${LIBCUGRAPH_ETL_BUILD_DIR} ${CUGRAPH_BUILD_
 VERBOSE_FLAG=""
 CMAKE_VERBOSE_OPTION=""
 BUILD_TYPE=Release
-INSTALL_TARGET=install
+INSTALL_TARGET="--target install"
 BUILD_CPP_TESTS=ON
 BUILD_CPP_MG_TESTS=OFF
 BUILD_ALL_GPU_ARCH=0
@@ -198,7 +198,7 @@ if buildAll || hasArg libcugraph; then
           -DBUILD_TESTS=${BUILD_CPP_TESTS} \
           -DBUILD_CUGRAPH_MG_TESTS=${BUILD_CPP_MG_TESTS} \
           ${CMAKE_VERBOSE_OPTION}
-    cmake --build "${LIBCUGRAPH_BUILD_DIR}" -j${PARALLEL_LEVEL} --target ${INSTALL_TARGET} ${VERBOSE_FLAG}
+    cmake --build "${LIBCUGRAPH_BUILD_DIR}" -j${PARALLEL_LEVEL} ${INSTALL_TARGET} ${VERBOSE_FLAG}
 fi
 
 # Configure, build, and install libcugraph_etl
@@ -220,7 +220,7 @@ if buildAll || hasArg libcugraph_etl; then
           -DBUILD_CUGRAPH_MG_TESTS=${BUILD_CPP_MG_TESTS} \
           ${CMAKE_VERBOSE_OPTION} \
           ${REPODIR}/cpp/libcugraph_etl
-    cmake --build "${LIBCUGRAPH_ETL_BUILD_DIR}" -j${PARALLEL_LEVEL} --target ${INSTALL_TARGET} ${VERBOSE_FLAG}
+    cmake --build "${LIBCUGRAPH_ETL_BUILD_DIR}" -j${PARALLEL_LEVEL} ${INSTALL_TARGET} ${VERBOSE_FLAG}
 fi
 
 # Build, and install pylibcugraph

@@ -1,5 +1,5 @@
 #!/bin/bash
-# Copyright (c) 2018-2021, NVIDIA CORPORATION.
+# Copyright (c) 2018-2022, NVIDIA CORPORATION.
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
@@ -50,6 +50,7 @@ sed_runner 's/version = .*/version = '"'${NEXT_SHORT_TAG}'"'/g' docs/cugraph/sou
 sed_runner 's/release = .*/release = '"'${NEXT_FULL_TAG}'"'/g' docs/cugraph/source/conf.py
 
 for FILE in conda/environments/*.yml; do
+   sed_runner "s/libcugraphops=${CURRENT_SHORT_TAG}/libcugraphops=${NEXT_SHORT_TAG}/g" ${FILE};
    sed_runner "s/cudf=${CURRENT_SHORT_TAG}/cudf=${NEXT_SHORT_TAG}/g" ${FILE};
    sed_runner "s/rmm=${CURRENT_SHORT_TAG}/rmm=${NEXT_SHORT_TAG}/g" ${FILE};
    sed_runner "s/dask-cuda=${CURRENT_SHORT_TAG}/dask-cuda=${NEXT_SHORT_TAG}/g" ${FILE};

@@ -49,6 +49,7 @@ requirements:
     - {{ pin_compatible('cudatoolkit', max_pin='x', min_pin='x') }}
     - nccl>=2.9.9
     - ucx-proc=*=gpu
+    - libcugraphops {{ minor_version }}.*
     - libcusolver>=11.2.1
 
 about:

@@ -37,7 +37,6 @@ requirements:
     - cmake>=3.20.1
     - doxygen>=1.8.11
     - cudatoolkit {{ cuda_version }}.*
-    - libcugraphops {{ minor_version }}.*  # needed for cmake to find transitive deps
     - libcudf {{ minor_version }}.*
     - libcugraph {{ minor_version }}.*
   run:

@@ -285,6 +285,7 @@ target_include_directories(cugraph
 # - link libraries -------------------------------------------------------------
 target_link_libraries(cugraph
     PUBLIC
+        cugraphops::cugraphops
         raft::raft
     PRIVATE
         cugraph::cuHornet

@@ -24,9 +24,15 @@ function(find_and_configure_cugraphops)
         HEADER_NAMES            graph/sampling.h
         LIBRARY_NAMES           cugraph-ops++
         INCLUDE_SUFFIXES        cugraph-ops
+        BUILD_EXPORT_SET    cugraph-exports
+        INSTALL_EXPORT_SET  cugraph-exports
     )
 
-    rapids_find_package(cugraphops REQUIRED)
+    rapids_find_package(cugraphops
+        REQUIRED
+        BUILD_EXPORT_SET    cugraph-exports
+        INSTALL_EXPORT_SET  cugraph-exports
+    )
 
 endfunction()
 

@@ -1,5 +1,5 @@
 /*
- * Copyright (c) 2020-2021, NVIDIA CORPORATION.
+ * Copyright (c) 2020-2022, NVIDIA CORPORATION.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -24,6 +24,8 @@
 #include <cugraph/internals.hpp>
 #include <cugraph/legacy/graph.hpp>
 
+#include <cugraph-ops/graph/sampling.h>
+
 #include <raft/handle.hpp>
 
 namespace cugraph {
@@ -1416,6 +1418,68 @@ random_walks(raft::handle_t const& handle,
              bool use_padding                                     = false,
              std::unique_ptr<sampling_params_t> sampling_strategy = nullptr);
 
+/**
+ * @brief generate sub-sampled graph as an adjacency list (CSR format) given input graph,
+ * list of vertices and sample size per vertex. The output graph consists of the given
+ * vertices with each vertex having at most `sample_size` neighbors from the original graph
+ *
+ * @tparam graph_t Type of input graph/view (typically, graph_view_t, non-transposed and
+ * single-gpu).
+ * @param handle RAFT handle object to encapsulate resources (e.g. CUDA stream, communicator, and
+ * handles to various CUDA libraries) to run graph algorithms.
+ * @param rng The Rng (stateful) instance holding pseudo-random number generator state.
+ * @param graph Graph (view )object to sub-sample.
+ * @param ptr_d_start Device pointer to set of starting vertex indices for the sub-sampling.
+ * @param num_start_vertices = number(vertices) to use for sub-sampling.
+ * @param sampling_size = max number of neighbors per output vertex.
+ * @param sampling_algo = the sampling algorithm (algo R/algo L/etc.) used to produce outputs.
+ * @return std::tuple<rmm::device_uvector<typename graph_t::edge_type>,
+ *                    rmm::device_uvector<typename graph_t::vertex_type>>
+ * Tuple consisting of two arrays representing the offsets and indices of
+ * the sub-sampled graph.
+ */
+template <typename graph_t>
+std::tuple<rmm::device_uvector<typename graph_t::edge_type>,
+           rmm::device_uvector<typename graph_t::vertex_type>>
+sample_neighbors_adjacency_list(raft::handle_t const& handle,
+                                ops::gnn::graph::Rng& rng,
+                                graph_t const& graph,
+                                typename graph_t::vertex_type const* ptr_d_start,
+                                size_t num_start_vertices,
+                                size_t sampling_size,
+                                ops::gnn::graph::SamplingAlgoT sampling_algo);
+
+/**
+ * @brief generate sub-sampled graph as an edge list (COO format) given input graph,
+ * list of vertices and sample size per vertex. The output graph consists of the given
+ * vertices with each vertex having at most `sample_size` neighbors from the original graph
+ *
+ * @tparam graph_t Type of input graph/view (typically, graph_view_t, non-transposed and
+ * single-gpu).
+ * @param handle RAFT handle object to encapsulate resources (e.g. CUDA stream, communicator, and
+ * handles to various CUDA libraries) to run graph algorithms.
+ * @param rng The Rng (stateful) instance holding pseudo-random number generator state.
+ * @param graph Graph (view )object to sub-sample.
+ * @param ptr_d_start Device pointer to set of starting vertex indices for the sub-sampling.
+ * @param num_start_vertices = number(vertices) to use for sub-sampling.
+ * @param sampling_size = max number of neighbors per output vertex.
+ * @param sampling_algo = the sampling algorithm (algo R/algo L/etc.) used to produce outputs.
+ * @return std::tuple<rmm::device_uvector<typename graph_t::edge_type>,
+ *                    rmm::device_uvector<typename graph_t::vertex_type>>
+ * Tuple consisting of two arrays representing the source and destination nodes of
+ * the sub-sampled graph.
+ */
+template <typename graph_t>
+std::tuple<rmm::device_uvector<typename graph_t::vertex_type>,
+           rmm::device_uvector<typename graph_t::vertex_type>>
+sample_neighbors_edgelist(raft::handle_t const& handle,
+                          ops::gnn::graph::Rng& rng,
+                          graph_t const& graph,
+                          typename graph_t::vertex_type const* ptr_d_start,
+                          size_t num_start_vertices,
+                          size_t sampling_size,
+                          ops::gnn::graph::SamplingAlgoT sampling_algo);
+
 /**
  * @brief Finds (weakly-connected-)component IDs of each vertices in the input graph.
  *

@@ -0,0 +1,65 @@
+/*
+ * Copyright (c) 2021-2022, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include <cugraph/algorithms.hpp>
+
+#include <utilities/cugraph_ops_utils.hpp>
+
+#include <cugraph-ops/graph/sampling.h>
+
+namespace cugraph {
+
+template std::tuple<rmm::device_uvector<int32_t>, rmm::device_uvector<int32_t>>
+sample_neighbors_adjacency_list(raft::handle_t const& handle,
+                                ops::gnn::graph::Rng& rng,
+                                graph_view_t<int32_t, int32_t, float, false, false> const& gview,
+                                int32_t const* ptr_d_start,
+                                size_t num_start_vertices,
+                                size_t sampling_size,
+                                ops::gnn::graph::SamplingAlgoT sampling_algo)
+{
+  const auto [graph, max_degree] = detail::get_graph_and_max_degree(gview);
+  return ops::gnn::graph::uniform_sample_csr(rng,
+                                             graph,
+                                             ptr_d_start,
+                                             num_start_vertices,
+                                             sampling_size,
+                                             sampling_algo,
+                                             max_degree,
+                                             handle.get_stream());
+}
+
+template std::tuple<rmm::device_uvector<int32_t>, rmm::device_uvector<int32_t>>
+sample_neighbors_edgelist(raft::handle_t const& handle,
+                          ops::gnn::graph::Rng& rng,
+                          graph_view_t<int32_t, int32_t, float, false, false> const& gview,
+                          typename graph_t::vertex_type const* ptr_d_start,
+                          size_t num_start_vertices,
+                          size_t sampling_size,
+                          ops::gnn::graph::SamplingAlgoT sampling_algo)
+{
+  const auto [graph, max_degree] = detail::get_graph_and_max_degree(gview);
+  return ops::gnn::graph::uniform_sample_csr(rng,
+                                             graph,
+                                             ptr_d_start,
+                                             num_start_vertices,
+                                             sampling_size,
+                                             sampling_algo,
+                                             max_degree,
+                                             handle.get_stream());
+}
+
+}  // namespace cugraph
@@ -0,0 +1,51 @@
+/*
+ * Copyright (c) 2021-2022, NVIDIA CORPORATION.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#pragma once
+
+#include <cugraph/graph_view.hpp>
+
+#include <cugraph-ops/graph/format.h>
+
+#include <tuple>
+
+namespace cugraph {
+namespace detail {
+
+template <typename IdxT, typename WeightT>
+ops::gnn::graph::fg_csr<IdxT> get_graph(
+  graph_view_t<IdxT, IdxT, WeightT, false, false> const& gview)
+{
+  ops::gnn::graph::fg_csr<IdxT> graph;
+  graph.n_nodes   = gview.get_number_of_vertices();
+  graph.n_indices = gview.get_number_of_edges();
+  graph.offsets   = gview.get_matrix_partition_view().get_offsets();
+  graph.indices   = gview.get_matrix_partition_view().get_indices();
+  return graph;
+}
+
+template <typename IdxT, typename WeightT>
+std::tuple<ops::gnn::graph::fg_csr<IdxT>, IdxT> get_graph_and_max_degree(
+  graph_view_t<IdxT, IdxT, WeightT, false, false> const& gview)
+{
+  // FIXME this is sufficient for now, but if there is a fast (cached) way
+  // of getting max degree, use that instead
+  int32_t max_degree = std::numeric_limits<int32_t>::max();
+  return std::make_tuple(get_graph(gview), max_degree);
+}
+
+}  // namespace detail
+}  // namespace cugraph