Skip to content

Commit

Permalink
[FEA] New Graph Interface and Loaders for Distributed Sampling in DGL (
Browse files Browse the repository at this point in the history
…#4486)

- [x] New Graph class that duck-types `DGLGraph`
- [x] New WholeGraph feature store that implements DGL's `FeatureStorage`
- [x] New Sampler interface
- [x] New Loader interface
- [x] New Sampler for distributed uniform neighbor sampling without dask
- [x] New Loader for distributed uniform neighbor sampling without dask

This PR also adds `pydantic` and `torchdata` as test dependencies of cuGraph-DGL, because they are unlisted runtime dependencies of the latest version of DGL (which we will be testing with in the new `cugraph-gnn` repository).

This PR also changes the test file structure to match the rest of cuGraph, by using the __mg_ suffix to denote multi-GPU tests and moving them to the main directory under "tests".

New examples will be added in a future PR.  This PR is just for basic functionality and tests.

Closes #3805 
Closes rapidsai/cugraph-gnn#4
Closes #4400
Closes #4247
Closes #3303

Authors:
  - Alex Barghi (https://github.com/alexbarghi-nv)
  - Ralph Liu (https://github.com/nv-rliu)

Approvers:
  - Vibhu Jawa (https://github.com/VibhuJawa)
  - Ray Douglass (https://github.com/raydouglass)
  - Rick Ratzel (https://github.com/rlratzel)

URL: #4486
  • Loading branch information
alexbarghi-nv authored Jul 31, 2024
1 parent d77a2d6 commit b38e010
Show file tree
Hide file tree
Showing 39 changed files with 3,464 additions and 376 deletions.
2 changes: 2 additions & 0 deletions conda/environments/all_cuda-118_arch-x86_64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -46,6 +46,7 @@ dependencies:
- packaging>=21
- pandas
- pre-commit
- pydantic
- pydata-sphinx-theme
- pylibcugraphops==24.8.*,>=0.0.0a0
- pylibraft==24.8.*,>=0.0.0a0
Expand All @@ -72,6 +73,7 @@ dependencies:
- sphinx<6
- sphinxcontrib-websupport
- thriftpy2!=0.5.0,!=0.5.1
- torchdata
- ucx-proc=*=gpu
- ucx-py==0.39.*,>=0.0.0a0
- wget
Expand Down
2 changes: 2 additions & 0 deletions conda/environments/all_cuda-125_arch-x86_64.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -51,6 +51,7 @@ dependencies:
- packaging>=21
- pandas
- pre-commit
- pydantic
- pydata-sphinx-theme
- pylibcugraphops==24.8.*,>=0.0.0a0
- pylibraft==24.8.*,>=0.0.0a0
Expand All @@ -77,6 +78,7 @@ dependencies:
- sphinx<6
- sphinxcontrib-websupport
- thriftpy2!=0.5.0,!=0.5.1
- torchdata
- ucx-proc=*=gpu
- ucx-py==0.39.*,>=0.0.0a0
- wget
Expand Down
4 changes: 3 additions & 1 deletion conda/recipes/cugraph-dgl/meta.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -28,8 +28,10 @@ requirements:
- numba >=0.57
- numpy >=1.23,<2.0a0
- pylibcugraphops ={{ minor_version }}
- tensordict >=0.1.2
- python
- pytorch
- pytorch >=2.0
- cupy >=12.0.0

tests:
imports:
Expand Down
5 changes: 4 additions & 1 deletion dependencies.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -659,6 +659,7 @@ dependencies:
- *cugraph_unsuffixed
- pytorch>=2.0
- pytorch-cuda==11.8
- &tensordict tensordict>=0.1.2
- dgl>=1.1.0.cu*
cugraph_pyg_dev:
common:
Expand All @@ -667,14 +668,16 @@ dependencies:
- *cugraph_unsuffixed
- pytorch>=2.0
- pytorch-cuda==11.8
- &tensordict tensordict>=0.1.2
- *tensordict
- pyg>=2.5,<2.6

depends_on_pytorch:
common:
- output_types: [conda]
packages:
- &pytorch_unsuffixed pytorch>=2.0,<2.2.0a0
- torchdata
- pydantic

specific:
- output_types: [requirements]
Expand Down
1 change: 1 addition & 0 deletions python/cugraph-dgl/conda/cugraph_dgl_dev_cuda-118.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -21,4 +21,5 @@ dependencies:
- pytorch-cuda==11.8
- pytorch>=2.0
- scipy
- tensordict>=0.1.2
name: cugraph_dgl_dev_cuda-118
8 changes: 6 additions & 2 deletions python/cugraph-dgl/cugraph_dgl/__init__.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# Copyright (c) 2019-2023, NVIDIA CORPORATION.
# Copyright (c) 2019-2024, NVIDIA CORPORATION.
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
Expand All @@ -15,8 +15,12 @@

# to prevent rapids context being created when importing cugraph_dgl
os.environ["RAPIDS_NO_INITIALIZE"] = "1"
from cugraph_dgl.graph import Graph
from cugraph_dgl.cugraph_storage import CuGraphStorage
from cugraph_dgl.convert import cugraph_storage_from_heterograph
from cugraph_dgl.convert import (
cugraph_storage_from_heterograph,
cugraph_dgl_graph_from_heterograph,
)
import cugraph_dgl.dataloading
import cugraph_dgl.nn

Expand Down
54 changes: 53 additions & 1 deletion python/cugraph-dgl/cugraph_dgl/convert.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# Copyright (c) 2022-2023, NVIDIA CORPORATION.
# Copyright (c) 2022-2024, NVIDIA CORPORATION.
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
Expand All @@ -12,6 +12,8 @@
# limitations under the License.
from __future__ import annotations
from cugraph.utilities.utils import import_optional

import cugraph_dgl
from cugraph_dgl import CuGraphStorage
from cugraph_dgl.utils.cugraph_conversion_utils import (
get_edges_dict_from_dgl_HeteroGraph,
Expand Down Expand Up @@ -39,3 +41,53 @@ def cugraph_storage_from_heterograph(
add_ndata_from_dgl_HeteroGraph(gs, g)
add_edata_from_dgl_HeteroGraph(gs, g)
return gs


def cugraph_dgl_graph_from_heterograph(
input_graph: dgl.DGLGraph,
single_gpu: bool = True,
ndata_storage: str = "torch",
edata_storage: str = "torch",
**kwargs,
) -> cugraph_dgl.Graph:
"""
Converts a DGL Graph to a cuGraph-DGL Graph.
"""

output_graph = cugraph_dgl.Graph(
is_multi_gpu=(not single_gpu),
ndata_storage=ndata_storage,
edata_storage=edata_storage,
**kwargs,
)

# Calling is_homogeneous does not work here
if len(input_graph.ntypes) <= 1:
output_graph.add_nodes(
input_graph.num_nodes(), data=input_graph.ndata, ntype=input_graph.ntypes[0]
)
else:
for ntype in input_graph.ntypes:
data = {
k: v_dict[ntype]
for k, v_dict in input_graph.ndata.items()
if ntype in v_dict
}
output_graph.add_nodes(input_graph.num_nodes(ntype), data=data, ntype=ntype)

if len(input_graph.canonical_etypes) <= 1:
can_etype = input_graph.canonical_etypes[0]
src_t, dst_t = input_graph.edges(form="uv", etype=can_etype)
output_graph.add_edges(src_t, dst_t, input_graph.edata, etype=can_etype)
else:
for can_etype in input_graph.canonical_etypes:
data = {
k: v_dict[can_etype]
for k, v_dict in input_graph.edata.items()
if can_etype in v_dict
}

src_t, dst_t = input_graph.edges(form="uv", etype=can_etype)
output_graph.add_edges(src_t, dst_t, data=data, etype=can_etype)

return output_graph
20 changes: 18 additions & 2 deletions python/cugraph-dgl/cugraph_dgl/dataloading/__init__.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# Copyright (c) 2019-2023, NVIDIA CORPORATION.
# Copyright (c) 2019-2024, NVIDIA CORPORATION.
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
Expand All @@ -11,9 +11,25 @@
# See the License for the specific language governing permissions and
# limitations under the License.

import warnings

from cugraph_dgl.dataloading.dataset import (
HomogenousBulkSamplerDataset,
HeterogenousBulkSamplerDataset,
)

from cugraph_dgl.dataloading.sampler import Sampler
from cugraph_dgl.dataloading.neighbor_sampler import NeighborSampler
from cugraph_dgl.dataloading.dataloader import DataLoader

from cugraph_dgl.dataloading.dask_dataloader import DaskDataLoader
from cugraph_dgl.dataloading.dataloader import DataLoader as FutureDataLoader


def DataLoader(*args, **kwargs):
warnings.warn(
"DataLoader has been renamed to DaskDataLoader. "
"In Release 24.10, cugraph_dgl.dataloading.FutureDataLoader "
"will take over the DataLoader name.",
FutureWarning,
)
return DaskDataLoader(*args, **kwargs)
Loading

0 comments on commit b38e010

Please sign in to comment.