From b9437ea2cf5f763ae6f9eb0bcf52009d0b8a84cb Mon Sep 17 00:00:00 2001
From: Alexandria Barghi <abarghi@nvidia.com>
Date: Wed, 11 Dec 2024 07:43:19 -0800
Subject: [PATCH] fix bulk sampler tests, re-enable other tests

---
 python/cugraph/cugraph/tests/sampling/test_bulk_sampler.py  | 6 +++---
 .../cugraph/cugraph/tests/sampling/test_bulk_sampler_mg.py  | 6 +++---
 .../cugraph/cugraph/tests/sampling/test_dist_sampler_mg.py  | 2 --
 3 files changed, 6 insertions(+), 8 deletions(-)

diff --git a/python/cugraph/cugraph/tests/sampling/test_bulk_sampler.py b/python/cugraph/cugraph/tests/sampling/test_bulk_sampler.py
index 765c6ef893..54e159012e 100644
--- a/python/cugraph/cugraph/tests/sampling/test_bulk_sampler.py
+++ b/python/cugraph/cugraph/tests/sampling/test_bulk_sampler.py
@@ -282,7 +282,7 @@ def test_bulk_sampler_empty_batches(scratch_dir):
     # [7, 8, 9] have no outgoing edges. The previous implementation returned and
     # offsets array omitting seeds with no outgoing edges from the
     # edge_label_offsets which is no longer the case
-    df = cudf.read_parquet(os.path.join(samples_path, "batch=0-2.parquet"))
+    df = cudf.read_parquet(os.path.join(samples_path, "batch=0-1.parquet"))
 
     assert df[
         (df.batch_id == 0) & (df.hop_id == 0)
@@ -293,12 +293,12 @@ def test_bulk_sampler_empty_batches(scratch_dir):
     ].destinations.sort_values().values_host.tolist() == [2, 3, 7, 8]
 
     assert df[
-        (df.batch_id == 2) & (df.hop_id == 0)
+        (df.batch_id == 1) & (df.hop_id == 0)
     ].destinations.sort_values().values_host.tolist() == [7, 8]
 
     assert len(df[(df.batch_id == 1) & (df.hop_id == 1)]) == 0
 
-    assert df.batch_id.max() == 2
+    assert df.batch_id.max() == 1
 
     shutil.rmtree(samples_path)
 
diff --git a/python/cugraph/cugraph/tests/sampling/test_bulk_sampler_mg.py b/python/cugraph/cugraph/tests/sampling/test_bulk_sampler_mg.py
index 77db37d4b9..f16b78a40a 100644
--- a/python/cugraph/cugraph/tests/sampling/test_bulk_sampler_mg.py
+++ b/python/cugraph/cugraph/tests/sampling/test_bulk_sampler_mg.py
@@ -232,7 +232,7 @@ def test_bulk_sampler_empty_batches(dask_client, scratch_dir):
     # [7, 8, 9] have no outgoing edges. The previous implementation returned and
     # offsets array omitting seeds with no outgoing edges from the
     # edge_label_offsets which is no longer the case
-    df = cudf.read_parquet(os.path.join(samples_path, "batch=0-2.parquet"))
+    df = cudf.read_parquet(os.path.join(samples_path, "batch=0-1.parquet"))
 
     assert df[
         (df.batch_id == 0) & (df.hop_id == 0)
@@ -243,12 +243,12 @@ def test_bulk_sampler_empty_batches(dask_client, scratch_dir):
     ].destinations.sort_values().values_host.tolist() == [2, 3, 7, 8]
 
     assert df[
-        (df.batch_id == 2) & (df.hop_id == 0)
+        (df.batch_id == 1) & (df.hop_id == 0)
     ].destinations.sort_values().values_host.tolist() == [7, 8]
 
     assert len(df[(df.batch_id == 1) & (df.hop_id == 1)]) == 0
 
-    assert df.batch_id.max() == 2
+    assert df.batch_id.max() == 1
 
     shutil.rmtree(samples_path)
 
diff --git a/python/cugraph/cugraph/tests/sampling/test_dist_sampler_mg.py b/python/cugraph/cugraph/tests/sampling/test_dist_sampler_mg.py
index 281c259c2e..ee6f64ef9e 100644
--- a/python/cugraph/cugraph/tests/sampling/test_dist_sampler_mg.py
+++ b/python/cugraph/cugraph/tests/sampling/test_dist_sampler_mg.py
@@ -116,7 +116,6 @@ def run_test_dist_sampler_simple(
 @pytest.mark.parametrize("batch_size", [1, 4])
 @pytest.mark.parametrize("seeds_per_rank", [8, 1])
 @pytest.mark.parametrize("seeds_per_call", [4, 8])
-@pytest.mark.skip("bleh")
 @pytest.mark.skipif(isinstance(torch, MissingModule), reason="torch not installed")
 def test_dist_sampler_simple(
     scratch_dir, batch_size, seeds_per_rank, fanout, equal_input_size, seeds_per_call
@@ -304,7 +303,6 @@ def run_test_dist_sampler_buffered_in_memory(
 @pytest.mark.skipif(isinstance(torch, MissingModule), reason="torch not available")
 @pytest.mark.parametrize("seeds_per_call", [4, 5, 10])
 @pytest.mark.parametrize("compression", ["COO", "CSR"])
-@pytest.mark.skip(reason="bleh")
 def test_dist_sampler_buffered_in_memory(scratch_dir, seeds_per_call, compression):
     uid = cugraph_comms_create_unique_id()