Skip to content

Commit 91e6b92

Browse files
authored
[CI] revert skip and shm size (#7487)
1 parent c74a5c8 commit 91e6b92

File tree

2 files changed

+23
-18
lines changed

2 files changed

+23
-18
lines changed

Jenkinsfile

+1-1
Original file line numberDiff line numberDiff line change
@@ -575,7 +575,7 @@ pipeline {
575575
docker {
576576
label "dgl-ci-linux-cpu"
577577
image "dgllib/dgl-ci-cpu:v240511_1440"
578-
args "-u root --shm-size=32gb"
578+
args "-u root --shm-size=8gb"
579579
alwaysPull true
580580
}
581581
}

tests/distributed/test_mp_dataloader.py

+22-17
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@
33
import tempfile
44
import time
55
import unittest
6+
import uuid
67

78
import backend as F
89
import dgl
@@ -121,8 +122,9 @@ def start_dist_dataloader(
121122
num_nodes_to_sample = 202
122123
batch_size = 32
123124
train_nid = th.arange(num_nodes_to_sample)
125+
graph_name = os.path.splitext(os.path.basename(part_config))[0]
124126
dist_graph = DistGraph(
125-
"test_sampling",
127+
graph_name,
126128
gpb=gpb,
127129
part_config=part_config,
128130
)
@@ -204,17 +206,17 @@ def test_standalone():
204206
print(g.idtype)
205207
num_parts = 1
206208
num_hops = 1
207-
209+
graph_name = f"graph_{uuid.uuid4()}"
208210
orig_nid, orig_eid = partition_graph(
209211
g,
210-
"test_sampling",
212+
graph_name,
211213
num_parts,
212214
test_dir,
213215
num_hops=num_hops,
214216
part_method="metis",
215217
return_mapping=True,
216218
)
217-
part_config = os.path.join(test_dir, "test_sampling.json")
219+
part_config = os.path.join(test_dir, f"{graph_name}.json")
218220
os.environ["DGL_DIST_MODE"] = "standalone"
219221
try:
220222
start_dist_dataloader(
@@ -243,7 +245,8 @@ def start_dist_neg_dataloader(
243245
_, _, _, gpb, _, _, _ = load_partition(part_config, rank)
244246
num_edges_to_sample = 202
245247
batch_size = 32
246-
dist_graph = DistGraph("test_mp", gpb=gpb, part_config=part_config)
248+
graph_name = os.path.splitext(os.path.basename(part_config))[0]
249+
dist_graph = DistGraph(graph_name, gpb=gpb, part_config=part_config)
247250
assert len(dist_graph.ntypes) == len(groundtruth_g.ntypes)
248251
assert len(dist_graph.etypes) == len(groundtruth_g.etypes)
249252
if len(dist_graph.etypes) == 1:
@@ -304,16 +307,17 @@ def check_neg_dataloader(g, num_server, num_workers):
304307

305308
num_parts = num_server
306309
num_hops = 1
310+
graph_name = f"graph_{uuid.uuid4()}"
307311
orig_nid, orig_eid = partition_graph(
308312
g,
309-
"test_sampling",
313+
graph_name,
310314
num_parts,
311315
test_dir,
312316
num_hops=num_hops,
313317
part_method="metis",
314318
return_mapping=True,
315319
)
316-
part_config = os.path.join(test_dir, "test_sampling.json")
320+
part_config = os.path.join(test_dir, f"{graph_name}.json")
317321
if not isinstance(orig_nid, dict):
318322
orig_nid = {g.ntypes[0]: orig_nid}
319323
if not isinstance(orig_eid, dict):
@@ -380,10 +384,10 @@ def test_dist_dataloader(num_server, num_workers, use_graphbolt, return_eids):
380384
g = CitationGraphDataset("cora")[0]
381385
num_parts = num_server
382386
num_hops = 1
383-
387+
graph_name = f"graph_{uuid.uuid4()}"
384388
orig_nid, orig_eid = partition_graph(
385389
g,
386-
"test_sampling",
390+
graph_name,
387391
num_parts,
388392
test_dir,
389393
num_hops=num_hops,
@@ -393,7 +397,7 @@ def test_dist_dataloader(num_server, num_workers, use_graphbolt, return_eids):
393397
store_eids=return_eids,
394398
)
395399

396-
part_config = os.path.join(test_dir, "test_sampling.json")
400+
part_config = os.path.join(test_dir, f"{graph_name}.json")
397401
pserver_list = []
398402
ctx = mp.get_context("spawn")
399403
for i in range(num_server):
@@ -461,8 +465,9 @@ def start_node_dataloader(
461465
_, _, _, gpb, _, _, _ = load_partition(part_config, rank)
462466
num_nodes_to_sample = 202
463467
batch_size = 32
468+
graph_name = os.path.splitext(os.path.basename(part_config))[0]
464469
dist_graph = DistGraph(
465-
"test_sampling",
470+
graph_name,
466471
gpb=gpb,
467472
part_config=part_config,
468473
)
@@ -580,7 +585,8 @@ def start_edge_dataloader(
580585
_, _, _, gpb, _, _, _ = load_partition(part_config, rank)
581586
num_edges_to_sample = 202
582587
batch_size = 32
583-
dist_graph = DistGraph("test_sampling", gpb=gpb, part_config=part_config)
588+
graph_name = os.path.splitext(os.path.basename(part_config))[0]
589+
dist_graph = DistGraph(graph_name, gpb=gpb, part_config=part_config)
584590
assert len(dist_graph.ntypes) == len(groundtruth_g.ntypes)
585591
assert len(dist_graph.etypes) == len(groundtruth_g.etypes)
586592
if len(dist_graph.etypes) == 1:
@@ -767,9 +773,10 @@ def check_dataloader(
767773

768774
num_parts = num_server
769775
num_hops = 1
776+
graph_name = f"graph_{uuid.uuid4()}"
770777
orig_nid, orig_eid = partition_graph(
771778
g,
772-
"test_sampling",
779+
graph_name,
773780
num_parts,
774781
test_dir,
775782
num_hops=num_hops,
@@ -778,7 +785,7 @@ def check_dataloader(
778785
use_graphbolt=use_graphbolt,
779786
store_eids=return_eids,
780787
)
781-
part_config = os.path.join(test_dir, "test_sampling.json")
788+
part_config = os.path.join(test_dir, f"{graph_name}.json")
782789
if not isinstance(orig_nid, dict):
783790
orig_nid = {g.ntypes[0]: orig_nid}
784791
if not isinstance(orig_eid, dict):
@@ -900,7 +907,6 @@ def test_dataloader_homograph(
900907
)
901908

902909

903-
@unittest.skip(reason="Skip due to glitch in CI")
904910
@pytest.mark.parametrize("num_workers", [0])
905911
@pytest.mark.parametrize("use_graphbolt", [False, True])
906912
@pytest.mark.parametrize("exclude", [None, "self", "reverse_id"])
@@ -950,7 +956,6 @@ def test_dataloader_homograph_prob_or_mask(
950956
)
951957

952958

953-
@unittest.skip(reason="Skip due to glitch in CI")
954959
@pytest.mark.parametrize("num_server", [1])
955960
@pytest.mark.parametrize("num_workers", [0, 1])
956961
@pytest.mark.parametrize("dataloader_type", ["node", "edge"])
@@ -1097,7 +1102,7 @@ def test_multiple_dist_dataloaders(
10971102
generate_ip_config(ip_config, num_parts, num_servers)
10981103

10991104
orig_g = dgl.rand_graph(1000, 10000)
1100-
graph_name = "test_multiple_dataloaders"
1105+
graph_name = f"graph_{uuid.uuid4()}"
11011106
partition_graph(
11021107
orig_g,
11031108
graph_name,

0 commit comments

Comments
 (0)