6
6
7
7
import ROOT
8
8
9
+ from collections import namedtuple
10
+
11
+ # Use a dummy execution identifier to test for TTree-based clustered ranges
12
+ Dummy = namedtuple ("Dummy" , ["rdf_uuid" ])
9
13
10
14
def emptysourceranges_to_tuples (ranges ):
11
15
"""Convert EmptySourceRange objects to tuples with the shape (start, end)"""
@@ -34,11 +38,11 @@ def test_nentries_multipleOf_npartitions(self):
34
38
npartitions_large = 10
35
39
36
40
# First case
37
- rng = Ranges .get_balanced_ranges (nentries_small , npartitions_small , exec_id = None )
41
+ rng = Ranges .get_balanced_ranges (nentries_small , npartitions_small , exec_id = Dummy ( "dummy" ) )
38
42
ranges_small = emptysourceranges_to_tuples (rng )
39
43
40
44
# Second case
41
- rng = Ranges .get_balanced_ranges (nentries_large , npartitions_large , exec_id = None )
45
+ rng = Ranges .get_balanced_ranges (nentries_large , npartitions_large , exec_id = Dummy ( "dummy" ) )
42
46
ranges_large = emptysourceranges_to_tuples (rng )
43
47
44
48
ranges_small_reqd = [(0 , 2 ), (2 , 4 ), (4 , 6 ), (6 , 8 ), (8 , 10 )]
@@ -70,12 +74,12 @@ def test_nentries_not_multipleOf_npartitions(self):
70
74
71
75
# Example in which fractional part of
72
76
# (nentries/npartitions) >= 0.5
73
- rng = Ranges .get_balanced_ranges (nentries_1 , npartitions , exec_id = None )
77
+ rng = Ranges .get_balanced_ranges (nentries_1 , npartitions , exec_id = Dummy ( "dummy" ) )
74
78
ranges_1 = emptysourceranges_to_tuples (rng )
75
79
76
80
# Example in which fractional part of
77
81
# (nentries/npartitions) < 0.5
78
- rng = Ranges .get_balanced_ranges (nentries_2 , npartitions , exec_id = None )
82
+ rng = Ranges .get_balanced_ranges (nentries_2 , npartitions , exec_id = Dummy ( "dummy" ) )
79
83
ranges_2 = emptysourceranges_to_tuples (rng )
80
84
81
85
# Required output pairs
@@ -94,7 +98,7 @@ def test_nentries_greater_than_npartitions(self):
94
98
nentries = 5
95
99
npartitions = 7
96
100
97
- rng = Ranges .get_balanced_ranges (nentries , npartitions , exec_id = None )
101
+ rng = Ranges .get_balanced_ranges (nentries , npartitions , exec_id = Dummy ( "dummy" ) )
98
102
ranges = emptysourceranges_to_tuples (rng )
99
103
100
104
ranges_reqd = [(0 , 1 ), (1 , 2 ), (2 , 3 ), (3 , 4 ), (4 , 5 )]
@@ -157,7 +161,7 @@ def test_clustered_ranges_with_one_cluster(self):
157
161
filenames = ["backend/Slimmed_ntuple.root" ]
158
162
npartitions = 1
159
163
160
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
164
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
161
165
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
162
166
163
167
ranges = treeranges_to_tuples (clusteredranges )
@@ -180,7 +184,7 @@ def test_npartitions_greater_than_clusters(self):
180
184
filenames = ["backend/Slimmed_ntuple.root" ]
181
185
npartitions = 2
182
186
183
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
187
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
184
188
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
185
189
186
190
# We return one task per partition
@@ -204,7 +208,7 @@ def test_clustered_ranges_with_two_clusters_two_partitions(self):
204
208
filenames = ["backend/2clusters.root" ]
205
209
npartitions = 2
206
210
207
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
211
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
208
212
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
209
213
ranges = treeranges_to_tuples (clusteredranges )
210
214
@@ -227,7 +231,7 @@ def test_rdataframe_with_treename_and_filename_with_globbing(self):
227
231
expected_inputfiles = ["backend/2clusters.root" ]
228
232
extracted_inputfiles = rdf .inputfiles
229
233
230
- percranges = Ranges .get_percentage_ranges ([treename ], extracted_inputfiles , npartitions , friendinfo = None , exec_id = None )
234
+ percranges = Ranges .get_percentage_ranges ([treename ], extracted_inputfiles , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
231
235
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
232
236
ranges = treeranges_to_tuples (clusteredranges )
233
237
@@ -258,7 +262,7 @@ def test_rdataframe_with_notreename_and_chain_with_subtrees(self):
258
262
extracted_filenames = rdf .inputfiles
259
263
260
264
percranges = Ranges .get_percentage_ranges (
261
- extracted_subtreenames , extracted_filenames , npartitions , friendinfo = None , exec_id = None )
265
+ extracted_subtreenames , extracted_filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
262
266
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
263
267
ranges = treeranges_to_tuples (clusteredranges )
264
268
@@ -281,7 +285,7 @@ def test_clustered_ranges_with_four_clusters_four_partitions(self):
281
285
filenames = ["backend/4clusters.root" ]
282
286
npartitions = 4
283
287
284
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
288
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
285
289
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
286
290
287
291
ranges = treeranges_to_tuples (clusteredranges )
@@ -304,7 +308,7 @@ def test_clustered_ranges_with_many_clusters_four_partitions(self):
304
308
filenames = ["backend/1000clusters.root" ]
305
309
npartitions = 4
306
310
307
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
311
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
308
312
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
309
313
310
314
ranges = treeranges_to_tuples (clusteredranges )
@@ -327,7 +331,7 @@ def test_clustered_ranges_with_many_clusters_many_partitions(self):
327
331
filenames = ["backend/1000clusters.root" ]
328
332
npartitions = 1000
329
333
330
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
334
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
331
335
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
332
336
333
337
ranges = treeranges_to_tuples (clusteredranges )
@@ -349,7 +353,7 @@ def test_clustered_ranges_with_two_files(self):
349
353
filenames = ["backend/2clusters.root" , "backend/4clusters.root" ]
350
354
npartitions = 2
351
355
352
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
356
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
353
357
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
354
358
355
359
ranges = treeranges_to_tuples (clusteredranges )
@@ -366,7 +370,7 @@ def test_three_files_one_partition(self):
366
370
filenames = [f"distrdf_unittests_file_{ i } .root" for i in range (nfiles )]
367
371
npartitions = 1
368
372
369
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
373
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
370
374
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
371
375
372
376
ranges = treeranges_to_tuples (clusteredranges )
@@ -382,7 +386,7 @@ def test_three_files_one_partition_per_file(self):
382
386
filenames = [f"distrdf_unittests_file_{ i } .root" for i in range (nfiles )]
383
387
npartitions = nfiles
384
388
385
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
389
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
386
390
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
387
391
388
392
ranges = treeranges_to_tuples (clusteredranges )
@@ -398,7 +402,7 @@ def test_three_files_two_partitions_per_file(self):
398
402
treenames = [f"tree_{ i } " for i in range (nfiles )]
399
403
filenames = [f"distrdf_unittests_file_{ i } .root" for i in range (nfiles )]
400
404
npartitions = nfiles * 2
401
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
405
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
402
406
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
403
407
404
408
ranges = treeranges_to_tuples (clusteredranges )
@@ -425,7 +429,7 @@ def test_three_files_partitions_equal_clusters(self):
425
429
filenames = [f"distrdf_unittests_file_{ i } .root" for i in range (nfiles )]
426
430
npartitions = nfiles * 10 # trees have 10 clusters
427
431
428
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
432
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
429
433
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
430
434
431
435
ranges = treeranges_to_tuples (clusteredranges )
@@ -473,7 +477,7 @@ def test_three_files_partitions_greater_than_clusters(self):
473
477
filenames = [f"distrdf_unittests_file_{ i } .root" for i in range (nfiles )]
474
478
npartitions = 42
475
479
476
- percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = None )
480
+ percranges = Ranges .get_percentage_ranges (treenames , filenames , npartitions , friendinfo = None , exec_id = Dummy ( "dummy" ) )
477
481
clusteredranges = [Ranges .get_clustered_range_from_percs (percrange )[0 ] for percrange in percranges ]
478
482
479
483
# We return one task per partition
0 commit comments