Skip to content
This repository was archived by the owner on Jan 12, 2026. It is now read-only.

Commit 9c8652b

Browse files
authored
Improve examples (#180)
1 parent 1ee4a18 commit 9c8652b

File tree

3 files changed

+6
-9
lines changed

3 files changed

+6
-9
lines changed

xgboost_ray/examples/higgs.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ def main():
5353
config,
5454
dtrain,
5555
evals_result=evals_result,
56-
ray_params=RayParams(max_actor_restarts=1),
56+
ray_params=RayParams(max_actor_restarts=1, num_actors=1),
5757
num_boost_round=100,
5858
evals=[(dtrain, "train")])
5959
taken = time.time() - start

xgboost_ray/examples/higgs_parquet.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5,8 +5,8 @@
55
import pyarrow as pa
66
import pyarrow.parquet as pq
77

8-
from .higgs import download_higgs
9-
from xgboost_ray import train, RayDMatrix
8+
from higgs import download_higgs
9+
from xgboost_ray import train, RayDMatrix, RayParams
1010

1111
FILENAME_CSV = "HIGGS.csv.gz"
1212
FILENAME_PARQUET = "HIGGS.parquet"
@@ -81,7 +81,7 @@ def main():
8181
config,
8282
dtrain,
8383
evals_result=evals_result,
84-
max_actor_restarts=1,
84+
ray_params=RayParams(max_actor_restarts=1, num_actors=1),
8585
num_boost_round=100,
8686
evals=[(dtrain, "train")])
8787
taken = time.time() - start

xgboost_ray/examples/simple_ray_dataset.py

Lines changed: 2 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -25,15 +25,12 @@ def main(cpus_per_actor, num_actors):
2525
# and current Ray master API
2626
if hasattr(ray.data, "from_pandas_refs"):
2727
# Generate Ray dataset from 4 partitions
28-
ray_ds = ray.data.from_pandas(np.split(data, 4))
28+
ray_ds = ray.data.from_pandas(data).repartition(num_actors)
2929
else:
3030
# Split into 4 partitions
31-
partitions = [ray.put(part) for part in np.split(data, 4)]
31+
partitions = [ray.put(part) for part in np.split(data, num_actors)]
3232
ray_ds = ray.data.from_pandas(partitions)
3333

34-
# Generate Ray dataset from 4 partitions
35-
ray_ds = ray.data.from_pandas(np.split(data, 4))
36-
3734
train_set = RayDMatrix(ray_ds, "label")
3835

3936
evals_result = {}

0 commit comments

Comments
 (0)