Skip to content

Commit 39edc60

Browse files
committed
update
1 parent 52761c7 commit 39edc60

File tree

1 file changed

+2
-2
lines changed
  • verl/experimental/reward_loop/reward_manager

1 file changed

+2
-2
lines changed

verl/experimental/reward_loop/reward_manager/remote.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
from verl.utils.reward_score import default_compute_score
2323

2424

25-
@ray.remote
25+
@ray.remote(num_cpus=1)
2626
class RewardComputeWorker:
2727
"""
2828
WARNING: This class cannot have async methods.
@@ -61,7 +61,7 @@ def __init__(self, config, tokenizer, compute_score=None, reward_router_address=
6161
RewardComputeWorker.options(
6262
scheduling_strategy=ray.util.scheduling_strategies.NodeAffinitySchedulingStrategy(
6363
node_id=ray.get_runtime_context().get_node_id(),
64-
soft=False,
64+
soft=True,
6565
),
6666
).remote(self.compute_score)
6767
for _ in range(num_reward_workers)

0 commit comments

Comments
 (0)