Skip to content

Commit

Permalink
fix ci
Browse files Browse the repository at this point in the history
  • Loading branch information
PeterSH6 committed Jan 16, 2025
1 parent 462c618 commit 1992e6d
Showing 1 changed file with 5 additions and 1 deletion.
6 changes: 5 additions & 1 deletion tests/e2e/arithmetic_sequence/rl/config/ray_trainer.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,8 @@ actor_rollout_ref:
clip_ratio: 0.2
entropy_coeff: 0.0
ppo_epochs: 1
shuffle: True
shuffle: False
ulysses_sequence_parallel_size: 1 # sp size
optim:
lr: 1e-4
fsdp_config:
Expand All @@ -44,6 +45,7 @@ actor_rollout_ref:
# transformer_layer_cls_to_wrap: None
min_num_params: 0
micro_batch_size: 200
ulysses_sequence_parallel_size: ${actor_rollout_ref.actor.ulysses_sequence_parallel_size} # sp size
rollout:
name: hf
temperature: 1.0
Expand Down Expand Up @@ -89,6 +91,7 @@ critic:
ppo_mini_batch_size: ${actor_rollout_ref.actor.ppo_mini_batch_size}
ppo_micro_batch_size: 200
forward_micro_batch_size: ${critic.ppo_micro_batch_size}
ulysses_sequence_parallel_size: 1 # sp size
ppo_epochs: ${actor_rollout_ref.actor.ppo_epochs}
shuffle: ${actor_rollout_ref.actor.shuffle}
grad_clip: 1.0
Expand All @@ -112,6 +115,7 @@ reward_model:
min_num_params: 0
micro_batch_size: 8
max_length: null
ulysses_sequence_parallel_size: 1 # sp size

algorithm:
gamma: 1.0
Expand Down

0 comments on commit 1992e6d

Please sign in to comment.