File tree Expand file tree Collapse file tree 4 files changed +137
-82
lines changed
Expand file tree Collapse file tree 4 files changed +137
-82
lines changed Original file line number Diff line number Diff line change @@ -36,7 +36,7 @@ run_test() {
3636
3737# This test is intentionally not run with uv run --no-sync to verify that the frozen environment is working correctly.
3838run_test bash ./tests/functional/grpo_frozen_env.sh
39- run_test fast bash ./tests/functional/test_frozen_env.sh
39+ run_test bash ./tests/functional/test_frozen_env.sh
4040
4141run_test fast uv run --no-sync bash ./tests/functional/distillation.sh
4242run_test uv run --no-sync bash ./tests/functional/distillation_megatron.sh
@@ -58,7 +58,7 @@ run_test uv run --no-sync bash ./tests/functional/grpo_non_colocated.sh
5858run_test uv run --no-sync bash ./tests/functional/grpo_rm_env.sh
5959run_test uv run --no-sync bash ./tests/functional/grpo_sglang.sh
6060run_test uv run --no-sync bash ./tests/functional/prorlv2.sh
61- run_test fast uv run --no-sync bash ./tests/functional/rm.sh
61+ run_test uv run --no-sync bash ./tests/functional/rm.sh
6262run_test fast uv run --no-sync bash ./tests/functional/sft.sh
6363run_test uv run --no-sync bash ./tests/functional/sft_automodel_lora.sh
6464run_test uv run --no-sync bash ./tests/functional/sft_avlm.sh
Original file line number Diff line number Diff line change @@ -26,16 +26,16 @@ uv run coverage run -a --data-file=$PROJECT_ROOT/tests/.coverage --source=$PROJE
2626 policy.model_name=Qwen/Qwen3-0.6B \
2727 teacher.model_name=Qwen/Qwen3-0.6B \
2828 cluster.gpus_per_node=2 \
29- policy.train_global_batch_size=16 \
29+ policy.train_global_batch_size=8 \
3030 policy.dtensor_cfg.tensor_parallel_size=1 \
3131 policy.dtensor_cfg.context_parallel_size=2 \
32- policy.max_total_sequence_length=2048 \
32+ policy.max_total_sequence_length=256 \
3333 teacher.dtensor_cfg.tensor_parallel_size=2 \
3434 teacher.dtensor_cfg.context_parallel_size=1 \
3535 distillation.max_num_steps=3 \
3636 distillation.num_prompts_per_step=16 \
37- distillation.max_val_samples=16 \
38- distillation.val_batch_size=8 \
37+ distillation.max_val_samples=2 \
38+ distillation.val_batch_size=4 \
3939 distillation.val_period=3 \
4040 data.train.dataset_name=OpenMathInstruct-2 \
4141 ++data.train.split_validation_size=0.05 \
Original file line number Diff line number Diff line change @@ -27,7 +27,7 @@ uv run coverage run -a --data-file=$PROJECT_ROOT/tests/.coverage --source=$PROJE
2727 policy.train_global_batch_size=4 \
2828 policy.train_micro_batch_size=1 \
2929 cluster.gpus_per_node=2 \
30- grpo.max_num_steps=20 \
30+ grpo.max_num_steps=5 \
3131 grpo.async_grpo.enabled=true \
3232 grpo.async_grpo.max_trajectory_age_steps=1 \
3333 policy.generation.vllm_cfg.async_engine=true \
You can’t perform that action at this time.
0 commit comments