|
| 1 | +# pytest -s tests/integration_tests/test_policy_update.py::TestWeightSync::test_sanity_check --config tests/integration_tests/fixtures/qwen3_30b_a3b.yaml |
| 2 | + |
| 3 | +# trainer tp = 1, generator tp = 4 |
| 4 | + |
| 5 | +# Global configuration |
| 6 | +group_size: 8 |
| 7 | +batch_size: 2 |
| 8 | +max_req_tokens: 256 |
| 9 | +max_res_tokens: 256 |
| 10 | +model: "Qwen/Qwen3-30B-A3B" |
| 11 | +off_by_n: 1 # Off by one by default |
| 12 | +compile: false # Enable torch.compile for trainer, and CUDA graphs for vLLM |
| 13 | + |
| 14 | + |
| 15 | +# Generator configuration |
| 16 | +generator: |
| 17 | + engine_args: |
| 18 | + model: ${model} |
| 19 | + tensor_parallel_size: 4 |
| 20 | + pipeline_parallel_size: 1 |
| 21 | + enforce_eager: ${not:${compile}} |
| 22 | + sampling_params: |
| 23 | + n: ${group_size} |
| 24 | + max_tokens: ${max_res_tokens} |
| 25 | + temperature: 1.0 |
| 26 | + top_p: 1.0 |
| 27 | + |
| 28 | +# Trainer configuration |
| 29 | +trainer: |
| 30 | + model: |
| 31 | + name: qwen3 |
| 32 | + flavor: 30B-A3B |
| 33 | + hf_assets_path: hf://${model} |
| 34 | + optimizer: |
| 35 | + name: AdamW |
| 36 | + lr: 1e-5 |
| 37 | + eps: 1e-8 |
| 38 | + lr_scheduler: |
| 39 | + warmup_steps: 1 |
| 40 | + training: |
| 41 | + local_batch_size: ${batch_size} |
| 42 | + seq_len: ${sum:${max_req_tokens},${max_res_tokens}} # seq_len >= max_req_tokens + max_res_tokens |
| 43 | + max_norm: 1.0 |
| 44 | + steps: 1000000 |
| 45 | + dtype: bfloat16 |
| 46 | + gc_freq: 1 |
| 47 | + compile: |
| 48 | + enable: ${compile} |
| 49 | + parallelism: |
| 50 | + data_parallel_replicate_degree: 1 |
| 51 | + data_parallel_shard_degree: -1 |
| 52 | + tensor_parallel_degree: 1 |
| 53 | + pipeline_parallel_degree: 1 |
| 54 | + context_parallel_degree: 1 |
| 55 | + expert_parallel_degree: 1 |
| 56 | + expert_tensor_parallel_degree: 1 |
| 57 | + disable_loss_parallel: true |
| 58 | + checkpoint: |
| 59 | + enable: true |
| 60 | + initial_load_path: hf://${model} |
| 61 | + initial_load_in_hf: true |
| 62 | + last_save_in_hf: true |
| 63 | + interval: 500 |
| 64 | + async_mode: "disabled" |
| 65 | + activation_checkpoint: |
| 66 | + mode: selective |
| 67 | + selective_ac_option: op |
| 68 | + |
| 69 | +# All resource allocations |
| 70 | +services: |
| 71 | + generator: |
| 72 | + procs: ${generator.engine_args.tensor_parallel_size} |
| 73 | + num_replicas: 1 |
| 74 | + with_gpus: true |
| 75 | + |
| 76 | +actors: |
| 77 | + trainer: |
| 78 | + procs: 4 |
| 79 | + num_replicas: 1 |
| 80 | + with_gpus: true |
0 commit comments