| trainer:
|
| nnodes: 1
|
| n_gpus_per_node: 1
|
|
|
| data:
|
| path: ./data/parquet/test.parquet
|
| prompt_key: prompt
|
| n_samples: 1
|
| output_path: ./checkpoints/grammar_generation.parquet
|
| batch_size: 1
|
|
|
| model:
|
| path: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
|
| external_lib: null
|
| load_param: False
|
| load_param_path: null
|
|
|
| rollout:
|
| name: vllm
|
| mode: sync
|
| temperature: 0.0
|
| top_k: -1
|
| top_p: 1.0
|
| max_loras: 1
|
| prompt_length: 1800
|
| response_length: 512
|
|
|
| dtype: bfloat16
|
| gpu_memory_utilization: 0.9
|
| ignore_eos: False
|
| enforce_eager: True
|
| free_cache_engine: True
|
| load_format: dummy_dtensor
|
| tensor_model_parallel_size: 1
|
| max_num_batched_tokens: 8192
|
| max_model_len: 1800
|
| max_num_seqs: 1024
|
| log_prob_micro_batch_size: null
|
| log_prob_micro_batch_size_per_gpu: 1
|
|
|
| use_fire_sampling: False
|
|
|
| do_sample: True
|
| disable_log_stats: False
|
| enable_chunked_prefill: True
|
| n: 1
|
|
|
|
|
| actor:
|
| strategy: fsdp
|
| ulysses_sequence_parallel_size: 1
|
| fsdp_config:
|
| fsdp_size: -1
|
|
|
| ray_init:
|
| num_cpus: null
|
|
|