{ "model_style": "enc", "task": "multiarith", "trajectory_path": "data/discriminator_data/sampled_trajectories/multiarith-clean/llama-7b/trajectories.jsonl", "validation_split_percentage": 5, "max_len": 512, "n_examples": null, "dev_is_train": false, "invalid_prefix_prob": 0.0, "max_alignment_cost": 2.0, "step_aligner_model": "roscoe", "step_delimiter": null, "break_after_extra_step": false, "use_correct_samples": false }