{ "ONLINE PARAMETERS": "-------------------", "online_shared_parameters": { "replay_buffer_capacity": 1000000, "batch_size": 32, "update_horizon": 1, "gamma": 0.99, "learning_rate": 6.25e-05, "horizon": 27000, "n_epochs": 40, "n_training_steps_per_epoch": 250000, "n_initial_samples": 20000, "epsilon_end": 0.01, "epsilon_duration": 250000.0, "target_update_frequency": 8000, "update_to_data": 4.0, "features": [ 32, 64, 64, "Feature Size" ], "architecture_type": "cnn" }, "eaudedqn": { "n_networks": 5, "max_noise": 3.0, "max_speed": 0.01, "reset_optimizer": true }, "polyprunedqn": { "sparcity_start_step": 2000000, "sparcity_end_step": 8000000, "sparcity_update_freq": 4000, "final_sparsity": 0.95 }, "dqn": {}, "OFFLINE PARAMETERS": "-------------------", "offline_shared_parameters": { "features": [ 32, 64, 64, "Feature Size" ], "replay_buffer_capacity": 50000, "batch_size": 32, "update_horizon": 1, "gamma": 0.99, "learning_rate": 5e-05, "architecture_type": "cnn", "target_update_frequency": 2000, "n_buffers_to_load": 5, "n_epochs": 50, "n_fitting_steps": 62500 }, "eaudecql": { "n_networks": 5, "max_noise": 3.0, "max_speed": 0.01, "reset_optimizer": true, "alpha_cql": 0.1 }, "polyprunecql": { "sparcity_start_step": 625000, "sparcity_end_step": 2500000, "sparcity_update_freq": 1000, "final_sparsity": 0.95, "alpha_cql": 0.1 }, "cql": { "alpha_cql": 0.1 } }