Atari_EauDeQN / config.json
TheoVincent's picture
unique config.json
9bd27a8
{
"ONLINE PARAMETERS": "-------------------",
"online_shared_parameters": {
"replay_buffer_capacity": 1000000,
"batch_size": 32,
"update_horizon": 1,
"gamma": 0.99,
"learning_rate": 6.25e-05,
"horizon": 27000,
"n_epochs": 40,
"n_training_steps_per_epoch": 250000,
"n_initial_samples": 20000,
"epsilon_end": 0.01,
"epsilon_duration": 250000.0,
"target_update_frequency": 8000,
"update_to_data": 4.0,
"features": [
32,
64,
64,
"Feature Size"
],
"architecture_type": "cnn"
},
"eaudedqn": {
"n_networks": 5,
"max_noise": 3.0,
"max_speed": 0.01,
"reset_optimizer": true
},
"polyprunedqn": {
"sparcity_start_step": 2000000,
"sparcity_end_step": 8000000,
"sparcity_update_freq": 4000,
"final_sparsity": 0.95
},
"dqn": {},
"OFFLINE PARAMETERS": "-------------------",
"offline_shared_parameters": {
"features": [
32,
64,
64,
"Feature Size"
],
"replay_buffer_capacity": 50000,
"batch_size": 32,
"update_horizon": 1,
"gamma": 0.99,
"learning_rate": 5e-05,
"architecture_type": "cnn",
"target_update_frequency": 2000,
"n_buffers_to_load": 5,
"n_epochs": 50,
"n_fitting_steps": 62500
},
"eaudecql": {
"n_networks": 5,
"max_noise": 3.0,
"max_speed": 0.01,
"reset_optimizer": true,
"alpha_cql": 0.1
},
"polyprunecql": {
"sparcity_start_step": 625000,
"sparcity_end_step": 2500000,
"sparcity_update_freq": 1000,
"final_sparsity": 0.95,
"alpha_cql": 0.1
},
"cql": {
"alpha_cql": 0.1
}
}