joyrl
/

joyrl-benchmarks

Model card Files Files and versions Metrics Training metrics Community

joyrl-benchmarks / ClassControl /Pendulum-v1 /Test_single_Pendulum-v1_DDPG_20230527-120739 /config.yaml

johnjim0816

update DDPG Pendulum-v1

56029d5 about 1 year ago

raw history blame

1.04 kB

	general_cfg:
	algo_name: DDPG
	collect_traj: false
	device: cuda
	env_name: gym
	load_checkpoint: true
	load_model_step: best
	load_path: Train_ray_Pendulum-v1_DDPG_20230527-001715
	max_episode: 10
	max_step: 200
	mode: test
	model_save_fre: 2000
	mp_backend: single
	n_learners: 1
	n_workers: 4
	online_eval: true
	online_eval_episode: 20
	seed: 10
	share_buffer: true
	algo_cfg:
	action_type: dpg
	actor_layers:
	- activation: relu
	layer_size:
	- 256
	layer_type: linear
	- activation: relu
	layer_size:
	- 256
	layer_type: linear
	actor_lr: 0.0001
	batch_size: 128
	buffer_size: 8000
	buffer_type: REPLAY_QUE
	critic_layers:
	- activation: relu
	layer_size:
	- 256
	layer_type: linear
	- activation: relu
	layer_size:
	- 256
	layer_type: linear
	critic_lr: 0.001
	gamma: 0.99
	policy_loss_weight: 0.002
	tau: 0.001
	value_max: .inf
	value_min: -.inf
	env_cfg:
	id: Pendulum-v1
	ignore_params:
	- wrapper
	- ignore_params
	render_mode: rgb_array
	wrapper: null