cboettig
/

rl-ecology

Reinforcement Learning

stable-baselines3

deep-reinforcement-learning

Model card Files Files and versions Community

rl-ecology / rllib /ppo-asm.yaml

cboettig's picture

tidy up

5c6be26 about 1 year ago

history blame contribute delete

1 kB

	asm:
	env: ecorl.envs.asm.AsmEnv
	run: PPO
	stop:
	time_total_s: 24000
	config:
	lambda: 0.95
	kl_coeff: 0.5
	clip_param: 0.2
	vf_clip_param: 400.0
	entropy_coeff: 0.0001
	rollout_fragment_length: auto
	num_sgd_iter: 10
	num_envs_per_worker: 24
	min_time_s_per_iteration: 360
	lr: 0.0003

	# Run with Learner- and RLModule API (new stack).
	_enable_learner_api: true
	_enable_rl_module_api: true
	# Use N Learner worker on the GPU
	num_learner_workers: 2
	num_gpus_per_learner_worker: 1
	num_gpus: 0 # No GPU needed for driver.
	# Since we are using learner workers, the driver process does not need
	# a CPU in particular.
	num_cpus_for_local_worker: 1
	# Need to unset this b/c we are using the RLModule API, which
	# provides exploration control via the RLModule's `forward_exploration` method.
	exploration_config: {}