-
Notifications
You must be signed in to change notification settings - Fork 21
/
Copy pathpickplace_sac_youbot.gin
39 lines (33 loc) · 1.25 KB
/
pickplace_sac_youbot.gin
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
# Training & playing the pick and place task with agent youbot_noplugin
#
# DISPLAY=null python -m alf.bin.train --root_dir=~/tmp/pickplace --gin_file=pickplace_sac_youbot.gin
# python -m alf.bin.play --root_dir=~/tmp/pickplace --gin_file=pickplace_sac_youbot.gin
include 'common_nonimage_sac.gin'
import social_bot
# environment config
create_environment.env_name="SocialBot-PlayGround-v0"
create_environment.num_parallel_environments=12
create_environment.env_load_fn=@suite_socialbot.load
# suite_socialbot.load.gym_env_wrappers=(@FrameStack,)
PlayGround.agent_type='youbot_noplugin'
PlayGround.tasks=[@PickAndPlace]
PlayGround.max_steps=150
suite_socialbot.load.max_episode_steps=152
PlayGround.step_time=0.05
PickAndPlace.reward_shaping=True
PlayGround.action_wrapper=@YoubotActionWrapper
# algorithm config
actor/Adam.learning_rate=1e-3
critic/Adam.learning_rate=1e-3
alpha/Adam.learning_rate=1e-3
OneStepTDLoss.gamma=0.98
# training config
TrainerConfig.initial_collect_steps=2000
TrainerConfig.mini_batch_length=2
TrainerConfig.unroll_length=1
TrainerConfig.mini_batch_size=512
TrainerConfig.summary_interval=200
TrainerConfig.eval_interval=2000
TrainerConfig.checkpoint_interval=2000
TrainerConfig.num_updates_per_train_step=1
TFUniformReplayBuffer.max_length=100000