diff --git a/config.yaml b/config.yaml index 4f6d2d1..32d66cb 100644 --- a/config.yaml +++ b/config.yaml @@ -110,7 +110,7 @@ train: max_grad_norm: 0.5 target_kl: ~ vf_clip_coef: 0.1 - vf_coef: 0.5 + vf_coef: 0.495 batch_rows: 128 bptt_horizon: 16 @@ -315,29 +315,29 @@ rewards: baseline.ObjectRewardRequiredEventsMapIds: reward: a_press: 0.0 # 0.00001 - badges: 3.0 + badges: .6 bag_menu: 0.0 - caught_pokemon: 2.5 + caught_pokemon: 1.0 cut_coords: 0.75 cut_tiles: 0.0 - event: .75 + event: 1.5 exploration: 0.019 explore_hidden_objs: 0.00009999 explore_signs: 0.015 explore_warps: 0.01006 - hm_count: 7.5 - level: 1.05 - moves_obtained: 4.0 - pokecenter_heal: 0.47 + hm_count: 9.75 + level: 1.016 + moves_obtained: 6.0 + pokecenter_heal: 0.42 pokemon_menu: 0.0 - required_event: 7.0 - required_item: 3.0 + required_event: 3.12 + required_item: 3.6 seen_action_bag_menu: 0.0 - seen_pokemon: 2.5 + seen_pokemon: 1.3 start_menu: 0.0 stats_menu: 0.0 use_surf: 0.4 - useful_item: 0.825 + useful_item: 1.06