diff --git a/config.yaml b/config.yaml index cfbbf44..7e05ad4 100644 --- a/config.yaml +++ b/config.yaml @@ -22,7 +22,7 @@ debug: env_batch_size: 4 env_pool: True zero_copy: False - batch_size: 128 + batch_size: 4 minibatch_size: 4 batch_rows: 4 bptt_horizon: 2 @@ -150,7 +150,6 @@ wrappers: jitter: 0 stream_only: - - episode_stats.EpisodeStatsWrapper: {} - stream_wrapper.StreamWrapper: user: thatguy - exploration.OnResetExplorationWrapper: @@ -170,6 +169,7 @@ wrappers: - exploration.OnResetExplorationWrapper: full_reset_frequency: 25 jitter: 0 + - episode_stats.EpisodeStatsWrapper: {} rewards: baseline.BaselineRewardEnv: diff --git a/pokemonred_puffer/eval.py b/pokemonred_puffer/eval.py index f1fc2c0..3397cc1 100644 --- a/pokemonred_puffer/eval.py +++ b/pokemonred_puffer/eval.py @@ -15,7 +15,7 @@ def make_pokemon_red_overlay(counts: np.ndarray): # The clip scaling needs to be re-calibrated since my # overlay is from the global map with fading scaled = np.ascontiguousarray(np.sum(counts, axis=0).astype(np.float32)) - scaled = scaled / np.max(counts) + scaled = scaled / np.max(scaled) nonzero = np.ascontiguousarray(np.where(scaled > 0, 1, 0).astype(np.float32)) # scaled = np.clip(counts, 0, 1000) / 1000.0