Skip to content

Commit

Permalink
More tuning to the sweep config
Browse files Browse the repository at this point in the history
  • Loading branch information
thatguy11325 committed Oct 13, 2024
1 parent f106574 commit e66c181
Show file tree
Hide file tree
Showing 3 changed files with 5 additions and 3 deletions.
2 changes: 1 addition & 1 deletion config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -93,7 +93,7 @@ train:
compile: True
compile_mode: "reduce-overhead"
float32_matmul_precision: "high"
total_timesteps: 500_000_000 # 100_000_000_000 for full games
total_timesteps: 1_000_000_000 # 100_000_000_000 for full games
batch_size: 65536
minibatch_size: 2048
learning_rate: 2.0e-4
Expand Down
2 changes: 2 additions & 0 deletions pokemonred_puffer/environment.py
Original file line number Diff line number Diff line change
Expand Up @@ -1435,6 +1435,8 @@ def agent_stats(self, action):
"in_battle": self.read_m("wIsInBattle") > 0,
"event": self.progress_reward["event"],
"max_steps": self.get_max_steps(),
# redundant but this is so we don't interfere with the swarm logic
"required_count": len(self.required_events) + len(self.required_items),
}
| {
"exploration": {
Expand Down
4 changes: 2 additions & 2 deletions pokemonred_puffer/sweep.py
Original file line number Diff line number Diff line change
Expand Up @@ -140,13 +140,13 @@ def launch_sweep(
finished.add(run["name"])
summary_metrics = json.loads(run["summaryMetrics"])
if (
"environment/stats/event" in summary_metrics
"environment/stats/required_count" in summary_metrics
and "performance/uptime" in summary_metrics
):
obs_in = ObservationInParam(
input=json.loads(run["config"])["x"]["value"],
# TODO: try out other stats like required count
output=summary_metrics["environment/stats/event"],
output=summary_metrics["environment/stats/required_count"],
cost=summary_metrics["performance/uptime"],
)
carbs.observe(obs_in)
Expand Down

0 comments on commit e66c181

Please sign in to comment.