-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathexample_experiment.py
45 lines (34 loc) · 1011 Bytes
/
example_experiment.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
from gym_torcs import TorcsEnv
from sample_agent import Agent
import numpy as np
vision = False
episode_count = 10
max_steps = 500
reward = 0
done = False
step = 0
# Generate a Torcs environment
env = TorcsEnv(vision=vision, throttle=False)
agent = Agent(1) # steering only
print("TORCS Experiment Start.")
for i in range(episode_count):
print("Episode : " + str(i))
if np.mod(i, 3) == 0:
# Sometimes you need to relaunch TORCS because of the memory leak error
ob = env.reset(relaunch=True)
else:
ob = env.reset()
total_reward = 0.
for j in range(max_steps):
action = agent.act(ob, reward, done, vision)
ob, reward, done, _ = env.step(action)
#print(ob)
total_reward += reward
step += 1
if done:
break
print("TOTAL REWARD @ " + str(i) +" -th Episode : " + str(total_reward))
print("Total Step: " + str(step))
print("")
env.end() # This is for shutting down TORCS
print("Finish.")