-
Notifications
You must be signed in to change notification settings - Fork 46
/
manualControl.py
67 lines (56 loc) · 2.1 KB
/
manualControl.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
"""
Manually control the agent to provide expert trajectories.
The main aim is to get the feature expectaitons respective to the expert trajectories manually given by the user
Use the arrow keys to move the agent around
Left arrow key: turn Left
right arrow key: turn right
up arrow key: dont turn, move forward
down arrow key: exit
Also, always exit using down arrow key rather than Ctrl+C or your terminal will be tken over by curses
"""
from flat_game import carmunk
import numpy as np
from nn import neural_net
import curses # for keypress
NUM_STATES = 8
GAMMA = 0.9 # the discount factor for RL algorithm
def play(screen):
car_distance = 0
weights = [1, 1, 1, 1, 1, 1, 1, 1]# just some random weights, does not matter in calculation of the feature expectations
game_state = carmunk.GameState(weights)
_, state, __ = game_state.frame_step((2))
featureExpectations = np.zeros(len(weights))
Prev = np.zeros(len(weights))
while True:
car_distance += 1
event = screen.getch()
if event == curses.KEY_LEFT:
action = 1
elif event == curses.KEY_RIGHT:
action = 0
elif event == curses.KEY_DOWN:
break
else:
action = 2
# Take action.
#start recording feature expectations only after 100 frames
immediateReward , state, readings = game_state.frame_step(action)
if car_distance > 100:
featureExpectations += (GAMMA**(car_distance-101))*np.array(readings)
# Tell us something.
changePercentage = (np.linalg.norm(featureExpectations - Prev)*100.0)/np.linalg.norm(featureExpectations)
print (car_distance)
print ("percentage change in Feature expectation ::", changePercentage)
Prev = np.array(featureExpectations)
if car_distance % 2000 == 0:
break
return featureExpectations
if __name__ == "__main__":
screen = curses.initscr()
curses.noecho()
curses.curs_set(0)
screen.keypad(1)
screen.addstr("Play the game")
result = play(screen)
curses.endwin()
print (result)