ml_capstone/plotting.py at master · drscott173/ml_capstone · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
#
# Some plotting routes to show off the learning agent for the "driverless car" using Tensorflow
#
# @scottpenberthy
# November 1, 2016
#

import tensorflow as tf
import numpy as np
from learning import *
import matplotlib
import matplotlib.mlab as mlab
import matplotlib.cm as cm
import matplotlib.pyplot as plt
import matplotlib.animation as animation
from scipy.signal import convolve2d

class Plotter:

    # We put some plotting routines here that
    # we used to document performance of our
    # final model.
    #
    # These fight with PyGame for control of the
    # matplot environment. As a result, you should
    # load these separately, as follows:
    #
    # from plotting import *
    #
    # p.contour_plot()
    # p.angle_v_sensor_plot()
    # p.theta_anim()
    # p.sensor_anim()

    def __init__(self, name='q_value', track=False):
        # Tf graph input
        self.ai = Learner(True)
        self.saver = tf.train.Saver()
        self.saver.restore(self.ai.s,"models/narrow-deep-pipe.ckpt")
        self.theta = 0
        self.im = None
        self.fig = None
        self.sensor = 0
        self.smoothing = True
        matplotlib.rcParams['xtick.direction'] = 'out'
        matplotlib.rcParams['ytick.direction'] = 'out'

    def moving_average_2d(self, data, window):
        """Moving average on two-dimensional data.
        """
        # Makes sure that the window function is normalized.
        window /= window.sum()
        # Makes sure data array is a numpy array or masked array.
        if type(data).__name__ not in ['ndarray', 'MaskedArray']:
            data = numpy.asarray(data)

        # The output array has the same dimensions as the input data
        # (mode='same') and symmetrical boundary conditions are assumed
        # (boundary='symm').
        return convolve2d(data, window, mode='same', boundary='symm')

    def location_contours(self, sensors=[0.2,0.2,0.2,0.0]):
        #
        # Create a mesh grid for 100x100 points within the simulated game.
        # Store the maximum Q value at each (x,y) location using the
        # fixed sensor values and car angle (theta) passed into this function.
        #
        x = np.arange(0,1,0.01)
        y = np.arange(0,1,0.01)
        qt = self.ai.q_train
        a,b = np.meshgrid(x,y)
        s1,s2,s3,theta = sensors
        # this hairball creates an entry in our matrix, storing the
        # sensor readings, x,y, and theta in the proper order
        # for evaluating through our network.
        X = np.concatenate([[[s1, s2, s3, a[:,i][j], b[:,i][j], theta] for i in range(len(a[0]))] for j in range(len(a))])
        feed = {qt.x: X, qt.q_max: qt.q_max_val}
        # use the maximum q value here..
        q = self.ai.s.run(tf.reduce_max(qt.q_value, reduction_indices=[1]), feed_dict=feed)
        # or uncomment and use the chosen action here
        #q = self.ai.s.run(tf.argmax(qt.q_value, dimension=1), feed_dict=feed)
        cols = len(a[0])
        rows = len(a)
        c = np.array([[q[i*cols+j] for j in range(cols)] for i in range(rows)])
        if self.smoothing:
            c = self.moving_average_2d(c, np.ones((6,40)))
        return a,b,c

    def angle_v_sensor_contours(self, x0=0.5, y0=0.5):
        #
        # Create a mesh grid of 100x100 varying from 0-1 on both axes.
        # Treat the x axis as the angle of the car
        # Treat the y axis as the sensor level for all 3 sensors
        # Compute the maximum Q value at a fixed position x0,y0 as supplied,
        # varying angle and sensor level across the grid.
        #
        # x axis varies theta from 0 to 2*pi
        # y axis varies sensors all from 0 to 1.0 in unison
        #
        x = np.arange(0,1,0.01)
        y = np.arange(0,1,0.01)
        qt = self.ai.q_train
        a,b = np.meshgrid(x,y)
        # this is the ugly hairbal that does the bulk of the work
        # populating our state values for pushing through the neural network.
        X = np.concatenate([[[b[:,i][j], b[:,i][j], b[:,i][j], x0, y0, 2*np.pi*a[:,i][j]] for i in range(len(a[0]))] for j in range(len(a))])
        feed = {qt.x: X, qt.q_max: qt.q_max_val}
        q = self.ai.s.run(tf.reduce_max(qt.q_value, reduction_indices=[1]), feed_dict=feed)
        #q = self.ai.s.run(tf.argmax(qt.q_value, dimension=1), feed_dict=feed)
        cols = len(a[0])
        rows = len(a)
        c = np.array([[q[i*cols+j] for j in range(cols)] for i in range(rows)])
        if self.smoothing:
            c = self.moving_average_2d(c, np.ones((6,40)))
        return a,b,c

    def contour_plot(self, sensors=[0.2,0.2,0.2,0.0], title="Contour Plot of Q(s,a)"):
        #
        # Show a contour plot of how Q varies over the geometry of our
        # play area, while fixing sensor readings and car rotation.
        #
        x,y,z = self.location_contours(sensors)
        plt.figure(facecolor='white')
        plt.hot()
        im = plt.imshow(z, interpolation='bilinear', origin='lower', cmap=cm.inferno)
        CBI = plt.colorbar(im, orientation='horizontal', shrink=0.8)
        plt.title(title+": theta="+str(int(sensors[3]*180.0/np.pi)))
        plt.xlabel('x%')
        plt.ylabel('y%')
        plt.show()

    def angle_v_sensor_plot(self, x0=0.5, y0=0.5, title="Contour Plot of Q(s,a)"):
        #
        # Show a contour plot of how Q varies as we change car rotation
        # and sensor strength at a fixed position (x0,y0) in the game area.
        #
        x,y,z = self.angle_v_sensor_contours(x0, y0)
        plt.figure(facecolor='white')
        plt.hot()
        plt.xlabel('Orientation')
        plt.ylabel('Signal strength')
        im = plt.imshow(z, interpolation='bilinear', origin='lower', cmap=cm.inferno)
        CBI = plt.colorbar(im, orientation='horizontal', shrink=0.8)
        plt.title(title)
        plt.show()

    def update_theta(self, *args):
        #
        # Companion to theta_anim, which increments the angle
        #
        self.theta += np.pi/20.0
        x,y,z = self.location_contours([0.2, 0.2, 0.2, self.theta])
        self.theta %= (np.pi*2.0)
        self.im.set_data(z)
        self.fig.suptitle("Countour Q plot - Heading "+str(int(self.theta*180.0/np.pi)))
        return self.im

    def theta_anim(self):
        #
        # Animate the contour plot from above by varying theta from 0 to 2*pi
        #
        self.theta = 0
        x,y,z = self.location_contours([0.2, 0.2, 0.2, self.theta])
        self.fig = plt.figure()
        self.im = plt.imshow(z, interpolation='bilinear', origin='lower', cmap=cm.inferno)
        CBI = plt.colorbar(self.im, orientation='horizontal', shrink=0.8)
        plt.title('Contour Plot - Q')
        ani = animation.FuncAnimation(self.fig, self.update_theta, interval=50, blit=False)
        plt.show()

    def theta_gif(self):
        #
        # Create an animated gif of the contour plot from above by varying theta from 0 to pi
        #
        self.theta = 0
        x,y,z = self.location_contours([0.2, 0.2, 0.2, self.theta])
        self.fig = plt.figure()
        self.im = plt.imshow(z, interpolation='bilinear', origin='lower', cmap=cm.inferno)
        CBI = plt.colorbar(self.im, orientation='horizontal', shrink=0.8)
        plt.xlabel('X %')
        plt.ylabel('Y %')
        ani = animation.FuncAnimation(self.fig, self.update_theta, frames=np.arange(0,20), interval=200, blit=False)
        ani.save('figures/theta.gif', dpi=80, writer='imagemagick')

    def update_sensor(self, *args):
        #
        # Companion to sensor_anim, which increments the angle
        #
        self.sensor += 0.02
        if self.sensor > 1:
            self.sensor = 0.0
        s = self.sensor
        x,y,z = self.location_contours([s, s, s, self.theta])
        self.im.set_data(z)
        self.fig.suptitle("Countour Q plot - Sensor "+str(self.sensor))
        return self.im

    def sensor_anim(self, theta=0):
        #
        # Animate the contour plot by changing sensor values and holding
        # the angle fixed at theta.
        #
        self.theta = theta
        self.sensor = 0.0
        x,y,z = self.location_contours([0,0,0, self.theta])
        self.fig = plt.figure()
        self.im = plt.imshow(z, interpolation='bilinear', origin='lower', cmap=cm.inferno)
        CBI = plt.colorbar(self.im, orientation='horizontal', shrink=0.8)
        ani = animation.FuncAnimation(self.fig, self.update_sensor, interval=50, blit=False)
        plt.show()


p = Plotter()