bball_cannon/bball.py at master · StevenCHowell/bball_cannon · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
import itertools
import numpy as np
from bokeh import plotting
from bokeh.resources import INLINE
from bokeh.palettes import Dark2_8 as palette

colors = itertools.cycle(palette)
# plotting.output_notebook(resources=INLINE)
# plotting.output_html(resources=INLINE)

class Shot():
    def __init__(self):
        # constants
        self.ball_radius = 9.5 / 12 / 2  # ft
        self.height_basket = 10  # ft
        self.g = -32.174  # ft/s^2
        self.path = []

    def setup(self, params=None):
        # randomly select cannon parameters: distance, height, speed
        if params is None:
            min_params = [5.0, 0.0, 34.3]
            max_params = [25.0, 10.0, 68.6]
            dist, height, speed = np.random.uniform(min_params, max_params)
        else:
            dist, height, speed = params
        self.dist = dist  # ft, distance to hoop
        self.height = height  # ft, height of the cannon
        self.speed = speed  # ft/s

        self.delta_h = self.height_basket - self.height
        self.rim = dist + self.ball_radius * np.array([-1, 1])  # m

        self.angle = 0

        return np.array([dist, height, speed])

    def shoot_reward(self, angle):
        shoot_delta_x(angle)
        if self.rim[0] < self.x_shot < self.rim[1]:
            # Big reward for success.  Not sure how big to make this.
            reward = 500.0
        else:
            # Penalty for missing equal to distance under/over shot.
            reward = -abs(self.delta_x)

        return reward

    def shoot_delta_x(self, angle):
        self.angle = np.deg2rad(angle)
        self.delta_x = self.dist
        if 0 < angle or angle < 90:
            cos = np.cos(self.angle)
            sin = np.sin(self.angle)

            # calculate the determinant
            D = (self.speed * sin) ** 2 + 2 * self.g * self.delta_h
            if D > 0:  # ball passes through correct height twice
                # negative root is the downward part of arc
                self.t_m = (-self.speed * sin - np.sqrt(D)) / self.g
                self.x_shot = self.speed * cos * self.t_m
                self.delta_x = self.x_shot - self.dist  # +/-: over/under-shot
            else:
                # ball not shot high enough
                self.t_m = 1.3  # s
        return self.delta_x

    def calc_path(self):
        if self.angle:
            cos = np.cos(self.angle)
            sin = np.sin(self.angle)
            t_final = self.t_m * 1.1
            t = np.linspace(0, t_final, 100)
            x = self.speed * cos * t
            y = self.height + self.speed * sin * t + self.g * t**2 / 2
            self.path.append(np.c_[x, y][y>=0])
        else:
            print('Error: no attempts made!')

    def show_path(self):
        if self.path:
            p = plotting.figure(
                width=800, height=400,
                x_axis_label='(ft)', y_axis_label='(ft)',
                x_range=(-1, self.dist*1.3), y_range=(-0.5, 20),
            )

            # plot the hoop
            p.line(np.array([1, 1.015, 1.015]) * self.rim[1],
                   [self.height_basket, self.height_basket, 0], color='gray')
            p.circle(self.rim, self.height_basket,
                     radius=0.02, color='orange')
            p.line(self.rim, self.height_basket, color='orange')

            # plot the attempts
            for i, (path, color) in enumerate(zip(self.path, colors)):
                name = f'Attempt {i+1}'
                p.line(path[:, 0], path[:, 1], color=color,
                       legend_label=name, muted_alpha=0.2)
                t = np.linspace(0, 1, 100)

            # plot the last cannon
            p.line(0, [0, self.height], color='black')
            p.line(
                [-np.cos(self.angle)/2, 0],
                [self.height - np.sin(self.angle)/2, self.height],
                line_width=5, color=color,
            )

            p.legend.location = 'top_right'
            p.legend.click_policy = 'mute'
            p.toolbar.autohide = True
            plotting.show(p)
        else:
            print('Error: no attempts made!')


class AgentPoly():
    def __init__(self, shot):
        self.shot = shot

    def learn(self, max_iters, *, angle_0=89, step_size=10):
        p_or_m = np.sign(45 - angle_0)
        angles = [angle_0, angle_0 + (p_or_m * step_size)]
        delta_x = []

        # fire first two shots
        for angle in angles:
            delta_x.append(self.shot.shoot_delta_x(angle))

        # first first order polynomial
        coef = np.polyfit(angles, delta_x, 1)
        guess = -coef[1] / coef[0]

        # fire estimated best guess as third shot
        angles.append(guess)
        delta_x.append(self.shot.shoot_delta_x(guess))

        success_angle = np.nan
        for i in range(max_iters-3):
            if np.abs(delta_x[-1]) < self.shot.ball_radius:
                success_angle = angles[-1]
                break
            else:
                # fit second order polynomial
                coef = np.polyfit(angles, delta_x, 2)
                guess = np.roots(coef).max()

                # fire estimated best guess
                angles.append(guess)
                delta_x.append(self.shot.shoot_delta_x(guess))

        self.results = np.c_[angles, delta_x]
        return success_angle