optimization/optimization.py at main · sachag678/optimization · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
#!/usr/bin/env python
import numpy as np
import matplotlib.pyplot as plt
from matplotlib.animation import FuncAnimation

def rosenbrock(x, y, a = 1, b = 100):
    return (a - x)**2 + b * (y - x**2)**2

def parabaloid(x, y):
    return (10*x**2 + y**2)/2

def himmelblau(x, y):
    return (x**2 + y - 11)**2 + (x + y**2 - 7)**2

params = {
    "Rosenbrock": {
        "x_min":-2,
        "x_max":2,
        "y_min":-1,
        "y_max":3,
        "init_x": -1.2,
        "init_y": 1
    },
    "Paraboloid": {
        "x_min":-4,
        "x_max":4,
        "y_min":-4,
        "y_max":4,
        "init_x": 3,
        "init_y": 3
    },
    "Himmelblau": {
        "x_min":-5,
        "x_max":5,
        "y_min":-5,
        "y_max":5,
        "init_x": 0,
        "init_y": 0
    }
}

def plot2d(f, xs, ys, func_name, animate=False):
    func_params = params[func_name]
    x = np.linspace(func_params['x_min'], func_params['x_max'], 10000)
    y = np.linspace(func_params['y_min'], func_params['y_max'], 10000)
    xv, yv = np.meshgrid(x, y)
    z = np.log10(f(xv, yv))

    fig, ax = plt.subplots()
    ax.imshow(z, aspect='equal', origin='lower', extent = (func_params['x_min'], func_params['x_max'], func_params['y_min'], func_params['y_max'],))
    ax.contour(xv, yv, z, colors = 'white', levels = 7, linewidths=0.5)

    if animate:
        def animate(i):
            ax.plot(xs[:i], ys[:i], 'rx--', linewidth=0.05)

        ani = FuncAnimation(fig, animate, frames=len(xs) - 1, interval=(10000 // len(xs)), repeat=False)
    else:
        ax.plot(xs, ys, 'rx--', linewidth=0.1)

    plt.show()

def plot3d(f, xs, ys, animate=False):
    x = np.linspace(-2, 2, 10000)
    y = np.linspace(-1, 3, 10000)
    xv, yv = np.meshgrid(x, y)
    z = np.log10(f(xv, yv))
    zs = np.log10(f(np.array(xs), np.array(ys)))

    fig = plt.figure()
    ax = fig.add_subplot(projection='3d')
    ax.plot_surface(xv, yv, z, cmap=plt.cm.magma)
    if animate:
        def animate(i):
            ax.plot(xs[:i], ys[:i], zs[:i], 'ro--')

        ani = FuncAnimation(fig, animate, frames=len(xs) - 1, interval=(10000 // len(xs)), repeat=False)
    else:
        ax.plot(xs, ys, zs, 'ro--')
    plt.show()

def dellfy(x, y):
    return 200 * (y - x**2)

def dellfx(x, y):
    return 400 * x**3 - 400 * x * y + 2 * x - 2

def delf(x, y):
    return np.array([dellfx(x, y), dellfy(x, y)])

def hessian(x, y):
    return np.array([[1200 * x**2 - 400 * y + 2, -400 * x], [-400 * x, 200]])

def approx_hessian(f, x, y, h = 0.000001, k = 0.000001):
    fxy = (f(x + h, y + k) - f(x + h, y - k) - f(x - h, y + k) + f(x - h, y - k)) / (4 * h * k)
    fxx = (f(x + h, y) - 2 * f(x, y) + f(x - h, y)) / h**2
    fyy = (f(x, y + k) - 2 * f(x, y) + f(x, y - k)) / k**2
    return np.array([[fxx , fxy], [fxy, fyy]])

def approx_deriv_x(f, x, y, h = 0.000001):
    return (f(x + h, y) - f(x - h, y)) / (2 * h)

def approx_deriv_y(f, x, y, h = 0.000001):
    return (f(x, y + h) - f(x, y - h)) / (2 * h)

def backtracking_line_search(f, df, px, py, x, y, alpha = 1, c = 0.01, rho= 0.75):
    while f(x + alpha * px, y + alpha * py) > f(x, y) + alpha * c * (df[0] * px + df[1] * py):
        alpha *= rho
    return alpha

def fixed_step_size(alpha):
    return alpha

# uses del f
def steepest_descent(f, x0=1.2, y0=1.2, c=0.01, rho=0.75):
    xs = [x0]
    ys = [y0]
    x = x0
    y = y0
    count = 0
    while True:
        px = -approx_deriv_x(f, x, y)
        py = -approx_deriv_y(f, x, y)
        step_size = backtracking_line_search(f, np.array([-px, -py]), px, py, x, y, c=c, rho=rho)
        #print('alpha: {}, p: ({}, {})'.format(step_size, px, py))
        old_x = x
        old_y = y
        x += step_size * px
        y += step_size * py
        xs.append(x)
        ys.append(y)
        #print('x: {}, y: {}'.format(x, y))
        if ((old_x - x)**2 + (old_y - y)**2)**0.5 < 0.0001:
            break
        count += 1
    #print('steepest_descent: ', x, y, count)
    return xs, ys


# uses Hessian
def newtons_method(f, x0=1.2, y0=1.2, beta=0.001, multiple_identity=False, flip_negative_eigs=False, c=0.01, rho=0.75):
    xs = [x0]
    ys = [y0]
    x = x0
    y = y0
    count = 0
    while True:
        df = np.array([approx_deriv_x(f, x, y), approx_deriv_y(f, x, y)])
        H = approx_hessian(f, x, y)
        eigs = np.linalg.eigvals(H)
        if multiple_identity:
            if min(eigs) > 0:
                tau = 0
            else:
                tau = - min(eigs) + beta
            Hbar = H + np.eye(2) * tau # modifies using multiples of identity
        elif flip_negative_eigs:
            mod_mat = (H>0).astype(int)
            mod_mat[mod_mat==0] = -1
            Hbar = H * mod_mat
        else:
            Hbar = H
        p = -np.linalg.inv(Hbar) @ df
        px = p[0]
        py = p[1]
        step_size = backtracking_line_search(f, df, px, py, x, y, c=c, rho=rho)
        #print('alpha: {}, p: ({}, {})'.format(step_size, px, py))
        old_x = x
        old_y = y
        x += step_size * px
        y += step_size * py
        xs.append(x)
        ys.append(y)
        #print('x: {}, y: {}'.format(x, y))
        #if ((old_x - x)**2 + (old_y - y)**2)**0.5 < 0.0001:
        if np.linalg.norm(df, 2) < 0.00001 or ((old_x - x)**2 + (old_y - y)**2)**0.5 < 0.0001:
            break
        count += 1
    #print('newtons method: ',  x, y, count)
    return xs, ys

# uses Bk
def bfgs():
    pass

# used to approximate the function f (this is a quadratic function)
def m(f, p, B, x, y):
    return f(x, y) + np.array([[approx_deriv_x(f, x, y), approx_deriv_y(f, x, y)]]) @ p + 0.5 * p.T @ B @ p

# uses standard cauchy point without modifications
def cauchy_point(f, x0, y0, max_delta, delta, nu):
    x = x0
    y = y0
    xs = [x0]
    ys = [y0]
    deltas = [delta]
    g = np.zeros((2, 1))
    while True:
        g = np.array([[approx_deriv_x(f, x, y)], [approx_deriv_y(f, x, y)]])
        norm_g = np.linalg.norm(g, 2)
        H = approx_hessian(f, x, y)
        curvature = g.T @ H @ g
        if curvature <= 0:
            tau = 1
        else:
            tau = min(1, norm_g**3/(delta * curvature))
        p = -tau * delta * g / norm_g
        rho = (f(x, y) - f(x + p[0], y + p[1])) / (m(f, np.zeros((2, 1)), H, x, y) - m(f, p, H, x, y))
        p_norm = np.linalg.norm(p)
        if rho < 0.25:
            delta = 0.25 * delta
        else:
            if rho > 0.75 and p_norm == delta:
                delta = min(2 * delta, max_delta)
            else:
                delta = delta
        if rho > nu:
            x += p[0][0]
            y += p[1][0]
            xs.append(x)
            ys.append(y)
            deltas.append(delta)

        if p_norm < 0.00001:
            break
    return xs, ys, deltas

def dog_leg():
    pass

if __name__ == '__main__':
    #xs, ys = steepest_descent(rosenbrock, x0=-1.2, y0=1)
    xs, ys = cauchy_point(parabaloid, x0=3, y0=3)
    plot2d(parabaloid, xs, ys, 'Paraboloid')
    #xs, ys = newtons_method(rosenbrock, x0=-1.2, y0=1)
    #plot3d(rosenbrock, xs, ys, animate=True)