Auther = 'Yubo Cai'
Email = 'yubo.cai@polytechnique.edu'


import sympy as sp
import numpy as np
from sympy import symbols, Eq, solve
import matplotlib.pyplot as plt
import scipy as sc
from scipy.optimize import minimize
from scipy.optimize import minimize_scalar
from scipy.optimize import linprog


x = sp.Symbol('x')
f_x = sp.sqrt(1 + x**2)

# Calculate the first and second derivatives of f(x)
f_prime = f_x.diff(x)
f_double_prime = f_prime.diff(x)
display(sp.simplify(f_prime))
display(sp.simplify(f_double_prime))

# Compute the expression x_{i+1} = x_i - f'(x_i) / f''(x_i)
x_next = x - f_prime / f_double_prime
display(sp.simplify(x_next))


x, y, z, lambda_1, lambda_2 = symbols('x y z lambda_1 lambda_2')

eq1 = Eq(2*x + 2*lambda_1 + 5*lambda_2, 0)
eq2 = Eq(2*y + 3*lambda_1 - lambda_2, 0)
eq3 = Eq(2*z - lambda_1 + lambda_2, 0)
eq4 = Eq(2*x + 3*y - z, 1)
eq5 = Eq(5*x - y + z, 1)

solutions = solve((eq1, eq2, eq3, eq4, eq5), (x, y, z, lambda_1, lambda_2))

print('lambda_1 =', solutions[lambda_1], ', lambda_2 =', solutions[lambda_2], 'Optimal point:', (solutions[x], solutions[y], solutions[z]))

lambda_1 = -7/57 , lambda_2 = -8/171 Optimal point: (41/171, 55/342, -13/342)


def f(x, y):
    return x**2 + y**2

plt.figure(figsize=(6, 6))
x = np.linspace(-2, 2, 400)
y = np.linspace(-2, 2, 400)
x, y = np.meshgrid(x, y)

z = f(x, y)

plt.contour(x, y, z, levels=20)

x_boundary = np.linspace(-2, 2, 400)
y_boundary1 = 1 - x_boundary
y_boundary2 = x_boundary + 1

# change the figure size
plt.plot(x_boundary, y_boundary1, label='x + y - 1 = 0')
plt.plot(x_boundary, y_boundary2, label='y - x - 1 = 0')
plt.fill_between(x_boundary, np.minimum(y_boundary1, y_boundary2), -2, where=(x_boundary >= -2) & (x_boundary <= 2), color='gray', alpha=0.5)
plt.xlim(-2, 2)
plt.ylim(-2, 2)
plt.xlabel('x')
plt.ylabel('y')
plt.legend()
plt.show()


from mpl_toolkits.mplot3d import Axes3D

def f(x, y):
    return np.exp(np.sin(50 * x)) + np.sin(60 * np.exp(y)) + np.sin(70 * np.sin(x)) + np.sin(np.sin(80 * y)) - np.sin(10 * (x + y)) + (x**2 + y**2) / 4


print('The value of 1/e is ', 1 / np.exp(1))
print('The value of f(-0.5, 0) is', f(-0.5, 0))

The value of 1/e is  0.36787944117144233
The value of f(-0.5, 0) is -0.8999682589251161


x = np.linspace(-4, 4, 200)
y = np.linspace(-4, 4, 200)

X, Y = np.meshgrid(x, y)
Z = f(X, Y)

# plot the 2D and 3D figures
plt.figure(figsize=(8, 6))
plt.contour(X, Y, Z, levels=20)
plt.colorbar()
plt.xlim(-4, 4)
plt.ylim(-4, 4)
plt.xlabel('x')
plt.ylabel('y')
plt.title('Contour plot of f(x, y)')
plt.bar(0, 0, label='f(x, y)', color='gray', alpha=0.5)
plt.show()

fig = plt.figure(figsize=(12, 8))
ax = fig.add_subplot(111, projection='3d')
ax.plot_surface(X, Y, Z, cmap='viridis')
ax.set_xlabel('X-axis')
ax.set_ylabel('Y-axis')
ax.set_zlabel('Z-axis')
ax.set_title('3D plot of f(x, y)')

plt.show()


# plot the graph sin(60e^y)
def f_plot(x):
    return np.sin(60 * np.exp(x))

x = np.linspace(-20, 20, 200)
y = f_plot(x)
plt.figure(figsize=(8, 6))
plt.plot(x, y)
plt.xlabel('x')
plt.ylabel('y')
plt.title(f'Plot of $\sin(60e^x)$')
plt.show()


list_min_posi = []

def evaluate_function_on_grid(N):
    x = np.linspace(-4, 4, N)
    y = np.linspace(-4, 4, N)
    X, Y = np.meshgrid(x, y)
    Z = f(X, Y)
    return Z

def find_min_values():
    for k in range(4, 11):
        N = 2 ** k + 1
        Z = evaluate_function_on_grid(N)
        min_value = np.min(Z)
        # return the indices of the minimum value
        x_min_index, y_min_index = np.where(Z == min_value)
        x_min = x_min_index[0] / (N - 1) * 8 - 4
        y_min = y_min_index[0] / (N - 1) * 8 - 4
        list_min_posi.append((y_min, x_min))
        print(f"For k={k}, N = {N}, the minimum value of f(x, y) is {min_value} at the point ({y_min}, {x_min})")

find_min_values()

For k=4, N = 17, the minimum value of f(x, y) is -1.7612874733047068 at the point (-0.5, -0.5)
For k=5, N = 33, the minimum value of f(x, y) is -1.8463465039832796 at the point (1.25, -0.5)
For k=6, N = 65, the minimum value of f(x, y) is -1.8463465039832796 at the point (1.25, -0.5)
For k=7, N = 129, the minimum value of f(x, y) is -2.449624019189007 at the point (0.0625, -0.5)
For k=8, N = 257, the minimum value of f(x, y) is -2.943575583284294 at the point (0.34375, -0.09375)
For k=9, N = 513, the minimum value of f(x, y) is -3.163951672593782 at the point (-0.390625, -0.09375)
For k=10, N = 1025, the minimum value of f(x, y) is -3.303518906855208 at the point (-0.0234375, 0.2109375)


def gradientVariableStep(f,df,x_init,step=0.001,tol=1e-06,maxiter=20000):
    maxstep = 10
    x=x_init.copy()
    xtab=[]
    ftab=[]
    xtab.append(x) 
    pval = f(x)
    ftab.append(pval)
    it=0 
    g=df(x)
    while((it==0) or (step>tol and it<maxiter and np.linalg.norm(xtab[-1]-xtab[-2]))>tol):  
        actx= x-step*g
        val = f(actx)
        if(val<pval):
            #accept iteration
            x = actx
            pval = val
            step = min(1.1*step,maxstep)
            xtab.append(x)
            ftab.append(val)
            g = df(x)
            it=it+1
        else:
            step = 0.8*step
            
    # boolean to indicate the convergence
    if(it==maxiter):
        conv = False
    else:
        conv = True
    return xtab, ftab, conv


def f_np(x):
    return np.exp(np.sin(50 * x[0])) + np.sin(60 * np.exp(x[1])) + np.sin(70 * np.sin(x[0])) + np.sin(np.sin(80 * x[1])) - np.sin(10 * (x[0] + x[1])) + (x[0]**2 + x[1]**2) / 4


def Gradf_np(x):
    return np.array([50*np.exp(np.sin(50*x[0]))*np.cos(50*x[0])+70*np.cos(np.sin(70*x[0]))*np.cos(70*x[0])-10*np.cos(10*(x[0]+x[1]))+x[0]/2, 60*np.exp(x[1])*np.cos(60*np.exp(x[1]))+80*np.cos(np.sin(80*x[1]))*np.cos(80*x[1])-10*np.cos(10*(x[0]+x[1]))+x[1]/2])


minimal_values = []
minimizer = []
for i in range(len(list_min_posi)):
    x_init = np.array(list_min_posi[i])
    if i < len(list_min_posi) - 2:
        xtab, ftab, conv = gradientVariableStep(f_np, Gradf_np, x_init, step=0.001, tol=1e-06, maxiter=200)
        print(f'For initial point {x_init}, the algorithm converges in {len(xtab)} iterations')
        print('Is the algorithm converges? ', conv)
        print(f'The minimum value of f(x, y) is {ftab[-1]} at the point ({xtab[-1][0]}, {xtab[-1][1]})')
        print('-' * 50)
        minimal_values.append(ftab[-1])
        minimizer.append(xtab[-1])
    else:
        res = minimize(f_np, x_init, method='L-BFGS-B', tol=1e-06)
        print(f'For initial point {x_init}, the algorithm converges in {res.nit} iterations')
        print('Is the algorithm converges? ', res.success)
        print(f'The minimum value of f(x, y) is {res.fun} at the point ({res.x[0]}, {res.x[1]})')
        print('-' * 50)
        minimal_values.append(res.fun)
        minimizer.append(res.x)

For initial point [-0.5 -0.5], the algorithm converges in 4 iterations
Is the algorithm converges?  True
The minimum value of f(x, y) is -1.8340181272776597 at the point (-0.5109105553704272, -0.49506955611011516)
--------------------------------------------------
For initial point [ 1.25 -0.5 ], the algorithm converges in 2 iterations
Is the algorithm converges?  True
The minimum value of f(x, y) is -1.878771216558539 at the point (1.2352881097083996, -0.4943874516804751)
--------------------------------------------------
For initial point [ 1.25 -0.5 ], the algorithm converges in 2 iterations
Is the algorithm converges?  True
The minimum value of f(x, y) is -1.878771216558539 at the point (1.2352881097083996, -0.4943874516804751)
--------------------------------------------------
For initial point [ 0.0625 -0.5   ], the algorithm converges in 8 iterations
Is the algorithm converges?  True
The minimum value of f(x, y) is -2.839623976975017 at the point (0.07331443185636564, -0.49676114392025295)
--------------------------------------------------
For initial point [ 0.34375 -0.09375], the algorithm converges in 2 iterations
Is the algorithm converges?  True
The minimum value of f(x, y) is -2.946970693908365 at the point (0.3407463345919834, -0.09436988349901183)
--------------------------------------------------
For initial point [-0.390625 -0.09375 ], the algorithm converges in 3 iterations
Is the algorithm converges?  True
The minimum value of f(x, y) is -3.2081391294819426 at the point (-0.39452567638237185, -0.09320021707807923)
--------------------------------------------------
For initial point [-0.0234375  0.2109375], the algorithm converges in 3 iterations
Is the algorithm converges?  True
The minimum value of f(x, y) is -3.3068686474609335 at the point (-0.024403099159344636, 0.21061247893447854)
--------------------------------------------------


# plot the graph of minimal values
plt.figure(figsize=(8, 6))
plt.plot(np.arange(4, 11), minimal_values, 'o-', color='red')
plt.xlabel('k')
plt.ylabel('minimal values')
plt.title('The graph of minimal values')
plt.show()


# plot the trajectory of minimizer and the points corresponding to the minimal values and order
plt.figure(figsize=(8, 6))
for i in range(len(list_min_posi)):
    if i == 0:
        plt.plot(minimizer[i][0], minimizer[i][1], 'o-', color='red', label='Trajectory')
    else:
        plt.plot(minimizer[i][0], minimizer[i][1], 'o-', color='red')
    plt.text(minimizer[i][0]-0.05, minimizer[i][1]+0.01, f'{i+1}', fontsize=15)
    if i > 0:
        plt.annotate('', xy=minimizer[i], xytext=minimizer[i-1], arrowprops=dict(facecolor='black', shrink=0.02, width=1, headwidth=5))
plt.xlabel('x')
plt.ylabel('y')
plt.title('The trajectory of minimizer and the points corresponding to the minimal values and order')
plt.legend()
plt.show()


# plot the graph of cosh(x) 
x = np.linspace(-2, 2, 100)
y = np.cosh(x)
plt.figure(figsize=(8, 6))
plt.plot(x, y, color='red')
plt.xlabel('x')
plt.ylabel('y')
plt.title('The graph of cosh(x)')
plt.show()


def J(x):
    return np.cosh(4 * x[0] + x[1])

def constraint(x):
    return 1 - x[0] * x[1]

def constraint2(x):
    return x[0] + x[1] - 2

def constraint3(x):
    return x[0] - x[1] + 1

plt.figure(figsize=(8, 6))
xmin=0
xmax=3
ymin=0
ymax=3
aX0=np.linspace(xmin,xmax,100)
aX1=np.linspace(ymin,ymax,100)
X, Y = np.meshgrid(aX0, aX1)
K2 = (Y <= X + 1) & (Y >= 2 - X)

Z=np.array([[J(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])
ZG=np.array([[constraint(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])
plt.contour(aX0,aX1,ZG,levels=0,colors='r',linewidths=2)
plt.contour(aX0,aX1,Z,12)
plt.axis('scaled')
plt.colorbar()
plt.xlabel('$x_0$')
plt.ylabel('$x_1$')
plt.title(r'Plot of $\cosh(4x+y)$ with constrain $K_{1}$')
plt.contour(X, Y, X * Y, levels=[1], colors="red", linewidths=2)
plt.contourf(X, Y, X * Y, levels=[1, 1e2], colors="red", alpha=0.1)
plt.text(0.5, 2.1, "$K_1$", fontsize=20, color="red")
plt.scatter(0.5, 2, c="black", marker="o", s=60, label="Conjectured Optimal Point")
plt.legend()
plt.show()

X, Y = np.meshgrid(aX0, aX1)
plt.figure(figsize=(8, 6))
ZG2=np.array([[constraint2(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])
ZG3=np.array([[constraint3(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])
plt.contourf(X, Y, K2, levels=[1e-10, 1], colors="green", alpha=0.1)
plt.text(0.7, 1.4, "$K_2$", fontsize=20, color="green")
plt.contour(aX0,aX1,ZG2,levels=0,colors='r',linewidths=2)
plt.contour(aX0,aX1,ZG3,levels=0,colors='r',linewidths=2)
plt.contour(aX0,aX1,Z,12)
plt.axis('scaled')
plt.colorbar()
plt.xlabel('$x_0$')
plt.ylabel('$x_1$')
plt.title(r'Plot of $\cosh(4x+y)$ with constrain $K_{2}$')
plt.show()


def closest_distance(x1, y1):
    x = sp.symbols('x')
    equation = Eq(2 * x **4 - 2 * x1 * x **3 + 2 * y1 * x  - 2, 0)
    roots = sp.solve(equation)
    x0 = 0
    # compute the distance
    for root in roots:
        if root.evalf() > 0:
            return np.array([float(root.evalf()), float(1 / root.evalf())])
        
def distance(x1, y1):
    return np.sqrt((x1 - result[0]) ** 2 + (y1 - result[1]) ** 2)

x1, y1 = 0.5, 1.0
result = closest_distance(x1, y1)
print(f'The closest distance between the point ({x1}, {y1}) is ({result[0]}, {result[1]}) and the curve is {distance(x1, y1)}')

The closest distance between the point (0.5, 1.0) is (0.8216181575795043, 1.2171103946217674) and the curve is 0.3880401560891017


# plot the graph
plt.figure(figsize=(8, 6))
Z=np.array([[J(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])
ZG=np.array([[constraint(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])
plt.contour(aX0,aX1,ZG,levels=0,colors='r',linewidths=2)
plt.contour(aX0,aX1,Z,12)
plt.axis('scaled')
plt.colorbar()
plt.xlabel('$x_0$')
plt.ylabel('$x_1$')
plt.title(r'Plot of $\cosh(4x+y)$ with constrain $K_{1}$')
plt.contour(X, Y, X * Y, levels=[1], colors="red", linewidths=2)
plt.contourf(X, Y, X * Y, levels=[1, 1e2], colors="red", alpha=0.1)
plt.text(0.5, 2.1, "$K_1$", fontsize=20, color="red")
plt.scatter(0.5, 2, c="black", marker="o", s=60, label="Conjectured Optimal Point")

# plot the point x1, y1 and result[0], result[1] and the connecting line
plt.scatter(x1, y1, c="black", marker="o", s=30, label="Initial Point")
plt.scatter(result[0], result[1], c="black", marker="o", s=30, label="Closest Point")
plt.plot([x1, result[0]], [y1, result[1]], c="black", linestyle="-", linewidth=1, label="Connecting Line")
plt.legend()
plt.show()


def J(x):
    return np.cosh(4 * x[0] + x[1])

def GradJ(x):
    return np.array([4 * np.sinh(4 * x[0] + x[1]), np.sinh(4 * x[0] + x[1])])

def projG(x):
    if x[0] * x[1] < 1:
        return closest_distance(x[0], x[1])
    else:
        return np.array([x[0], x[1]])


def projection_gradient_algorithm(f, df, x_init, step=1e-03, tol=1e-06, max_iter=2000):
    x = x_init.copy()
    xtab = []
    ftab = []
    xtab.append(projG(x))
    pval = f(x)
    ftab.append(pval)
    it = 0
    g = df(x)
    while (it == 0) or (
        step > tol and it < max_iter and np.linalg.norm(xtab[-1] - xtab[-2]) > tol
    ):
        x = projG(x - step * df(x))
        xtab.append(x)
        fval = f(x)
        ftab.append(fval)
        it = it + 1
    if it == max_iter:
        conv = False
    else:
        conv = True
    return xtab, ftab, conv


x0 = np.array([1.0, 0.5])
xtab, ftab, conv = projection_gradient_algorithm(J, GradJ, x0, max_iter=1000)


print('Has the algorithm converged ? : ',conv)
plt.figure()
plt.plot(ftab)
plt.xlabel('iteration: $it$')
plt.ylabel('$J(it)$')
plt.show()

Has the algorithm converged ? :  True


plt.figure(figsize=(8, 6))
aX0=np.linspace(xmin,xmax,100)
aX1=np.linspace(ymin,ymax,100)
Z=np.array([[J(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])
ZG=np.array([[constraint(np.array([x0,x1])) for x0 in aX0] for x1 in aX1])

plt.contour(aX0,aX1,ZG,levels=0,colors='b',linewidths=2)
plt.contour(aX0,aX1,Z,25)

lx0=[X[0] for X in xtab]
lx1=[X[1] for X in xtab]
plt.plot(x0[0],x0[1],'-xr')

plt.plot(lx0,lx1,"-ro")
plt.title('Number of iterations. = '+str(np.shape(lx0)[0]))
plt.axis('scaled')
plt.colorbar()
plt.show()

print("The final position is : ", xtab[-1])
print("The value of the function at this point is : ", ftab[-1])

The final position is :  [0.50000921 1.99996316]
The value of the function at this point is :  27.30823285453461


def f_1(x):
    return 4 * x[0] + x[1]

def constraint1(x):
    return x[0] * x[1] - 1

result = minimize(f_1, np.array([4, 3]), constraints={'fun': constraint1, 'type': 'ineq'})
print("Optimal Point:", result.x, "\tValue:", result.fun)
print('The value of function is ', np.cosh(result.fun))
print('-' * 50)
print(res)

Optimal Point: [0.49977422 2.00090346] 	Value: 4.0000003459285
The value of function is  27.308242276378245
--------------------------------------------------
  message: CONVERGENCE: REL_REDUCTION_OF_F_<=_FACTR*EPSMCH
  success: True
   status: 0
      fun: -3.3068686474609335
        x: [-2.440e-02  2.106e-01]
      nit: 3
      jac: [-8.153e-05  5.597e-04]
     nfev: 21
     njev: 7
 hess_inv: <2x2 LbfgsInvHessProduct with dtype=float64>


c = [4, 1] # here is 4x + y
A = [[-1, 1], [-1, -1]]
b = [1, -2]

res = linprog(c, A_ub=A, b_ub=b, bounds=(0, None))
print("Optimal Point:", res.x, "\tValue:", res.fun)
print('The value of function is ', np.cosh(res.fun))
print('-' * 50)
print(res)

Optimal Point: [0.5 1.5] 	Value: 3.5
The value of function is  16.572824671057315
--------------------------------------------------
        message: Optimization terminated successfully. (HiGHS Status 7: Optimal)
        success: True
         status: 0
            fun: 3.5
              x: [ 5.000e-01  1.500e+00]
            nit: 2
          lower:  residual: [ 5.000e-01  1.500e+00]
                 marginals: [ 0.000e+00  0.000e+00]
          upper:  residual: [       inf        inf]
                 marginals: [ 0.000e+00  0.000e+00]
          eqlin:  residual: []
                 marginals: []
        ineqlin:  residual: [ 0.000e+00  0.000e+00]
                 marginals: [-1.500e+00 -2.500e+00]
 mip_node_count: 0
 mip_dual_bound: 0.0
        mip_gap: 0.0


# plot the graph of cosh(x) 
x = np.linspace(-2, 2, 100)
y = np.sinh(x)
plt.figure(figsize=(8, 6))
plt.plot(x, y, color='red')
plt.xlabel('x')
plt.ylabel('y')
plt.title('The graph of cosh(x)')
plt.show()

MAA209 - Numerical Optimization - Final project¶

Part 1 - Theoretical Questions¶

Part 2 - Problem 1 - Unconstrained and Constrained optimization¶

Part A - Global optimization of an oscillating function¶

Part B - Global optimization of an oscillating function¶