import numpy as np
import torch
from utils import plot_contours

torch.set_default_dtype(torch.double)

# Define domain
x0 = torch.linspace(-5, 5, steps=100)
x1 = torch.linspace(-5, 5, steps=100)
x = torch.stack(torch.meshgrid(x0, x1, indexing="xy"), dim=2)

# Define constants
xt = torch.tensor([-1.0, 1.0])
Q = torch.tensor([[2.0, 1.0], [1, 1.0]])


# Define function
def f(x):
    dx = x - xt
    return torch.einsum("...i,ij,...j", dx, Q, dx)


# Plot function as contour lines
plot_contours(x, f(x), opti=[-1, 1])

def simple_decent(x_init, func, eta=0.1, max_iter=100):
    # Copy initial x to new differentiable tensor x
    x = x_init.clone().requires_grad_()

    points = []

    # --> Implement your solution here

    return points

x_init = torch.tensor([4.0, -1.0])
path = simple_decent(x_init, f)
plot_contours(x, f(x), opti=[-1, 1], paths={"Simple steepest decent": path})
print(f"Final values are x_1={path[-1][0]:.3f}, x_2={path[-1][1]:.3f}")

def incomplete_line_search(x_init, func, eta_0=5.0, c=0.5, rho=0.8, max_iter=10):
    # Copy initial x to new differentiable tensor x
    x = x_init.clone().requires_grad_()

    points = []

    # --> Implement your solution here

    return points

x_init = torch.tensor([4.0, -1.0])
path = incomplete_line_search(x_init, f)
plot_contours(x, f(x), opti=[-1, 1], paths={"Incomplete line search": path})
print(f"Final values are x_1={path[-1][0]:.3f}, x_2={path[-1][1]:.3f}")

def complete_line_search(x_init, func, max_iter=10):
    # Copy initial x to new differentiable tensor x
    x = x_init.clone().requires_grad_()

    points = []

    # --> Implement your solution here

    return points

x_init = torch.tensor([4.0, -1.0])
path = complete_line_search(x_init, f)
plot_contours(x, f(x), opti=[-1, 1], paths={"Complete line search": path})
print(f"Final values are x_1={path[-1][0]:.3f}, x_2={path[-1][1]:.3f}")

def cg(x_init, func, max_iter=5):
    # Copy initial x to new differentiable tensor x
    x = x_init.clone().requires_grad_()

    points = []

    # --> Implement your solution here

    return points

x_init = torch.tensor([4.0, -1.0])
path = cg(x_init, f)
plot_contours(x, f(x), opti=[-1, 1], paths={"Conjugated gradients": path})
print(f"Final values are x_1={path[-1][0]:.3f}, x_2={path[-1][1]:.3f}")

def bfgs(x_init, func, max_iter=5):
    # Copy initial x to new differentiable tensor x
    x = x_init.clone().requires_grad_()

    points = []

    # --> Implement your solution here

    return points

x_init = torch.tensor([4.0, -1.0])
path = bfgs(x_init, f)
plot_contours(x, f(x), opti=[-1, 1], paths={"BFGS": path})
print(f"Final values are x_1={path[-1][0]:.3f}, x_2={path[-1][1]:.3f}")

x_init = torch.tensor([4.0, -1.0])
path_simple = simple_decent(x_init, f)
path_ils = incomplete_line_search(x_init, f)
path_cls = complete_line_search(x_init, f)
path_cg = cg(x_init, f)
path_bfgs = bfgs(x_init, f)
plot_contours(
    x,
    f(x),
    opti=[-1, 1],
    paths={
        "Simple": path_simple,
        "ILS": path_ils,
        "CLS": path_cls,
        "CG": path_cg,
        "BFGS": path_bfgs,
    },
)

def himmelblau_function(x):
    return (x[..., 0] ** 2 + x[..., 1] - 11) ** 2 + (
        x[..., 0] + x[..., 1] ** 2 - 7
    ) ** 2


# --> Implement your solution here

# Define domain
x0 = torch.linspace(-1.5, 1.5, steps=100)
x1 = torch.linspace(-1.5, 1.5, steps=100)
x = torch.stack(torch.meshgrid(x0, x1, indexing="xy"), dim=2)


def rosenbrock_function(x):
    return 100 * (x[..., 1] - x[..., 0] ** 2) ** 2 + (1 - x[..., 0]) ** 2


# --> Implement your solution here

Exercise 02 Gradient decent methods¶

Task 1 - Simple steepest decent¶

Task 2 - Steepest decent method with incomplete line search¶

Task 3 - Steepest decent method with complete line search¶

Task 4 - Conjugated gradients¶

Task 5 - BFGS¶

Task 6 - Comparison¶