import numpy as np
import matplotlib.pyplot as plt

r = np.array([3.4, 0.2])
# closest point satisfying z1 + z2 = 2
z_star = np.array([2.6, -0.6])

x = np.linspace(-0.5, 4.0, 200)
y = 2 - x

plt.plot(x, y, label=r"feasible set: $z_1 + z_2 = 2$")
plt.scatter(*r, marker="x", s=50, linewidths=3, label=r"raw point $r$")
plt.scatter(*z_star, s=50, label=r"closest feasible point $z^\star$")

plt.arrow(
    r[0], r[1],
    z_star[0] - r[0],
    z_star[1] - r[1],
    length_includes_head=True,
    head_width=0.04,
    alpha=0.5
)

plt.text(3.60, 0.25, r"$r=(3.4,0.2)$")
plt.text(2.80, -0.55, r"$z^\star=(2.6,-0.6)$")

plt.axis("equal")
plt.grid(True, alpha=0.3)
plt.xlabel(r"$z_1$")
plt.ylabel(r"$z_2$")
plt.legend();

import numpy as np

np.random.seed(42)

n = 40
c_true = 2.0

# Create points near the *hidden* constraint line z1 + z2 = 2
z1 = np.linspace(-0.2, 2.2, n)
z2 = c_true - z1

# Ground truth points to predict (y)
y_clean = np.column_stack([z1, z2])
# Noisy predictions
y = y_clean + 0.15 * np.random.randn(n, 2)

# Raw points (data) with noise and bias
r = y + np.array([0.65, -0.25]) + 0.5 * np.random.randn(n, 2)

# Plot
x = np.linspace(-0.6, 3.2, 200)
line = c_true - x

plt.plot(x, line, label=r"true constraint: $z_1 + z_2 = 2$")
plt.scatter(y[:, 0], y[:, 1], s=45, label="target data")
plt.scatter(r[:, 0], r[:, 1], marker="x", s=55, label="noisy data points")

plt.axis("equal")
plt.grid(True, alpha=0.3)
plt.xlabel(r"$z_1$")
plt.ylabel(r"$z_2$")
plt.title("Synthetic dataset")
plt.legend();

r = np.array([3.4, 0.2])
c = 2.0

# Candidate points z = (z1, z2)
z1 = np.linspace(-0.5, 4.2, 300)
z2 = np.linspace(-1.0, 3.2, 300)
Z1, Z2 = np.meshgrid(z1, z2)

# Original objective and constraint violation
distance = (Z1 - r[0])**2 + (Z2 - r[1])**2
violation = Z1 + Z2 - c

# Exact constrained solution, only for visual reference
z_exact = np.array([2.6, -0.6])

# Values of rho used for the geometry plot
rhos_for_plot = np.array([0, 0.05, 0.15, 0.5, 1.5, 5, 20])

# Values of rho used for the curve plot
rhos_for_curve = np.logspace(-3, 2, 100)


def solve_by_grid_search(rho):
    objective = distance + rho * violation**2

    row, col = np.unravel_index(
        np.argmin(objective),
        objective.shape
    )

    z = np.array([Z1[row, col], Z2[row, col]])
    d = distance[row, col]
    v = violation[row, col]
    p = rho * v**2

    return z, d, v, p


# Compute solutions for selected rho values
solutions = np.array([
    solve_by_grid_search(rho)[0]
    for rho in rhos_for_plot
])

# Compute curves for many rho values
curve_data = np.array([
    solve_by_grid_search(rho)[1:]
    for rho in rhos_for_curve
])

distance_terms = curve_data[:, 0]
violations = np.abs(curve_data[:, 1])
penalty_terms = curve_data[:, 2]


# Contours of the original distance objective
contours = plt.contour(Z1, Z2, distance, levels=20, linewidths=0.9)
plt.clabel(contours, inline=True, fontsize=8)

# Feasible line z1 + z2 = c
line_x = np.linspace(-0.5, 4.2, 300)
plt.plot(
    line_x,
    c - line_x,
    linewidth=3,
    alpha=0.6,
    label=r"constraint: $z_1+z_2=2$"
)

# Raw point and exact constrained solution
plt.scatter(
    r[0], r[1],
    s=130,
    marker="x",
    linewidths=3,
    label=r"raw point $r$"
)

plt.scatter(
    z_exact[0], z_exact[1],
    s=120,
    marker="*",
    label=r"exact constrained solution"
)

# Penalty solutions
plt.plot(
    solutions[:, 0],
    solutions[:, 1],
    "--",
    linewidth=1.5,
    label=r"grid-search penalty solutions"
)

plt.scatter(solutions[:, 0], solutions[:, 1], s=30)

for rho, z in zip(rhos_for_plot, solutions):
    plt.text(
        z[0] + 0.20,
        z[1] + 0.04,
        fr"$\rho={rho:g}$",
        fontsize=8
    )

plt.xlabel(r"$z_1$")
plt.ylabel(r"$z_2$")
plt.axis("equal")
plt.grid(True, alpha=0.3)
plt.legend(loc="lower left");

plt.loglog(
    rhos_for_curve,
    violations,
    linewidth=2.5,
    label=r"$|z_1+z_2-c|$"
)

plt.loglog(
    rhos_for_curve,
    distance_terms,
    linewidth=2.2,
    label=r"distance term"
)

plt.loglog(
    rhos_for_curve,
    penalty_terms,
    linewidth=2.2,
    label=r"penalty term"
)

# Add final-value labels
for y, name in [
    (violations, r"$|z_1+z_2-c|$"),
    (distance_terms, "distance"),
    (penalty_terms, "penalty"),
]:
    plt.annotate(
        f"{y[-1]:.2f}",
        xy=(rhos_for_curve[-1], y[-1]),
        xytext=(6, 0),
        textcoords="offset points",
        va="center",
        fontsize=10,
    )

plt.xlabel(r"penalty strength $\rho$")
plt.ylabel("value")
plt.title(r"How the penalty strength $\rho$ affects the solution")
plt.grid(True, alpha=0.3, which="both")
plt.legend();

# Original example
r = np.array([3.4, 0.2])
c = 2.0

# Constraint: z1 + z2 = c
x = np.linspace(-1.0, 4.0, 200)
y = c - x

lambdas = np.linspace(-1.0, 3.0, 9)

solutions = np.array([
    r - (lam / 2) * np.array([1.0, 1.0])
    for lam in lambdas
])

# Exact lambda that makes z*(lambda) feasible:
# z1 + z2 = c
# r1 + r2 - lambda = c
# lambda = r1 + r2 - c
lambda_star = r.sum() - c
z_star = r - (lambda_star / 2) * np.array([1.0, 1.0])

plt.plot(x, y, label=r"constraint: $z_1 + z_2 = c$")
plt.scatter(r[0], r[1], s=100, label=r"$r=(3.4,0.2)$")
plt.scatter(solutions[:, 0], solutions[:, 1], s=30, label=r"$z^\star(\lambda)$")
plt.plot(
    solutions[:, 0],
    solutions[:, 1],
    linestyle="--",
    label=r"path as $\lambda$ changes"
)
plt.scatter(
    z_star[0],
    z_star[1],
    s=130,
    marker="*",
    label=rf"exact projection $z^\star=({z_star[0]:.1f},{z_star[1]:.1f})$"
)

for lam, z in zip(lambdas, solutions):
    plt.text(z[0] + 0.04, z[1] + 0.04, rf"$\lambda={lam:.1f}$", fontsize=8)

plt.axis("equal")
plt.xlabel(r"$z_1$")
plt.ylabel(r"$z_2$")
plt.title(r"Changing $\lambda$ moves the unconstrained minimizer")
plt.legend()
plt.grid(True);

A simple motivating problem¶

Getting rid of the constraint with penalties¶

From penalties to exact constraints¶

The Lagrangian¶

What the Lagrange multiplier is doing¶

The Karush-Kuhn-Tucker (KKT) conditions¶

KKT conditions: are these sufficient?¶

Extending to multiple equality constraints¶

From the special case to general quadratic programs¶

What about inequalities?¶

Summary and next steps¶