humancompatible
diff --git a/‎benchmark/demo_balls.py‎
Lines changed: 265 additions & 0 deletions b/‎benchmark/demo_balls.py‎
Lines changed: 265 additions & 0 deletions
@@ -0,0 +1,265 @@
+from matplotlib.patches import Circle
+import torch
+from humancompatible.train.optim.PBM import PBM
+import numpy as np
+import matplotlib.pyplot as plt
+from mpl_toolkits.axes_grid1 import make_axes_locatable
+
+torch.manual_seed(1)
+np.random.seed(1)
+
+def plot_balls_trajectory(trajectories, names):
+    """
+    trajectory: array-like of shape (N, 2), where each row is [x, y]
+    """
+
+    fig, ax = plt.subplots(figsize=(24, 16))
+
+    # Feasible regions: unit balls
+    ball_centers = [(-2, 0), (2, 0)]
+    radius = np.sqrt(0.99)
+    labels = [r"$\mathbb{E}[g_1(x,y,\xi)] \leq 0 $", r"$\mathbb{E}[g_2(x,y,\xi)] \leq 0$"]
+
+    # Heatmap for x^2 + y^2
+    x = np.linspace(-4, 4, 100)
+    y = np.linspace(-2.5, 2.5, 100)
+    X, Y = np.meshgrid(x, y)
+    Z = X**2 + Y**2
+
+
+    for center, label in zip(ball_centers, labels):
+        ball = Circle(
+            center,
+            radius=radius,
+            facecolor="lightgray",
+            edgecolor="black",
+            linewidth=1.5,
+            alpha=0.6,
+            zorder=1,
+        )
+        ax.add_patch(ball)
+        # Label inside the ball
+        ax.text(
+            center[0], center[1],
+            label,
+            fontsize=18,
+            fontweight='bold',
+            color='black',
+            ha='center',
+            va='center',
+            zorder=5
+        )
+
+    for i, traj in enumerate(trajectories):
+        traj = np.asarray(traj)
+
+        # Trajectory
+        ax.plot(
+            traj[:, 0],
+            traj[:, 1],
+            linewidth=2.0,
+            zorder=3,
+            alpha=1.0
+        )
+
+        # Emphasize x_0 and x_n
+        x0 = traj[0]
+        xn = traj[-1]
+
+        ax.scatter(
+            x0[0], x0[1],
+            s=80,
+            marker="o",
+            facecolor="white",
+            edgecolor="black",
+            linewidth=2,
+            zorder=4,
+        )
+        ax.scatter(
+            xn[0], xn[1],
+            s=60,
+            marker="s",
+            facecolor="black",
+            edgecolor="black",
+            zorder=4,
+        )
+        x_n = [
+            r"$x_{\rho=0}^n$",
+            r"$x_{\rho=1}^n$",
+            r"$x_{\rho=2.5}^n$",
+            r"$x_{SPBM}^n$",
+        ]
+        # Labels for x_0 and x_n
+        ax.annotate(
+            r"$x^0$",
+            xy=(x0[0], x0[1]),
+            xytext=(6, 8),
+            textcoords="offset points",
+            fontsize=22,
+            zorder=5,
+        )
+        ax.annotate(
+            x_n[i],
+            xy=(xn[0], xn[1]),
+            # xytext=(8 if i==1 or i == 3 else -36, -12),
+            xytext=(8 if i==1 or i == 3 else -45, -15),
+            textcoords="offset points",
+            fontsize=22,
+            zorder=5,
+        )
+
+    # Formatting
+    ax.set_aspect("equal", adjustable="box")
+    ax.set_xlabel(r"$x$", fontsize=12)
+    ax.set_ylabel(r"$y$", fontsize=12)
+    ax.grid(True, linestyle=":", linewidth=0.8, alpha=0.7)
+    ax.set_xlim(-3.2, 3.2)
+    ax.set_ylim(-1.8, 1.8)
+
+
+    contour = ax.contourf(X, Y, Z, levels=100, cmap='viridis', alpha=0.5, zorder=0)
+    divider = make_axes_locatable(ax)
+    cax = divider.append_axes("right", size="3%", pad=0.08)
+
+    cbar = fig.colorbar(contour, cax=cax)
+    cbar.set_label(r"$x^2 + y^2$", fontsize=14)
+
+    fig.savefig(
+        "./demo_balls_pbm.pdf",
+        bbox_inches="tight",
+        pad_inches=0.05
+    )
+
+
+
+def balls(x, sample):
+    g1 = ((x[0] - 2 + sample)**2 + x[1]**2 - 1)
+    g2 = ((x[0] + 2 + sample)**2 + x[1]**2 - 1)
+    # g1 = ((x[0] - 2)**2 + x[1]**2 - 1) + sample
+    # g2 = ((x[0] + 2)**2 + x[1]**2 - 1) + sample
+    if g1 <= g2:
+        return g1
+    else:
+        return g2
+
+def parabola(x):
+    return x[0]**2 + x[1]**2
+
+
+samples = [
+    # torch.tensor([0]),
+    # torch.tensor([0])
+    torch.tensor([-0.1]),
+    torch.tensor([0.1])
+]
+
+
+################## SGD ######################### 
+
+def run_sgd(rho: float):
+
+    xy = torch.nn.Parameter(data=torch.ones(2, requires_grad=True))
+    with torch.no_grad():
+        xy[0] = 0
+        xy[1] = 1
+
+    sgd = torch.optim.SGD([xy], lr=0.05, dampening=0.1)
+
+    scheduler = torch.optim.lr_scheduler.LambdaLR(
+        sgd,
+        lr_lambda=lambda step: 0.99 ** step
+    )
+
+    param_log_sgd = []
+    con_log_sgd = []
+
+    for i in range(200):
+        param_log_sgd.append(
+            xy.detach().numpy().copy()
+        )
+
+        r = np.random.uniform()
+        minibatch = samples[0 if r > 0.5 else 1]
+            
+        c = balls(xy, minibatch)
+
+        obj = parabola(xy) + rho * torch.square(torch.norm(c, p=2))
+
+        obj.backward()
+        sgd.step()
+        scheduler.step()
+        sgd.zero_grad()
+        for gr in sgd.param_groups:
+            gr['lr'] *= 0.97
+
+        con_log_sgd.append(c.detach().numpy().copy().item())
+    
+    return param_log_sgd, con_log_sgd
+
+
+sgd_param_logs, sgd_con_logs = [], []
+
+rhos = [0.1,1,2]
+
+for rho in rhos:
+    param_log_sgd, con_log_sgd = run_sgd(rho)
+    sgd_param_logs.append(param_log_sgd)
+    sgd_con_logs.append(con_log_sgd)
+
+
+################## PBM ######################### 
+
+xy = torch.nn.Parameter(data=torch.ones(2, requires_grad=True))
+with torch.no_grad():
+    xy[0] = 0
+    xy[1] = 1
+
+pbm = PBM([xy], m=1, lr=0.01, dual_bounds=(1e-3, 1e3), penalty_update_m='CONST', epoch_len=2, mu=0, opt_method="Adam")
+
+iters = 200
+
+param_log = []
+con_log = []
+dual_log = []
+c_grad_log = []
+
+for i in range(iters):
+    param_log.append(
+        xy.detach().numpy().copy()
+    )
+    # print(xy)
+    
+    r = np.random.uniform()
+    minibatch = samples[
+        0 if r > 0.5 else 1
+        ]
+    
+    c = balls(xy, minibatch)
+    
+    pbm.dual_step(0, c)
+    dual_log.append(pbm._dual_vars.detach().numpy().copy().item())
+
+    obj = parabola(xy)
+
+    pbm.step(obj)
+    for gr in pbm.param_groups:
+        gr['lr'] *= 0.99
+
+    con_log.append(c.detach().numpy().copy().item())
+
+
+# print(param_log)
+# print(con_log)
+
+trajectories = sgd_param_logs
+trajectories.append(param_log)
+
+plot_balls_trajectory(
+    trajectories,
+    [r"$\rho= $" + str(rho) for rho in rhos] + ['spbm']
+)
+
+# print(param_log)
+# print(np.array(dual_log))
+# print(np.array(con_log))
+# print(np.array(con_log))