OpenClaw-Medical-Skills/skills/bayesian-optimizer/bayesian_optimization.py at main · opencare-skillhub/OpenClaw-Medical-Skills · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
# COPYRIGHT NOTICE
# This file is part of the "Universal Biomedical Skills" project.
# Copyright (c) 2026 MD BABU MIA, PhD <md.babu.mia@mssm.edu>
# All Rights Reserved.
#
# This code is proprietary and confidential.
# Unauthorized copying of this file, via any medium is strictly prohibited.
#
# Provenance: Authenticated by MD BABU MIA

import numpy as np
from typing import List, Tuple, Callable, Optional
from dataclasses import dataclass

@dataclass
class OptimizationResult:
    best_params: np.ndarray
    best_value: float
    all_history: List[Tuple[np.ndarray, float]]

class BayesianOptimizer:
    """
    A lightweight implementation of Bayesian Optimization using Gaussian Processes (GP).
    Crucial for 'Self-Driving Labs' to select the next experiment that maximizes information gain
    (Upper Confidence Bound - UCB).
    """

    def __init__(self, bounds: List[Tuple[float, float]], kappa: float = 2.5):
        """
        :param bounds: List of (min, max) for each dimension.
        :param kappa: Exploration-exploitation balance (higher = more exploration).
        """
        self.bounds = np.array(bounds)
        self.dim = len(bounds)
        self.kappa = kappa
        self.X_sample: List[np.ndarray] = []
        self.Y_sample: List[float] = []

        # Hyperparameters for the RBF Kernel
        self.sigma_f = 1.0
        self.length_scale = 1.0
        self.noise = 1e-5

    def _kernel(self, X1: np.ndarray, X2: np.ndarray) -> np.ndarray:
        """
        Radial Basis Function (RBF) / Squared Exponential Kernel.
        Computes covariance between points.
        """
        sqdist = np.sum(X1**2, 1).reshape(-1, 1) + np.sum(X2**2, 1) - 2 * np.dot(X1, X2.T)
        return self.sigma_f**2 * np.exp(-0.5 / self.length_scale**2 * sqdist)

    def fit(self, X: List[np.ndarray], Y: List[float]):
        """Update the internal Gaussian Process with new data."""
        self.X_sample = np.array(X)
        self.Y_sample = np.array(Y).reshape(-1, 1)

    def predict(self, X: np.ndarray) -> Tuple[np.ndarray, np.ndarray]:
        """
        Predicts mean and variance for a new set of points X using the GP.
        """
        if len(self.X_sample) == 0:
            return np.zeros((len(X), 1)), np.ones((len(X), 1))

        K = self._kernel(self.X_sample, self.X_sample) + self.noise * np.eye(len(self.X_sample))
        K_s = self._kernel(self.X_sample, X)
        K_ss = self._kernel(X, X) + 1e-8 * np.eye(len(X))

        K_inv = np.linalg.inv(K)

        # Mean prediction
        mu = K_s.T.dot(K_inv).dot(self.Y_sample)

        # Variance prediction
        cov = K_ss - K_s.T.dot(K_inv).dot(K_s)
        return mu, np.diag(cov).reshape(-1, 1)

    def acquisition_function(self, X: np.ndarray) -> np.ndarray:
        """
        Upper Confidence Bound (UCB).
        Selects points with high mean (exploitation) or high variance (exploration).
        """
        mu, sigma = self.predict(X)
        return mu + self.kappa * np.sqrt(sigma)

    def propose_next_location(self, num_candidates: int = 100) -> np.ndarray:
        """
        Randomly samples the search space and returns the point with the highest Acquisition Score.
        In production, use L-BFGS-B to maximize the acquisition function properly.
        """
        # Uniform random sampling within bounds
        candidates = np.random.uniform(
            self.bounds[:, 0], self.bounds[:, 1], size=(num_candidates, self.dim)
        )
        scores = self.acquisition_function(candidates)
        best_idx = np.argmax(scores)
        return candidates[best_idx]

if __name__ == "__main__":
    import argparse
    import json
    import ast
    import sys

    parser = argparse.ArgumentParser(description="Bayesian Optimization Agent")
    parser.add_argument("--history", help="List of [X, Y] pairs or JSON history. Format: '[[[x1], y1], [[x2], y2]]'")
    parser.add_argument("--bounds", required=True, help="List of (min, max) tuples. Format: '[[min1, max1], ...]'")
    parser.add_argument("--demo", action="store_true", help="Run the internal synthetic demo")
    parser.add_argument("--output", help="Path to save output JSON")

    args = parser.parse_args()

    if args.demo:
        # Define a "Black Box" function (e.g., experimental yield)
        # Goal: Maximize this function
        def synthetic_experiment(params):
            # Simple 1D function: f(x) = -(x-2)^2 + 10. Max is at x=2, value=10.
            x = params[0]
            return -(x - 2.0)**2 + 10.0

        # Initialize Optimizer for 1D space between [-5, 5]
        opt = BayesianOptimizer(bounds=[(-5.0, 5.0)])

        print("--- Starting Self-Driving Lab Simulation ---")

        # Initial random observations
        X_init = [np.array([0.0]), np.array([4.0])]
        Y_init = [synthetic_experiment(x) for x in X_init]
        opt.fit(X_init, Y_init)

        # Run 5 optimization steps
        for step in range(5):
            next_param = opt.propose_next_location()
            actual_value = synthetic_experiment(next_param)

            print(f"Step {step+1}: Suggested Param {next_param}, Result {actual_value:.4f}")

            # Add to known data
            X_init.append(next_param)
            Y_init.append(actual_value)
            opt.fit(X_init, Y_init)

        best_y = max(Y_init)
        print(f"Optimization Complete. Best Value Found: {best_y:.4f}")

    else:
        # Parsing CLI arguments
        try:
            bounds = json.loads(args.bounds)
            opt = BayesianOptimizer(bounds=bounds)

            if args.history:
                # History format expected: [ [[x1_1, x1_2], y1], [[x2_1, x2_2], y2] ]
                history = json.loads(args.history)
                X_hist = []
                Y_hist = []
                for x, y in history:
                    X_hist.append(np.array(x))
                    Y_hist.append(y)

                if X_hist:
                    opt.fit(X_hist, Y_hist)

            next_param = opt.propose_next_location()

            result = {
                "next_parameters": next_param.tolist(),
                "status": "ready"
            }

            print(json.dumps(result, indent=2))

            if args.output:
                with open(args.output, 'w') as f:
                    json.dump(result, f, indent=2)

        except Exception as e:
            print(f"Error parsing arguments: {e}", file=sys.stderr)
            sys.exit(1)
__AUTHOR_SIGNATURE__ = "9a7f3c2e-MD-BABU-MIA-2026-MSSM-SECURE"