E2ETune-AI4DB/stress_testing_tool.py at master · psychlone77/E2ETune-AI4DB · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
"""
Stress testing tool for evaluating database configurations under workload.
Supports OLAP (dwg), OLTP (sysbench, tpcc), and surrogate model evaluation.
"""
import copy
import os
import time
import logging
from typing import Dict, Any, Optional
import json

import numpy as np

from tuning_utils.multi_thread import multi_thread
from tuning_utils.surrogate import Surrogate
from knob_config import parse_knob_config
from benchbase_runner import BenchBaseRunner


class stress_testing_tool:
    """
    Execute workloads under specific knob configurations and measure performance.

    Supports:
    - OLAP workloads via multi-threaded query execution (dwg)
    - OLTP benchmarks via sysbench and tpcc
    - Surrogate model-based fast evaluation
    """

    def __init__(self, config: Dict[str, Any], db, logger: logging.Logger, records_log: str):
        """Initialize stress testing tool."""
        self.args = config
        self.benchmark_config = config['benchmark_config']
        self.db = db
        self.sur_config = config.get('surrogate_config', {})
        self.logger = logger
        self.records_log = records_log
        self.iteration_count = 0

        # Ensure directories exist
        os.makedirs(os.path.dirname(self.records_log), exist_ok=True)
        perf_record_dir = self.benchmark_config.get('performance_record_path', 'logs/performance_record')
        os.makedirs(perf_record_dir, exist_ok=True)

    def test_config(self, config: Dict[str, Any], iteration: Optional[int] = None) -> float:
        """Test a configuration and return performance metric."""
        self.iteration_count += 1
        if iteration is None:
            iteration = self.iteration_count

        workload_name = os.path.basename(self.benchmark_config.get('workload_path', 'unknown'))
        self.logger.info(f"[Iteration {iteration}] [Workload: {workload_name}] Testing configuration")

        temp_config = copy.deepcopy(config)
        cur_state = []
        tool = self.benchmark_config.get('tool', 'dwg')

        # Apply knobs and fetch metrics
        if tool != 'surrogate':
            self.logger.info(f"[Iteration {iteration}] Applying knobs to database")
            flag = self.db.change_knob(config)
            if not flag:
                self.logger.warning(f"[Iteration {iteration}] Some knobs failed to apply")

            self.logger.info(f"[Iteration {iteration}] Fetching internal metrics")
            cur_state = self.db.fetch_inner_metrics()

        if tool == 'dwg':
            self.logger.info(f"[Iteration {iteration}] Running DWG OLAP workload")
            y = self._test_by_dwg(
                self.benchmark_config['workload_path'],
                self.benchmark_config.get('log_path', 'logs/performance/workload_execution.log'),
                iteration
            )['throughput_qps']
            y = y[0] if isinstance(y, (list, tuple)) else y

        elif tool == 'benchbase':
            self.logger.info(f"[Iteration {iteration}] Running BenchBase benchmark")
            y = self.test_by_benchbase(
                self.benchmark_config['workload_path'],
                self.benchmark_config.get('log_path', 'logs/performance/benchbase_execution.log')
            )

        elif tool == 'surrogate':
            self.logger.info(f"[Iteration {iteration}] Running surrogate model")
            y = self._test_by_surrogate(cur_state, self.benchmark_config['workload_path'],
                                        self.sur_config, config, iteration)
        else:
            self.logger.error(f"[Iteration {iteration}] Unknown tool: {tool}")
            return 0.0

        self.logger.info(f"[Iteration {iteration}] Performance: {y:.4f}")

        # Record to training log
        temp_config['tps'] = y
        temp_config['iteration'] = iteration
        temp_config['workload'] = workload_name
        with open(self.records_log, 'a') as f:
            f.write(json.dumps(temp_config) + '\n')

        # Record to offline sample
        if tool != 'surrogate':
            offline_path = 'logs/offline_sample/offline_sample.jsonl'
            os.makedirs(os.path.dirname(offline_path), exist_ok=True)
            with open(offline_path, 'a') as f:
                temp_config['y'] = [-y, 1/(-y)] if y != 0 else [0, 0]
                temp_config['inner_metrics'] = cur_state
                temp_config['workload'] = self.benchmark_config['workload_path']
                f.write(json.dumps(temp_config) + '\n')

        # Record to per-workload performance file
        perf_dir = self.benchmark_config.get('performance_record_path', 'logs/performance_record')
        perf_file = os.path.join(perf_dir, f"{workload_name}.txt")
        with open(perf_file, 'a') as w:
            w.write(f"[Iteration {iteration}] Performance: {y:.4f}\n")

        return y

    def test_by_benchbase(self, workload_path, log_file):
        # Test the database performance using benchbase
        benchbase_runner = BenchBaseRunner(self.args, self.logger)
        return benchbase_runner.run_benchmark(workload_path, log_file)

    def _test_by_dwg(self, workload_path: str, log_file: str, iteration: int) -> tuple:
        """Execute OLAP workload via multi-threaded DWG."""
        os.makedirs(os.path.dirname(log_file), exist_ok=True)

        thread_count = int(self.benchmark_config.get('thread', 1))
        mh = multi_thread(self.db, workload_path, thread_count, log_file)

        mh.data_pre()

        self.logger.info(f"[Iteration {iteration}] Running with {thread_count} thread(s)")
        result = mh.run()

        self.logger.info(f"[Iteration {iteration}] DWG complete, result: {result}")
        return result

    def _test_by_surrogate(self, inner_metrics: Any, workload_path: str,
                           sur_config: Dict[str, Any], knobs: Dict[str, Any],
                           iteration: int) -> float:
        """Predict performance using surrogate model."""
        self.logger.info(f"[Iteration {iteration}] Loading surrogate model")
        sg = Surrogate(sur_config, workload_path)

        # 1. Prepare normalized knobs as a dictionary
        knob_detail = parse_knob_config.get_knobs('knob_config/knob_config.json')
        normalized_knobs = {}
        for key in knob_detail.keys():
            detail = knob_detail[key]
            val = knobs.get(key, detail.get('default', 0))
            if detail['max'] - detail['min'] != 0:
                normalized = (val - detail['min']) / (detail['max'] - detail['min'])
                normalized_knobs[key] = normalized
            else:
                normalized_knobs[key] = 0.0

        # 2. Prepare internal metrics as a dictionary
        # Database.fetch_inner_metrics() returns a dict
        if isinstance(inner_metrics, dict):
            inner_metrics_dict = inner_metrics
        else:
            # Fallback for list input
            metric_keys = [
                'xact_commit', 'xact_rollback', 'blks_read', 'blks_hit',
                'tup_returned', 'tup_fetched', 'tup_inserted', 'conflicts',
                'tup_updated', 'tup_deleted', 'disk_read_count', 'disk_write_count',
                'disk_read_bytes', 'disk_write_bytes'
            ]
            inner_metrics_dict = {}
            for i, key in enumerate(metric_keys):
                if i < len(inner_metrics):
                    inner_metrics_dict[key] = inner_metrics[i]
                else:
                    inner_metrics_dict[key] = 0.0

        # Ensure temp_bytes is handled (default to 0 if not in dict)
        if 'temp_bytes' not in inner_metrics_dict:
            inner_metrics_dict['temp_bytes'] = 0.0

        self.logger.info(f"[Iteration {iteration}] Running surrogate prediction")
        prediction = sg.run(inner_metrics_dict, normalized_knobs)
        self.logger.info(f"[Iteration {iteration}] Surrogate prediction: {prediction:.4f}")
        return prediction