aws-crt-s3-benchmarks/runners/s3-benchrunner-c/BenchmarkRunner.cpp at main · c-hagem/aws-crt-s3-benchmarks · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
#include "BenchmarkRunner.h"

#include <algorithm>
#include <fstream>
#include <iostream>
#include <random>
#include <sstream>
#include <string>

#include <aws/common/system_resource_util.h>

#include <argh.h>
#include <nlohmann/json.hpp>

using namespace std;
using namespace std::chrono;
using json = nlohmann::json;

struct TaskConfig;
class Benchmark;

// exit due to failure
[[noreturn]] void fail(string_view msg)
{
    cerr << "FAIL - " << msg << endl;
    _Exit(255);
}

// exit because we're skipping the benchmark (e.g. has version# this runner doesn't support yet)
[[noreturn]] void skip(string_view msg)
{
    cerr << "Skipping benchmark - " << msg << endl;
    _Exit(123);
}

uint64_t bytesFromKiB(uint64_t kibibytes)
{
    return kibibytes * 1024;
}

uint64_t bytesFromMiB(uint64_t mebibytes)
{
    return mebibytes * 1024 * 1024;
}

uint64_t bytesFromGiB(uint64_t gibibytes)
{
    return gibibytes * 1024 * 1024 * 1024;
}

double bytesToKiB(uint64_t bytes)
{
    return (double)bytes / 1024;
}

double bytesToMiB(uint64_t bytes)
{
    return (double)bytes / (1024 * 1024);
}

double bytesToGiB(uint64_t bytes)
{
    return (double)bytes / (1024 * 1024 * 1024);
}

double bytesToKilobit(uint64_t bytes)
{
    return ((double)bytes * 8) / 1'000;
}

double bytesToMegabit(uint64_t bytes)
{
    return ((double)bytes * 8) / 1'000'000;
}

double bytesToGigabit(uint64_t bytes)
{
    return ((double)bytes * 8) / 1'000'000'000;
}

BenchmarkConfig::BenchmarkConfig(
    std::string_view jsonFilepath,
    std::string_view bucket,
    std::string_view region,
    double targetThroughputGbps,
    std::string_view networkInterfaceNames,
    std::string_view telemetryFileBasePath)
    : bucket(bucket), region(region), targetThroughputGbps(targetThroughputGbps),
      telemetryFileBasePath(telemetryFileBasePath)
{
    auto f = ifstream(string(jsonFilepath));
    if (!f)
        fail(string("Couldn't open file: ") + string(jsonFilepath));

    auto json = json::parse(f, /*cb*/ nullptr, /*exceptions*/ false);
    if (json.is_discarded())
        fail(string("Couldn't parse JSON: ") + string(jsonFilepath));

    int version = json["version"];
    if (version != 2)
        skip("workload version not supported");

    this->maxRepeatCount = json["maxRepeatCount"];
    this->maxRepeatSecs = json["maxRepeatSecs"];

    if (!json["checksum"].is_null())
        this->checksum = json["checksum"];

    this->filesOnDisk = json["filesOnDisk"];

    for (auto &&taskJson : json["tasks"])
    {
        auto &task = this->tasks.emplace_back();
        task.action = taskJson["action"];
        task.key = taskJson["key"];
        task.size = taskJson["size"];
    }

    if (!networkInterfaceNames.empty())
    {
        std::istringstream ss((std::string(networkInterfaceNames)));
        std::string interface;
        while (std::getline(ss, interface, ','))
        {
            if (!interface.empty())
            {
                this->networkInterfaceNames.push_back(interface);
            }
        }
    }
}

uint64_t BenchmarkConfig::bytesPerRun() const
{
    uint64_t bytes = 0;
    for (auto &&task : tasks)
        bytes += task.size;
    return bytes;
}

// Instantiates S3 Client, does not run the benchmark yet
BenchmarkRunner::BenchmarkRunner(const BenchmarkConfig &config) : config(config)
{
    // If we're uploading, and not using files on disk,
    // then generate an in-memory buffer of random data to upload.
    // All uploads will use this same buffer, so make it big enough for the largest file.
    if (!config.filesOnDisk)
    {
        size_t maxUploadSize = 0;
        for (auto &&task : config.tasks)
            if (task.action == "upload")
                maxUploadSize = std::max(maxUploadSize, (size_t)task.size);

        // Generating randomness is slower then copying memory. Therefore, only fill SOME
        // of the buffer with randomness, and fill the rest with copies of that randomness.

        // We don't want any parts to be identical.
        // Use something that won't fall on a part boundary as we copy it.
        const size_t randomBlockSize = std::min((size_t)31415926, maxUploadSize); // approx 30MiB, digits of pi
        std::vector<uint8_t> randomBlock(randomBlockSize);
        independent_bits_engine<default_random_engine, CHAR_BIT, unsigned char> randEngine;
        generate(randomBlock.begin(), randomBlock.end(), randEngine);

        // Resize the buffer to the maximum upload size
        randomDataForUpload.resize(maxUploadSize);

        // Fill the buffer by repeating the random block
        size_t bytesWritten = 0;
        while (bytesWritten < maxUploadSize)
        {
            // Calculate how many bytes to copy in this iteration
            size_t bytesToCopy = std::min(randomBlockSize, maxUploadSize - bytesWritten);

            // Copy the bytes from the random block to the target buffer
            std::copy(
                randomBlock.begin(), randomBlock.begin() + bytesToCopy, randomDataForUpload.begin() + bytesWritten);

            bytesWritten += bytesToCopy;
        }
    }
}

BenchmarkRunner::~BenchmarkRunner() = default;

// If telemetry is enabled, output stats for each run to ./telemetry/<workload_name>/<current_date_time>/stats.txt
FILE *statsFile = NULL;

// Print to both stdout and statsFile
template <typename... Args> void StatsPrintf(const char *fmt, Args... args)
{
    // Print to stdout
    printf(fmt, args...);

    // Print to statsFile if it exists
    if (statsFile)
    {
        fprintf(statsFile, fmt, args...);
        fflush(statsFile);
    }
}

// Print all kinds of stats about these values (median, mean, min, max, etc)
void printValueStats(const char *label, vector<double> values)
{
    std::sort(values.begin(), values.end());
    double n = values.size();
    double min = values.front();
    double max = values.back();
    double mean = std::accumulate(values.begin(), values.end(), 0.0) / n;

    double median = values.front();
    if (values.size() > 1)
    {
        size_t middle = values.size() / 2;
        if (values.size() % 2 == 1)
        {
            // odd number, use middle value
            median = values[middle];
        }
        else
        {
            // even number, use avg of two middle values
            double a = values[middle - 1];
            double b = values[middle];
            median = (a + b) / 2;
        }
    }

    double variance = std::accumulate(
        values.begin(),
        values.end(),
        0.0,
        [mean, n](double accumulator, const double &val) { return accumulator + ((val - mean) * (val - mean) / n); });

    double stdDev = std::sqrt(variance);

    StatsPrintf(
        "Overall %s Median:%f Mean:%f Min:%f Max:%f Variance:%f StdDev:%f\n",
        label,
        median,
        mean,
        min,
        max,
        variance,
        stdDev);
}

void printAllStats(uint64_t bytesPerRun, const vector<double> &durations)
{
    vector<double> throughputsGbps;
    for (double duration : durations)
        throughputsGbps.push_back(bytesToGigabit(bytesPerRun) / duration);

    printValueStats("Throughput (Gb/s)", throughputsGbps);

    printValueStats("Duration (Secs)", durations);

    struct aws_memory_usage_stats mu;
    aws_init_memory_usage_for_current_process(&mu);

    StatsPrintf("Peak RSS:%f MiB\n", (double)mu.maxrss / 1024.0);
}

/**
 * Extracts the workload name from a path.
 * Given "path/to/my-workload.run.json" returns "my-workload".
 */
string workload_name(string_view path)
{
    // Get the filename without the path
    string filename = filesystem::path(path).filename().string();

    // Get everything before the first dot
    auto first_dot = filename.find('.');
    if (first_dot != string::npos)
    {
        return filename.substr(0, first_dot);
    }

    return filename;
}

struct Args
{
    string s3ClientId;
    string workload;
    string bucket;
    string region;
    double targetThroughputGbps;

    // Optional arguments
    string networkInterfaceNames = "";
    bool telemetry = false;
};

int benchmarkRunnerMain(int argc, char *argv[], const CreateRunnerFromNameFn &createRunnerFromName)
{
    // START Argument Parsing
    argh::parser cmdl;
    // pre-register optional named arguments to support --param_name param_value syntax
    cmdl.add_params({"--nic"});
    cmdl.parse(argc, argv);

    if (cmdl[{"-h", "--help"}] || cmdl.pos_args().size() < 6)
    {
        fail(
            std::string("usage: ") + argv[0] +
            " S3_CLIENT WORKLOAD BUCKET REGION TARGET_THROUGHPUT [--nic name1,name2] [--telemetry]");
    }

    struct Args parsedArgs;

    // Parse required positional parameters
    parsedArgs.s3ClientId = cmdl[1];
    parsedArgs.workload = cmdl[2];
    parsedArgs.bucket = cmdl[3];
    parsedArgs.region = cmdl[4];
    parsedArgs.targetThroughputGbps = stod(cmdl[5]);

    // Parse optional named arguments
    cmdl("nic") >> parsedArgs.networkInterfaceNames;

    if (cmdl["telemetry"])
    {
        parsedArgs.telemetry = true;
    }

    // END argument parsing

    string telemetryFileBasePath = "";
    if (parsedArgs.telemetry)
    {
        auto now = chrono::system_clock::to_time_t(chrono::system_clock::now());
        stringstream ss;
        ss << "telemetry/";
        ss << workload_name(parsedArgs.workload) << "/";
        ss << put_time(localtime(&now), "%Y-%m-%d_%H-%M-%S");

        telemetryFileBasePath = ss.str();
        // Create the directory
        error_code ec;
        filesystem::create_directories(telemetryFileBasePath, ec);
        if (ec)
        {
            fail(string("Unable to create directory for telemetry files: ") + ec.message());
        }
        statsFile = fopen((telemetryFileBasePath + "/stats.txt").c_str(), "w");
    }

    auto config = BenchmarkConfig(
        parsedArgs.workload,
        parsedArgs.bucket,
        parsedArgs.region,
        parsedArgs.targetThroughputGbps,
        parsedArgs.networkInterfaceNames,
        telemetryFileBasePath);
    unique_ptr<BenchmarkRunner> benchmark = createRunnerFromName(parsedArgs.s3ClientId, config);
    uint64_t bytesPerRun = config.bytesPerRun();

    // Repeat benchmark until we exceed maxRepeatCount or maxRepeatSecs
    std::vector<double> durations;
    auto appStart = high_resolution_clock::now();
    for (int runNumber = 1; runNumber <= config.maxRepeatCount; ++runNumber)
    {
        auto runStart = high_resolution_clock::now();

        benchmark->run(runNumber);

        duration<double> runDurationSecs = high_resolution_clock::now() - runStart;
        double runSecs = runDurationSecs.count();
        durations.push_back(runSecs);
        fflush(stderr);
        StatsPrintf("Run:%d Secs:%f Gb/s:%f\n", runNumber, runSecs, bytesToGigabit(bytesPerRun) / runSecs);
        fflush(stdout);

        // break out if we've exceeded maxRepeatSecs
        duration<double> appDurationSecs = high_resolution_clock::now() - appStart;
        if (appDurationSecs >= 1s * config.maxRepeatSecs)
            break;
    }

    printAllStats(bytesPerRun, durations);

    if (statsFile != NULL)
    {
        fclose(statsFile);
    }

    return 0;
}