diff options
Diffstat (limited to 'test/perf-ingest.cpp')
-rw-r--r-- | test/perf-ingest.cpp | 115 |
1 files changed, 115 insertions, 0 deletions
diff --git a/test/perf-ingest.cpp b/test/perf-ingest.cpp new file mode 100644 index 0000000..6de3dae --- /dev/null +++ b/test/perf-ingest.cpp @@ -0,0 +1,115 @@ +#include <benchmark/benchmark.h> +#include <filesystem> + +#include "test-util.hpp" +#include <c++11Helpers.h> +#include <fstream> +#include <random> + +#include <ingestor.hpp> + +namespace { + const std::filesystem::path TMP_LOG = std::format("/tmp/webstat-perf-{}.log", getpid()); + + const struct LogFile { + SPECIAL_MEMBERS_DELETE(LogFile); + + LogFile() + { + std::random_device randDevice; + std::mt19937 generator(randDevice()); + + struct Strings { + std::vector<std::string> vhosts; + std::vector<std::string> ips; + std::vector<std::string> paths; + std::vector<std::string> qss; + std::vector<std::string> refs; + std::vector<std::string> uas; + }; + + Strings strings; + + auto genIp = [&generator]() { + static std::uniform_int_distribution<unsigned short> octetDistrib { + 0, std::numeric_limits<uint8_t>::max()}; + return std::format("{}.{}.{}.{}", octetDistrib(generator), octetDistrib(generator), + octetDistrib(generator), octetDistrib(generator) + + ); + }; + auto getStrGen = [&generator](size_t minLen, size_t maxLen) { + return [minLen, maxLen, &generator]() { + std::uniform_int_distribution<char> charDistrib {'a', 'z'}; + std::uniform_int_distribution<size_t> lenDistrib {minLen, maxLen}; + std::string out; + std::generate_n(std::back_inserter(out), lenDistrib(generator), [&generator, &charDistrib]() { + return charDistrib(generator); + }); + return out; + }; + }; + + for (auto & [out, count, stringGenerator] : std::initializer_list< + std::tuple<std::vector<std::string> &, size_t, std::function<std::string()>>> { + {strings.vhosts, 4, getStrGen(6, 20)}, + {strings.ips, 4, genIp}, + {strings.paths, 100, getStrGen(1, 50)}, + {strings.qss, 100, getStrGen(1, 50)}, + {strings.refs, 50, getStrGen(10, 50)}, + {strings.uas, 10, getStrGen(50, 70)}, + }) { + std::generate_n(std::back_inserter(out), count, stringGenerator); + } + strings.qss.emplace_back(""); + strings.refs.emplace_back("-"); + strings.uas.emplace_back("-"); + + constexpr size_t MISC_MIN = 1000; + constexpr size_t MISC_MAX = 10000; + constexpr uint64_t TICK_START = 1755710158296508; + std::uniform_int_distribution<size_t> tickDistrib {MISC_MIN, MISC_MAX}; + std::uniform_int_distribution<size_t> sizeDistrib {MISC_MIN, MISC_MAX}; + std::uniform_int_distribution<size_t> durationDistrib {MISC_MIN, MISC_MAX}; + uint64_t tick = TICK_START; + auto randomString = [&generator](auto & stringSet) { + std::uniform_int_distribution<size_t> choiceDistrib {0, stringSet.size() - 1}; + return stringSet[choiceDistrib(generator)]; + }; + + std::ofstream logfile {TMP_LOG}; + constexpr size_t LOG_LINES = 10000; + for (size_t line = 0; line < LOG_LINES; ++line) { + std::println(logfile, R"LOG({} {} {} GET "/{}" "?{}" HTTP/1.1 200 {} {} "{}" "{}")LOG", + randomString(strings.vhosts), randomString(strings.ips), tick += tickDistrib(generator), + randomString(strings.paths), randomString(strings.qss), sizeDistrib(generator), + durationDistrib(generator), randomString(strings.refs), randomString(strings.uas)); + } + } + + ~LogFile() + { + std::filesystem::remove(TMP_LOG); + } + } LOG_FILE; + + void + setup(const benchmark::State &) + { + static const WebStat::MockDB mockdb; + } + + void + doIngestFile(benchmark::State & state) + { + WebStat::Ingestor ingestor {"perf-hostname", DB::MockDatabase::openConnectionTo("webstat")}; + for (auto loop : state) { + WebStat::FilePtr logFile {fopen(TMP_LOG.c_str(), "r")}; + ingestor.ingestLog(logFile.get()); + } + } +} + +BENCHMARK(doIngestFile)->Setup(setup); + +BENCHMARK_MAIN(); |