Fixing daggyr issues when reporting on tasks with very large outputs
(>10kb). Squashed commit of the following: commit b87fa418b4aca78928186a8fa992bef701e044a4 Author: Ian Roddis <tech@kinesin.ca> Date: Mon Feb 14 12:55:34 2022 -0400 removing memory leak commit 5e284ab92dbea991262a08c0cd50d6fc2f912e3b Author: Ian Roddis <tech@kinesin.ca> Date: Mon Feb 14 11:58:57 2022 -0400 Speeding up serialization, fixing payload sizing issue on daggyr commit e5e358820da4c2587741abdc3b6b103e5a4d4dd3 Author: Ian Roddis <tech@kinesin.ca> Date: Sun Feb 13 22:24:04 2022 -0400 changing newlines to std::endl for flush goodness commit 705ec86b75be947e64f4124ec8017cba2c8465e6 Author: Ian Roddis <tech@kinesin.ca> Date: Sun Feb 13 22:16:56 2022 -0400 adding more logging commit aa3db9c23e55da7a0523dc57e268b605ce8faac3 Author: Ian Roddis <tech@kinesin.ca> Date: Sun Feb 13 22:13:56 2022 -0400 Adding threadid commit 3b1a0f1333b2d43bc5ecad0746435504babbaa61 Author: Ian Roddis <tech@kinesin.ca> Date: Sun Feb 13 22:13:24 2022 -0400 Adding some debugging commit 804507e65251858fa597b7c27bcece8d8dfd589d Author: Ian Roddis <tech@kinesin.ca> Date: Sun Feb 13 21:52:53 2022 -0400 Removing curl global cleanup
This commit is contained in:
@@ -34,7 +34,6 @@ namespace daggy {
|
||||
void set(const T val)
|
||||
{
|
||||
if (val_) {
|
||||
std::cout << "Future already has a value!" << std::endl;
|
||||
throw std::runtime_error("Future already has a value");
|
||||
}
|
||||
val_.emplace(val);
|
||||
|
||||
@@ -50,6 +50,7 @@ namespace daggy {
|
||||
Ok = 200,
|
||||
Not_Found = 404,
|
||||
Not_Acceptable = 406,
|
||||
Not_Ready = 428,
|
||||
Server_Error = 500
|
||||
};
|
||||
|
||||
|
||||
@@ -23,6 +23,7 @@ namespace daggy {
|
||||
std::string dumpJSON(const rj::Value &doc)
|
||||
{
|
||||
rj::StringBuffer buffer;
|
||||
buffer.Clear();
|
||||
rj::Writer<rj::StringBuffer> writer(buffer);
|
||||
doc.Accept(writer);
|
||||
return buffer.GetString();
|
||||
@@ -281,8 +282,68 @@ namespace daggy {
|
||||
return os;
|
||||
}
|
||||
|
||||
// From https://stackoverflow.com/questions/7724448/simple-json-string-escape-for-c
|
||||
enum State {ESCAPED, UNESCAPED};
|
||||
std::string escapeJSON(const std::string& input)
|
||||
{
|
||||
std::string output;
|
||||
output.reserve(input.length());
|
||||
|
||||
for (std::string::size_type i = 0; i < input.length(); ++i)
|
||||
{
|
||||
switch (input[i]) {
|
||||
case '"':
|
||||
output += "\\\"";
|
||||
break;
|
||||
case '/':
|
||||
output += "\\/";
|
||||
break;
|
||||
case '\b':
|
||||
output += "\\b";
|
||||
break;
|
||||
case '\f':
|
||||
output += "\\f";
|
||||
break;
|
||||
case '\n':
|
||||
output += "\\n";
|
||||
break;
|
||||
case '\r':
|
||||
output += "\\r";
|
||||
break;
|
||||
case '\t':
|
||||
output += "\\t";
|
||||
break;
|
||||
case '\\':
|
||||
output += "\\\\";
|
||||
break;
|
||||
default:
|
||||
output += input[i];
|
||||
break;
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
return output;
|
||||
}
|
||||
|
||||
std::string attemptRecordToJSON(const AttemptRecord &record)
|
||||
{
|
||||
std::stringstream ss;
|
||||
|
||||
ss << "{"
|
||||
<< R"("startTime": ")" << timePointToString(record.startTime) << "\","
|
||||
<< R"("stopTime": ")" << timePointToString(record.stopTime) << "\","
|
||||
<< R"("rc": )" << record.rc << ","
|
||||
<< R"("outputLog": ")" << escapeJSON(record.outputLog) << "\","
|
||||
<< R"("errorLog": ")" << escapeJSON(record.errorLog) << "\","
|
||||
<< R"("executorLog": ")" << escapeJSON(record.executorLog) << '"'
|
||||
<< "}";
|
||||
|
||||
return ss.str();
|
||||
}
|
||||
|
||||
/*
|
||||
std::string attemptRecordToJSON(const AttemptRecord &record) {
|
||||
rj::Document doc;
|
||||
doc.SetObject();
|
||||
auto &alloc = doc.GetAllocator();
|
||||
@@ -314,9 +375,9 @@ namespace daggy {
|
||||
rj::Value().SetString(record.executorLog.c_str(),
|
||||
record.executorLog.size(), alloc),
|
||||
alloc);
|
||||
|
||||
return dumpJSON(doc);
|
||||
}
|
||||
*/
|
||||
|
||||
AttemptRecord attemptRecordFromJSON(const std::string &json)
|
||||
{
|
||||
|
||||
@@ -225,16 +225,17 @@ namespace daggy {
|
||||
CURLcode res;
|
||||
struct curl_slist *headers = NULL;
|
||||
|
||||
curl_global_init(CURL_GLOBAL_ALL);
|
||||
|
||||
curl = curl_easy_init();
|
||||
if (curl) {
|
||||
std::stringstream buffer;
|
||||
char errbuf[CURL_ERROR_SIZE];
|
||||
|
||||
curl_easy_setopt(curl, CURLOPT_URL, url.c_str());
|
||||
curl_easy_setopt(curl, CURLOPT_WRITEFUNCTION, curlWriter);
|
||||
curl_easy_setopt(curl, CURLOPT_WRITEDATA, &buffer);
|
||||
curl_easy_setopt(curl, CURLOPT_TIMEOUT, 8);
|
||||
curl_easy_setopt(curl, CURLOPT_ERRORBUFFER, &errbuf);
|
||||
curl_easy_setopt(curl, CURLOPT_TIMEOUT, 8L);
|
||||
curl_easy_setopt(curl, CURLOPT_NOSIGNAL, 1L);
|
||||
|
||||
if (trace) {
|
||||
curl_easy_setopt(curl, CURLOPT_DEBUGFUNCTION, http_trace);
|
||||
@@ -253,19 +254,19 @@ namespace daggy {
|
||||
res = curl_easy_perform(curl);
|
||||
|
||||
if (res != CURLE_OK) {
|
||||
|
||||
curl_easy_cleanup(curl);
|
||||
response.code = HTTPCode::Server_Error;
|
||||
response.body = std::string{"CURL Failed: "} + curl_easy_strerror(res);
|
||||
return response;
|
||||
}
|
||||
curl_easy_cleanup(curl);
|
||||
|
||||
curl_easy_getinfo(curl, CURLINFO_RESPONSE_CODE, &response.code);
|
||||
curl_easy_cleanup(curl);
|
||||
response.body = buffer.str();
|
||||
} else {
|
||||
throw std::runtime_error("Unable to init cURL object");
|
||||
}
|
||||
|
||||
curl_global_cleanup();
|
||||
|
||||
return response;
|
||||
}
|
||||
|
||||
|
||||
@@ -16,6 +16,7 @@ add_executable(${PROJECT_NAME} main.cpp
|
||||
int_basic.cpp
|
||||
# Performance checks
|
||||
perf_dag.cpp
|
||||
perf_serialization.cpp
|
||||
)
|
||||
target_link_libraries(${PROJECT_NAME} libdaggy stdc++fs Catch2::Catch2)
|
||||
|
||||
|
||||
@@ -49,7 +49,7 @@ const size_t MAX_CHILDREN = 10;
|
||||
|
||||
static auto DAG = createDAG(N_NODES, MAX_CHILDREN);
|
||||
|
||||
TEST_CASE("massive DAGs", "[dag_performance]")
|
||||
TEST_CASE("massive DAGs", "[dag_performance][perf]")
|
||||
{
|
||||
BENCHMARK_ADVANCED("dag.reset")(Catch::Benchmark::Chronometer meter)
|
||||
{
|
||||
|
||||
50
libdaggy/tests/perf_serialization.cpp
Normal file
50
libdaggy/tests/perf_serialization.cpp
Normal file
@@ -0,0 +1,50 @@
|
||||
#ifdef CATCH_CONFIG_ENABLE_BENCHMARKING
|
||||
|
||||
#include <catch2/catch.hpp>
|
||||
#include <iostream>
|
||||
#include <random>
|
||||
|
||||
#include <daggy/Serialization.hpp>
|
||||
|
||||
std::string random_string(std::size_t length)
|
||||
{
|
||||
const std::string CHARACTERS = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz;\"'\n\t{}[]()";
|
||||
|
||||
std::random_device random_device;
|
||||
std::mt19937 generator(random_device());
|
||||
std::uniform_int_distribution<> distribution(0, CHARACTERS.size() - 1);
|
||||
|
||||
std::string random_string;
|
||||
|
||||
for (std::size_t i = 0; i < length; ++i)
|
||||
{
|
||||
random_string += CHARACTERS[distribution(generator)];
|
||||
}
|
||||
|
||||
return random_string;
|
||||
}
|
||||
|
||||
using namespace daggy;
|
||||
|
||||
TEST_CASE("attempt output", "[serialize_attempt_performance][perf]")
|
||||
{
|
||||
size_t LOGSIZE = 512000;
|
||||
// Need lots of data
|
||||
AttemptRecord attempt{
|
||||
.startTime = Clock::now(),
|
||||
.stopTime = Clock::now(),
|
||||
.rc = 0,
|
||||
.executorLog = random_string(LOGSIZE),
|
||||
.outputLog = random_string(LOGSIZE),
|
||||
.errorLog = random_string(LOGSIZE)
|
||||
};
|
||||
|
||||
|
||||
BENCHMARK_ADVANCED("rj_dump")(Catch::Benchmark::Chronometer meter)
|
||||
{
|
||||
meter.measure([&] { return attemptRecordToJSON(attempt); });
|
||||
};
|
||||
|
||||
}
|
||||
|
||||
#endif
|
||||
@@ -102,3 +102,45 @@ TEST_CASE("task_serialization", "[serialize_tasks]")
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
TEST_CASE("attempt_serialization", "[serialize_attempt]")
|
||||
{
|
||||
SECTION("Serialize Simple Attempt")
|
||||
{
|
||||
using namespace daggy;
|
||||
|
||||
AttemptRecord attempt{
|
||||
.startTime = Clock::now(),
|
||||
.stopTime = Clock::now(),
|
||||
.rc = 0,
|
||||
.executorLog = "",
|
||||
.outputLog = "",
|
||||
.errorLog = "",
|
||||
};
|
||||
|
||||
auto json = attemptRecordToJSON(attempt);
|
||||
|
||||
rj::Document doc;
|
||||
REQUIRE_NOTHROW(checkRJParse(doc.Parse(json.c_str()), "Parsing AttemptRecord"));
|
||||
}
|
||||
|
||||
SECTION("Serialize Attempt with complicated logs")
|
||||
{
|
||||
using namespace daggy;
|
||||
|
||||
AttemptRecord attempt{
|
||||
.startTime = Clock::now(),
|
||||
.stopTime = Clock::now(),
|
||||
.rc = 0,
|
||||
.executorLog = "",
|
||||
.outputLog = "This is a testament to\nmore complicated, \"potentially quoted\"\nproblem\tspaces\n",
|
||||
.errorLog = "",
|
||||
};
|
||||
|
||||
auto json = attemptRecordToJSON(attempt);
|
||||
|
||||
rj::Document doc;
|
||||
REQUIRE_NOTHROW(checkRJParse(doc.Parse(json.c_str()), "Parsing AttemptRecord"));
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user