Changing up variable interpolation in preparation of supporting interpolation for environments

This commit is contained in:
Ian Roddis
2021-11-12 16:08:57 -04:00
parent ac3928c7f6
commit c0315b4f0b
3 changed files with 121 additions and 34 deletions

View File

@@ -18,6 +18,12 @@ namespace daggy {
std::string globalSub(std::string string, const std::string &pattern,
const std::string &replacement);
std::unordered_set<std::string> matchingParameters(
const std::vector<std::string> &input, const ConfigValues &values);
std::vector<std::unordered_map<std::string, std::string>>
generateCartesianValues(const ConfigValues &values);
std::vector<Command> interpolateValues(const std::vector<std::string> &raw,
const ConfigValues &values);

View File

@@ -17,48 +17,77 @@ namespace daggy {
return string;
}
std::vector<std::unordered_map<std::string, std::string>>
generateCartesianValues(const ConfigValues &values)
{
using ResultType =
std::vector<std::unordered_map<std::string, std::string>>;
ResultType result{{}};
for (const auto &[k, v] : values) {
if (std::holds_alternative<std::string>(v)) {
for (auto &valset : result) {
valset.emplace(k, std::get<std::string>(v));
}
}
else {
ResultType new_result;
for (const auto &val : std::get<std::vector<std::string>>(v)) {
for (auto valset : result) {
valset.emplace(k, val);
new_result.emplace_back(valset);
}
}
result.swap(new_result);
}
}
return result;
}
std::unordered_set<std::string> matchingParameters(
const std::vector<std::string> &input, const ConfigValues &values)
{
std::unordered_set<std::string> matchParams;
for (const auto &[k, v] : values) {
std::string pattern = "{{" + k + "}}";
bool anyMatched =
std::any_of(input.begin(), input.end(), [&](const auto &part) {
return part.find(pattern) != std::string::npos;
});
if (anyMatched)
matchParams.insert(k);
}
return matchParams;
}
std::vector<std::vector<std::string>> interpolateValues(
const std::vector<std::string> &raw, const ConfigValues &values)
{
std::vector<std::vector<std::string>> cooked{{}};
std::vector<std::vector<std::string>> cooked;
for (const auto &part : raw) {
std::vector<std::string> expandedPart{part};
auto matchParams = matchingParameters(raw, values);
if (matchParams.empty()) {
cooked.emplace_back(raw);
return cooked;
}
// Find all values of parameters, and expand them
for (const auto &[paramRaw, paramValue] : values) {
std::string param = "{{" + paramRaw + "}}";
auto pos = part.find(param);
if (pos == std::string::npos)
continue;
std::vector<std::string> newExpandedPart;
ConfigValues paramSubset;
for (const auto &[k, v] : values) {
if (matchParams.count(k) == 0)
continue;
paramSubset.emplace(k, v);
}
if (std::holds_alternative<std::string>(paramValue)) {
for (auto &cmd : expandedPart) {
newExpandedPart.push_back(
globalSub(cmd, param, std::get<std::string>(paramValue)));
}
}
else {
for (const auto &val :
std::get<std::vector<std::string>>(paramValue)) {
for (const auto &cmd : expandedPart) {
newExpandedPart.push_back(globalSub(cmd, param, val));
}
}
}
const auto valueSets = generateCartesianValues(paramSubset);
expandedPart.swap(newExpandedPart);
}
std::vector<std::vector<std::string>> newCommands;
for (const auto &newPart : expandedPart) {
for (auto cmd : cooked) {
cmd.push_back(newPart);
newCommands.emplace_back(cmd);
for (const auto &valueSet : valueSets) {
std::vector<std::string> item(raw);
for (auto &part : item) {
for (const auto &[k, v] : valueSet) {
part = globalSub(part, "{{" + k + "}}", v);
}
}
cooked.swap(newCommands);
cooked.emplace_back(item);
}
return cooked;
}

View File

@@ -8,6 +8,7 @@
#include "daggy/Serialization.hpp"
#include "daggy/Utilities.hpp"
#include "daggy/executors/task/NoopTaskExecutor.hpp"
TEST_CASE("string_utilities", "[utilities_string]")
{
@@ -16,7 +17,24 @@ TEST_CASE("string_utilities", "[utilities_string]")
REQUIRE(res == "/this/is/hello/test/hello");
}
TEST_CASE("string_expansion", "[utilities_parameter_expansion]")
TEST_CASE("generate_cart_values", "[cartesian_values]")
{
std::string testParams{
R"({"DATE": ["2021-05-06", "2021-05-07" ], "SOURCE": "name", "TYPE": ["a", "b", "c"]})"};
auto params = daggy::configFromJSON(testParams);
auto result = daggy::generateCartesianValues(params);
REQUIRE(result.size() == 6);
for (const auto& valset : result) {
REQUIRE(valset.size() == 3);
REQUIRE(valset.count("DATE") == 1);
REQUIRE(valset.count("SOURCE") == 1);
REQUIRE(valset.count("TYPE") == 1);
}
}
TEST_CASE("string_expansion", "[utilities][parameter_expansion]")
{
SECTION("Basic expansion")
{
@@ -30,6 +48,17 @@ TEST_CASE("string_expansion", "[utilities_parameter_expansion]")
REQUIRE(allCommands.size() == 6);
}
SECTION("No expansion")
{
std::string testParams{
R"({"DATE": ["2021-05-06", "2021-05-07" ], "SOURCE": "name", "TYPE": ["a", "b", "c"]})"};
auto params = daggy::configFromJSON(testParams);
std::vector<std::string> cmd{"/usr/bin/echo"};
auto allCommands = daggy::interpolateValues(cmd, params);
REQUIRE(allCommands.size() == 1);
}
SECTION("Skip over unused parameters")
{
std::string testParams{
@@ -54,3 +83,26 @@ TEST_CASE("string_expansion", "[utilities_parameter_expansion]")
REQUIRE(result.size() == 4);
}
}
TEST_CASE("expand_taskset", "[utilities][expand_taskset]")
{
daggy::executors::task::NoopTaskExecutor ex;
daggy::DAGSpec dagSpec;
std::string testParams{R"({"DATE": ["2021-05-06", "2021-05-07" ]})"};
dagSpec.taskConfig.variables = daggy::configFromJSON(testParams);
std::stringstream jsonTasks;
jsonTasks
<< R"({ "A": { "job": {"command": [ "/usr/bin/cat", "/etc/passwd"]} )"
<< R"(, "children": ["C"], "isGenerator": true},)"
<< R"("C": { "job": {"command": [ "/usr/bin/echo", "hello!"]} } })";
dagSpec.tasks = daggy::tasksFromJSON(jsonTasks.str());
REQUIRE(dagSpec.tasks.size() == 2);
REQUIRE(dagSpec.tasks["A"].children == std::unordered_set<std::string>{"C"});
dagSpec.tasks =
daggy::expandTaskSet(dagSpec.tasks, ex, dagSpec.taskConfig.variables);
REQUIRE(dagSpec.tasks.size() == 2);
REQUIRE(dagSpec.tasks["A_0"].children ==
std::unordered_set<std::string>{"C"});
}