2020-12-21 04:16:59 +00:00
|
|
|
#include <folly/Format.h>
|
2020-12-19 07:02:53 +00:00
|
|
|
#include <folly/String.h>
|
|
|
|
|
|
|
|
#include <fstream>
|
|
|
|
#include <functional>
|
|
|
|
#include <iostream>
|
|
|
|
#include <map>
|
|
|
|
#include <memory>
|
|
|
|
#include <numeric>
|
|
|
|
#include <optional>
|
2020-12-21 04:16:59 +00:00
|
|
|
#include <regex>
|
2020-12-19 07:02:53 +00:00
|
|
|
#include <string>
|
|
|
|
#include <vector>
|
|
|
|
|
2020-12-21 22:37:50 +00:00
|
|
|
constexpr auto RULE_DELIM = ":";
|
2020-12-19 07:02:53 +00:00
|
|
|
constexpr auto ALTERNATING_DELIM = " | ";
|
2020-12-21 23:05:26 +00:00
|
|
|
constexpr int NUM_RULE_11_CYCLES = 8;
|
|
|
|
|
2020-12-19 07:02:53 +00:00
|
|
|
class GrammarEntry;
|
|
|
|
using MultiGrammarEntry = std::vector<GrammarEntry>;
|
|
|
|
using AlternatableMultiGrammarEntry = std::vector<MultiGrammarEntry>;
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* An entry in the grammar. This can either be a layer of indirection to another entry (a lookup) or a grammar rule
|
|
|
|
* itself.
|
|
|
|
*/
|
2020-12-19 07:02:53 +00:00
|
|
|
class GrammarEntry {
|
|
|
|
public:
|
|
|
|
GrammarEntry(int index) : index(index), isThisALookup(true) {
|
|
|
|
}
|
|
|
|
|
|
|
|
GrammarEntry(char value) : value(value), isThisALookup(false) {
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* Checks whether or not this grammar rule is an indirection to another
|
|
|
|
*
|
|
|
|
* @return bool Whether or not thisg rammar ule is an indirection to another.
|
|
|
|
*/
|
2020-12-19 07:02:53 +00:00
|
|
|
bool isLookup() const {
|
|
|
|
return this->isThisALookup;
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* @return int The index of the rule that this looks up
|
|
|
|
*/
|
2020-12-19 07:02:53 +00:00
|
|
|
int getIndex() const {
|
2020-12-21 23:05:26 +00:00
|
|
|
if (!this->isLookup()) {
|
2020-12-19 07:02:53 +00:00
|
|
|
throw "Cannot get the index of a non-lookup";
|
|
|
|
}
|
|
|
|
|
|
|
|
return this->index;
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* Checks the value of this grammar rule, if it is not a lookup.
|
|
|
|
*
|
|
|
|
* @return The character that this grammar rule represents.
|
|
|
|
*/
|
2020-12-19 07:02:53 +00:00
|
|
|
char getValue() const {
|
|
|
|
if (isThisALookup) {
|
|
|
|
throw "Cannot get the value of a lookup";
|
|
|
|
}
|
|
|
|
|
|
|
|
return this->value;
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
|
|
|
int index;
|
|
|
|
char value;
|
|
|
|
bool isThisALookup;
|
|
|
|
};
|
|
|
|
|
|
|
|
std::vector<std::string> readInput(const std::string &filename) {
|
|
|
|
std::vector<std::string> input;
|
|
|
|
std::string line;
|
|
|
|
std::ifstream file(filename);
|
|
|
|
while (std::getline(file, line)) {
|
|
|
|
input.push_back(line);
|
|
|
|
}
|
|
|
|
|
|
|
|
return input;
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* Split the input into grammar and test strings
|
|
|
|
*
|
|
|
|
* @param input The puzzle input.
|
|
|
|
*
|
|
|
|
* @return std::pair<std::vector<std::string>, std::vector<std::string>> A pair of the puzzle grammar and the puzzle
|
|
|
|
* test strings
|
|
|
|
*/
|
2020-12-19 07:02:53 +00:00
|
|
|
std::pair<std::vector<std::string>, std::vector<std::string>> splitInput(const std::vector<std::string> &input) {
|
|
|
|
auto emptyLine = std::find(input.cbegin(), input.cend(), "");
|
|
|
|
auto beforeEmptyLine = std::vector<std::string>(input.cbegin(), emptyLine);
|
|
|
|
auto afterEmptyLine = std::vector<std::string>(emptyLine + 1, input.cend());
|
|
|
|
return std::pair<std::vector<std::string>, std::vector<std::string>>(
|
|
|
|
std::move(beforeEmptyLine), std::move(afterEmptyLine));
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* Convert a single pattern to a grammar entry
|
|
|
|
*
|
|
|
|
* @param rawPattern The pattern from the entry to parse.
|
|
|
|
*
|
|
|
|
* @return MultiGrammarEntry The grammar entry to parse, which is a vector of single entries, each element
|
|
|
|
* representating an alternation.
|
|
|
|
*/
|
2020-12-19 07:02:53 +00:00
|
|
|
MultiGrammarEntry parseSinglePattern(const std::string &rawPattern) {
|
|
|
|
std::vector<std::string> rawPatternComponents;
|
|
|
|
folly::split(" ", rawPattern, rawPatternComponents);
|
|
|
|
MultiGrammarEntry patternComponents;
|
|
|
|
std::transform(
|
|
|
|
rawPatternComponents.cbegin(),
|
|
|
|
rawPatternComponents.cend(),
|
|
|
|
std::back_inserter(patternComponents),
|
|
|
|
[](const std::string &rawComponent) {
|
|
|
|
if (rawComponent.at(0) == '"' && rawComponent.at(rawComponent.size() - 1) == '"') {
|
|
|
|
std::string component = rawComponent.substr(1, rawComponent.size() - 2);
|
|
|
|
if (component.size() != 1) {
|
|
|
|
throw std::invalid_argument("Base rule must be 1 char");
|
|
|
|
}
|
|
|
|
|
|
|
|
return GrammarEntry(component.at(0));
|
|
|
|
} else {
|
|
|
|
return GrammarEntry(std::stoi(rawComponent));
|
|
|
|
}
|
|
|
|
});
|
|
|
|
|
|
|
|
return patternComponents;
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* Parse the grammar part of the puzzle into a map of grammar entries.
|
|
|
|
*
|
|
|
|
* @param patterns The pattern from the entry to parse.
|
|
|
|
*
|
|
|
|
* @return std::unordered_multimap<int, MultiGrammarEntry> A map of grammar rule indices to grammar entries. Each
|
|
|
|
* element of the grammar entry vectors are alternations.
|
|
|
|
*/
|
2020-12-21 04:16:59 +00:00
|
|
|
std::unordered_multimap<int, MultiGrammarEntry> parseGrammar(const std::vector<std::string> &patterns) {
|
|
|
|
std::unordered_multimap<int, MultiGrammarEntry> grammar;
|
|
|
|
for (const std::string &patternLine : patterns) {
|
2020-12-21 22:37:50 +00:00
|
|
|
auto colonIndex = patternLine.find(RULE_DELIM);
|
2020-12-21 04:16:59 +00:00
|
|
|
std::string rawIndex = patternLine.substr(0, colonIndex);
|
|
|
|
int patternIndex = std::stoi(rawIndex);
|
|
|
|
std::vector<std::string> rawAlternations;
|
|
|
|
// An extra +1 on the colon index to get rid of the space after the colon
|
|
|
|
folly::split(ALTERNATING_DELIM, patternLine.substr(colonIndex + 2), rawAlternations);
|
|
|
|
|
|
|
|
std::transform(
|
|
|
|
rawAlternations.cbegin(),
|
|
|
|
rawAlternations.cend(),
|
|
|
|
std::inserter(grammar, grammar.end()),
|
|
|
|
[patternIndex](const std::string &pattern) {
|
|
|
|
return std::make_pair(patternIndex, parseSinglePattern(pattern));
|
|
|
|
});
|
|
|
|
}
|
2020-12-19 07:02:53 +00:00
|
|
|
|
|
|
|
return grammar;
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* Convert a grammar to a regular expression
|
|
|
|
*
|
|
|
|
* @param grammar The grammar for the puzzle
|
|
|
|
* @param rule The grammar rule to start the search at
|
|
|
|
*
|
|
|
|
* @return A regular expression for the puzzle input.
|
|
|
|
*/
|
|
|
|
std::string convertToRegularExpression(const std::unordered_multimap<int, MultiGrammarEntry> &grammar, int rule = 0) {
|
2020-12-21 04:16:59 +00:00
|
|
|
std::vector<std::string> expressions;
|
|
|
|
auto ruleIterators = grammar.equal_range(rule);
|
2020-12-21 22:37:50 +00:00
|
|
|
std::vector<std::pair<int, MultiGrammarEntry>> entries(ruleIterators.first, ruleIterators.second);
|
2020-12-21 04:16:59 +00:00
|
|
|
std::transform(
|
2020-12-21 22:37:50 +00:00
|
|
|
entries.cbegin(),
|
|
|
|
entries.cend(),
|
2020-12-21 04:16:59 +00:00
|
|
|
std::back_inserter(expressions),
|
2020-12-21 22:37:50 +00:00
|
|
|
[&grammar, rule](const std::pair<int, MultiGrammarEntry> &entry) {
|
2020-12-21 04:16:59 +00:00
|
|
|
MultiGrammarEntry alternative = entry.second;
|
2020-12-21 22:37:50 +00:00
|
|
|
std::string prefix;
|
2020-12-21 04:16:59 +00:00
|
|
|
std::string expression;
|
2020-12-21 22:37:50 +00:00
|
|
|
std::string suffixPrefix;
|
|
|
|
std::string suffix;
|
|
|
|
bool isNonRegularCycle = false;
|
2020-12-21 04:16:59 +00:00
|
|
|
for (const GrammarEntry &grammarEntry : alternative) {
|
2020-12-21 22:37:50 +00:00
|
|
|
if (!grammarEntry.isLookup()) {
|
2020-12-21 04:16:59 +00:00
|
|
|
expression += grammarEntry.getValue();
|
2020-12-21 22:37:50 +00:00
|
|
|
} else if (
|
|
|
|
grammarEntry.getIndex() == rule && alternative.back().isLookup() &&
|
|
|
|
rule == alternative.back().getIndex()) {
|
|
|
|
expression = folly::format("(?:{})+?", expression).str();
|
|
|
|
} else if (grammarEntry.getIndex() == rule) {
|
|
|
|
isNonRegularCycle = true;
|
|
|
|
// This grossness will be resolved when using a format string. We want to be able to replace this
|
|
|
|
// with a number later.
|
2020-12-21 23:05:26 +00:00
|
|
|
suffixPrefix = folly::format("(?:{}){{{{{{}}}}}}(?:", expression).str();
|
2020-12-21 22:37:50 +00:00
|
|
|
expression.clear();
|
2020-12-21 23:05:26 +00:00
|
|
|
suffix = "){{{}}}";
|
2020-12-21 22:37:50 +00:00
|
|
|
} else {
|
|
|
|
expression += convertToRegularExpression(grammar, grammarEntry.getIndex());
|
2020-12-21 04:16:59 +00:00
|
|
|
}
|
2020-12-19 07:02:53 +00:00
|
|
|
}
|
|
|
|
|
2020-12-21 22:37:50 +00:00
|
|
|
if (!isNonRegularCycle) {
|
|
|
|
return expression;
|
|
|
|
} else {
|
|
|
|
std::vector<std::string> fullSuffixElements;
|
2020-12-21 23:05:26 +00:00
|
|
|
// This is awful, but basically, checking for 31 11 42 is not posisble with a regular language, so we
|
|
|
|
// must check the possibilities of 1 of each, 2 of each, ... the value of NUM_RULE_11_CYCLES was picked
|
|
|
|
// arbitrarily because it works with my input.
|
|
|
|
for (int i = 1; i < NUM_RULE_11_CYCLES; i++) {
|
2020-12-21 22:37:50 +00:00
|
|
|
fullSuffixElements.push_back(
|
|
|
|
folly::format(suffixPrefix, i).str() + expression + folly::format(suffix, i).str());
|
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
return "(" + folly::join("|", fullSuffixElements) + ")";
|
2020-12-21 22:37:50 +00:00
|
|
|
}
|
2020-12-21 04:16:59 +00:00
|
|
|
});
|
2020-12-19 07:02:53 +00:00
|
|
|
|
2020-12-21 04:16:59 +00:00
|
|
|
if (expressions.size() == 1) {
|
|
|
|
return expressions.at(0);
|
|
|
|
} else {
|
2020-12-21 23:05:26 +00:00
|
|
|
// Create an alternation of all of the entries
|
2020-12-21 22:37:50 +00:00
|
|
|
return folly::format("(?:{})", folly::join("|", expressions)).str();
|
2020-12-19 07:02:53 +00:00
|
|
|
}
|
2020-12-21 04:16:59 +00:00
|
|
|
}
|
2020-12-19 07:02:53 +00:00
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
/**
|
|
|
|
* Get the number of times the grammar matches the test strings
|
|
|
|
*
|
|
|
|
* @param grammar The grammar to check against
|
|
|
|
* @param testStrings The strings to test if they match
|
|
|
|
*
|
|
|
|
* @returns int The number of test strings that match the grammar
|
|
|
|
*/
|
|
|
|
int getNumberOfMatches(
|
|
|
|
const std::unordered_multimap<int, MultiGrammarEntry> &grammar, const std::vector<std::string> &testStrings) {
|
|
|
|
std::regex inputRegex(convertToRegularExpression(grammar));
|
2020-12-21 22:37:50 +00:00
|
|
|
return std::count_if(testStrings.cbegin(), testStrings.cend(), [&inputRegex](const std::string &testString) {
|
|
|
|
std::smatch matches;
|
2020-12-21 23:05:26 +00:00
|
|
|
return std::regex_match(testString, matches, inputRegex);
|
2020-12-21 22:37:50 +00:00
|
|
|
});
|
2020-12-19 07:02:53 +00:00
|
|
|
}
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
int part1(const std::vector<std::string> &patterns, const std::vector<std::string> &testStrings) {
|
|
|
|
std::unordered_multimap<int, MultiGrammarEntry> grammar = parseGrammar(patterns);
|
|
|
|
return getNumberOfMatches(grammar, testStrings);
|
|
|
|
}
|
|
|
|
|
2020-12-21 22:37:50 +00:00
|
|
|
int part2(const std::vector<std::string> &patterns, const std::vector<std::string> &testStrings) {
|
2020-12-21 04:16:59 +00:00
|
|
|
std::unordered_multimap<int, MultiGrammarEntry> grammar = parseGrammar(patterns);
|
2020-12-21 22:37:50 +00:00
|
|
|
grammar.erase(8);
|
|
|
|
grammar.erase(11);
|
|
|
|
grammar.emplace(8, MultiGrammarEntry{GrammarEntry(42)});
|
|
|
|
grammar.emplace(8, MultiGrammarEntry{GrammarEntry(42), GrammarEntry(8)});
|
|
|
|
grammar.emplace(11, MultiGrammarEntry{GrammarEntry(42), GrammarEntry(31)});
|
|
|
|
grammar.emplace(11, MultiGrammarEntry{GrammarEntry(42), GrammarEntry(11), GrammarEntry(31)});
|
2020-12-21 23:05:26 +00:00
|
|
|
return getNumberOfMatches(grammar, testStrings);
|
2020-12-19 07:02:53 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
int main(int argc, char *argv[]) {
|
|
|
|
if (argc != 2) {
|
|
|
|
std::cerr << argv[0] << " <input_file>" << std::endl;
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
auto input = readInput(argv[1]);
|
|
|
|
auto parsedInput = splitInput(input);
|
|
|
|
|
2020-12-21 23:05:26 +00:00
|
|
|
std::cout << part1(parsedInput.first, parsedInput.second) << std::endl;
|
2020-12-21 22:37:50 +00:00
|
|
|
std::cout << part2(parsedInput.first, parsedInput.second) << std::endl;
|
2020-12-19 07:02:53 +00:00
|
|
|
}
|