taskwarrior/src/CLI2.cpp

1891 lines
61 KiB
C++

////////////////////////////////////////////////////////////////////////////////
//
// Copyright 2006 - 2021, Tomas Babej, Paul Beckingham, Federico Hernandez.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included
// in all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.
//
// https://www.opensource.org/licenses/mit-license.php
//
////////////////////////////////////////////////////////////////////////////////
#include <cmake.h>
// cmake.h include header must come first
#include <CLI2.h>
#include <CmdCustom.h>
#include <CmdTimesheet.h>
#include <Color.h>
#include <Context.h>
#include <Lexer.h>
#include <format.h>
#include <shared.h>
#include <stdlib.h>
#include <utf8.h>
#include <algorithm>
#include <sstream>
// Overridden by rc.abbreviation.minimum.
int CLI2::minimumMatchLength = 3;
// Alias expansion limit. Any more indicates some kind of error.
static int safetyValveDefault = 10;
////////////////////////////////////////////////////////////////////////////////
A2::A2(const std::string& raw, Lexer::Type lextype) {
_lextype = lextype;
attribute("raw", raw);
}
////////////////////////////////////////////////////////////////////////////////
A2::A2(const A2& other) = default;
////////////////////////////////////////////////////////////////////////////////
A2& A2::operator=(const A2& other) = default;
////////////////////////////////////////////////////////////////////////////////
bool A2::hasTag(const std::string& tag) const {
return std::find(_tags.begin(), _tags.end(), tag) != _tags.end();
}
////////////////////////////////////////////////////////////////////////////////
void A2::tag(const std::string& tag) {
if (!hasTag(tag)) _tags.push_back(tag);
}
////////////////////////////////////////////////////////////////////////////////
void A2::unTag(const std::string& tag) {
for (auto i = _tags.begin(); i != _tags.end(); ++i)
if (*i == tag) {
_tags.erase(i);
break;
}
}
////////////////////////////////////////////////////////////////////////////////
// Accessor for attributes.
void A2::attribute(const std::string& name, const std::string& value) {
_attributes[name] = value;
if (name == "raw") decompose();
}
////////////////////////////////////////////////////////////////////////////////
// Accessor for attributes.
const std::string A2::attribute(const std::string& name) const {
// Prevent autovivification.
auto i = _attributes.find(name);
if (i != _attributes.end()) return i->second;
return "";
}
////////////////////////////////////////////////////////////////////////////////
const std::string A2::getToken() const {
auto i = _attributes.find("canonical");
if (i == _attributes.end()) i = _attributes.find("raw");
return i->second;
}
////////////////////////////////////////////////////////////////////////////////
void A2::decompose() {
if (_lextype == Lexer::Type::tag) {
std::string raw = _attributes["raw"];
attribute("name", raw.substr(1));
attribute("sign", raw.substr(0, 1));
}
else if (_lextype == Lexer::Type::substitution) {
// if (Directory (raw).exists ())
// return;
std::string from;
std::string to;
std::string flags;
if (Lexer::decomposeSubstitution(_attributes["raw"], from, to, flags)) {
attribute("from", from);
attribute("to", to);
attribute("flags", flags);
}
}
else if (_lextype == Lexer::Type::pair) {
std::string name;
std::string mod;
std::string sep;
std::string value;
if (Lexer::decomposePair(_attributes["raw"], name, mod, sep, value)) {
attribute("name", name);
attribute("modifier", mod);
attribute("separator", sep);
attribute("value", value);
if (name == "rc") {
if (mod != "")
tag("CONFIG");
else
tag("RC");
}
}
}
else if (_lextype == Lexer::Type::pattern) {
// if (Directory (raw).exists ())
// return;
std::string pattern;
std::string flags;
if (Lexer::decomposePattern(_attributes["raw"], pattern, flags)) {
attribute("pattern", pattern);
attribute("flags", flags);
}
}
}
////////////////////////////////////////////////////////////////////////////////
const std::string A2::dump() const {
auto output = Lexer::typeToString(_lextype);
// Dump attributes.
std::string atts;
for (const auto& a : _attributes) atts += a.first + "='\033[33m" + a.second + "\033[0m' ";
// Dump tags.
std::string tags;
for (const auto& tag : _tags) {
if (tag == "BINARY")
tags += "\033[1;37;44m" + tag + "\033[0m ";
else if (tag == "CMD")
tags += "\033[1;37;46m" + tag + "\033[0m ";
else if (tag == "FILTER")
tags += "\033[1;37;42m" + tag + "\033[0m ";
else if (tag == "MODIFICATION")
tags += "\033[1;37;43m" + tag + "\033[0m ";
else if (tag == "MISCELLANEOUS")
tags += "\033[1;37;45m" + tag + "\033[0m ";
else if (tag == "RC")
tags += "\033[1;37;41m" + tag + "\033[0m ";
else if (tag == "CONFIG")
tags += "\033[1;37;101m" + tag + "\033[0m ";
else if (tag == "?")
tags += "\033[38;5;255;48;5;232m" + tag + "\033[0m ";
else
tags += "\033[32m" + tag + "\033[0m ";
}
return output + ' ' + atts + tags;
}
////////////////////////////////////////////////////////////////////////////////
static const char* getValue(int argc, const char** argv, std::string arg) {
const auto is_arg = [&](std::string s) {
return s.size() > arg.size() + 1 && (s[arg.size()] == ':' || s[arg.size()] == '=') &&
s.compare(0, arg.size(), arg) == 0;
};
// find last argument before --
auto last = std::make_reverse_iterator(argv);
auto first = std::make_reverse_iterator(std::find(argv, argv + argc, std::string("--")));
auto it = std::find_if(first, last, is_arg);
if (it == last) return nullptr;
// return the string after : or =
return *it + arg.size() + 1;
}
////////////////////////////////////////////////////////////////////////////////
// Static method.
bool CLI2::getOverride(int argc, const char** argv, File& rc) {
const char* value = getValue(argc, argv, "rc");
if (value == nullptr) return false;
rc = File(value);
return true;
}
////////////////////////////////////////////////////////////////////////////////
// Look for CONFIG data.location and initialize a Path object.
// Static method.
bool CLI2::getDataLocation(int argc, const char** argv, Path& data) {
const char* value = getValue(argc, argv, "rc.data.location");
if (value == nullptr) {
std::string location = Context::getContext().config.get("data.location");
if (location != "") data = location;
return false;
}
data = Directory(value);
return true;
}
////////////////////////////////////////////////////////////////////////////////
// Static method.
void CLI2::applyOverrides(int argc, const char** argv) {
auto& context = Context::getContext();
auto last = std::find(argv, argv + argc, std::string("--"));
auto is_override = [](const std::string& s) { return s.compare(0, 3, "rc.") == 0; };
auto get_sep = [&](const std::string& s) {
if (is_override(s)) return s.find_first_of(":=", 3);
return std::string::npos;
};
auto override_settings = [&](std::string raw) {
auto sep = get_sep(raw);
if (sep == std::string::npos) return;
std::string name = raw.substr(3, sep - 3);
std::string value = raw.substr(sep + 1);
context.config.set(name, value);
};
auto display_overrides = [&](std::string raw) {
if (is_override(raw)) context.footnote(format("Configuration override {1}", raw));
};
std::for_each(argv, last, override_settings);
if (context.verbose("override")) std::for_each(argv, last, display_overrides);
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::alias(const std::string& name, const std::string& value) { _aliases[name] = value; }
////////////////////////////////////////////////////////////////////////////////
void CLI2::entity(const std::string& category, const std::string& name) {
// Walk the list of entities for category.
auto c = _entities.equal_range(category);
for (auto e = c.first; e != c.second; ++e)
if (e->second == name) return;
// The category/name pair was not found, therefore add it.
_entities.emplace(category, name);
}
////////////////////////////////////////////////////////////////////////////////
// Capture a single argument.
void CLI2::add(const std::string& argument) {
A2 arg(Lexer::trim(argument), Lexer::Type::word);
arg.tag("ORIGINAL");
_original_args.push_back(arg);
// Adding a new argument invalidates prior analysis.
_args.clear();
}
////////////////////////////////////////////////////////////////////////////////
// Capture a set of arguments, inserted immediately after <offset> arguments
// after the binary..
void CLI2::add(const std::vector<std::string>& arguments, int offset /* = 0 */) {
std::vector<A2> replacement{_original_args.begin(), _original_args.begin() + offset + 1};
for (const auto& arg : arguments) replacement.emplace_back(arg, Lexer::Type::word);
for (unsigned int i = 1 + offset; i < _original_args.size(); ++i)
replacement.push_back(_original_args[i]);
_original_args = replacement;
// Adding a new argument invalidates prior analysis.
_args.clear();
}
////////////////////////////////////////////////////////////////////////////////
// Arg0 is the first argument, which is the name and potentially a relative or
// absolute path to the invoked binary.
//
// The binary name is 'task', but if the binary is reported as 'cal' or
// 'calendar' then it was invoked via symbolic link, in which case capture the
// first argument as 'calendar'.
void CLI2::handleArg0() {
// Capture arg0 separately, because it is the command that was run, and could
// need special handling.
auto raw = _original_args[0].attribute("raw");
A2 a(raw, Lexer::Type::word);
a.tag("BINARY");
std::string basename = "task";
auto slash = raw.rfind('/');
if (slash != std::string::npos) basename = raw.substr(slash + 1);
a.attribute("basename", basename);
if (basename == "cal" || basename == "calendar") {
_args.push_back(a);
A2 cal("calendar", Lexer::Type::word);
_args.push_back(cal);
} else {
_args.push_back(a);
}
}
////////////////////////////////////////////////////////////////////////////////
// All arguments must be individually and wholly recognized by the Lexer. Any
// argument not recognized is considered a Lexer::Type::word.
//
// As a side effect, tags all arguments after a terminator ('--') with
// TERMINATED.
void CLI2::lexArguments() {
// Note: Starts iterating at index 1, because ::handleArg0 has already
// processed it.
bool terminated = false;
for (unsigned int i = 1; i < _original_args.size(); ++i) {
bool quoted = Lexer::wasQuoted(_original_args[i].attribute("raw"));
// Process single-token arguments.
std::string lexeme;
Lexer::Type type;
Lexer lex(_original_args[i].attribute("raw"));
if (lex.token(lexeme, type) &&
(lex.isEOS() || // Token goes to EOS
(quoted && type == Lexer::Type::pair))) // Quoted pairs automatically go to EOS
{
if (!terminated && type == Lexer::Type::separator)
terminated = true;
else if (terminated)
type = Lexer::Type::word;
A2 a(_original_args[i].attribute("raw"), type);
if (terminated) a.tag("TERMINATED");
if (quoted) a.tag("QUOTED");
if (_original_args[i].hasTag("ORIGINAL")) a.tag("ORIGINAL");
_args.push_back(a);
}
// Process multiple-token arguments.
else {
const std::string quote = "'";
// Escape unescaped single quotes
std::string escaped = "";
// For performance reasons. The escaped string is as long as the original.
escaped.reserve(_original_args[i].attribute("raw").size());
std::string::size_type cursor = 0;
bool nextEscaped = false;
while (int num = utf8_next_char(_original_args[i].attribute("raw"), cursor)) {
std::string character = utf8_character(num);
if (!nextEscaped && (character == "\\"))
nextEscaped = true;
else {
if (character == quote && !nextEscaped) escaped += "\\";
nextEscaped = false;
}
escaped += character;
}
cursor = 0;
std::string word;
if (Lexer::readWord(quote + escaped + quote, quote, cursor, word)) {
Lexer::dequote(word);
A2 unknown(word, Lexer::Type::word);
if (lex.wasQuoted(_original_args[i].attribute("raw"))) unknown.tag("QUOTED");
if (_original_args[i].hasTag("ORIGINAL")) unknown.tag("ORIGINAL");
_args.push_back(unknown);
}
// This branch may have no use-case.
else {
A2 unknown(_original_args[i].attribute("raw"), Lexer::Type::word);
unknown.tag("UNKNOWN");
if (lex.wasQuoted(_original_args[i].attribute("raw"))) unknown.tag("QUOTED");
if (_original_args[i].hasTag("ORIGINAL")) unknown.tag("ORIGINAL");
_args.push_back(unknown);
}
}
}
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze lexArguments"));
}
////////////////////////////////////////////////////////////////////////////////
// [1] Scan all args for the 'add' and 'log' commands, and demote any
// Lexer::Type::Tag args with sign '-' to Lexer::Type::word.
// [2] Convert any pseudo args name:value into config settings, and erase.
void CLI2::demotion() {
bool changes = false;
std::vector<A2> replacement;
std::string canonical;
for (auto& a : _args) {
if (a._lextype == Lexer::Type::tag && a.attribute("sign") == "-") {
std::string command = getCommand();
if (command == "add" || command == "log") {
a._lextype = Lexer::Type::word;
changes = true;
}
}
else if (a._lextype == Lexer::Type::pair &&
canonicalize(canonical, "pseudo", a.attribute("name"))) {
Context::getContext().config.set(canonical, a.attribute("value"));
changes = true;
// Equivalent to erasing 'a'.
continue;
}
replacement.push_back(a);
}
if (changes && Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze demotion"));
}
////////////////////////////////////////////////////////////////////////////////
// Intended to be called after ::add() to perform the final analysis.
void CLI2::analyze() {
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze"));
// Process _original_args.
_args.clear();
handleArg0();
lexArguments();
// Process _args.
aliasExpansion();
if (!findCommand()) {
defaultCommand();
if (!findCommand()) throw std::string("You must specify a command or a task to modify.");
}
demotion();
canonicalizeNames();
// Determine arg types: FILTER, MODIFICATION, MISCELLANEOUS.
categorizeArgs();
parenthesizeOriginalFilter();
// Cache frequently looked up items
_command = getCommand();
}
////////////////////////////////////////////////////////////////////////////////
// Process raw filter string.
// Insert filter arguments (wrapped in parentheses) immediatelly after the binary.
void CLI2::addFilter(const std::string& arg) {
if (arg.length()) {
std::vector<std::string> filter;
filter.push_back("(");
std::string lexeme;
Lexer::Type type;
Lexer lex(arg);
while (lex.token(lexeme, type)) filter.push_back(lexeme);
filter.push_back(")");
add(filter);
analyze();
}
}
////////////////////////////////////////////////////////////////////////////////
// Process raw modification string.
// Insert modification arguments immediatelly after the command (i.e. 'add')
void CLI2::addModifications(const std::string& arg) {
if (arg.length()) {
std::vector<std::string> mods;
std::string lexeme;
Lexer::Type type;
Lexer lex(arg);
while (lex.token(lexeme, type)) mods.push_back(lexeme);
// Determine at which argument index does the task modification command
// reside
unsigned int cmdIndex = 0;
for (; cmdIndex < _args.size(); ++cmdIndex) {
// Command found, stop iterating.
if (_args[cmdIndex].hasTag("CMD")) break;
}
// Insert modifications after the command.
add(mods, cmdIndex);
analyze();
}
}
////////////////////////////////////////////////////////////////////////////////
// There are situations where a context filter is applied. This method
// determines whether one applies, and if so, applies it. Disqualifiers include:
// - filter contains ID or UUID
void CLI2::addContext(bool readable, bool writeable) {
// Recursion block.
if (_context_added) return;
// Detect if any context is set, and bail out if not
std::string contextString;
if (readable)
// Empty string is treated as "currently selected context"
contextString = Context::getContext().getTaskContext("read", "");
else if (writeable)
contextString = Context::getContext().getTaskContext("write", "");
else
return;
// If context is empty, bail out too
if (contextString.empty()) return;
// For readable contexts: Detect if UUID or ID is set, and bail out
if (readable)
for (auto& a : _args) {
if (a._lextype == Lexer::Type::uuid || a._lextype == Lexer::Type::number ||
a._lextype == Lexer::Type::set) {
Context::getContext().debug(
format("UUID/ID argument found '{1}', not applying context.", a.attribute("raw")));
return;
}
}
// Apply the context. Readable (filtering) takes precedence. Also set the
// block now, since addFilter calls analyze(), which calls addContext().
_context_added = true;
if (readable)
addFilter(contextString);
else if (writeable)
addModifications(contextString);
// Inform the user about the application of context
if (Context::getContext().verbose("context"))
Context::getContext().footnote(format("Context '{1}' set. Use 'task context none' to remove.",
Context::getContext().config.get("context")));
}
////////////////////////////////////////////////////////////////////////////////
// Parse the command line, identifiying filter components, expanding syntactic
// sugar as necessary.
void CLI2::prepareFilter() {
// Clear and re-populate.
_id_ranges.clear();
_uuid_list.clear();
_context_added = false;
// Remove all the syntactic sugar for FILTERs.
lexFilterArgs();
findIDs();
findUUIDs();
insertIDExpr();
desugarFilterPlainArgs();
findStrayModifications();
desugarFilterTags();
desugarFilterAttributes();
desugarFilterPatterns();
insertJunctions(); // Deliberately after all desugar calls.
if (Context::getContext().verbose("filter")) {
std::string combined;
for (const auto& a : _args) {
if (a.hasTag("FILTER")) {
if (combined != "") combined += ' ';
combined += a.attribute("raw");
}
}
if (combined.size()) Context::getContext().footnote(std::string("Filter: ") + combined);
}
}
////////////////////////////////////////////////////////////////////////////////
// Return all the MISCELLANEOUS args as strings.
const std::vector<std::string> CLI2::getWords() {
std::vector<std::string> words;
for (const auto& a : _args)
if (a.hasTag("MISCELLANEOUS")) words.push_back(a.attribute("raw"));
if (Context::getContext().config.getInteger("debug.parser") >= 2) {
Color colorOrigArgs("gray10 on gray4");
std::string message = " ";
for (const auto& word : words) message += colorOrigArgs.colorize(word) + ' ';
Context::getContext().debug("CLI2::getWords" + message);
}
return words;
}
////////////////////////////////////////////////////////////////////////////////
// Return all the MISCELLANEOUS args.
const std::vector<A2> CLI2::getMiscellaneous() {
std::vector<A2> misc;
for (const auto& a : _args)
if (a.hasTag("MISCELLANEOUS")) misc.push_back(a);
return misc;
}
////////////////////////////////////////////////////////////////////////////////
// Search for 'value' in _entities category, return canonicalized value.
bool CLI2::canonicalize(std::string& canonicalized, const std::string& category,
const std::string& value) {
// Utilize a cache mapping of (category, value) -> canonicalized value.
// This cache does not need to be invalidated, because entities are defined
// only once per initialization of the Context object.
int cache_key = 31 * std::hash<std::string>{}(category) + std::hash<std::string>{}(value);
auto cache_result = _canonical_cache.find(cache_key);
if (cache_result != _canonical_cache.end()) {
canonicalized = cache_result->second;
return true;
}
// Extract a list of entities for category.
std::vector<std::string> options;
auto c = _entities.equal_range(category);
for (auto e = c.first; e != c.second; ++e) {
// Shortcut: if an exact match is found, success.
if (value == e->second) {
canonicalized = value;
_canonical_cache[cache_key] = value;
return true;
}
options.push_back(e->second);
}
// Match against the options, throw away results.
std::vector<std::string> matches;
if (autoComplete(value, options, matches, minimumMatchLength) == 1) {
canonicalized = matches[0];
_canonical_cache[cache_key] = matches[0];
return true;
}
return false;
}
////////////////////////////////////////////////////////////////////////////////
std::string CLI2::getBinary() const {
if (_args.size()) return _args[0].attribute("raw");
return "";
}
////////////////////////////////////////////////////////////////////////////////
std::string CLI2::getCommand(bool canonical) const {
// Shortcut if analysis has been finalized
if (_command != "") return _command;
for (const auto& a : _args)
if (a.hasTag("CMD")) return a.attribute(canonical ? "canonical" : "raw");
return "";
}
////////////////////////////////////////////////////////////////////////////////
const std::string CLI2::dump(const std::string& title) const {
std::stringstream out;
out << "\033[1m" << title << "\033[0m\n"
<< " _original_args\n ";
Color colorArgs("gray10 on gray4");
Color colorFilter("black on rgb311");
for (auto i = _original_args.begin(); i != _original_args.end(); ++i) {
if (i != _original_args.begin()) out << ' ';
if (i->hasTag("ORIGINAL"))
out << colorArgs.colorize(i->attribute("raw"));
else
out << colorFilter.colorize(i->attribute("raw"));
}
out << '\n';
if (_args.size()) {
out << " _args\n";
for (const auto& a : _args) out << " " << a.dump() << '\n';
}
if (_id_ranges.size()) {
out << " _id_ranges\n ";
for (const auto& range : _id_ranges) {
if (range.first != range.second)
out << colorArgs.colorize(range.first + "-" + range.second) << ' ';
else
out << colorArgs.colorize(range.first) << ' ';
}
out << '\n';
}
if (_uuid_list.size()) {
out << " _uuid_list\n ";
for (const auto& uuid : _uuid_list) out << colorArgs.colorize(uuid) << ' ';
out << '\n';
}
return out.str();
}
////////////////////////////////////////////////////////////////////////////////
// If any aliases are found in un-TERMINATED arguments, replace the alias with
// a set of Lexed tokens from the configuration.
void CLI2::aliasExpansion() {
bool changes = false;
bool action;
int counter = 0;
do {
action = false;
std::vector<A2> reconstructed;
std::string raw;
for (const auto& i : _args) {
raw = i.attribute("raw");
if (i.hasTag("TERMINATED")) {
reconstructed.push_back(i);
} else if (_aliases.find(raw) != _aliases.end()) {
std::string lexeme;
Lexer::Type type;
Lexer lex(_aliases[raw]);
while (lex.token(lexeme, type)) reconstructed.emplace_back(lexeme, type);
action = true;
changes = true;
} else {
reconstructed.push_back(i);
}
}
_args = reconstructed;
std::vector<A2> reconstructedOriginals;
bool terminated = false;
for (const auto& i : _original_args) {
if (i.attribute("raw") == "--") terminated = true;
if (terminated) {
reconstructedOriginals.push_back(i);
} else if (_aliases.find(i.attribute("raw")) != _aliases.end()) {
std::string lexeme;
Lexer::Type type;
Lexer lex(_aliases[i.attribute("raw")]);
while (lex.token(lexeme, type)) reconstructedOriginals.emplace_back(lexeme, type);
action = true;
changes = true;
} else {
reconstructedOriginals.push_back(i);
}
}
_original_args = reconstructedOriginals;
} while (action && counter++ < safetyValveDefault);
if (counter >= safetyValveDefault)
Context::getContext().debug(format("Nested alias limit of {1} reached.", safetyValveDefault));
if (changes && Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze aliasExpansion"));
}
////////////////////////////////////////////////////////////////////////////////
// Scan all arguments and canonicalize names that need it.
void CLI2::canonicalizeNames() {
bool changes = false;
for (auto& a : _args) {
if (a._lextype == Lexer::Type::pair) {
std::string raw = a.attribute("raw");
if (raw.substr(0, 3) != "rc:" && raw.substr(0, 3) != "rc.") {
std::string name = a.attribute("name");
std::string canonical;
if (canonicalize(canonical, "pseudo", name) || canonicalize(canonical, "attribute", name)) {
a.attribute("canonical", canonical);
} else {
a._lextype = Lexer::Type::word;
}
changes = true;
}
}
}
if (changes && Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze canonicalizeNames"));
}
////////////////////////////////////////////////////////////////////////////////
// Categorize FILTER, MODIFICATION and MISCELLANEOUS args, based on CMD DNA.
void CLI2::categorizeArgs() {
// Context is only applied for commands that request it.
std::string command = getCommand();
Command* cmd = Context::getContext().commands[command];
// Determine if the command uses Context. CmdCustom and CmdTimesheet need to
// be handled separately, as they override the parent Command::use_context
// method, and this is a pointer to Command class.
//
// All Command classes overriding uses_context () getter need to be specified
// here.
bool uses_context;
if (dynamic_cast<CmdCustom*>(cmd))
uses_context = (dynamic_cast<CmdCustom*>(cmd))->uses_context();
else if (dynamic_cast<CmdTimesheet*>(cmd))
uses_context = (dynamic_cast<CmdTimesheet*>(cmd))->uses_context();
else if (cmd)
uses_context = cmd->uses_context();
// Apply the context, if applicable
if (cmd && uses_context) addContext(cmd->accepts_filter(), cmd->accepts_modifications());
bool changes = false;
bool afterCommand = false;
for (auto& a : _args) {
if (a._lextype == Lexer::Type::separator) continue;
// Record that the command has been found, it affects behavior.
if (a.hasTag("CMD")) {
afterCommand = true;
}
// Skip admin args.
else if (a.hasTag("BINARY") || a.hasTag("RC") || a.hasTag("CONFIG")) {
// NOP.
}
// All combinations, with all 8 cases handled below.:
//
// -- -- -- Error: found an arg, but none expected
// -- -- Mi task [Mi] <cmd> [Mi]
// -- Mo -- task [Mo] <cmd> [Mo]
// -- Mo Mi Internally inconsistent
// Fi -- -- task [Fi] <cmd> [Fi]
// Fi -- Mi task [Fi] <cmd> [Mi]
// Fi Mo -- task [Fi] <cmd> [Mo]
// Fi Mo Mi Internally inconsistent
//
else if (cmd && !cmd->accepts_filter() && !cmd->accepts_modifications() &&
!cmd->accepts_miscellaneous()) {
// No commands were expected --> error.
throw format("The '{1}' command does not allow '{2}'.", command, a.attribute("raw"));
} else if (cmd && !cmd->accepts_filter() && !cmd->accepts_modifications() &&
cmd->accepts_miscellaneous()) {
a.tag("MISCELLANEOUS");
changes = true;
} else if (cmd && !cmd->accepts_filter() && cmd->accepts_modifications() &&
!cmd->accepts_miscellaneous()) {
a.tag("MODIFICATION");
changes = true;
} else if (cmd && !cmd->accepts_filter() && cmd->accepts_modifications() &&
cmd->accepts_miscellaneous()) {
// Error: internally inconsistent.
throw std::string("Unknown error. Please report.");
} else if (cmd && cmd->accepts_filter() && !cmd->accepts_modifications() &&
!cmd->accepts_miscellaneous()) {
a.tag("FILTER");
changes = true;
} else if (cmd && cmd->accepts_filter() && !cmd->accepts_modifications() &&
cmd->accepts_miscellaneous()) {
if (!afterCommand)
a.tag("FILTER");
else
a.tag("MISCELLANEOUS");
changes = true;
} else if (cmd && cmd->accepts_filter() && cmd->accepts_modifications() &&
!cmd->accepts_miscellaneous()) {
if (!afterCommand)
a.tag("FILTER");
else
a.tag("MODIFICATION");
changes = true;
} else if (cmd && cmd->accepts_filter() && cmd->accepts_modifications() &&
cmd->accepts_miscellaneous()) {
// Error: internally inconsistent.
throw std::string("Unknown error. Please report.");
}
}
if (changes && Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze categorizeArgs"));
}
////////////////////////////////////////////////////////////////////////////////
// The following command:
//
// task +home or +work list
//
// Is reasonable, and does not work unless the filter is parenthesized. Ignoring
// context, the 'list' report has a filter, which is inserted at the beginning
// like this:
//
// task ( status:pending ) +home or +work list
//
// Parenthesizing the user-provided (original) filter yields this:
//
// task ( status:pending ) ( +home or +work ) list
//
// And when the conjunction is added:
//
// task ( status:pending ) and ( +home or +work ) list
//
// the query is correct.
void CLI2::parenthesizeOriginalFilter() {
// Locate the first and last ORIGINAL FILTER args.
unsigned int firstOriginalFilter = 0;
unsigned int lastOriginalFilter = 0;
for (unsigned int i = 1; i < _args.size(); ++i) {
if (_args[i].hasTag("FILTER") && _args[i].hasTag("ORIGINAL")) {
if (firstOriginalFilter == 0) firstOriginalFilter = i;
lastOriginalFilter = i;
}
}
// If found, parenthesize the arg list accordingly.
if (firstOriginalFilter && lastOriginalFilter) {
std::vector<A2> reconstructed;
for (unsigned int i = 0; i < _args.size(); ++i) {
if (i == firstOriginalFilter) {
A2 openParen("(", Lexer::Type::op);
openParen.tag("ORIGINAL");
openParen.tag("FILTER");
reconstructed.push_back(openParen);
}
reconstructed.push_back(_args[i]);
if (i == lastOriginalFilter) {
A2 closeParen(")", Lexer::Type::op);
closeParen.tag("ORIGINAL");
closeParen.tag("FILTER");
reconstructed.push_back(closeParen);
}
}
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze parenthesizeOriginalFilter"));
}
}
////////////////////////////////////////////////////////////////////////////////
// Scan all arguments and if any are an exact match for a command name, then
// tag as CMD. If an argument is an exact match for an attribute, despite being
// an inexact match for a command, then it is not a command.
bool CLI2::findCommand() {
for (auto& a : _args) {
std::string raw = a.attribute("raw");
std::string canonical;
// If the arg canonicalized to a 'cmd', but is also not an exact match
// for an 'attribute', proceed. Example:
// task project=foo list
// ^cmd ^cmd
// ^attribute
if (exactMatch("cmd", raw))
canonical = raw;
else if (exactMatch("attribute", raw))
continue;
else if (!canonicalize(canonical, "cmd", raw))
continue;
a.attribute("canonical", canonical);
a.tag("CMD");
// Apply command DNA as tags.
Command* command = Context::getContext().commands[canonical];
if (command->read_only()) a.tag("READONLY");
if (command->displays_id()) a.tag("SHOWSID");
if (command->needs_gc()) a.tag("RUNSGC");
if (command->uses_context()) a.tag("USESCONTEXT");
if (command->accepts_filter()) a.tag("ALLOWSFILTER");
if (command->accepts_modifications()) a.tag("ALLOWSMODIFICATIONS");
if (command->accepts_miscellaneous()) a.tag("ALLOWSMISC");
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze findCommand"));
// Stop and indicate command found.
return true;
}
// Indicate command not found.
return false;
}
////////////////////////////////////////////////////////////////////////////////
// Search for exact 'value' in _entities category.
bool CLI2::exactMatch(const std::string& category, const std::string& value) const {
// Extract a list of entities for category.
auto c = _entities.equal_range(category);
for (auto e = c.first; e != c.second; ++e)
if (value == e->second) return true;
return false;
}
////////////////////////////////////////////////////////////////////////////////
// +tag --> tags _hastag_ tag
// -tag --> tags _notag_ tag
void CLI2::desugarFilterTags() {
bool changes = false;
std::vector<A2> reconstructed;
for (const auto& a : _args) {
if (a._lextype == Lexer::Type::tag && a.hasTag("FILTER")) {
changes = true;
A2 left("tags", Lexer::Type::dom);
left.tag("FILTER");
reconstructed.push_back(left);
std::string raw = a.attribute("raw");
A2 op(raw[0] == '+' ? "_hastag_" : "_notag_", Lexer::Type::op);
op.tag("FILTER");
reconstructed.push_back(op);
A2 right("" + raw.substr(1) + "", Lexer::Type::string);
right.tag("FILTER");
reconstructed.push_back(right);
} else
reconstructed.push_back(a);
}
if (changes) {
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter desugarFilterTags"));
}
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::findStrayModifications() {
bool changes = false;
auto command = getCommand();
if (command == "add" || command == "log") {
for (auto& a : _args) {
if (a.hasTag("FILTER")) {
a.unTag("FILTER");
a.tag("MODIFICATION");
changes = true;
}
}
}
if (changes)
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter findStrayModifications"));
}
////////////////////////////////////////////////////////////////////////////////
// <name>[.<mod>]:['"][<value>]['"] --> name <op> value
void CLI2::desugarFilterAttributes() {
bool changes = false;
std::vector<A2> reconstructed;
for (auto& a : _args) {
if (a._lextype == Lexer::Type::pair && a.hasTag("FILTER")) {
std::string raw = a.attribute("raw");
std::string name = a.attribute("name");
std::string mod = a.attribute("modifier");
std::string sep = a.attribute("separator");
std::string value = a.attribute("value");
// An unquoted string, while equivalent to an empty string, doesn't cause
// an operand shortage in eval.
if (value == "") value = "''";
// Some values are expressions, which need to be lexed. The best way to
// determine whether an expression is either a single value, or needs to
// be lexed, is to lex it and count the tokens. For example:
// now+1d
// This should be lexed and surrounded by parentheses:
// (
// now
// +
// 1d
// )
// Use this sequence in place of a single value.
std::vector<A2> values = lexExpression(value);
if (Context::getContext().config.getInteger("debug.parser") >= 2) {
Context::getContext().debug("CLI2::lexExpression " + name + ':' + value);
for (auto& v : values) Context::getContext().debug(" " + v.dump());
Context::getContext().debug(" ");
}
bool found = false;
std::string canonical;
if (canonicalize(canonical, "attribute", name)) {
// Certain attribute types do not suport math.
// string --> no
// numeric --> yes
// date --> yes
// duration --> yes
bool evalSupported = true;
Column* col = Context::getContext().columns[canonical];
if (col && col->type() == "string") evalSupported = false;
A2 lhs(name, Lexer::Type::dom);
lhs.tag("FILTER");
lhs.attribute("canonical", canonical);
lhs.attribute("modifier", mod);
A2 op("", Lexer::Type::op);
op.tag("FILTER");
// Attribute types that do not support evaluation should be interpreted
// as strings (currently this means that string attributes are not evaluated)
A2 rhs("", evalSupported ? values[0]._lextype : Lexer::Type::string);
rhs.tag("FILTER");
// Special case for '<name>:<value>'.
if (mod == "") {
op.attribute("raw", "=");
rhs.attribute("raw", value);
} else if (mod == "before" || mod == "under" || mod == "below") {
op.attribute("raw", "<");
rhs.attribute("raw", value);
} else if (mod == "after" || mod == "over" || mod == "above") {
op.attribute("raw", ">");
rhs.attribute("raw", value);
} else if (mod == "by") {
op.attribute("raw", "<=");
rhs.attribute("raw", value);
} else if (mod == "none") {
op.attribute("raw", "==");
rhs.attribute("raw", "''");
} else if (mod == "any") {
op.attribute("raw", "!==");
rhs.attribute("raw", "''");
} else if (mod == "is" || mod == "equals") {
op.attribute("raw", "==");
rhs.attribute("raw", value);
} else if (mod == "not") {
op.attribute("raw", "!=");
rhs.attribute("raw", value);
} else if (mod == "isnt") {
op.attribute("raw", "!==");
rhs.attribute("raw", value);
} else if (mod == "has" || mod == "contains") {
op.attribute("raw", "~");
rhs.attribute("raw", value);
} else if (mod == "hasnt") {
op.attribute("raw", "!~");
rhs.attribute("raw", value);
} else if (mod == "startswith" || mod == "left") {
op.attribute("raw", "~");
rhs.attribute("raw", "^" + value);
} else if (mod == "endswith" || mod == "right") {
op.attribute("raw", "~");
rhs.attribute("raw", value + "$");
} else if (mod == "word") {
op.attribute("raw", "~");
#if defined(DARWIN)
rhs.attribute("raw", value);
#elif defined(SOLARIS)
rhs.attribute("raw", "\\<" + value + "\\>");
#else
rhs.attribute("raw", "\\b" + value + "\\b");
#endif
} else if (mod == "noword") {
op.attribute("raw", "!~");
#if defined(DARWIN)
rhs.attribute("raw", value);
#elif defined(SOLARIS)
rhs.attribute("raw", "\\<" + value + "\\>");
#else
rhs.attribute("raw", "\\b" + value + "\\b");
#endif
} else
throw format("Error: unrecognized attribute modifier '{1}'.", mod);
reconstructed.push_back(lhs);
reconstructed.push_back(op);
// Do not modify this construct without full understanding.
// Getting this wrong breaks a whole lot of filtering tests.
if (evalSupported) {
for (auto& v : values) reconstructed.push_back(v);
} else if (Lexer::isDOM(rhs.attribute("raw"))) {
rhs._lextype = Lexer::Type::dom;
reconstructed.push_back(rhs);
} else {
reconstructed.push_back(rhs);
}
found = true;
}
// If the name does not canonicalize to either an attribute or a UDA
// then it is not a recognized Lexer::Type::pair, so downgrade it to
// Lexer::Type::word.
else {
a._lextype = Lexer::Type::word;
}
if (found)
changes = true;
else
reconstructed.push_back(a);
}
// Not a FILTER pair.
else
reconstructed.push_back(a);
}
if (changes) {
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter desugarFilterAttributes"));
}
}
////////////////////////////////////////////////////////////////////////////////
// /pattern/ --> description ~ 'pattern'
void CLI2::desugarFilterPatterns() {
bool changes = false;
std::vector<A2> reconstructed;
for (const auto& a : _args) {
if (a._lextype == Lexer::Type::pattern && a.hasTag("FILTER")) {
changes = true;
A2 lhs("description", Lexer::Type::dom);
lhs.tag("FILTER");
reconstructed.push_back(lhs);
A2 op("~", Lexer::Type::op);
op.tag("FILTER");
reconstructed.push_back(op);
A2 rhs(a.attribute("pattern"), Lexer::Type::string);
rhs.attribute("flags", a.attribute("flags"));
rhs.tag("FILTER");
reconstructed.push_back(rhs);
} else
reconstructed.push_back(a);
}
if (changes) {
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter desugarFilterPatterns"));
}
}
////////////////////////////////////////////////////////////////////////////////
// An ID sequence can be:
//
// a single ID: 1
// a list of IDs: 1,3,5
// a list of IDs: 1 3 5
// a range: 5-10
// or a combination: 1,3,5-10 12
//
void CLI2::findIDs() {
bool changes = false;
if (Context::getContext().config.getBoolean("sugar")) {
bool previousFilterArgWasAnOperator = false;
int filterCount = 0;
for (const auto& a : _args) {
if (a.hasTag("FILTER")) {
++filterCount;
if (a._lextype == Lexer::Type::number) {
// Skip any number that was preceded by an operator.
if (!previousFilterArgWasAnOperator) {
changes = true;
std::string number = a.attribute("raw");
_id_ranges.emplace_back(number, number);
}
} else if (a._lextype == Lexer::Type::set) {
// Split the ID list into elements.
auto elements = split(a.attribute("raw"), ',');
for (auto& element : elements) {
changes = true;
auto hyphen = element.find('-');
if (hyphen != std::string::npos)
_id_ranges.emplace_back(element.substr(0, hyphen), element.substr(hyphen + 1));
else
_id_ranges.emplace_back(element, element);
}
}
std::string raw = a.attribute("raw");
previousFilterArgWasAnOperator =
(a._lextype == Lexer::Type::op && raw != "(" && raw != ")") ? true : false;
}
}
// If no IDs were found, and no filter was specified, look for number/set
// listed as a MODIFICATION.
std::string command = getCommand();
if (!_id_ranges.size() && filterCount == 0 && command != "add" && command != "log") {
for (auto& a : _args) {
if (a.hasTag("MODIFICATION")) {
std::string raw = a.attribute("raw");
// For a number to be an ID, it must not contain any sign or floating
// point elements.
if (a._lextype == Lexer::Type::number && raw.find('.') == std::string::npos &&
raw.find('e') == std::string::npos && raw.find('-') == std::string::npos) {
changes = true;
a.unTag("MODIFICATION");
a.tag("FILTER");
_id_ranges.emplace_back(raw, raw);
} else if (a._lextype == Lexer::Type::set) {
a.unTag("MODIFICATION");
a.tag("FILTER");
// Split the ID list into elements.
auto elements = split(raw, ',');
for (const auto& element : elements) {
changes = true;
auto hyphen = element.find('-');
if (hyphen != std::string::npos)
_id_ranges.emplace_back(element.substr(0, hyphen), element.substr(hyphen + 1));
else
_id_ranges.emplace_back(element, element);
}
}
}
}
}
}
// Sugar-free.
else {
std::vector<A2> reconstructed;
for (const auto& a : _args) {
if (a.hasTag("FILTER") && a._lextype == Lexer::Type::number) {
changes = true;
A2 pair("id:" + a.attribute("raw"), Lexer::Type::pair);
pair.tag("FILTER");
pair.decompose();
reconstructed.push_back(pair);
} else
reconstructed.push_back(a);
}
if (changes) _args = reconstructed;
}
if (changes)
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter findIDs"));
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::findUUIDs() {
bool changes = false;
if (Context::getContext().config.getBoolean("sugar")) {
for (const auto& a : _args) {
if (a._lextype == Lexer::Type::uuid && a.hasTag("FILTER")) {
changes = true;
_uuid_list.push_back(a.attribute("raw"));
}
}
if (!_uuid_list.size()) {
for (auto& a : _args) {
if (a._lextype == Lexer::Type::uuid && a.hasTag("MODIFICATION")) {
changes = true;
a.unTag("MODIFICATION");
a.tag("FILTER");
_uuid_list.push_back(a.attribute("raw"));
}
}
}
}
// Sugar-free.
else {
std::vector<A2> reconstructed;
for (const auto& a : _args) {
if (a.hasTag("FILTER") && a._lextype == Lexer::Type::uuid) {
changes = true;
A2 pair("uuid:" + a.attribute("raw"), Lexer::Type::pair);
pair.tag("FILTER");
pair.decompose();
reconstructed.push_back(pair);
} else
reconstructed.push_back(a);
}
if (changes) _args = reconstructed;
}
if (changes)
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter findUUIDs"));
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::insertIDExpr() {
// Skip completely if no ID/UUID was found. This is because below, '(' and ')'
// are inserted regardless of list size.
if (!_id_ranges.size() && !_uuid_list.size()) return;
// Find the *first* occurence of lexer type set/number/uuid, and replace it
// with a synthesized expression. All other occurences are eaten.
bool changes = false;
bool foundID = false;
std::vector<A2> reconstructed;
for (const auto& a : _args) {
if ((a._lextype == Lexer::Type::set || a._lextype == Lexer::Type::number ||
a._lextype == Lexer::Type::uuid) &&
a.hasTag("FILTER")) {
if (!foundID) {
foundID = true;
changes = true;
// Construct a single sequence that represents all _id_ranges and
// _uuid_list in one clause. This is essentially converting this:
//
// 1,2-3 uuid,uuid uuid 4
//
// into:
//
// (
// ( id == 1 )
// or ( ( id >= 2 ) and ( id <= 3 ) )
// or ( id == 4 )
// or ( uuid = $UUID )
// or ( uuid = $UUID )
// )
// Building block operators.
A2 openParen("(", Lexer::Type::op);
openParen.tag("FILTER");
A2 closeParen(")", Lexer::Type::op);
closeParen.tag("FILTER");
A2 opOr("or", Lexer::Type::op);
opOr.tag("FILTER");
A2 opAnd("and", Lexer::Type::op);
opAnd.tag("FILTER");
A2 opSimilar("=", Lexer::Type::op);
opSimilar.tag("FILTER");
A2 opEqual("==", Lexer::Type::op);
opEqual.tag("FILTER");
A2 opGTE(">=", Lexer::Type::op);
opGTE.tag("FILTER");
A2 opLTE("<=", Lexer::Type::op);
opLTE.tag("FILTER");
// Building block attributes.
A2 argID("id", Lexer::Type::dom);
argID.tag("FILTER");
A2 argUUID("uuid", Lexer::Type::dom);
argUUID.tag("FILTER");
reconstructed.push_back(openParen);
// Add all ID ranges.
for (auto r = _id_ranges.begin(); r != _id_ranges.end(); ++r) {
if (r != _id_ranges.begin()) reconstructed.push_back(opOr);
if (r->first == r->second) {
reconstructed.push_back(openParen);
reconstructed.push_back(argID);
reconstructed.push_back(opEqual);
A2 value(r->first, Lexer::Type::number);
value.tag("FILTER");
reconstructed.push_back(value);
reconstructed.push_back(closeParen);
} else {
bool ascending = true;
int low = strtol(r->first.c_str(), nullptr, 10);
int high = strtol(r->second.c_str(), nullptr, 10);
if (low <= high)
ascending = true;
else
ascending = false;
reconstructed.push_back(openParen);
reconstructed.push_back(argID);
reconstructed.push_back(opGTE);
A2 startValue((ascending ? r->first : r->second), Lexer::Type::number);
startValue.tag("FILTER");
reconstructed.push_back(startValue);
reconstructed.push_back(opAnd);
reconstructed.push_back(argID);
reconstructed.push_back(opLTE);
A2 endValue((ascending ? r->second : r->first), Lexer::Type::number);
endValue.tag("FILTER");
reconstructed.push_back(endValue);
reconstructed.push_back(closeParen);
}
}
// Combine the ID and UUID sections with 'or'.
if (_id_ranges.size() && _uuid_list.size()) reconstructed.push_back(opOr);
// Add all UUID list items.
for (auto u = _uuid_list.begin(); u != _uuid_list.end(); ++u) {
if (u != _uuid_list.begin()) reconstructed.push_back(opOr);
reconstructed.push_back(openParen);
reconstructed.push_back(argUUID);
reconstructed.push_back(opSimilar);
A2 value(*u, Lexer::Type::string);
value.tag("FILTER");
reconstructed.push_back(value);
reconstructed.push_back(closeParen);
}
reconstructed.push_back(closeParen);
}
// No 'else' because all set/number/uuid args but the first are removed.
} else
reconstructed.push_back(a);
}
if (changes) {
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter insertIDExpr"));
}
}
////////////////////////////////////////////////////////////////////////////////
// FILTER Lexer::Type::word args will become part of an expression, and so they
// need to be Lexed.
void CLI2::lexFilterArgs() {
bool changes = false;
std::vector<A2> reconstructed;
for (const auto& a : _args) {
if (a._lextype == Lexer::Type::word && a.hasTag("FILTER")) {
changes = true;
std::string lexeme;
Lexer::Type type;
Lexer lex(a.attribute("raw"));
while (lex.token(lexeme, type)) {
A2 extra(lexeme, type);
extra.tag("FILTER");
reconstructed.push_back(extra);
}
} else
reconstructed.push_back(a);
}
if (changes) {
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter lexFilterArgs"));
}
}
////////////////////////////////////////////////////////////////////////////////
// FILTER, Lexer::Type::word args are treated as search terms.
//
// Algorithm:
// Given:
// - task ... argX candidate argY
// Where:
// - neither argX nor argY are an operator, except (, ), and, or, xor
// - candidate is one of: Lexer::Type::word
// Lexer::Type::identifier
// Lexer::Type::date
//
void CLI2::desugarFilterPlainArgs() {
// First walk the arg list looking for plain words that are not part of an
// existing expression.
auto prevprev = &_args[0];
auto prev = &_args[0];
for (auto& a : _args) {
auto raw = a.attribute("raw");
auto praw = prev->attribute("raw");
auto ppraw = prevprev->attribute("raw");
if ((prevprev->_lextype != Lexer::Type::op || // argX
ppraw == "(" || ppraw == ")" || ppraw == "and" || ppraw == "or" || ppraw == "xor") &&
(prev->_lextype == Lexer::Type::identifier || // candidate
prev->_lextype == Lexer::Type::date || // candidate
prev->_lextype == Lexer::Type::word) && // candidate
prev->hasTag("FILTER") && // candidate
(a._lextype != Lexer::Type::op || // argY
raw == "(" || raw == ")" || raw == "and" || raw == "or" || raw == "xor")) {
prev->tag("PLAIN");
}
prevprev = prev;
prev = &a;
}
// Cover the case where the *last* argument is a plain arg.
auto& penultimate = _args[_args.size() - 2];
auto praw = penultimate.attribute("raw");
auto& last = _args[_args.size() - 1];
if ((penultimate._lextype != Lexer::Type::op || // argX
praw == "(" || praw == ")" || praw == "and" || praw == "or" || praw == "xor") &&
(last._lextype == Lexer::Type::identifier || // candidate
last._lextype == Lexer::Type::word) && // candidate
last.hasTag("FILTER")) // candidate
{
last.tag("PLAIN");
}
// Walk the list again, upgrading PLAIN args.
bool changes = false;
std::vector<A2> reconstructed;
for (const auto& a : _args) {
if (a.hasTag("PLAIN")) {
changes = true;
A2 lhs("description", Lexer::Type::dom);
lhs.attribute("canonical", "description");
lhs.tag("FILTER");
lhs.tag("PLAIN");
reconstructed.push_back(lhs);
A2 op("~", Lexer::Type::op);
op.tag("FILTER");
op.tag("PLAIN");
reconstructed.push_back(op);
std::string word = a.attribute("raw");
Lexer::dequote(word);
A2 rhs(word, Lexer::Type::string);
rhs.tag("FILTER");
rhs.tag("PLAIN");
reconstructed.push_back(rhs);
} else
reconstructed.push_back(a);
}
if (changes) {
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter desugarFilterPlainArgs"));
}
}
////////////////////////////////////////////////////////////////////////////////
// Detects if the bracket at iterator it is a start or end of an empty paren expression
// Examples:
// ( status = pending ) ( )
// ^
// it -----| => true
//
// ( status = pending ) ( project = Home )
// ^
// it -----| => false
bool CLI2::isEmptyParenExpression(std::vector<A2>::iterator it, bool forward /* = true */) const {
int open = 0;
int closed = 0;
for (auto a = it; a != (forward ? _args.end() : _args.begin()); (forward ? ++a : --a)) {
if (a->attribute("raw") == "(")
open++;
else if (a->attribute("raw") == ")")
closed++;
else
// Encountering a non-paren token means there is something between parenthees
return false;
// Getting balanced parentheses means we have an empty paren expression
if (open == closed && open != 0) return true;
}
// Should not end here.
return false;
}
////////////////////////////////////////////////////////////////////////////////
// Two consecutive FILTER, non-OP arguments that are not "(" or ")" need an
// "and" operator inserted between them.
//
// ) <non-op> --> ) and <non-op>
// <non-op> ( --> <non-op> <and> (
// ) ( --> ) and (
// <non-op> <non-op> --> <non-op> and <non-op>
//
void CLI2::insertJunctions() {
bool changes = false;
std::vector<A2> reconstructed;
auto prev = _args.begin();
for (auto a = _args.begin(); a != _args.end(); ++a) {
if (a->hasTag("FILTER")) {
// The prev iterator should be the first FILTER arg.
if (prev == _args.begin()) prev = a;
// Insert AND between terms.
else if (a != prev) {
if ((prev->_lextype != Lexer::Type::op && a->attribute("raw") == "(" &&
!isEmptyParenExpression(a, true)) ||
(prev->attribute("raw") == ")" && a->_lextype != Lexer::Type::op &&
!isEmptyParenExpression(prev, false)) ||
(prev->attribute("raw") == ")" && a->attribute("raw") == "(" &&
!isEmptyParenExpression(a, true) && !isEmptyParenExpression(prev, false)) ||
(prev->_lextype != Lexer::Type::op && a->_lextype != Lexer::Type::op)) {
A2 opOr("and", Lexer::Type::op);
opOr.tag("FILTER");
reconstructed.push_back(opOr);
changes = true;
}
}
// Previous FILTER arg.
prev = a;
}
reconstructed.push_back(*a);
}
if (changes) {
_args = reconstructed;
if (Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::prepareFilter insertJunctions"));
}
}
////////////////////////////////////////////////////////////////////////////////
// Look for situations that require defaults:
//
// 1. If no command was found, and no ID/UUID, and if rc.default.command is
// configured, inject the lexed tokens from rc.default.command.
//
// 2. If no command was found, but an ID/UUID was found, then assume a command
// of 'information'.
//
void CLI2::defaultCommand() {
// Scan the top-level branches for evidence of ID, UUID, overrides and other
// arguments.
bool changes = false;
bool found_command = false;
bool found_sequence = false;
for (const auto& a : _args) {
std::string raw = a.attribute("raw");
if (a.hasTag("CMD")) found_command = true;
if (a._lextype == Lexer::Type::uuid || a._lextype == Lexer::Type::number) found_sequence = true;
}
// If no command was specified, then a command will be inserted.
if (!found_command) {
// Default command.
if (!found_sequence) {
// Apply overrides, if any.
std::string defaultCommand = Context::getContext().config.get("default.command");
if (defaultCommand != "") {
// Modify _args, _original_args to be:
// <args0> [<def0> ...] <args1> [...]
std::vector<A2> reconstructedOriginals{_original_args[0]};
std::vector<A2> reconstructed{_args[0]};
std::string lexeme;
Lexer::Type type;
Lexer lex(defaultCommand);
while (lex.token(lexeme, type)) {
reconstructedOriginals.emplace_back(lexeme, type);
A2 cmd(lexeme, type);
cmd.tag("DEFAULT");
reconstructed.push_back(cmd);
}
for (unsigned int i = 1; i < _original_args.size(); ++i)
reconstructedOriginals.push_back(_original_args[i]);
for (unsigned int i = 1; i < _args.size(); ++i) reconstructed.push_back(_args[i]);
_original_args = reconstructedOriginals;
_args = reconstructed;
changes = true;
}
} else {
A2 info("information", Lexer::Type::word);
info.tag("ASSUMED");
_args.push_back(info);
changes = true;
}
}
if (changes && Context::getContext().config.getInteger("debug.parser") >= 2)
Context::getContext().debug(dump("CLI2::analyze defaultCommand"));
}
////////////////////////////////////////////////////////////////////////////////
// Some values are expressions, which need to be lexed. The best way to
// determine whether an expression is either a single value, or needs to be
// lexed, is to lex it and count the tokens. For example:
// now+1d
// This should be lexed and surrounded by parentheses:
// (
// now
// +
// 1d
// )
std::vector<A2> CLI2::lexExpression(const std::string& expression) {
std::vector<A2> lexed;
std::string lexeme;
Lexer::Type type;
Lexer lex(expression);
while (lex.token(lexeme, type)) {
A2 token(lexeme, type);
token.tag("FILTER");
lexed.push_back(token);
}
// If there were multiple tokens, parenthesize, because this expression will
// be used as a value.
if (lexed.size() > 1) {
A2 openParen("(", Lexer::Type::op);
openParen.tag("FILTER");
A2 closeParen(")", Lexer::Type::op);
closeParen.tag("FILTER");
lexed.insert(lexed.begin(), openParen);
lexed.push_back(closeParen);
}
return lexed;
}
////////////////////////////////////////////////////////////////////////////////
// vim: ts=2:sw=2