taskwarrior/src/CLI2.cpp
2020-12-05 16:18:37 -05:00

2113 lines
60 KiB
C++

////////////////////////////////////////////////////////////////////////////////
//
// Copyright 2006 - 2020, Paul Beckingham, Federico Hernandez.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included
// in all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
// SOFTWARE.
//
// https://www.opensource.org/licenses/mit-license.php
//
////////////////////////////////////////////////////////////////////////////////
#include <cmake.h>
#include <CLI2.h>
#include <sstream>
#include <algorithm>
#include <cstdlib>
#include <Context.h>
#include <Lexer.h>
#include <Color.h>
#include <shared.h>
#include <format.h>
// Overridden by rc.abbreviation.minimum.
int CLI2::minimumMatchLength = 3;
// Alias expansion limit. Any more indicates some kind of error.
static int safetyValveDefault = 10;
////////////////////////////////////////////////////////////////////////////////
A2::A2 (const std::string& raw, Lexer::Type lextype)
{
_lextype = lextype;
attribute ("raw", raw);
}
////////////////////////////////////////////////////////////////////////////////
A2::A2 (const A2& other) = default;
////////////////////////////////////////////////////////////////////////////////
A2& A2::operator= (const A2& other) = default;
////////////////////////////////////////////////////////////////////////////////
bool A2::hasTag (const std::string& tag) const
{
return std::find (_tags.begin (), _tags.end (), tag) != _tags.end ();
}
////////////////////////////////////////////////////////////////////////////////
void A2::tag (const std::string& tag)
{
if (! hasTag (tag))
_tags.push_back (tag);
}
////////////////////////////////////////////////////////////////////////////////
void A2::unTag (const std::string& tag)
{
for (auto i = _tags.begin (); i != _tags.end (); ++i)
if (*i == tag)
{
_tags.erase (i);
break;
}
}
////////////////////////////////////////////////////////////////////////////////
// Accessor for attributes.
void A2::attribute (const std::string& name, const std::string& value)
{
_attributes[name] = value;
if (name == "raw")
decompose ();
}
////////////////////////////////////////////////////////////////////////////////
// Accessor for attributes.
const std::string A2::attribute (const std::string& name) const
{
// Prevent autovivification.
auto i = _attributes.find (name);
if (i != _attributes.end ())
return i->second;
return "";
}
////////////////////////////////////////////////////////////////////////////////
const std::string A2::getToken () const
{
auto i = _attributes.find ("canonical");
if (i == _attributes.end ())
i = _attributes.find ("raw");
return i->second;
}
////////////////////////////////////////////////////////////////////////////////
void A2::decompose ()
{
if (_lextype == Lexer::Type::tag)
{
std::string raw = _attributes["raw"];
attribute ("name", raw.substr (1));
attribute ("sign", raw.substr (0, 1));
}
else if (_lextype == Lexer::Type::substitution)
{
//if (Directory (raw).exists ())
// return;
std::string from;
std::string to;
std::string flags;
if (Lexer::decomposeSubstitution (_attributes["raw"], from, to, flags))
{
attribute ("from", from);
attribute ("to", to);
attribute ("flags", flags);
}
}
else if (_lextype == Lexer::Type::pair)
{
std::string name;
std::string mod;
std::string sep;
std::string value;
if (Lexer::decomposePair (_attributes["raw"], name, mod, sep, value))
{
attribute ("name", name);
attribute ("modifier", mod);
attribute ("separator", sep);
attribute ("value", value);
if (name == "rc")
{
if (!mod.empty())
tag ("CONFIG");
else
tag ("RC");
}
}
}
else if (_lextype == Lexer::Type::pattern)
{
//if (Directory (raw).exists ())
// return;
std::string pattern;
std::string flags;
if (Lexer::decomposePattern (_attributes["raw"], pattern, flags))
{
attribute ("pattern", pattern);
attribute ("flags", flags);
}
}
}
////////////////////////////////////////////////////////////////////////////////
const std::string A2::dump () const
{
auto output = Lexer::typeToString (_lextype);
// Dump attributes.
std::string atts;
for (const auto& a : _attributes)
atts += a.first + "='\033[33m" + a.second + "\033[0m' ";
// Dump tags.
std::string tags;
for (const auto& tag : _tags)
{
if (tag == "BINARY") tags += "\033[1;37;44m" + tag + "\033[0m ";
else if (tag == "CMD") tags += "\033[1;37;46m" + tag + "\033[0m ";
else if (tag == "FILTER") tags += "\033[1;37;42m" + tag + "\033[0m ";
else if (tag == "MODIFICATION") tags += "\033[1;37;43m" + tag + "\033[0m ";
else if (tag == "MISCELLANEOUS") tags += "\033[1;37;45m" + tag + "\033[0m ";
else if (tag == "RC") tags += "\033[1;37;41m" + tag + "\033[0m ";
else if (tag == "CONFIG") tags += "\033[1;37;101m" + tag + "\033[0m ";
else if (tag == "?") tags += "\033[38;5;255;48;5;232m" + tag + "\033[0m ";
else tags += "\033[32m" + tag + "\033[0m ";
}
return output + ' ' + atts + tags;
}
////////////////////////////////////////////////////////////////////////////////
static
const char* getValue (int argc, const char** argv, std::string arg)
{
const auto is_arg = [&] (std::string s)
{
return s.size () > arg.size () + 1
&& (s[arg.size ()] == ':' || s[arg.size ()] == '=')
&& s.compare (0, arg.size (), arg) == 0;
};
// find last argument before --
auto last = std::make_reverse_iterator (argv);
auto first = std::make_reverse_iterator (
std::find (argv, argv + argc, std::string ("--")));
auto it = std::find_if (first, last, is_arg);
if (it == last)
return nullptr;
// return the string after : or =
return *it + arg.size () + 1;
}
////////////////////////////////////////////////////////////////////////////////
// Static method.
bool CLI2::getOverride (int argc, const char** argv, std::string& home, File& rc)
{
const char* value = getValue (argc, argv, "rc");
if (value == nullptr)
return false;
rc = File (value);
if (rc._data.rfind ('/') != std::string::npos)
home = rc.parent ();
else
home = ".";
return true;
}
////////////////////////////////////////////////////////////////////////////////
// Look for CONFIG data.location and initialize a Path object.
// Static method.
bool CLI2::getDataLocation (int argc, const char** argv, Path& data)
{
const char* value = getValue (argc, argv, "rc.data.location");
if (value == nullptr)
{
std::string location = Context::getContext ().config.get ("data.location");
if (!location.empty())
data = location;
return false;
}
data = Directory (value);
return true;
}
////////////////////////////////////////////////////////////////////////////////
// Static method.
void CLI2::applyOverrides (int argc, const char** argv)
{
auto& context = Context::getContext ();
auto last = std::find (argv, argv + argc, std::string ("--"));
auto is_override = [] (const std::string& s)
{
return s.compare (0, 3, "rc.") == 0;
};
auto get_sep = [&] (const std::string& s)
{
if (is_override (s))
return s.find_first_of (":=", 3);
return std::string::npos;
};
auto override_settings = [&] (const std::string& raw)
{
auto sep = get_sep (raw);
if (sep == std::string::npos)
return;
std::string name = raw.substr (3, sep - 3);
std::string value = raw.substr (sep + 1);
context.config.set (name, value);
};
auto display_overrides = [&] (const std::string& raw)
{
if (is_override (raw))
context.footnote (format ("Configuration override {1}", raw));
};
std::for_each (argv, last, override_settings);
if (context.verbose ("override"))
std::for_each (argv, last, display_overrides);
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::alias (const std::string& name, const std::string& value)
{
_aliases[name] = value;
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::entity (const std::string& category, const std::string& name)
{
// Walk the list of entities for category.
auto c = _entities.equal_range (category);
for (auto e = c.first; e != c.second; ++e)
if (e->second == name)
return;
// The category/name pair was not found, therefore add it.
_entities.insert (std::pair <std::string, std::string> (category, name));
}
////////////////////////////////////////////////////////////////////////////////
// Capture a single argument.
void CLI2::add (const std::string& argument)
{
A2 arg (Lexer::trim (argument), Lexer::Type::word);
arg.tag ("ORIGINAL");
_original_args.push_back (arg);
// Adding a new argument invalidates prior analysis.
_args.clear ();
}
////////////////////////////////////////////////////////////////////////////////
// Capture a set of arguments, inserted immediately after the binary.
void CLI2::add (const std::vector <std::string>& arguments)
{
std::vector <A2> replacement {_original_args[0]};
for (const auto& arg : arguments)
replacement.emplace_back(arg, Lexer::Type::word);
for (unsigned int i = 1; i < _original_args.size (); ++i)
replacement.push_back (_original_args[i]);
_original_args = replacement;
// Adding a new argument invalidates prior analysis.
_args.clear ();
}
////////////////////////////////////////////////////////////////////////////////
// Arg0 is the first argument, which is the name and potentially a relative or
// absolute path to the invoked binary.
//
// The binary name is 'task', but if the binary is reported as 'cal' or
// 'calendar' then it was invoked via symbolic link, in which case capture the
// first argument as 'calendar'.
void CLI2::handleArg0 ()
{
// Capture arg0 separately, because it is the command that was run, and could
// need special handling.
auto raw = _original_args[0].attribute ("raw");
A2 a (raw, Lexer::Type::word);
a.tag ("BINARY");
std::string basename = "task";
auto slash = raw.rfind ('/');
if (slash != std::string::npos)
basename = raw.substr (slash + 1);
a.attribute ("basename", basename);
if (basename == "cal" ||
basename == "calendar")
{
_args.push_back (a);
A2 cal ("calendar", Lexer::Type::word);
_args.push_back (cal);
}
else
{
_args.push_back (a);
}
}
////////////////////////////////////////////////////////////////////////////////
// All arguments must be individually and wholly recognized by the Lexer. Any
// argument not recognized is considered a Lexer::Type::word.
//
// As a side effect, tags all arguments after a terminator ('--') with
// TERMINATED.
void CLI2::lexArguments ()
{
// Note: Starts iterating at index 1, because ::handleArg0 has already
// processed it.
bool terminated = false;
for (unsigned int i = 1; i < _original_args.size (); ++i)
{
bool quoted = Lexer::wasQuoted (_original_args[i].attribute ("raw"));
// Process single-token arguments.
std::string lexeme;
Lexer::Type type;
Lexer lex (_original_args[i].attribute ("raw"));
if (lex.token (lexeme, type) &&
(lex.isEOS () || // Token goes to EOS
(quoted && type == Lexer::Type::pair))) // Quoted pairs automatically go to EOS
{
if (! terminated && type == Lexer::Type::separator)
terminated = true;
else if (terminated)
type = Lexer::Type::word;
A2 a (_original_args[i].attribute ("raw"), type);
if (terminated)
a.tag ("TERMINATED");
if (quoted)
a.tag ("QUOTED");
if (_original_args[i].hasTag ("ORIGINAL"))
a.tag ("ORIGINAL");
_args.push_back (a);
}
// Process muktiple-token arguments.
else
{
std::string quote = "'";
std::string escaped = _original_args[i].attribute ("raw");
escaped = str_replace (escaped, quote, "\\'");
std::string::size_type cursor = 0;
std::string word;
if (Lexer::readWord (quote + escaped + quote, quote, cursor, word))
{
Lexer::dequote (word);
A2 unknown (word, Lexer::Type::word);
if (Lexer::wasQuoted (_original_args[i].attribute ("raw")))
unknown.tag ("QUOTED");
if (_original_args[i].hasTag ("ORIGINAL"))
unknown.tag ("ORIGINAL");
_args.push_back (unknown);
}
// This branch may have no use-case.
else
{
A2 unknown (_original_args[i].attribute ("raw"), Lexer::Type::word);
unknown.tag ("UNKNOWN");
if (Lexer::wasQuoted (_original_args[i].attribute ("raw")))
unknown.tag ("QUOTED");
if (_original_args[i].hasTag ("ORIGINAL"))
unknown.tag ("ORIGINAL");
_args.push_back (unknown);
}
}
}
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze lexArguments"));
}
////////////////////////////////////////////////////////////////////////////////
// [1] Scan all args for the 'add' and 'log' commands, and demote any
// Lexer::Type::Tag args with sign '-' to Lexer::Type::word.
// [2] Convert any pseudo args name:value into config settings, and erase.
void CLI2::demotion ()
{
bool changes = false;
std::vector <A2> replacement;
std::string canonical;
for (auto& a : _args)
{
if (a._lextype == Lexer::Type::tag &&
a.attribute ("sign") == "-")
{
std::string command = getCommand ();
if (command == "add" ||
command == "log")
{
a._lextype = Lexer::Type::word;
changes = true;
}
}
else if (a._lextype == Lexer::Type::pair &&
canonicalize (canonical, "pseudo", a.attribute ("name")))
{
Context::getContext ().config.set (canonical, a.attribute ("value"));
changes = true;
// Equivalent to erasing 'a'.
continue;
}
replacement.push_back (a);
}
if (changes &&
Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze demotion"));
}
////////////////////////////////////////////////////////////////////////////////
// Intended to be called after ::add() to perform the final analysis.
void CLI2::analyze ()
{
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze"));
// Process _original_args.
_args.clear ();
handleArg0 ();
lexArguments ();
// Process _args.
aliasExpansion ();
if (! findCommand ())
{
defaultCommand ();
if (! findCommand ())
throw std::string ("You must specify a command or a task to modify.");
}
demotion ();
canonicalizeNames ();
// Determine arg types: FILTER, MODIFICATION, MISCELLANEOUS.
categorizeArgs ();
parenthesizeOriginalFilter ();
}
////////////////////////////////////////////////////////////////////////////////
// Process raw string.
void CLI2::addFilter (const std::string& arg)
{
if (arg.length ())
{
std::vector <std::string> filter;
filter.emplace_back("(");
std::string lexeme;
Lexer::Type type;
Lexer lex (arg);
while (lex.token (lexeme, type))
filter.push_back (lexeme);
filter.emplace_back(")");
add (filter);
analyze ();
}
}
////////////////////////////////////////////////////////////////////////////////
// There are situations where a context filter is applied. This method
// determines whether one applies, and if so, applies it. Disqualifiers include:
// - filter contains ID or UUID
void CLI2::addContextFilter ()
{
// Recursion block.
if (_context_filter_added)
return;
// Detect if any context is set, and bail out if not
std::string contextName = Context::getContext ().config.get ("context");
if (contextName.empty())
{
Context::getContext ().debug ("No context.");
return;
}
// Detect if UUID or ID is set, and bail out
for (auto& a : _args)
{
if (a._lextype == Lexer::Type::uuid ||
a._lextype == Lexer::Type::number ||
a._lextype == Lexer::Type::set)
{
Context::getContext ().debug (format ("UUID/ID argument found '{1}', not applying context.", a.attribute ("raw")));
return;
}
}
// Apply context
Context::getContext ().debug ("Applying context: " + contextName);
std::string contextFilter = Context::getContext ().config.get ("context." + contextName);
if (contextFilter.empty())
Context::getContext ().debug ("Context '" + contextName + "' not defined.");
else
{
_context_filter_added = true;
addFilter (contextFilter);
if (Context::getContext ().verbose ("context"))
Context::getContext ().footnote (format ("Context '{1}' set. Use 'task context none' to remove.", contextName));
}
}
////////////////////////////////////////////////////////////////////////////////
// Parse the command line, identifiying filter components, expanding syntactic
// sugar as necessary.
void CLI2::prepareFilter ()
{
// Clear and re-populate.
_id_ranges.clear ();
_uuid_list.clear ();
_context_filter_added = false;
// Remove all the syntactic sugar for FILTERs.
lexFilterArgs ();
findIDs ();
findUUIDs ();
insertIDExpr ();
desugarFilterPlainArgs ();
findStrayModifications ();
desugarFilterTags ();
desugarFilterAttributes ();
desugarFilterPatterns ();
insertJunctions (); // Deliberately after all desugar calls.
if (Context::getContext ().verbose ("filter"))
{
std::string combined;
for (const auto& a : _args)
{
if (a.hasTag ("FILTER"))
{
if (!combined.empty())
combined += ' ';
combined += a.attribute ("raw");
}
}
if (!combined.empty())
Context::getContext ().footnote (std::string ("Filter: ") + combined);
}
}
////////////////////////////////////////////////////////////////////////////////
// Return all the MISCELLANEOUS args.
const std::vector <std::string> CLI2::getWords ()
{
std::vector <std::string> words;
for (const auto& a : _args)
if (a.hasTag ("MISCELLANEOUS"))
words.push_back (a.attribute ("raw"));
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
{
Color colorOrigArgs ("gray10 on gray4");
std::string message = " ";
for (const auto& word : words)
message += colorOrigArgs.colorize (word) + ' ';
Context::getContext ().debug ("CLI2::getWords" + message);
}
return words;
}
////////////////////////////////////////////////////////////////////////////////
// Search for 'value' in _entities category, return canonicalized value.
bool CLI2::canonicalize (
std::string& canonicalized,
const std::string& category,
const std::string& value) const
{
// Extract a list of entities for category.
std::vector <std::string> options;
auto c = _entities.equal_range (category);
for (auto e = c.first; e != c.second; ++e)
{
// Shortcut: if an exact match is found, success.
if (value == e->second)
{
canonicalized = value;
return true;
}
options.push_back (e->second);
}
// Match against the options, throw away results.
std::vector <std::string> matches;
if (autoComplete (value, options, matches, minimumMatchLength) == 1)
{
canonicalized = matches[0];
return true;
}
return false;
}
////////////////////////////////////////////////////////////////////////////////
std::string CLI2::getBinary () const
{
if (!_args.empty())
return _args[0].attribute ("raw");
return "";
}
////////////////////////////////////////////////////////////////////////////////
std::string CLI2::getCommand (bool canonical) const
{
for (const auto& a : _args)
if (a.hasTag ("CMD"))
return a.attribute (canonical ? "canonical" : "raw");
return "";
}
////////////////////////////////////////////////////////////////////////////////
const std::string CLI2::dump (const std::string& title) const
{
std::stringstream out;
out << "\033[1m" << title << "\033[0m\n"
<< " _original_args\n ";
Color colorArgs ("gray10 on gray4");
Color colorFilter ("black on rgb311");
for (auto i = _original_args.begin (); i != _original_args.end (); ++i)
{
if (i != _original_args.begin ())
out << ' ';
if (i->hasTag ("ORIGINAL"))
out << colorArgs.colorize (i->attribute ("raw"));
else
out << colorFilter.colorize (i->attribute ("raw"));
}
out << '\n';
if (!_args.empty())
{
out << " _args\n";
for (const auto& a : _args)
out << " " << a.dump () << '\n';
}
if (!_id_ranges.empty())
{
out << " _id_ranges\n ";
for (const auto& range : _id_ranges)
{
if (range.first != range.second)
out << colorArgs.colorize (range.first + "-" + range.second) << ' ';
else
out << colorArgs.colorize (range.first) << ' ';
}
out << '\n';
}
if (!_uuid_list.empty())
{
out << " _uuid_list\n ";
for (const auto& uuid : _uuid_list)
out << colorArgs.colorize (uuid) << ' ';
out << '\n';
}
return out.str ();
}
////////////////////////////////////////////////////////////////////////////////
// If any aliases are found in un-TERMINATED arguments, replace the alias with
// a set of Lexed tokens from the configuration.
void CLI2::aliasExpansion ()
{
bool changes = false;
bool action;
int counter = 0;
do
{
action = false;
std::vector <A2> reconstructed;
std::string raw;
for (const auto& i : _args)
{
raw = i.attribute ("raw");
if (i.hasTag ("TERMINATED"))
{
reconstructed.push_back (i);
}
else if (_aliases.find (raw) != _aliases.end ())
{
std::string lexeme;
Lexer::Type type;
Lexer lex (_aliases[raw]);
while (lex.token (lexeme, type))
reconstructed.emplace_back(lexeme, type);
action = true;
changes = true;
}
else
{
reconstructed.push_back (i);
}
}
_args = reconstructed;
std::vector <A2> reconstructedOriginals;
bool terminated = false;
for (const auto& i : _original_args)
{
if (i.attribute ("raw") == "--")
terminated = true;
if (terminated)
{
reconstructedOriginals.push_back (i);
}
else if (_aliases.find (i.attribute ("raw")) != _aliases.end ())
{
std::string lexeme;
Lexer::Type type;
Lexer lex (_aliases[i.attribute ("raw")]);
while (lex.token (lexeme, type))
reconstructedOriginals.emplace_back(lexeme, type);
action = true;
changes = true;
}
else
{
reconstructedOriginals.push_back (i);
}
}
_original_args = reconstructedOriginals;
}
while (action && counter++ < safetyValveDefault);
if (counter >= safetyValveDefault)
Context::getContext ().debug (format ("Nested alias limit of {1} reached.", safetyValveDefault));
if (changes &&
Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze aliasExpansion"));
}
////////////////////////////////////////////////////////////////////////////////
// Scan all arguments and canonicalize names that need it.
void CLI2::canonicalizeNames ()
{
bool changes = false;
for (auto& a : _args)
{
if (a._lextype == Lexer::Type::pair)
{
std::string raw = a.attribute ("raw");
if (raw.substr (0, 3) != "rc:" &&
raw.substr (0, 3) != "rc.")
{
std::string name = a.attribute ("name");
std::string canonical;
if (canonicalize (canonical, "pseudo", name) ||
canonicalize (canonical, "attribute", name))
{
a.attribute ("canonical", canonical);
}
else
{
a._lextype = Lexer::Type::word;
}
changes = true;
}
}
}
if (changes &&
Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze canonicalizeNames"));
}
////////////////////////////////////////////////////////////////////////////////
// Categorize FILTER, MODIFICATION and MISCELLANEOUS args, based on CMD DNA.
void CLI2::categorizeArgs ()
{
// Context is only applied for commands that request it.
std::string command = getCommand ();
Command* cmd = Context::getContext ().commands[command];
if (cmd && cmd->uses_context ())
addContextFilter ();
bool changes = false;
bool afterCommand = false;
for (auto& a : _args)
{
if (a._lextype == Lexer::Type::separator)
continue;
// Record that the command has been found, it affects behavior.
if (a.hasTag ("CMD"))
{
afterCommand = true;
}
// Skip admin args.
else if (a.hasTag ("BINARY") ||
a.hasTag ("RC") ||
a.hasTag ("CONFIG"))
{
// NOP.
}
// All combinations, with all 8 cases handled below.:
//
// -- -- -- Error: found an arg, but none expected
// -- -- Mi task [Mi] <cmd> [Mi]
// -- Mo -- task [Mo] <cmd> [Mo]
// -- Mo Mi Internally inconsistent
// Fi -- -- task [Fi] <cmd> [Fi]
// Fi -- Mi task [Fi] <cmd> [Mi]
// Fi Mo -- task [Fi] <cmd> [Mo]
// Fi Mo Mi Internally inconsistent
//
else if (cmd &&
! cmd->accepts_filter () &&
! cmd->accepts_modifications () &&
! cmd->accepts_miscellaneous ())
{
// No commands were expected --> error.
throw format ("The '{1}' command does not allow '{2}'.", command, a.attribute ("raw"));
}
else if (cmd &&
! cmd->accepts_filter () &&
! cmd->accepts_modifications () &&
cmd->accepts_miscellaneous ())
{
a.tag ("MISCELLANEOUS");
changes = true;
}
else if (cmd &&
! cmd->accepts_filter () &&
cmd->accepts_modifications () &&
! cmd->accepts_miscellaneous ())
{
a.tag ("MODIFICATION");
changes = true;
}
else if (cmd &&
! cmd->accepts_filter () &&
cmd->accepts_modifications () &&
cmd->accepts_miscellaneous ())
{
// Error: internally inconsistent.
throw std::string ("Unknown error. Please report.");
}
else if (cmd &&
cmd->accepts_filter () &&
! cmd->accepts_modifications () &&
! cmd->accepts_miscellaneous ())
{
a.tag ("FILTER");
changes = true;
}
else if (cmd &&
cmd->accepts_filter () &&
! cmd->accepts_modifications () &&
cmd->accepts_miscellaneous ())
{
if (!afterCommand)
a.tag ("FILTER");
else
a.tag ("MISCELLANEOUS");
changes = true;
}
else if (cmd &&
cmd->accepts_filter () &&
cmd->accepts_modifications () &&
! cmd->accepts_miscellaneous ())
{
if (!afterCommand)
a.tag ("FILTER");
else
a.tag ("MODIFICATION");
changes = true;
}
else if (cmd &&
cmd->accepts_filter () &&
cmd->accepts_modifications () &&
cmd->accepts_miscellaneous ())
{
// Error: internally inconsistent.
throw std::string ("Unknown error. Please report.");
}
}
if (changes &&
Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze categorizeArgs"));
}
////////////////////////////////////////////////////////////////////////////////
// The following command:
//
// task +home or +work list
//
// Is reasonable, and does not work unless the filter is parenthesized. Ignoring
// context, the 'list' report has a filter, which is inserted at the beginning
// like this:
//
// task ( status:pending ) +home or +work list
//
// Parenthesizing the user-provided (original) filter yields this:
//
// task ( status:pending ) ( +home or +work ) list
//
// And when the conjunction is added:
//
// task ( status:pending ) and ( +home or +work ) list
//
// the query is correct.
void CLI2::parenthesizeOriginalFilter ()
{
// Locate the first and last ORIGINAL FILTER args.
unsigned int firstOriginalFilter = 0;
unsigned int lastOriginalFilter = 0;
for (unsigned int i = 1; i < _args.size (); ++i)
{
if (_args[i].hasTag ("FILTER") &&
_args[i].hasTag ("ORIGINAL"))
{
if (firstOriginalFilter == 0)
firstOriginalFilter = i;
lastOriginalFilter = i;
}
}
// If found, parenthesize the arg list accordingly.
if (firstOriginalFilter &&
lastOriginalFilter)
{
std::vector <A2> reconstructed;
for (unsigned int i = 0; i < _args.size (); ++i)
{
if (i == firstOriginalFilter)
{
A2 openParen ("(", Lexer::Type::op);
openParen.tag ("ORIGINAL");
openParen.tag ("FILTER");
reconstructed.push_back (openParen);
}
reconstructed.push_back (_args[i]);
if (i == lastOriginalFilter)
{
A2 closeParen (")", Lexer::Type::op);
closeParen.tag ("ORIGINAL");
closeParen.tag ("FILTER");
reconstructed.push_back (closeParen);
}
}
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze parenthesizeOriginalFilter"));
}
}
////////////////////////////////////////////////////////////////////////////////
// Scan all arguments and if any are an exact match for a command name, then
// tag as CMD. If an argument is an exact match for an attribute, despite being
// an inexact match for a command, then it is not a command.
bool CLI2::findCommand ()
{
for (auto& a : _args)
{
std::string raw = a.attribute ("raw");
std::string canonical;
// If the arg canonicalized to a 'cmd', but is also not an exact match
// for an 'attribute', proceed. Example:
// task project=foo list
// ^cmd ^cmd
// ^attribute
if (exactMatch ("cmd", raw))
canonical = raw;
else if (exactMatch ("attribute", raw))
continue;
else if (! canonicalize (canonical, "cmd", raw))
continue;
a.attribute ("canonical", canonical);
a.tag ("CMD");
// Apply command DNA as tags.
Command* command = Context::getContext ().commands[canonical];
if (command->read_only ()) a.tag ("READONLY");
if (command->displays_id ()) a.tag ("SHOWSID");
if (command->needs_gc ()) a.tag ("RUNSGC");
if (command->uses_context ()) a.tag ("USESCONTEXT");
if (command->accepts_filter ()) a.tag ("ALLOWSFILTER");
if (command->accepts_modifications ()) a.tag ("ALLOWSMODIFICATIONS");
if (command->accepts_miscellaneous ()) a.tag ("ALLOWSMISC");
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze findCommand"));
// Stop and indicate command found.
return true;
}
// Indicate command not found.
return false;
}
////////////////////////////////////////////////////////////////////////////////
// Search for exact 'value' in _entities category.
bool CLI2::exactMatch (
const std::string& category,
const std::string& value) const
{
// Extract a list of entities for category.
auto c = _entities.equal_range (category);
for (auto e = c.first; e != c.second; ++e)
if (value == e->second)
return true;
return false;
}
////////////////////////////////////////////////////////////////////////////////
// +tag --> tags _hastag_ tag
// -tag --> tags _notag_ tag
void CLI2::desugarFilterTags ()
{
bool changes = false;
std::vector <A2> reconstructed;
for (const auto& a : _args)
{
if (a._lextype == Lexer::Type::tag &&
a.hasTag ("FILTER"))
{
changes = true;
A2 left ("tags", Lexer::Type::dom);
left.tag ("FILTER");
reconstructed.push_back (left);
std::string raw = a.attribute ("raw");
A2 op (raw[0] == '+' ? "_hastag_" : "_notag_", Lexer::Type::op);
op.tag ("FILTER");
reconstructed.push_back (op);
A2 right ("" + raw.substr (1) + "", Lexer::Type::string);
right.tag ("FILTER");
reconstructed.push_back (right);
}
else
reconstructed.push_back (a);
}
if (changes)
{
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter desugarFilterTags"));
}
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::findStrayModifications ()
{
bool changes = false;
auto command = getCommand ();
if (command == "add" ||
command == "log")
{
for (auto& a : _args)
{
if (a.hasTag ("FILTER"))
{
a.unTag ("FILTER");
a.tag ("MODIFICATION");
changes = true;
}
}
}
if (changes)
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter findStrayModifications"));
}
////////////////////////////////////////////////////////////////////////////////
// <name>[.<mod>]:['"][<value>]['"] --> name <op> value
void CLI2::desugarFilterAttributes ()
{
bool changes = false;
std::vector <A2> reconstructed;
for (auto& a : _args)
{
if (a._lextype == Lexer::Type::pair &&
a.hasTag ("FILTER"))
{
std::string raw = a.attribute ("raw");
std::string name = a.attribute ("name");
std::string mod = a.attribute ("modifier");
std::string sep = a.attribute ("separator");
std::string value = a.attribute ("value");
// An unquoted string, while equivalent to an empty string, doesn't cause
// an operand shortage in eval.
if (value.empty())
value = "''";
// Some values are expressions, which need to be lexed. The best way to
// determine whether an expression is either a single value, or needs to
// be lexed, is to lex it and count the tokens. For example:
// now+1d
// This should be lexed and surrounded by parentheses:
// (
// now
// +
// 1d
// )
// Use this sequence in place of a single value.
std::vector <A2> values = lexExpression (value);
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
{
Context::getContext ().debug ("CLI2::lexExpression " + name + ':' + value);
for (auto& v : values)
Context::getContext ().debug (" " + v.dump ());
Context::getContext ().debug (" ");
}
bool found = false;
std::string canonical;
if (canonicalize (canonical, "attribute", name))
{
// Certain attribute types do not suport math.
// string --> no
// numeric --> yes
// date --> yes
// duration --> yes
bool evalSupported = true;
Column* col = Context::getContext ().columns[canonical];
if (col && col->type () == "string")
evalSupported = false;
A2 lhs (name, Lexer::Type::dom);
lhs.tag ("FILTER");
lhs.attribute ("canonical", canonical);
lhs.attribute ("modifier", mod);
A2 op ("", Lexer::Type::op);
op.tag ("FILTER");
A2 rhs ("", values[0]._lextype);
rhs.tag ("FILTER");
// Special case for '<name>:<value>'.
if (mod.empty())
{
op.attribute ("raw", "=");
rhs.attribute ("raw", value);
}
else if (mod == "before" || mod == "under" || mod == "below")
{
op.attribute ("raw", "<");
rhs.attribute ("raw", value);
}
else if (mod == "after" || mod == "over" || mod == "above")
{
op.attribute ("raw", ">");
rhs.attribute ("raw", value);
}
else if (mod == "none")
{
op.attribute ("raw", "==");
rhs.attribute ("raw", "''");
}
else if (mod == "any")
{
op.attribute ("raw", "!==");
rhs.attribute ("raw", "''");
}
else if (mod == "is" || mod == "equals")
{
op.attribute ("raw", "==");
rhs.attribute ("raw", value);
}
else if (mod == "not")
{
op.attribute ("raw", "!=");
rhs.attribute ("raw", value);
}
else if (mod == "isnt")
{
op.attribute ("raw", "!==");
rhs.attribute ("raw", value);
}
else if (mod == "has" || mod == "contains")
{
op.attribute ("raw", "~");
rhs.attribute ("raw", value);
}
else if (mod == "hasnt")
{
op.attribute ("raw", "!~");
rhs.attribute ("raw", value);
}
else if (mod == "startswith" || mod == "left")
{
op.attribute ("raw", "~");
rhs.attribute ("raw", "^" + value);
}
else if (mod == "endswith" || mod == "right")
{
op.attribute ("raw", "~");
rhs.attribute ("raw", value + "$");
}
else if (mod == "word")
{
op.attribute ("raw", "~");
#if defined (DARWIN)
rhs.attribute ("raw", value);
#elif defined (SOLARIS)
rhs.attribute ("raw", "\\<" + value + "\\>");
#else
rhs.attribute ("raw", "\\b" + value + "\\b");
#endif
}
else if (mod == "noword")
{
op.attribute ("raw", "!~");
#if defined (DARWIN)
rhs.attribute ("raw", value);
#elif defined (SOLARIS)
rhs.attribute ("raw", "\\<" + value + "\\>");
#else
rhs.attribute ("raw", "\\b" + value + "\\b");
#endif
}
else
throw format ("Error: unrecognized attribute modifier '{1}'.", mod);
reconstructed.push_back (lhs);
reconstructed.push_back (op);
// Do not modify this construct without full understanding.
// Getting this wrong breaks a whole lot of filtering tests.
if (values.size () > 1 || evalSupported)
{
for (auto& v : values)
reconstructed.push_back (v);
}
else if (Lexer::isDOM (rhs.attribute ("raw")))
{
rhs._lextype = Lexer::Type::dom;
reconstructed.push_back (rhs);
}
else
{
reconstructed.push_back (rhs);
}
found = true;
}
// If the name does not canonicalize to either an attribute or a UDA
// then it is not a recognized Lexer::Type::pair, so downgrade it to
// Lexer::Type::word.
else
{
a._lextype = Lexer::Type::word;
}
if (found)
changes = true;
else
reconstructed.push_back (a);
}
// Not a FILTER pair.
else
reconstructed.push_back (a);
}
if (changes)
{
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter desugarFilterAttributes"));
}
}
////////////////////////////////////////////////////////////////////////////////
// /pattern/ --> description ~ 'pattern'
void CLI2::desugarFilterPatterns ()
{
bool changes = false;
std::vector <A2> reconstructed;
for (const auto& a : _args)
{
if (a._lextype == Lexer::Type::pattern &&
a.hasTag ("FILTER"))
{
changes = true;
A2 lhs ("description", Lexer::Type::dom);
lhs.tag ("FILTER");
reconstructed.push_back (lhs);
A2 op ("~", Lexer::Type::op);
op.tag ("FILTER");
reconstructed.push_back (op);
A2 rhs (a.attribute ("pattern"), Lexer::Type::string);
rhs.attribute ("flags", a.attribute ("flags"));
rhs.tag ("FILTER");
reconstructed.push_back (rhs);
}
else
reconstructed.push_back (a);
}
if (changes)
{
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter desugarFilterPatterns"));
}
}
////////////////////////////////////////////////////////////////////////////////
// An ID sequence can be:
//
// a single ID: 1
// a list of IDs: 1,3,5
// a list of IDs: 1 3 5
// a range: 5-10
// or a combination: 1,3,5-10 12
//
void CLI2::findIDs ()
{
bool changes = false;
if (Context::getContext ().config.getBoolean ("sugar"))
{
bool previousFilterArgWasAnOperator = false;
int filterCount = 0;
for (const auto& a : _args)
{
if (a.hasTag ("FILTER"))
{
++filterCount;
if (a._lextype == Lexer::Type::number)
{
// Skip any number that was preceded by an operator.
if (! previousFilterArgWasAnOperator)
{
changes = true;
std::string number = a.attribute ("raw");
_id_ranges.emplace_back(number, number);
}
}
else if (a._lextype == Lexer::Type::set)
{
// Split the ID list into elements.
auto elements = split (a.attribute ("raw"), ',');
for (auto& element : elements)
{
changes = true;
auto hyphen = element.find ('-');
if (hyphen != std::string::npos)
_id_ranges.emplace_back(element.substr (0, hyphen), element.substr (hyphen + 1));
else
_id_ranges.emplace_back(element, element);
}
}
std::string raw = a.attribute ("raw");
previousFilterArgWasAnOperator = (a._lextype == Lexer::Type::op &&
raw != "(" &&
raw != ")")
? true
: false;
}
}
// If no IDs were found, and no filter was specified, look for number/set
// listed as a MODIFICATION.
std::string command = getCommand ();
if (_id_ranges.empty() &&
filterCount == 0 &&
command != "add" &&
command != "log")
{
for (auto& a : _args)
{
if (a.hasTag ("MODIFICATION"))
{
std::string raw = a.attribute ("raw");
// For a number to be an ID, it must not contain any sign or floating
// point elements.
if (a._lextype == Lexer::Type::number &&
raw.find ('.') == std::string::npos &&
raw.find ('e') == std::string::npos &&
raw.find ('-') == std::string::npos)
{
changes = true;
a.unTag ("MODIFICATION");
a.tag ("FILTER");
_id_ranges.emplace_back(raw, raw);
}
else if (a._lextype == Lexer::Type::set)
{
a.unTag ("MODIFICATION");
a.tag ("FILTER");
// Split the ID list into elements.
auto elements = split (raw, ',');
for (const auto& element : elements)
{
changes = true;
auto hyphen = element.find ('-');
if (hyphen != std::string::npos)
_id_ranges.emplace_back(element.substr (0, hyphen), element.substr (hyphen + 1));
else
_id_ranges.emplace_back(element, element);
}
}
}
}
}
}
// Sugar-free.
else
{
std::vector <A2> reconstructed;
for (const auto& a : _args)
{
if (a.hasTag ("FILTER") &&
a._lextype == Lexer::Type::number)
{
changes = true;
A2 pair ("id:" + a.attribute ("raw"), Lexer::Type::pair);
pair.tag ("FILTER");
pair.decompose ();
reconstructed.push_back (pair);
}
else
reconstructed.push_back (a);
}
if (changes)
_args = reconstructed;
}
if (changes)
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter findIDs"));
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::findUUIDs ()
{
bool changes = false;
if (Context::getContext ().config.getBoolean ("sugar"))
{
for (const auto& a : _args)
{
if (a._lextype == Lexer::Type::uuid &&
a.hasTag ("FILTER"))
{
changes = true;
_uuid_list.push_back (a.attribute ("raw"));
}
}
if (_uuid_list.empty())
{
for (auto& a : _args)
{
if (a._lextype == Lexer::Type::uuid &&
a.hasTag ("MODIFICATION"))
{
changes = true;
a.unTag ("MODIFICATION");
a.tag ("FILTER");
_uuid_list.push_back (a.attribute ("raw"));
}
}
}
}
// Sugar-free.
else
{
std::vector <A2> reconstructed;
for (const auto& a : _args)
{
if (a.hasTag ("FILTER") &&
a._lextype == Lexer::Type::uuid)
{
changes = true;
A2 pair ("uuid:" + a.attribute ("raw"), Lexer::Type::pair);
pair.tag ("FILTER");
pair.decompose ();
reconstructed.push_back (pair);
}
else
reconstructed.push_back (a);
}
if (changes)
_args = reconstructed;
}
if (changes)
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter findUUIDs"));
}
////////////////////////////////////////////////////////////////////////////////
void CLI2::insertIDExpr ()
{
// Skip completely if no ID/UUID was found. This is because below, '(' and ')'
// are inserted regardless of list size.
if (_id_ranges.empty() &&
_uuid_list.empty())
return;
// Find the *first* occurence of lexer type set/number/uuid, and replace it
// with a synthesized expression. All other occurences are eaten.
bool changes = false;
bool foundID = false;
std::vector <A2> reconstructed;
for (const auto& a : _args)
{
if ((a._lextype == Lexer::Type::set ||
a._lextype == Lexer::Type::number ||
a._lextype == Lexer::Type::uuid) &&
a.hasTag ("FILTER"))
{
if (! foundID)
{
foundID = true;
changes = true;
// Construct a single sequence that represents all _id_ranges and
// _uuid_list in one clause. This is essentially converting this:
//
// 1,2-3 uuid,uuid uuid 4
//
// into:
//
// (
// ( id == 1 )
// or ( ( id >= 2 ) and ( id <= 3 ) )
// or ( id == 4 )
// or ( uuid = $UUID )
// or ( uuid = $UUID )
// )
// Building block operators.
A2 openParen ("(", Lexer::Type::op); openParen.tag ("FILTER");
A2 closeParen (")", Lexer::Type::op); closeParen.tag ("FILTER");
A2 opOr ("or", Lexer::Type::op); opOr.tag ("FILTER");
A2 opAnd ("and", Lexer::Type::op); opAnd.tag ("FILTER");
A2 opSimilar ("=", Lexer::Type::op); opSimilar.tag ("FILTER");
A2 opEqual ("==", Lexer::Type::op); opEqual.tag ("FILTER");
A2 opGTE (">=", Lexer::Type::op); opGTE.tag ("FILTER");
A2 opLTE ("<=", Lexer::Type::op); opLTE.tag ("FILTER");
// Building block attributes.
A2 argID ("id", Lexer::Type::dom);
argID.tag ("FILTER");
A2 argUUID ("uuid", Lexer::Type::dom);
argUUID.tag ("FILTER");
reconstructed.push_back (openParen);
// Add all ID ranges.
for (auto r = _id_ranges.begin (); r != _id_ranges.end (); ++r)
{
if (r != _id_ranges.begin ())
reconstructed.push_back (opOr);
if (r->first == r->second)
{
reconstructed.push_back (openParen);
reconstructed.push_back (argID);
reconstructed.push_back (opEqual);
A2 value (r->first, Lexer::Type::number);
value.tag ("FILTER");
reconstructed.push_back (value);
reconstructed.push_back (closeParen);
}
else
{
bool ascending = true;
int low = strtol (r->first.c_str (), nullptr, 10);
int high = strtol (r->second.c_str (), nullptr, 10);
if (low <= high)
ascending = true;
else
ascending = false;
reconstructed.push_back (openParen);
reconstructed.push_back (argID);
reconstructed.push_back (opGTE);
A2 startValue ((ascending ? r->first : r->second), Lexer::Type::number);
startValue.tag ("FILTER");
reconstructed.push_back (startValue);
reconstructed.push_back (opAnd);
reconstructed.push_back (argID);
reconstructed.push_back (opLTE);
A2 endValue ((ascending ? r->second : r->first), Lexer::Type::number);
endValue.tag ("FILTER");
reconstructed.push_back (endValue);
reconstructed.push_back (closeParen);
}
}
// Combine the ID and UUID sections with 'or'.
if (!_id_ranges.empty() &&
!_uuid_list.empty())
reconstructed.push_back (opOr);
// Add all UUID list items.
for (auto u = _uuid_list.begin (); u != _uuid_list.end (); ++u)
{
if (u != _uuid_list.begin ())
reconstructed.push_back (opOr);
reconstructed.push_back (openParen);
reconstructed.push_back (argUUID);
reconstructed.push_back (opSimilar);
A2 value (*u, Lexer::Type::string);
value.tag ("FILTER");
reconstructed.push_back (value);
reconstructed.push_back (closeParen);
}
reconstructed.push_back (closeParen);
}
// No 'else' because all set/number/uuid args but the first are removed.
}
else
reconstructed.push_back (a);
}
if (changes)
{
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter insertIDExpr"));
}
}
////////////////////////////////////////////////////////////////////////////////
// FILTER Lexer::Type::word args will become part of an expression, and so they
// need to be Lexed.
void CLI2::lexFilterArgs ()
{
bool changes = false;
std::vector <A2> reconstructed;
for (const auto& a : _args)
{
if (a._lextype == Lexer::Type::word &&
a.hasTag ("FILTER"))
{
changes = true;
std::string lexeme;
Lexer::Type type;
Lexer lex (a.attribute ("raw"));
while (lex.token (lexeme, type))
{
A2 extra (lexeme, type);
extra.tag ("FILTER");
reconstructed.push_back (extra);
}
}
else
reconstructed.push_back (a);
}
if (changes)
{
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter lexFilterArgs"));
}
}
////////////////////////////////////////////////////////////////////////////////
// FILTER, Lexer::Type::word args are treated as search terms.
//
// Algorithm:
// Given:
// - task ... argX candidate argY
// Where:
// - neither argX nor argY are an operator, except (, ), and, or, xor
// - candidate is Lexer::Type::word
//
void CLI2::desugarFilterPlainArgs ()
{
// First walk the arg list looking for plain words that are not part of an
// existing expression.
auto prevprev = &_args[0];
auto prev = &_args[0];
for (auto& a : _args)
{
auto raw = a.attribute ("raw");
auto praw = prev->attribute ("raw");
auto ppraw = prevprev->attribute ("raw");
if ((prevprev->_lextype != Lexer::Type::op || // argX
ppraw == "(" ||
ppraw == ")" ||
ppraw == "and" ||
ppraw == "or" ||
ppraw == "xor") &&
(prev->_lextype == Lexer::Type::identifier || // candidate
prev->_lextype == Lexer::Type::word) && // candidate
prev->hasTag ("FILTER") && // candidate
(a._lextype != Lexer::Type::op || // argY
raw == "(" ||
raw == ")" ||
raw == "and" ||
raw == "or" ||
raw == "xor"))
{
prev->tag ("PLAIN");
}
prevprev = prev;
prev = &a;
}
// Cover the case where the *last* argument is a plain arg.
auto& penultimate = _args[_args.size () - 2];
auto praw = penultimate.attribute ("raw");
auto& last = _args[_args.size () - 1];
if ((penultimate._lextype != Lexer::Type::op || // argX
praw == "(" ||
praw == ")" ||
praw == "and" ||
praw == "or" ||
praw == "xor") &&
(last._lextype == Lexer::Type::identifier || // candidate
last._lextype == Lexer::Type::word) && // candidate
last.hasTag ("FILTER")) // candidate
{
last.tag ("PLAIN");
}
// Walk the list again, upgrading PLAIN args.
bool changes = false;
std::vector <A2> reconstructed;
for (const auto& a : _args)
{
if (a.hasTag ("PLAIN"))
{
changes = true;
A2 lhs ("description", Lexer::Type::dom);
lhs.attribute ("canonical", "description");
lhs.tag ("FILTER");
lhs.tag ("PLAIN");
reconstructed.push_back (lhs);
A2 op ("~", Lexer::Type::op);
op.tag ("FILTER");
op.tag ("PLAIN");
reconstructed.push_back (op);
std::string word = a.attribute ("raw");
Lexer::dequote (word);
A2 rhs (word, Lexer::Type::string);
rhs.tag ("FILTER");
rhs.tag ("PLAIN");
reconstructed.push_back (rhs);
}
else
reconstructed.push_back (a);
}
if (changes)
{
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter desugarFilterPlainArgs"));
}
}
////////////////////////////////////////////////////////////////////////////////
// Two consecutive FILTER, non-OP arguments that are not "(" or ")" need an
// "and" operator inserted between them.
//
// ) <non-op> --> ) and <non-op>
// <non-op> ( --> <non-op> <and> (
// ) ( --> ) and (
// <non-op> <non-op> --> <non-op> and <non-op>
//
void CLI2::insertJunctions ()
{
bool changes = false;
std::vector <A2> reconstructed;
auto prev = _args.begin ();
for (auto a = _args.begin (); a != _args.end (); ++a)
{
if (a->hasTag ("FILTER"))
{
// The prev iterator should be the first FILTER arg.
if (prev == _args.begin ())
prev = a;
// Insert AND between terms.
else if (a != prev)
{
if ((prev->_lextype != Lexer::Type::op && a->attribute ("raw") == "(") ||
(prev->_lextype != Lexer::Type::op && a->_lextype != Lexer::Type::op) ||
(prev->attribute ("raw") == ")" && a->_lextype != Lexer::Type::op) ||
(prev->attribute ("raw") == ")" && a->attribute ("raw") == "("))
{
A2 opOr ("and", Lexer::Type::op);
opOr.tag ("FILTER");
reconstructed.push_back (opOr);
changes = true;
}
}
// Previous FILTER arg.
prev = a;
}
reconstructed.push_back (*a);
}
if (changes)
{
_args = reconstructed;
if (Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::prepareFilter insertJunctions"));
}
}
////////////////////////////////////////////////////////////////////////////////
// Look for situations that require defaults:
//
// 1. If no command was found, and no ID/UUID, and if rc.default.command is
// configured, inject the lexed tokens from rc.default.command.
//
// 2. If no command was found, but an ID/UUID was found, then assume a command
// of 'information'.
//
void CLI2::defaultCommand ()
{
// Scan the top-level branches for evidence of ID, UUID, overrides and other
// arguments.
bool changes = false;
bool found_command = false;
bool found_sequence = false;
for (const auto& a : _args)
{
std::string raw = a.attribute ("raw");
if (a.hasTag ("CMD"))
found_command = true;
if (a._lextype == Lexer::Type::uuid ||
a._lextype == Lexer::Type::number)
found_sequence = true;
}
// If no command was specified, then a command will be inserted.
if (! found_command)
{
// Default command.
if (! found_sequence)
{
// Apply overrides, if any.
std::string defaultCommand = Context::getContext ().config.get ("default.command");
if (!defaultCommand.empty())
{
// Modify _args, _original_args to be:
// <args0> [<def0> ...] <args1> [...]
std::vector <A2> reconstructedOriginals {_original_args[0]};
std::vector <A2> reconstructed {_args[0]};
std::string lexeme;
Lexer::Type type;
Lexer lex (defaultCommand);
while (lex.token (lexeme, type))
{
reconstructedOriginals.emplace_back(lexeme, type);
A2 cmd (lexeme, type);
cmd.tag ("DEFAULT");
reconstructed.push_back (cmd);
}
for (unsigned int i = 1; i < _original_args.size (); ++i)
reconstructedOriginals.push_back (_original_args[i]);
for (unsigned int i = 1; i < _args.size (); ++i)
reconstructed.push_back (_args[i]);
_original_args = reconstructedOriginals;
_args = reconstructed;
changes = true;
}
}
else
{
A2 info ("information", Lexer::Type::word);
info.tag ("ASSUMED");
_args.push_back (info);
changes = true;
}
}
if (changes &&
Context::getContext ().config.getInteger ("debug.parser") >= 2)
Context::getContext ().debug (dump ("CLI2::analyze defaultCommand"));
}
////////////////////////////////////////////////////////////////////////////////
// Some values are expressions, which need to be lexed. The best way to
// determine whether an expression is either a single value, or needs to be
// lexed, is to lex it and count the tokens. For example:
// now+1d
// This should be lexed and surrounded by parentheses:
// (
// now
// +
// 1d
// )
std::vector <A2> CLI2::lexExpression (const std::string& expression)
{
std::vector <A2> lexed;
std::string lexeme;
Lexer::Type type;
Lexer lex (expression);
while (lex.token (lexeme, type))
{
A2 token (lexeme, type);
token.tag ("FILTER");
lexed.push_back (token);
}
// If there were multiple tokens, parenthesize, because this expression will
// be used as a value.
if (lexed.size () > 1)
{
A2 openParen ("(", Lexer::Type::op);
openParen.tag ("FILTER");
A2 closeParen (")", Lexer::Type::op);
closeParen.tag ("FILTER");
lexed.insert (lexed.begin (), openParen);
lexed.push_back (closeParen);
}
return lexed;
}
////////////////////////////////////////////////////////////////////////////////
// vim: ts=2:sw=2