PluralKit/PluralKit.Bot/CommandSystem/Parameters.cs

178 lines
6.5 KiB
C#
Raw Normal View History

namespace PluralKit.Bot;
2019-10-05 05:41:00 +00:00
public class Parameters
2019-10-05 05:41:00 +00:00
{
// Dictionary of (left, right) quote pairs
// Each char in the string is an individual quote, multi-char strings imply "one of the following chars"
private static readonly Dictionary<string, string> _quotePairs = new()
2019-10-05 05:41:00 +00:00
{
// Basic
{ "'", "'" }, // ASCII single quotes
{ "\"", "\"" }, // ASCII double quotes
2021-08-27 15:03:47 +00:00
// "Smart quotes"
// Specifically ignore the left/right status of the quotes and match any combination of them
// Left string also includes "low" quotes to allow for the low-high style used in some locales
{ "\u201C\u201D\u201F\u201E", "\u201C\u201D\u201F" }, // double quotes
{ "\u2018\u2019\u201B\u201A", "\u2018\u2019\u201B" }, // single quotes
2021-08-27 15:03:47 +00:00
// Chevrons (normal and "fullwidth" variants)
{ "\u00AB\u300A", "\u00BB\u300B" }, // double chevrons, pointing away (<<text>>)
{ "\u00BB\u300B", "\u00AA\u300A" }, // double chevrons, pointing together (>>text<<)
{ "\u2039\u3008", "\u203A\u3009" }, // single chevrons, pointing away (<text>)
{ "\u203A\u3009", "\u2039\u3008" }, // single chevrons, pointing together (>text<)
2020-02-06 16:47:37 +00:00
// Other
{ "\u300C\u300E", "\u300D\u300F" } // corner brackets (Japanese/Chinese)
};
2020-02-06 16:47:37 +00:00
private ISet<string> _flags; // Only parsed when requested first time
private int _ptr;
2019-10-05 05:41:00 +00:00
public string FullCommand { get; }
2019-10-05 05:41:00 +00:00
private struct WordPosition
{
// Start of the word
internal readonly int startPos;
2021-08-27 15:03:47 +00:00
// End of the word
internal readonly int endPos;
2021-08-27 15:03:47 +00:00
// How much to advance word pointer afterwards to point at the start of the *next* word
internal readonly int advanceAfterWord;
2021-08-27 15:03:47 +00:00
internal readonly bool wasQuoted;
2020-02-06 16:47:37 +00:00
public WordPosition(int startPos, int endPos, int advanceAfterWord, bool wasQuoted)
{
this.startPos = startPos;
this.endPos = endPos;
this.advanceAfterWord = advanceAfterWord;
this.wasQuoted = wasQuoted;
2020-02-06 16:47:37 +00:00
}
}
2020-02-06 16:47:37 +00:00
public Parameters(string cmd)
{
// This is a SUPER dirty hack to avoid having to match both spaces and newlines in the word detection below
// Instead, we just add a space before every newline (which then gets stripped out later).
FullCommand = cmd.Replace("\n", " \n");
_ptr = 0;
}
2019-10-05 05:41:00 +00:00
private void ParseFlags()
{
_flags = new HashSet<string>();
2019-10-05 05:41:00 +00:00
var ptr = 0;
while (NextWordPosition(ptr) is { } wp)
2019-10-05 05:41:00 +00:00
{
ptr = wp.endPos + wp.advanceAfterWord;
2020-02-06 16:47:37 +00:00
// Is this word a *flag* (as in, starts with a - AND is not quoted)
if (FullCommand[wp.startPos] != '-' || wp.wasQuoted) continue; // (if not, carry on w/ next word)
2019-10-05 05:41:00 +00:00
// Find the *end* of the flag start (technically allowing arbitrary amounts of dashes)
var flagNameStart = wp.startPos;
while (flagNameStart < FullCommand.Length && FullCommand[flagNameStart] == '-')
flagNameStart++;
// Then add the word to the flag set
var word = FullCommand.Substring(flagNameStart, wp.endPos - flagNameStart).Trim();
if (word.Length > 0)
_flags.Add(word.ToLowerInvariant());
2019-10-05 05:41:00 +00:00
}
}
2019-10-05 05:41:00 +00:00
public string Pop()
{
// Loop to ignore and skip past flags
while (NextWordPosition(_ptr) is { } pos)
2020-02-06 16:47:37 +00:00
{
_ptr = pos.endPos + pos.advanceAfterWord;
if (FullCommand[pos.startPos] == '-' && !pos.wasQuoted) continue;
return FullCommand.Substring(pos.startPos, pos.endPos - pos.startPos).Trim();
2020-02-06 16:47:37 +00:00
}
2021-08-27 15:03:47 +00:00
return "";
}
2019-10-05 05:41:00 +00:00
public string Peek()
{
// Loop to ignore and skip past flags, temp ptr so we don't move the real ptr
var ptr = _ptr;
while (NextWordPosition(ptr) is { } pos)
2019-10-05 05:41:00 +00:00
{
ptr = pos.endPos + pos.advanceAfterWord;
if (FullCommand[pos.startPos] == '-' && !pos.wasQuoted) continue;
return FullCommand.Substring(pos.startPos, pos.endPos - pos.startPos).Trim();
}
return "";
}
public ISet<string> Flags()
{
if (_flags == null) ParseFlags();
return _flags;
}
2019-10-05 05:41:00 +00:00
public string Remainder(bool skipFlags = true)
{
if (skipFlags)
// Skip all *leading* flags when taking the remainder
while (NextWordPosition(_ptr) is { } wp)
2019-10-05 05:41:00 +00:00
{
if (FullCommand[wp.startPos] != '-' || wp.wasQuoted) break;
_ptr = wp.endPos + wp.advanceAfterWord;
2019-10-05 05:41:00 +00:00
}
// *Then* get the remainder
return FullCommand.Substring(Math.Min(_ptr, FullCommand.Length)).Trim();
}
2021-08-27 15:03:47 +00:00
private WordPosition? NextWordPosition(int position)
{
// Skip leading spaces before actual content
while (position < FullCommand.Length && FullCommand[position] == ' ') position++;
// Is this the end of the string?
if (FullCommand.Length <= position) return null;
2020-05-07 21:43:07 +00:00
// Is this a quoted word?
if (TryCheckQuote(FullCommand[position], out var endQuotes))
2020-05-07 21:43:07 +00:00
{
// We found a quoted word - find an instance of one of the corresponding end quotes
var endQuotePosition = -1;
for (var i = position + 1; i < FullCommand.Length; i++)
if (endQuotePosition == -1 && endQuotes.Contains(FullCommand[i]))
endQuotePosition = i; // need a break; don't feel like brackets tho lol
// Position after the end quote should be EOL or a space
// Otherwise we fallthrough to the unquoted word handler below
if (FullCommand.Length == endQuotePosition + 1 || FullCommand[endQuotePosition + 1] == ' ')
return new WordPosition(position + 1, endQuotePosition, 2, true);
}
// Not a quoted word, just find the next space and return if it's the end of the command
var wordEnd = FullCommand.IndexOf(' ', position + 1);
return wordEnd == -1
? new WordPosition(position, FullCommand.Length, 0, false)
: new WordPosition(position, wordEnd, 1, false);
}
private bool TryCheckQuote(char potentialLeftQuote, out string correspondingRightQuotes)
{
foreach (var (left, right) in _quotePairs)
if (left.Contains(potentialLeftQuote))
2020-05-07 21:43:07 +00:00
{
correspondingRightQuotes = right;
return true;
2020-05-07 21:43:07 +00:00
}
2021-08-27 15:03:47 +00:00
correspondingRightQuotes = null;
return false;
2019-10-05 05:41:00 +00:00
}
}