mpd/src/util/Tokenizer.cxx

177 lines
4.0 KiB
C++
Raw Normal View History

/*
2017-01-17 11:54:55 +01:00
* Copyright (C) 2009-2014 Max Kellermann <max.kellermann@gmail.com>
*
2014-02-19 10:41:48 +01:00
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
2014-02-19 10:41:48 +01:00
* - Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
2014-02-19 10:41:48 +01:00
* - Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the
* distribution.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
* FOUNDATION OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
* OF THE POSSIBILITY OF SUCH DAMAGE.
*/
2013-04-08 23:51:39 +02:00
#include "Tokenizer.hxx"
#include "CharUtil.hxx"
#include "StringStrip.hxx"
#include <stdexcept>
static inline bool
valid_word_first_char(char ch)
{
return IsAlphaASCII(ch);
}
static inline bool
valid_word_char(char ch)
{
return IsAlphaNumericASCII(ch) || ch == '_';
}
char *
Tokenizer::NextWord()
{
2013-04-08 23:51:39 +02:00
char *const word = input;
if (*input == 0)
2013-04-08 23:51:39 +02:00
return nullptr;
/* check the first character */
if (!valid_word_first_char(*input))
throw std::runtime_error("Letter expected");
/* now iterate over the other characters until we find a
whitespace or end-of-string */
while (*++input != 0) {
2014-08-07 15:05:27 +02:00
if (IsWhitespaceFast(*input)) {
/* a whitespace: the word ends here */
*input = 0;
/* skip all following spaces, too */
input = StripLeft(input + 1);
break;
}
if (!valid_word_char(*input))
throw std::runtime_error("Invalid word character");
}
/* end of string: the string is already null-terminated
here */
return word;
}
static inline bool
valid_unquoted_char(char ch)
{
return (unsigned char)ch > 0x20 && ch != '"' && ch != '\'';
}
char *
Tokenizer::NextUnquoted()
{
2013-04-08 23:51:39 +02:00
char *const word = input;
if (*input == 0)
2013-04-08 23:51:39 +02:00
return nullptr;
/* check the first character */
if (!valid_unquoted_char(*input))
throw std::runtime_error("Invalid unquoted character");
/* now iterate over the other characters until we find a
whitespace or end-of-string */
while (*++input != 0) {
2014-08-07 15:05:27 +02:00
if (IsWhitespaceFast(*input)) {
/* a whitespace: the word ends here */
*input = 0;
/* skip all following spaces, too */
input = StripLeft(input + 1);
break;
}
if (!valid_unquoted_char(*input))
throw std::runtime_error("Invalid unquoted character");
}
/* end of string: the string is already null-terminated
here */
return word;
}
char *
Tokenizer::NextString()
{
2013-04-08 23:51:39 +02:00
char *const word = input, *dest = input;
if (*input == 0)
/* end of line */
2013-04-08 23:51:39 +02:00
return nullptr;
/* check for the opening " */
if (*input != '"')
throw std::runtime_error("'\"' expected");
++input;
/* copy all characters */
while (*input != '"') {
if (*input == '\\')
/* the backslash escapes the following
character */
++input;
if (*input == 0)
throw std::runtime_error("Missing closing '\"'");
/* copy one character */
*dest++ = *input++;
}
/* the following character must be a whitespace (or end of
line) */
++input;
if (!IsWhitespaceFast(*input))
throw std::runtime_error("Space expected after closing '\"'");
/* finish the string and return it */
*dest = 0;
input = StripLeft(input);
return word;
}
char *
Tokenizer::NextParam()
{
2013-04-08 23:51:39 +02:00
if (*input == '"')
return NextString();
else
return NextUnquoted();
}