192 lines
3.9 KiB
C++
192 lines
3.9 KiB
C++
/*
|
|
* Copyright (C) 2003-2013 The Music Player Daemon Project
|
|
* http://www.musicpd.org
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
* GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with this program; if not, write to the Free Software Foundation, Inc.,
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
*/
|
|
|
|
#include "config.h"
|
|
#include "Tokenizer.hxx"
|
|
#include "CharUtil.hxx"
|
|
#include "StringUtil.hxx"
|
|
#include "Error.hxx"
|
|
#include "Domain.hxx"
|
|
|
|
#include <glib.h>
|
|
|
|
static constexpr Domain tokenizer_domain("tokenizer");
|
|
|
|
static inline bool
|
|
valid_word_first_char(char ch)
|
|
{
|
|
return IsAlphaASCII(ch);
|
|
}
|
|
|
|
static inline bool
|
|
valid_word_char(char ch)
|
|
{
|
|
return IsAlphaNumericASCII(ch) || ch == '_';
|
|
}
|
|
|
|
char *
|
|
Tokenizer::NextWord(Error &error)
|
|
{
|
|
char *const word = input;
|
|
|
|
if (*input == 0)
|
|
return nullptr;
|
|
|
|
/* check the first character */
|
|
|
|
if (!valid_word_first_char(*input)) {
|
|
error.Set(tokenizer_domain, "Letter expected");
|
|
return nullptr;
|
|
}
|
|
|
|
/* now iterate over the other characters until we find a
|
|
whitespace or end-of-string */
|
|
|
|
while (*++input != 0) {
|
|
if (IsWhitespaceOrNull(*input)) {
|
|
/* a whitespace: the word ends here */
|
|
*input = 0;
|
|
/* skip all following spaces, too */
|
|
input = strchug_fast(input + 1);
|
|
break;
|
|
}
|
|
|
|
if (!valid_word_char(*input)) {
|
|
error.Set(tokenizer_domain, "Invalid word character");
|
|
return nullptr;
|
|
}
|
|
}
|
|
|
|
/* end of string: the string is already null-terminated
|
|
here */
|
|
|
|
return word;
|
|
}
|
|
|
|
static inline bool
|
|
valid_unquoted_char(char ch)
|
|
{
|
|
return (unsigned char)ch > 0x20 && ch != '"' && ch != '\'';
|
|
}
|
|
|
|
char *
|
|
Tokenizer::NextUnquoted(Error &error)
|
|
{
|
|
char *const word = input;
|
|
|
|
if (*input == 0)
|
|
return nullptr;
|
|
|
|
/* check the first character */
|
|
|
|
if (!valid_unquoted_char(*input)) {
|
|
error.Set(tokenizer_domain, "Invalid unquoted character");
|
|
return nullptr;
|
|
}
|
|
|
|
/* now iterate over the other characters until we find a
|
|
whitespace or end-of-string */
|
|
|
|
while (*++input != 0) {
|
|
if (IsWhitespaceOrNull(*input)) {
|
|
/* a whitespace: the word ends here */
|
|
*input = 0;
|
|
/* skip all following spaces, too */
|
|
input = strchug_fast(input + 1);
|
|
break;
|
|
}
|
|
|
|
if (!valid_unquoted_char(*input)) {
|
|
error.Set(tokenizer_domain,
|
|
"Invalid unquoted character");
|
|
return nullptr;
|
|
}
|
|
}
|
|
|
|
/* end of string: the string is already null-terminated
|
|
here */
|
|
|
|
return word;
|
|
}
|
|
|
|
char *
|
|
Tokenizer::NextString(Error &error)
|
|
{
|
|
char *const word = input, *dest = input;
|
|
|
|
if (*input == 0)
|
|
/* end of line */
|
|
return nullptr;
|
|
|
|
/* check for the opening " */
|
|
|
|
if (*input != '"') {
|
|
error.Set(tokenizer_domain, "'\"' expected");
|
|
return nullptr;
|
|
}
|
|
|
|
++input;
|
|
|
|
/* copy all characters */
|
|
|
|
while (*input != '"') {
|
|
if (*input == '\\')
|
|
/* the backslash escapes the following
|
|
character */
|
|
++input;
|
|
|
|
if (*input == 0) {
|
|
/* return input-1 so the caller can see the
|
|
difference between "end of line" and
|
|
"error" */
|
|
--input;
|
|
error.Set(tokenizer_domain, "Missing closing '\"'");
|
|
return nullptr;
|
|
}
|
|
|
|
/* copy one character */
|
|
*dest++ = *input++;
|
|
}
|
|
|
|
/* the following character must be a whitespace (or end of
|
|
line) */
|
|
|
|
++input;
|
|
if (!IsWhitespaceOrNull(*input)) {
|
|
error.Set(tokenizer_domain,
|
|
"Space expected after closing '\"'");
|
|
return nullptr;
|
|
}
|
|
|
|
/* finish the string and return it */
|
|
|
|
*dest = 0;
|
|
input = strchug_fast(input);
|
|
return word;
|
|
}
|
|
|
|
char *
|
|
Tokenizer::NextParam(Error &error)
|
|
{
|
|
if (*input == '"')
|
|
return NextString(error);
|
|
else
|
|
return NextUnquoted(error);
|
|
}
|