2019-08-09 15:54:13 +02:00
|
|
|
/*
|
|
|
|
* Copyright 2008-2019 Max Kellermann <max.kellermann@gmail.com>
|
|
|
|
*
|
|
|
|
* Redistribution and use in source and binary forms, with or without
|
|
|
|
* modification, are permitted provided that the following conditions
|
|
|
|
* are met:
|
|
|
|
*
|
|
|
|
* - Redistributions of source code must retain the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer.
|
|
|
|
*
|
|
|
|
* - Redistributions in binary form must reproduce the above copyright
|
|
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
|
|
* documentation and/or other materials provided with the
|
|
|
|
* distribution.
|
|
|
|
*
|
|
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
|
|
* ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
|
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
|
|
|
|
* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
|
|
|
|
* FOUNDATION OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
|
|
|
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
|
|
|
|
* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
* SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
|
|
|
|
* HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
|
|
|
|
* STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED
|
|
|
|
* OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "UriExtract.hxx"
|
|
|
|
#include "CharUtil.hxx"
|
|
|
|
#include "StringView.hxx"
|
|
|
|
|
|
|
|
#include <string.h>
|
|
|
|
|
|
|
|
static constexpr bool
|
|
|
|
IsValidSchemeStart(char ch)
|
|
|
|
{
|
|
|
|
return IsLowerAlphaASCII(ch);
|
|
|
|
}
|
|
|
|
|
|
|
|
static constexpr bool
|
|
|
|
IsValidSchemeChar(char ch)
|
|
|
|
{
|
|
|
|
return IsLowerAlphaASCII(ch) || IsDigitASCII(ch) ||
|
|
|
|
ch == '+' || ch == '.' || ch == '-';
|
|
|
|
}
|
|
|
|
|
|
|
|
gcc_pure
|
|
|
|
static bool
|
2020-03-13 18:15:21 +01:00
|
|
|
IsValidScheme(std::string_view p) noexcept
|
2019-08-09 15:54:13 +02:00
|
|
|
{
|
|
|
|
if (p.empty() || !IsValidSchemeStart(p.front()))
|
|
|
|
return false;
|
|
|
|
|
2020-03-13 18:15:21 +01:00
|
|
|
for (size_t i = 1; i < p.size(); ++i)
|
2019-08-09 15:54:13 +02:00
|
|
|
if (!IsValidSchemeChar(p[i]))
|
|
|
|
return false;
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Return the URI part after the scheme specification (and after the
|
|
|
|
* double slash).
|
|
|
|
*/
|
|
|
|
gcc_pure
|
2020-03-13 18:15:21 +01:00
|
|
|
static std::string_view
|
|
|
|
uri_after_scheme(std::string_view uri) noexcept
|
2019-08-09 15:54:13 +02:00
|
|
|
{
|
2020-03-13 18:15:21 +01:00
|
|
|
if (uri.length() > 2 &&
|
|
|
|
uri[0] == '/' && uri[1] == '/' && uri[2] != '/')
|
|
|
|
return uri.substr(2);
|
|
|
|
|
|
|
|
auto colon = uri.find(':');
|
|
|
|
if (colon == std::string_view::npos ||
|
|
|
|
!IsValidScheme(uri.substr(0, colon)))
|
|
|
|
return {};
|
|
|
|
|
|
|
|
uri = uri.substr(colon + 1);
|
|
|
|
if (uri[0] != '/' || uri[1] != '/')
|
|
|
|
return {};
|
|
|
|
|
|
|
|
return uri.substr(2);
|
2019-08-09 15:54:13 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
bool
|
|
|
|
uri_has_scheme(const char *uri) noexcept
|
|
|
|
{
|
2020-03-13 18:11:29 +01:00
|
|
|
return !uri_get_scheme(uri).empty();
|
2019-08-09 15:54:13 +02:00
|
|
|
}
|
|
|
|
|
2020-03-13 18:11:29 +01:00
|
|
|
std::string_view
|
|
|
|
uri_get_scheme(std::string_view uri) noexcept
|
2019-08-09 15:54:13 +02:00
|
|
|
{
|
2020-03-13 18:11:29 +01:00
|
|
|
auto end = uri.find("://");
|
|
|
|
if (end == std::string_view::npos)
|
|
|
|
return {};
|
2019-08-09 15:54:13 +02:00
|
|
|
|
2020-03-13 18:11:29 +01:00
|
|
|
return uri.substr(0, end);
|
2019-08-09 15:54:13 +02:00
|
|
|
}
|
|
|
|
|
2019-09-07 23:57:33 +02:00
|
|
|
bool
|
|
|
|
uri_is_relative_path(const char *uri) noexcept
|
|
|
|
{
|
|
|
|
return !uri_has_scheme(uri) && *uri != '/';
|
|
|
|
}
|
|
|
|
|
2020-03-13 18:15:21 +01:00
|
|
|
std::string_view
|
|
|
|
uri_get_path(std::string_view uri) noexcept
|
2019-08-09 15:54:13 +02:00
|
|
|
{
|
2020-03-13 18:15:21 +01:00
|
|
|
auto ap = uri_after_scheme(uri);
|
|
|
|
if (ap.data() != nullptr) {
|
|
|
|
auto slash = ap.find('/');
|
|
|
|
if (slash == std::string_view::npos)
|
|
|
|
return {};
|
|
|
|
return ap.substr(slash);
|
|
|
|
}
|
2019-08-09 15:54:13 +02:00
|
|
|
|
|
|
|
return uri;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* suffixes should be ascii only characters */
|
|
|
|
const char *
|
|
|
|
uri_get_suffix(const char *uri) noexcept
|
|
|
|
{
|
2020-05-01 04:25:55 +02:00
|
|
|
const char *suffix = std::strrchr(uri, '.');
|
2019-08-09 15:54:13 +02:00
|
|
|
if (suffix == nullptr || suffix == uri ||
|
|
|
|
suffix[-1] == '/' || suffix[-1] == '\\')
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
++suffix;
|
|
|
|
|
|
|
|
if (strpbrk(suffix, "/\\") != nullptr)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
return suffix;
|
|
|
|
}
|
|
|
|
|
|
|
|
const char *
|
|
|
|
uri_get_suffix(const char *uri, UriSuffixBuffer &buffer) noexcept
|
|
|
|
{
|
|
|
|
const char *suffix = uri_get_suffix(uri);
|
|
|
|
if (suffix == nullptr)
|
|
|
|
return nullptr;
|
|
|
|
|
2020-05-01 04:25:55 +02:00
|
|
|
const char *q = std::strchr(suffix, '?');
|
2019-08-09 15:54:13 +02:00
|
|
|
if (q != nullptr && size_t(q - suffix) < sizeof(buffer.data)) {
|
|
|
|
memcpy(buffer.data, suffix, q - suffix);
|
|
|
|
buffer.data[q - suffix] = 0;
|
|
|
|
suffix = buffer.data;
|
|
|
|
}
|
|
|
|
|
|
|
|
return suffix;
|
|
|
|
}
|
2019-08-09 16:14:17 +02:00
|
|
|
|
|
|
|
const char *
|
|
|
|
uri_get_fragment(const char *uri) noexcept
|
|
|
|
{
|
2020-05-01 04:25:55 +02:00
|
|
|
const char *fragment = std::strchr(uri, '#');
|
2019-08-09 16:14:17 +02:00
|
|
|
if (fragment == nullptr)
|
|
|
|
return nullptr;
|
|
|
|
|
|
|
|
return fragment + 1;
|
|
|
|
}
|