// SPDX-License-Identifier: BSD-2-Clause // author: Max Kellermann #include "UriExtract.hxx" #include "CharUtil.hxx" #include "StringSplit.hxx" #include static constexpr bool IsValidSchemeStart(char ch) { return IsLowerAlphaASCII(ch); } static constexpr bool IsValidSchemeChar(char ch) { return IsLowerAlphaASCII(ch) || IsDigitASCII(ch) || ch == '+' || ch == '.' || ch == '-'; } [[gnu::pure]] static bool IsValidScheme(std::string_view p) noexcept { if (p.empty() || !IsValidSchemeStart(p.front())) return false; for (size_t i = 1; i < p.size(); ++i) if (!IsValidSchemeChar(p[i])) return false; return true; } /** * Return the URI part after the scheme specification (and after the * double slash). */ [[gnu::pure]] static std::string_view uri_after_scheme(std::string_view uri) noexcept { if (uri.length() > 2 && uri[0] == '/' && uri[1] == '/' && uri[2] != '/') return uri.substr(2); auto colon = uri.find(':'); if (colon == std::string_view::npos || !IsValidScheme(uri.substr(0, colon))) return {}; uri = uri.substr(colon + 1); if (uri[0] != '/' || uri[1] != '/') return {}; return uri.substr(2); } bool uri_has_scheme(std::string_view uri) noexcept { return !uri_get_scheme(uri).empty(); } std::string_view uri_get_scheme(std::string_view uri) noexcept { auto end = uri.find("://"); if (end == std::string_view::npos) return {}; return uri.substr(0, end); } bool uri_is_relative_path(const char *uri) noexcept { return !uri_has_scheme(uri) && *uri != '/'; } std::string_view uri_get_path_query_fragment(std::string_view uri) noexcept { auto ap = uri_after_scheme(uri); if (ap.data() != nullptr) { auto slash = ap.find('/'); if (slash == std::string_view::npos) return {}; return ap.substr(slash); } return uri; } [[gnu::pure]] static std::string_view UriWithoutQueryString(std::string_view uri) noexcept { return Split(uri, '?').first; } std::string_view uri_get_path(std::string_view uri) noexcept { auto path = uri_get_path_query_fragment(uri); if (path.data() == nullptr || path.data() == uri.data()) /* preserve query and fragment if this URI doesn't have a scheme; the question mark may be part of the file name, after all */ return path; auto end = path.find('?'); if (end == std::string_view::npos) end = path.find('#'); return path.substr(0, end); } /* suffixes should be ascii only characters */ std::string_view uri_get_suffix(std::string_view _uri) noexcept { const auto uri = UriWithoutQueryString(_uri); const auto dot = uri.rfind('.'); if (dot == uri.npos || dot == 0 || uri[dot - 1] == '/' || uri[dot - 1] == '\\') return {}; auto suffix = uri.substr(dot + 1); if (suffix.find('/') != suffix.npos || suffix.find('\\') != suffix.npos) /* this was not the last path segment */ return {}; return suffix; } const char * uri_get_fragment(const char *uri) noexcept { const char *fragment = std::strchr(uri, '#'); if (fragment == nullptr) return nullptr; return fragment + 1; }