/* * Copyright 2003-2016 The Music Player Daemon Project * http://www.musicpd.org * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License along * with this program; if not, write to the Free Software Foundation, Inc., * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */ #include "config.h" #include "Collate.hxx" #include "util/AllocatedString.hxx" #ifdef HAVE_ICU #include "Util.hxx" #include "util/AllocatedArray.hxx" #include "util/ConstBuffer.hxx" #include "util/RuntimeError.hxx" #include #include #else #include #include #endif #ifdef WIN32 #include "Win32.hxx" #include "util/AllocatedString.hxx" #include #endif #include #include #include #include #ifdef HAVE_ICU static UCollator *collator; #endif #ifdef HAVE_ICU void IcuCollateInit() { assert(collator == nullptr); UErrorCode code = U_ZERO_ERROR; collator = ucol_open("", &code); if (collator == nullptr) throw FormatRuntimeError("ucol_open() failed: %s", u_errorName(code)); } void IcuCollateFinish() { assert(collator != nullptr); ucol_close(collator); } #endif gcc_pure int IcuCollate(const char *a, const char *b) { #if !CLANG_CHECK_VERSION(3,6) /* disabled on clang due to -Wtautological-pointer-compare */ assert(a != nullptr); assert(b != nullptr); #endif #ifdef HAVE_ICU assert(collator != nullptr); #if U_ICU_VERSION_MAJOR_NUM >= 50 UErrorCode code = U_ZERO_ERROR; return (int)ucol_strcollUTF8(collator, a, -1, b, -1, &code); #else /* fall back to ucol_strcoll() */ try { const auto au = UCharFromUTF8(a); const auto bu = UCharFromUTF8(b); return ucol_strcoll(collator, au.begin(), au.size(), bu.begin(), bu.size()); } catch (const std::runtime_error &) { /* fall back to plain strcasecmp() */ return strcasecmp(a, b); } #endif #elif defined(WIN32) AllocatedString wa = nullptr, wb = nullptr; try { wa = MultiByteToWideChar(CP_UTF8, a); } catch (const std::runtime_error &) { try { wb = MultiByteToWideChar(CP_UTF8, b); return -1; } catch (const std::runtime_error &) { return 0; } } try { wb = MultiByteToWideChar(CP_UTF8, b); } catch (const std::runtime_error &) { return 1; } auto result = CompareStringEx(LOCALE_NAME_INVARIANT, LINGUISTIC_IGNORECASE, wa.c_str(), -1, wb.c_str(), -1, nullptr, nullptr, 0); if (result != 0) /* "To maintain the C runtime convention of comparing strings, the value 2 can be subtracted from a nonzero return value." */ result -= 2; return result; #else return strcoll(a, b); #endif } AllocatedString<> IcuCaseFold(const char *src) try { #ifdef HAVE_ICU assert(collator != nullptr); #if !CLANG_CHECK_VERSION(3,6) /* disabled on clang due to -Wtautological-pointer-compare */ assert(src != nullptr); #endif const auto u = UCharFromUTF8(src); if (u.IsNull()) return AllocatedString<>::Duplicate(src); AllocatedArray folded(u.size() * 2u); UErrorCode error_code = U_ZERO_ERROR; size_t folded_length = u_strFoldCase(folded.begin(), folded.size(), u.begin(), u.size(), U_FOLD_CASE_DEFAULT, &error_code); if (folded_length == 0 || error_code != U_ZERO_ERROR) return AllocatedString<>::Duplicate(src); folded.SetSize(folded_length); return UCharToUTF8({folded.begin(), folded.size()}); #elif defined(WIN32) const auto u = MultiByteToWideChar(CP_UTF8, src); const int size = LCMapStringEx(LOCALE_NAME_INVARIANT, LCMAP_SORTKEY|LINGUISTIC_IGNORECASE, u.c_str(), -1, nullptr, 0, nullptr, nullptr, 0); if (size <= 0) return AllocatedString<>::Duplicate(src); std::unique_ptr buffer(new wchar_t[size]); if (LCMapStringEx(LOCALE_NAME_INVARIANT, LCMAP_SORTKEY|LINGUISTIC_IGNORECASE, u.c_str(), -1, buffer.get(), size, nullptr, nullptr, 0) <= 0) return AllocatedString<>::Duplicate(src); return WideCharToMultiByte(CP_UTF8, buffer.get()); #else size_t size = strlen(src) + 1; std::unique_ptr buffer(new char[size]); size_t nbytes = strxfrm(buffer.get(), src, size); if (nbytes >= size) { /* buffer too small - reallocate and try again */ buffer.reset(); size = nbytes + 1; buffer.reset(new char[size]); nbytes = strxfrm(buffer.get(), src, size); } assert(nbytes < size); assert(buffer[nbytes] == 0); return AllocatedString<>::Donate(buffer.release()); #endif } catch (const std::runtime_error &) { return AllocatedString<>::Duplicate(src); }