2014-02-23 19:27:08 +01:00
|
|
|
/*
|
2016-02-26 17:54:05 +01:00
|
|
|
* Copyright 2003-2016 The Music Player Daemon Project
|
2014-02-23 19:27:08 +01:00
|
|
|
* http://www.musicpd.org
|
|
|
|
*
|
|
|
|
* This program is free software; you can redistribute it and/or modify
|
|
|
|
* it under the terms of the GNU General Public License as published by
|
|
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
|
|
* (at your option) any later version.
|
|
|
|
*
|
|
|
|
* This program is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU General Public License along
|
|
|
|
* with this program; if not, write to the Free Software Foundation, Inc.,
|
|
|
|
* 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "config.h"
|
|
|
|
#include "Collate.hxx"
|
2015-06-25 22:43:55 +02:00
|
|
|
#include "util/AllocatedString.hxx"
|
2014-02-23 19:27:08 +01:00
|
|
|
|
|
|
|
#ifdef HAVE_ICU
|
2014-11-30 10:53:05 +01:00
|
|
|
#include "Util.hxx"
|
2014-02-23 19:27:08 +01:00
|
|
|
#include "Error.hxx"
|
2016-04-12 21:32:02 +02:00
|
|
|
#include "util/AllocatedArray.hxx"
|
2014-05-12 14:35:25 +02:00
|
|
|
#include "util/ConstBuffer.hxx"
|
2014-02-23 19:27:08 +01:00
|
|
|
#include "util/Error.hxx"
|
|
|
|
|
|
|
|
#include <unicode/ucol.h>
|
|
|
|
#include <unicode/ustring.h>
|
|
|
|
#else
|
|
|
|
#include <algorithm>
|
|
|
|
#include <ctype.h>
|
|
|
|
#endif
|
|
|
|
|
2015-06-23 11:37:25 +02:00
|
|
|
#ifdef WIN32
|
|
|
|
#include "Win32.hxx"
|
|
|
|
#include "util/AllocatedString.hxx"
|
|
|
|
#include <windows.h>
|
|
|
|
#endif
|
|
|
|
|
2016-04-12 21:53:55 +02:00
|
|
|
#include <memory>
|
2016-04-13 11:51:01 +02:00
|
|
|
#include <stdexcept>
|
2016-04-12 21:53:55 +02:00
|
|
|
|
2014-02-23 19:27:08 +01:00
|
|
|
#include <assert.h>
|
|
|
|
#include <string.h>
|
|
|
|
|
|
|
|
#ifdef HAVE_ICU
|
|
|
|
static UCollator *collator;
|
|
|
|
#endif
|
|
|
|
|
2014-06-10 22:38:00 +02:00
|
|
|
#ifdef HAVE_ICU
|
|
|
|
|
2014-02-23 19:27:08 +01:00
|
|
|
bool
|
|
|
|
IcuCollateInit(Error &error)
|
|
|
|
{
|
|
|
|
assert(collator == nullptr);
|
|
|
|
assert(!error.IsDefined());
|
|
|
|
|
2014-02-24 21:04:23 +01:00
|
|
|
UErrorCode code = U_ZERO_ERROR;
|
2014-02-23 19:27:08 +01:00
|
|
|
collator = ucol_open("", &code);
|
|
|
|
if (collator == nullptr) {
|
|
|
|
error.Format(icu_domain, int(code),
|
|
|
|
"ucol_open() failed: %s", u_errorName(code));
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
|
|
|
IcuCollateFinish()
|
|
|
|
{
|
|
|
|
assert(collator != nullptr);
|
|
|
|
|
|
|
|
ucol_close(collator);
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
|
|
|
gcc_pure
|
|
|
|
int
|
|
|
|
IcuCollate(const char *a, const char *b)
|
|
|
|
{
|
2014-12-26 14:28:01 +01:00
|
|
|
#if !CLANG_CHECK_VERSION(3,6)
|
|
|
|
/* disabled on clang due to -Wtautological-pointer-compare */
|
2014-02-23 19:27:08 +01:00
|
|
|
assert(a != nullptr);
|
|
|
|
assert(b != nullptr);
|
2014-12-26 14:28:01 +01:00
|
|
|
#endif
|
2014-02-23 19:27:08 +01:00
|
|
|
|
|
|
|
#ifdef HAVE_ICU
|
|
|
|
assert(collator != nullptr);
|
|
|
|
|
|
|
|
#if U_ICU_VERSION_MAJOR_NUM >= 50
|
2014-02-24 21:05:34 +01:00
|
|
|
UErrorCode code = U_ZERO_ERROR;
|
|
|
|
return (int)ucol_strcollUTF8(collator, a, -1, b, -1, &code);
|
2014-02-23 19:27:08 +01:00
|
|
|
#else
|
|
|
|
/* fall back to ucol_strcoll() */
|
|
|
|
|
2014-05-12 14:39:40 +02:00
|
|
|
const auto au = UCharFromUTF8(a);
|
|
|
|
const auto bu = UCharFromUTF8(b);
|
2014-02-23 19:27:08 +01:00
|
|
|
|
2016-04-12 21:32:02 +02:00
|
|
|
return !au.IsNull() && !bu.IsNull()
|
|
|
|
? (int)ucol_strcoll(collator, au.begin(), au.size(),
|
|
|
|
bu.begin(), bu.size())
|
2014-02-23 19:27:08 +01:00
|
|
|
: strcasecmp(a, b);
|
|
|
|
#endif
|
|
|
|
|
2015-06-23 11:37:25 +02:00
|
|
|
#elif defined(WIN32)
|
2016-04-13 11:51:01 +02:00
|
|
|
AllocatedString<wchar_t> wa = nullptr, wb = nullptr;
|
|
|
|
|
|
|
|
try {
|
|
|
|
wa = MultiByteToWideChar(CP_UTF8, a);
|
|
|
|
} catch (const std::runtime_error &) {
|
|
|
|
try {
|
|
|
|
wb = MultiByteToWideChar(CP_UTF8, b);
|
|
|
|
return -1;
|
|
|
|
} catch (const std::runtime_error &) {
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
try {
|
|
|
|
wb = MultiByteToWideChar(CP_UTF8, b);
|
|
|
|
} catch (const std::runtime_error &) {
|
2015-06-23 11:37:25 +02:00
|
|
|
return 1;
|
2016-04-13 11:51:01 +02:00
|
|
|
}
|
2015-06-23 11:37:25 +02:00
|
|
|
|
|
|
|
auto result = CompareStringEx(LOCALE_NAME_INVARIANT,
|
|
|
|
LINGUISTIC_IGNORECASE,
|
|
|
|
wa.c_str(), -1,
|
|
|
|
wb.c_str(), -1,
|
|
|
|
nullptr, nullptr, 0);
|
|
|
|
if (result != 0)
|
|
|
|
/* "To maintain the C runtime convention of comparing
|
|
|
|
strings, the value 2 can be subtracted from a
|
|
|
|
nonzero return value." */
|
|
|
|
result -= 2;
|
|
|
|
|
|
|
|
return result;
|
2014-02-23 19:27:08 +01:00
|
|
|
#else
|
2015-06-23 13:26:45 +02:00
|
|
|
return strcoll(a, b);
|
2014-02-23 19:27:08 +01:00
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2015-06-25 22:43:55 +02:00
|
|
|
AllocatedString<>
|
2014-02-23 19:27:08 +01:00
|
|
|
IcuCaseFold(const char *src)
|
2016-04-13 11:51:01 +02:00
|
|
|
try {
|
2014-02-23 19:27:08 +01:00
|
|
|
#ifdef HAVE_ICU
|
|
|
|
assert(collator != nullptr);
|
2014-12-26 14:28:01 +01:00
|
|
|
#if !CLANG_CHECK_VERSION(3,6)
|
|
|
|
/* disabled on clang due to -Wtautological-pointer-compare */
|
2014-02-23 19:27:08 +01:00
|
|
|
assert(src != nullptr);
|
2014-12-26 14:28:01 +01:00
|
|
|
#endif
|
2014-02-23 19:27:08 +01:00
|
|
|
|
2014-05-12 14:39:40 +02:00
|
|
|
const auto u = UCharFromUTF8(src);
|
|
|
|
if (u.IsNull())
|
2015-06-25 22:43:55 +02:00
|
|
|
return AllocatedString<>::Duplicate(src);
|
2014-02-23 19:27:08 +01:00
|
|
|
|
2016-04-12 21:51:18 +02:00
|
|
|
AllocatedArray<UChar> folded(u.size() * 2u);
|
2014-05-12 14:35:25 +02:00
|
|
|
|
|
|
|
UErrorCode error_code = U_ZERO_ERROR;
|
2016-04-12 21:51:18 +02:00
|
|
|
size_t folded_length = u_strFoldCase(folded.begin(), folded.size(),
|
2016-04-12 21:32:02 +02:00
|
|
|
u.begin(), u.size(),
|
2015-06-25 22:55:54 +02:00
|
|
|
U_FOLD_CASE_DEFAULT,
|
|
|
|
&error_code);
|
2016-04-12 21:51:18 +02:00
|
|
|
if (folded_length == 0 || error_code != U_ZERO_ERROR)
|
2015-06-25 22:43:55 +02:00
|
|
|
return AllocatedString<>::Duplicate(src);
|
2014-02-23 19:27:08 +01:00
|
|
|
|
2016-04-12 21:51:18 +02:00
|
|
|
folded.SetSize(folded_length);
|
|
|
|
return UCharToUTF8({folded.begin(), folded.size()});
|
2015-06-27 15:52:37 +02:00
|
|
|
|
|
|
|
#elif defined(WIN32)
|
|
|
|
const auto u = MultiByteToWideChar(CP_UTF8, src);
|
|
|
|
|
|
|
|
const int size = LCMapStringEx(LOCALE_NAME_INVARIANT,
|
|
|
|
LCMAP_SORTKEY|LINGUISTIC_IGNORECASE,
|
|
|
|
u.c_str(), -1, nullptr, 0,
|
|
|
|
nullptr, nullptr, 0);
|
|
|
|
if (size <= 0)
|
|
|
|
return AllocatedString<>::Duplicate(src);
|
|
|
|
|
2016-04-12 21:53:55 +02:00
|
|
|
std::unique_ptr<wchar_t[]> buffer(new wchar_t[size]);
|
2015-06-27 15:52:37 +02:00
|
|
|
if (LCMapStringEx(LOCALE_NAME_INVARIANT,
|
|
|
|
LCMAP_SORTKEY|LINGUISTIC_IGNORECASE,
|
2016-04-12 21:53:55 +02:00
|
|
|
u.c_str(), -1, buffer.get(), size,
|
|
|
|
nullptr, nullptr, 0) <= 0)
|
2015-06-27 15:52:37 +02:00
|
|
|
return AllocatedString<>::Duplicate(src);
|
|
|
|
|
2016-04-13 11:51:01 +02:00
|
|
|
return WideCharToMultiByte(CP_UTF8, buffer.get());
|
2015-06-27 15:52:37 +02:00
|
|
|
|
2014-02-23 19:27:08 +01:00
|
|
|
#else
|
2015-06-25 23:01:29 +02:00
|
|
|
size_t size = strlen(src) + 1;
|
2016-04-12 21:53:55 +02:00
|
|
|
std::unique_ptr<char[]> buffer(new char[size]);
|
|
|
|
size_t nbytes = strxfrm(buffer.get(), src, size);
|
2015-06-25 23:01:29 +02:00
|
|
|
if (nbytes >= size) {
|
|
|
|
/* buffer too small - reallocate and try again */
|
2016-04-12 21:53:55 +02:00
|
|
|
buffer.reset();
|
2015-06-25 23:01:29 +02:00
|
|
|
size = nbytes + 1;
|
2016-04-12 21:53:55 +02:00
|
|
|
buffer.reset(new char[size]);
|
|
|
|
nbytes = strxfrm(buffer.get(), src, size);
|
2015-06-25 23:01:29 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
assert(nbytes < size);
|
|
|
|
assert(buffer[nbytes] == 0);
|
|
|
|
|
2016-04-12 21:53:55 +02:00
|
|
|
return AllocatedString<>::Donate(buffer.release());
|
2014-02-23 19:27:08 +01:00
|
|
|
#endif
|
2016-04-13 11:51:01 +02:00
|
|
|
} catch (const std::runtime_error &) {
|
|
|
|
return AllocatedString<>::Duplicate(src);
|
2014-02-23 19:27:08 +01:00
|
|
|
}
|