Converter.cxx 3.88 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21
/*
 * Copyright (C) 2003-2014 The Music Player Daemon Project
 * http://www.musicpd.org
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 */

#include "config.h"
#include "Converter.hxx"
22
#include "Error.hxx"
23
#include "util/Error.hxx"
24 25 26
#include "util/Macros.hxx"
#include "util/WritableBuffer.hxx"
#include "util/ConstBuffer.hxx"
27 28 29

#include <string.h>

30 31 32 33 34
#ifdef HAVE_ICU
#include "Util.hxx"
#include <unicode/ucnv.h>
#elif defined(HAVE_GLIB)
#include "util/Domain.hxx"
35 36 37
static constexpr Domain g_iconv_domain("g_iconv");
#endif

38 39 40 41 42 43 44 45 46
#ifdef HAVE_ICU

IcuConverter::~IcuConverter()
{
	ucnv_close(converter);
}

#endif

47 48 49 50 51
#ifdef HAVE_ICU_CONVERTER

IcuConverter *
IcuConverter::Create(const char *charset, Error &error)
{
52 53 54 55 56 57 58 59 60 61 62 63
#ifdef HAVE_ICU
	UErrorCode code = U_ZERO_ERROR;
	UConverter *converter = ucnv_open(charset, &code);
	if (converter == nullptr) {
		error.Format(icu_domain, int(code),
			     "Failed to initialize charset '%s': %s",
			     charset, u_errorName(code));
		return nullptr;
	}

	return new IcuConverter(converter);
#elif defined(HAVE_GLIB)
64 65 66 67 68 69 70 71 72 73 74 75 76
	GIConv to = g_iconv_open("utf-8", charset);
	GIConv from = g_iconv_open(charset, "utf-8");
	if (to == (GIConv)-1 || from == (GIConv)-1) {
		if (to != (GIConv)-1)
			g_iconv_close(to);
		if (from != (GIConv)-1)
			g_iconv_close(from);
		error.Format(g_iconv_domain,
			     "Failed to initialize charset '%s'", charset);
		return nullptr;
	}

	return new IcuConverter(to, from);
77
#endif
78 79
}

80 81 82
#ifdef HAVE_ICU
#elif defined(HAVE_GLIB)

83 84 85
static std::string
DoConvert(GIConv conv, const char *src)
{
86
	// TODO: dynamic buffer?
87 88 89 90 91 92 93 94 95 96 97 98 99 100
	char buffer[4096];
	char *in = const_cast<char *>(src);
	char *out = buffer;
	size_t in_left = strlen(src);
	size_t out_left = sizeof(buffer);

	size_t n = g_iconv(conv, &in, &in_left, &out, &out_left);

	if (n == static_cast<size_t>(-1) || in_left > 0)
		return std::string();

	return std::string(buffer, sizeof(buffer) - out_left);
}

101 102
#endif

103 104 105
std::string
IcuConverter::ToUTF8(const char *s) const
{
106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132
#ifdef HAVE_ICU
	const ScopeLock protect(mutex);

	ucnv_resetToUnicode(converter);

	// TODO: dynamic buffer?
	UChar buffer[4096], *target = buffer;
	const char *source = s;

	UErrorCode code = U_ZERO_ERROR;

	ucnv_toUnicode(converter, &target, buffer + ARRAY_SIZE(buffer),
		       &source, source + strlen(source),
		       nullptr, true, &code);
	if (code != U_ZERO_ERROR)
		return std::string();

	const size_t target_length = target - buffer;
	const auto u = UCharToUTF8({buffer, target_length});
	if (u.IsNull())
		return std::string();

	std::string result(u.data, u.size);
	delete[] u.data;
	return result;

#elif defined(HAVE_GLIB)
133
	return DoConvert(to_utf8, s);
134
#endif
135 136 137 138 139
}

std::string
IcuConverter::FromUTF8(const char *s) const
{
140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164
#ifdef HAVE_ICU
	const ScopeLock protect(mutex);

	const auto u = UCharFromUTF8(s);
	if (u.IsNull())
		return std::string();

	ucnv_resetFromUnicode(converter);

	// TODO: dynamic buffer?
	char buffer[4096], *target = buffer;
	const UChar *source = u.data;
	UErrorCode code = U_ZERO_ERROR;

	ucnv_fromUnicode(converter, &target, buffer + ARRAY_SIZE(buffer),
			 &source, u.end(),
			 nullptr, true, &code);
	delete[] u.data;

	if (code != U_ZERO_ERROR)
		return std::string();

	return std::string(buffer, target);

#elif defined(HAVE_GLIB)
165
	return DoConvert(from_utf8, s);
166
#endif
167 168 169
}

#endif