Charset.cxx 3.67 KB
Newer Older
1
/*
Max Kellermann's avatar
Max Kellermann committed
2
 * Copyright (C) 2003-2014 The Music Player Daemon Project
3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25
 * http://www.musicpd.org
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License along
 * with this program; if not, write to the Free Software Foundation, Inc.,
 * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.
 */

#include "config.h"
#include "Charset.hxx"
#include "Domain.hxx"
#include "Limits.hxx"
#include "system/FatalError.hxx"
#include "Log.hxx"
26
#include "Traits.hxx"
27

28
#ifdef HAVE_GLIB
29
#include <glib.h>
30
#endif
31

32 33
#include <algorithm>

34 35 36 37 38 39 40 41 42 43 44 45 46
#include <assert.h>
#include <string.h>

/**
 * Maximal number of bytes required to represent path name in UTF-8
 * (including nul-terminator).
 * This value is a rought estimate of upper bound.
 * It's based on path name limit in bytes (MPD_PATH_MAX)
 * and assumption that some weird encoding could represent some UTF-8 4 byte
 * sequences with single byte.
 */
static constexpr size_t MPD_PATH_MAX_UTF8 = (MPD_PATH_MAX - 1) * 4 + 1;

47
#ifdef HAVE_GLIB
48 49 50 51 52 53 54
static std::string fs_charset;

gcc_pure
static bool
IsSupportedCharset(const char *charset)
{
	/* convert a space to check if the charset is valid */
55 56
	char *test = g_convert(" ", 1, charset, "UTF-8", nullptr, nullptr, nullptr);
	if (test == nullptr)
57 58 59 60 61 62 63 64 65
		return false;

	g_free(test);
	return true;
}

void
SetFSCharset(const char *charset)
{
66
	assert(charset != nullptr);
67 68 69 70 71 72 73 74 75 76

	if (!IsSupportedCharset(charset))
		FormatFatalError("invalid filesystem charset: %s", charset);

	fs_charset = charset;

	FormatDebug(path_domain,
		    "SetFSCharset: fs charset is: %s", fs_charset.c_str());
}

77 78
#endif

79
const char *
80 81
GetFSCharset()
{
82
#ifdef HAVE_GLIB
83
	return fs_charset.empty() ? "UTF-8" : fs_charset.c_str();
84
#else
85
	return "UTF-8";
86
#endif
87 88
}

89 90 91 92 93 94 95 96 97 98 99 100 101
static inline void FixSeparators(std::string &s)
{
#ifdef WIN32
	// For whatever reason GCC can't convert constexpr to value reference.
	// This leads to link errors when passing separators directly.
	auto from = PathTraitsFS::SEPARATOR;
	auto to = PathTraitsUTF8::SEPARATOR;
	std::replace(s.begin(), s.end(), from, to);
#else
	(void)s;
#endif
}

102 103 104
std::string
PathToUTF8(const char *path_fs)
{
105
	assert(path_fs != nullptr);
106

107
#ifdef HAVE_GLIB
108
	if (fs_charset.empty()) {
109
#endif
110 111 112
		auto result = std::string(path_fs);
		FixSeparators(result);
		return result;
113
#ifdef HAVE_GLIB
114
	}
115

116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134
	GIConv conv = g_iconv_open("utf-8", fs_charset.c_str());
	if (conv == reinterpret_cast<GIConv>(-1))
		return std::string();

	// g_iconv() does not need nul-terminator,
	// std::string could be created without it too.
	char path_utf8[MPD_PATH_MAX_UTF8 - 1];
	char *in = const_cast<char *>(path_fs);
	char *out = path_utf8;
	size_t in_left = strlen(path_fs);
	size_t out_left = sizeof(path_utf8);

	size_t ret = g_iconv(conv, &in, &in_left, &out, &out_left);

	g_iconv_close(conv);

	if (ret == static_cast<size_t>(-1) || in_left > 0)
		return std::string();

135 136 137
	auto result_path = std::string(path_utf8, sizeof(path_utf8) - out_left);
	FixSeparators(result_path);
	return result_path;
138
#endif
139 140
}

141 142
#ifdef HAVE_GLIB

143 144 145
char *
PathFromUTF8(const char *path_utf8)
{
146 147
	assert(path_utf8 != nullptr);

148 149 150
	if (fs_charset.empty())
		return g_strdup(path_utf8);

151 152 153 154
	return g_convert(path_utf8, -1,
			 fs_charset.c_str(), "utf-8",
			 nullptr, nullptr, nullptr);
}
155 156

#endif