File: iconv.cpp

package info (click to toggle)
residualvm 0.3.1%2Bdfsg-2
  • links: PTS, VCS
  • area: contrib
  • in suites: bullseye
  • size: 31,292 kB
  • sloc: cpp: 227,029; sh: 7,256; xml: 1,731; perl: 1,067; java: 861; asm: 738; python: 691; ansic: 272; makefile: 139; objc: 81; sed: 22; php: 1
file content (106 lines) | stat: -rw-r--r-- 3,574 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
/* ScummVM - Graphic Adventure Engine
 *
 * ScummVM is the legal property of its developers, whose names
 * are too numerous to list here. Please refer to the COPYRIGHT
 * file distributed with this source distribution.
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version 2
 * of the License, or (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301, USA.
 *
 */

#include <iconv.h>

#include "common/iconv.h"
#include "common/str.h"
#include "common/textconsole.h"
#include "common/ustr.h"

namespace Common {

static const char **getIconvCodesForEncoding(Encoding encoding) {
	static const char *encodingCP932Codes[]  = { "cp932",  nullptr };
	static const char *encodingCP1250Codes[] = { "cp1250", nullptr };
	static const char *encodingCP1251Codes[] = { "cp1251", nullptr };
	static const char *encodingCP1252Codes[] = { "cp1252", nullptr };
	static const char *encodingCP1255Codes[] = { "cp1255", nullptr };

	// libiconv and glibc-iconv don't use the same name for that encoding, we have to try both
	static const char *encodingMacCentralEuropeCodes[] = { "maccentraleurope", "mac-centraleurope", nullptr };

	switch (encoding) {
		case kEncodingCP932:  return encodingCP932Codes;
		case kEncodingCP1250: return encodingCP1250Codes;
		case kEncodingCP1251: return encodingCP1251Codes;
		case kEncodingCP1252: return encodingCP1252Codes;
		case kEncodingCP1255: return encodingCP1255Codes;
		case kEncodingMacCentralEurope: return encodingMacCentralEuropeCodes;
	}

	error("Failed look up iconv codes for encoding '%d'", encoding);
}

U32String convertToU32String(Encoding fromEncoding, const String &string) {
	const char **fromCodes = getIconvCodesForEncoding(fromEncoding);

	// Apparently UTF-32 isn't native endian. Also, UCS−4−INTERNAL fails
	// for me.
	static const char *toCode =
#ifdef SCUMM_BIG_ENDIAN
		"UTF-32BE";
#else
		"UTF-32LE";
#endif

	iconv_t handle;
	do {
		handle = iconv_open(toCode, *fromCodes);

		if (handle == (iconv_t)-1) {
			fromCodes++;
		}
	} while (handle == ((iconv_t)-1) && *fromCodes);

	if (handle == ((iconv_t)-1))
		error("Failed to initialize UTF-32 conversion from %d", fromEncoding);

	size_t inSize = string.size();
	size_t outSize = inSize * 4; // Approximation
	size_t originalOutSize = outSize;

	char *buffer = new char[outSize];
	char *dst = buffer;

#ifdef ICONV_USES_CONST
	const char *src = string.c_str();
#else
	char *src = const_cast<char *>(string.c_str());
#endif

	if (iconv(handle, &src, &inSize, &dst, &outSize) == ((size_t)-1))
		error("Failed to convert %s to UTF-32 string", *fromCodes);

	// The conversion descriptor may still contain some state. Write it to the output buffer.
	if (iconv(handle, nullptr, nullptr, &dst, &outSize) == ((size_t)-1))
		error("Failed to convert the remaining state of %s to UTF-32 string", *fromCodes);

	U32String output((const U32String::value_type *)buffer, (originalOutSize - outSize) / 4);

	delete[] buffer;
	iconv_close(handle);

	return output;
}

} // End of namespace Common