File: charsets.config

package info (click to toggle)
kdelibs 4%3A2.2.2-13.woody.14
links: PTS
area: main
in suites: woody
size: 36,832 kB
ctags: 40,077
sloc: cpp: 313,284; ansic: 20,558; xml: 11,448; sh: 11,318; makefile: 2,426; perl: 2,084; yacc: 1,663; java: 1,538; lex: 629; python: 300
file content (222 lines) | stat: -rw-r--r-- 4,880 bytes
# KDE Config file
#
# This file defines where to find conversion maps for specific encodings.
# The directory below gives the dir where the posix charmaps are located.
#
[general]
i18ndir=/usr/share/i18n/charmaps

# defines some different names for codecs that are built into Qt.
[builtin]
iso-ir-111=koi8-r
koi8-ru=koi8-u
koi8r=koi8-r
koi8u=koi8-u
koi unified=koi8-r
us-ascii=iso 8859-1
usascii=iso 8859-1
x-utf-8=utf8
x-utf-7=utf7
ucs2=utf16
iso10646-1=ISO-10646-UCS-2
gbk-0=gbk
gb2312=gbk
gb2312.1980-0=gbk
euc-kr=euckr
x-euc-kr=euckr
euc-jp=eucjp
x-euc-jp=eucjp
jisx0201.1976-0=eucjp
jisx0208.1983-0=eucjp
jisx0208.1990-0=eucjp
jisx0208.1997-0=eucjp
jisx0212.1990-0=eucjp
jisx0213.2000-1=eucjp
jisx0213.2000-2=eucjp
shift_jis=sjis
shift-jis=sjis
x-sjis=sjis
iso-2022-jp=jis7
windows1250=cp 1250
windows1251=cp 1251
windows1252=cp 1252
windows1253=cp 1253
windows1254=cp 1254
windows1255=cp 1255
windows1256=cp 1256
windows1257=cp 1257
windows-1250=cp 1250
windows-1251=cp 1251
windows-1252=cp 1252
windows-1253=cp 1253
windows-1254=cp 1254
windows-1255=cp 1255
windows-1256=cp 1256
windows-1257=cp 1257
x-windows-1250=cp 1250
x-windows-1251=cp 1251
x-windows-1252=cp 1252
x-windows-1253=cp 1253
x-windows-1254=cp 1254
x-windows-1255=cp 1255
x-windows-1256=cp 1256
x-windows-1257=cp 1257
cp-1250=cp 1250
cp-1251=cp 1251
cp-1252=cp 1252
cp-1253=cp 1253
cp-1254=cp 1254
cp-1255=cp 1255
cp-1256=cp 1256
cp-1257=cp 1257
x-cp-1250=cp 1250
x-cp-1251=cp 1251
x-cp-1252=cp 1252
x-cp-1253=cp 1253
x-cp-1254=cp 1254
x-cp-1255=cp 1255
x-cp-1256=cp 1256
x-cp-1257=cp 1257
tis620=iso 8859-11
tis-620=iso 8859-11
windows-874=iso 8859-11
windows874=iso 8859-11
x-windows-874=iso 8859-11
cp874=iso 8859-11
cp-874=iso 8859-11
x-cp-874=iso 8859-11
ksc5601.1987-0=euckr
ks_c_5601-1987=euckr
iso-8859-1=iso 8859-1
iso-8859-2=iso 8859-2
iso-8859-3=iso 8859-3
iso-8859-4=iso 8859-4
iso-8859-5=iso 8859-5
iso-8859-6=iso 8859-6
iso-8859-7=iso 8859-7
iso-8859-8=iso 8859-8
iso-8859-9=iso 8859-9
iso-8859-10=iso 8859-10
iso-8859-11=iso 8859-11
iso-8859-12=iso 8859-12
iso-8859-13=iso 8859-13
iso-8859-14=iso 8859-14
iso-8859-15=iso 8859-15
tscii=tscii
paratype-154=pt 154
pt-154=pt 154

# some different names for the encodings defined in the charmaps files.
# even though the charmap file names are all uppercase, the names are all lowercase here.
[aliases]
cp852=ibm852

# some last resort hints in case the charmap file couldn't be found. This gives at least a partial conversion
# and helps making things readable.
#the name used as input here is already converted to the more canonical name as defined in the [aliases] group.
[conversionHints]
cp1250=iso-8859-2
koi8-r=iso-8859-5
koi8-u=koi8-r

# this list gives the charsets that can be used to display a file given in a certain encoding.
# the list should be in order of preference
# left side is the name returned by the codec used, right side the name of the charset as
# used in kcharsets.cpp
# 'unicode' will always be chosen as last resort, so it only needs to be added to the list,
# if it should get a higher priority
[charsetsForEncoding]
koi8-r=koi8-r,cp 1251,koi8-u,iso-8859-5
koi8-u=koi8-u,cp 1251,iso-8859-5,koi8-r
iso 8859-1=iso8859-1,iso8859-15
iso 8859-2=iso8859-2,unicode,iso8859-1
iso 8859-3=iso8859-3,unicode,iso8859-1
iso 8859-4=iso8859-4,unicode,iso8859-1
iso 8859-5=iso8859-5,koi8-u,koi8-r
iso 8859-6=unicode,iso8859-6
iso 8859-7=iso8859-7
iso 8859-8=iso8859-8,unicode
iso 8859-8-i=iso8859-8
iso 8859-9=iso8859-9,unicode,iso8859-1
iso 8859-11=iso8859-11
iso 8859-13=iso8859-13,unicode,iso8859-1
iso 8859-15=iso8859-15,unicode,iso8859-1
utf8=unicode,iso8859-1
utf16=unicode,iso8859-1
ISO-10646-UCS-2=unicode,iso8859-1
cp 1250=iso8859-2
cp 1251=cp 1251,koi8-u,koi8-r,iso8859-5
cp 1252=iso8859-1
cp 1253=iso8859-7
cp 1254=iso8859-9
cp 1255=iso8859-8
cp 1256=unicode,iso8859-6
cp 1257=iso8859-13
ibm852=unicode,iso-8859-2
tis620=iso8859-11,unicode
eucjp=eucjp,unicode,iso8859-1
sjis=eucjp,unicode,iso8859-1
jis7=eucjp,unicode,iso8859-1
big5=big5,unicode,iso8859-1
gbk=gb2312.1980-0,gbk-0,unicode,iso8859-1
gb2312=gb2312.1980-0,unicode,iso8859-1
euckr=euckr,unicode,iso8859-1
tscii=tscii
pt 154=pt 154,cp 1251,koi8-u,koi8-r,iso8859-5


[LanguageForEncoding]
# keep this in sync with the stuff in kcharsets.cpp
# 0 other
# 1 Arabic
# 2 Baltic
# 3 Central European
# 4 Chinese Simplified
# 5 Chinese Traditional
# 6 Cyrillic
# 7 Greek
# 8 Hebrew
# 9 Japanese
# 10 Korean
# 11 Thai
# 12 Turkish
# 13 Western European
# 14 Tamil
# 15 Unicode
iso 8859-1=13
iso 8859-15=13
cp 1252=13
iso 8859-2=3
iso 8859-3=3
iso 8859-4=2
iso 8859-13=2
cp 1250=3
cp 1254=12
cp 1257=2
ibm852=3
koi8-r=6
iso 8859-5=6
cp 1251=6
koi8-u=6
pt 154=6
big5=5
gbk=4
gb2312=4
euckr=10
sjis=9
jis7=9
eucjp=9
iso 8859-7=7
cp 1253=7
iso 8859-6=1
cp 1256=1
iso 8859-8=8
iso 8859-8-i=8
cp 1255=8
iso 8859-9=12
tis620=11
iso 8859-11=11
utf8=15
utf16=15
utf7=15
ucs2=15