1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365
|
.\" Copyright (c) 1996 Eric S. Raymond <esr@thyrsus.com>
.\" and Andries Brouwer <aeb@cwi.nl>
.\"
.\" This is free documentation; you can redistribute it and/or
.\" modify it under the terms of the GNU General Public License as
.\" published by the Free Software Foundation; either version 2 of
.\" the License, or (at your option) any later version.
.\"
.\" This is combined from many sources, including notes by aeb and
.\" research by esr. Portions derive from a writeup by Roman Czyborra.
.\"
.\" Last changed by David Starner <dstarner98@aasaa.ofe.org>.
.\"
.\" Japanese Version Copyright (c) 1996,1997,1998
.\" ISHIKAWA Mutsumi, all rights reserved.
.\" Translated Mon Jul 21 03:46:21 JST 1997
.\" by ISHIKAWA Mutsumi <ishikawa@linux.or.jp>
.\" Updated Fri Dec 3 JST 1999 by Kentaro Shirakata <argrath@ub32.org>
.\" Updated Fri Jan 4 JST 2002 by Kentaro Shirakata <argrath@ub32.org>
.\"
.\" WORD: ligature
.\"
.TH CHARSETS 7 2008-06-03 "Linux" "Linux Programmer's Manual"
.SH ̾
charsets \- ץޤλ鸫ʸåȤȹݲ
.SH
Linux Ϲݲ줿ڥ졼ƥƥǤ롣
Linux ͡ʥ桼ƥƥ䡢 console ɥ饤Фʤɤ
ǥХɥ饤Фϡƥե٥åȤʤɤ
ޥʸå (multilingual character sets) ݡȤƤ롣
ˤϥƥե٥åʸꥷʸ
ʸӥʸإ֥饤ʸʤɤޤޤ졢
ȯ (diacritical marks)ȡ (ligatures) ʤɤ
ȤȤǤ롣
.LP
Υޥ˥奢ڡǤϡץޤλߤۤʤʸ絬
(character-set standards) ȡ Linux ˤɤŬ礵뤫Ȥ
ȤˤĤƽҤ٤롣ǤϡASCII, ISO 8859, KOI8-R, Unicode, ISO 2022,
ISO 4873 γƵʤˤĤƵ롣
Ǥϼºݤ˥ʸåȤȤƻȤƤʸåȤܤ
¾ΥƥǻȤƤ̵ΤΤϽŻ뤷ʤ
.LP
glibc 2.2.3 ǸбƤѤƤʸåȤ
ʥꥹȤϰʲ̤:
ISO-8859-{1,2,3,5,6,7,8,9,13,15}, CP1251, UTF-8, EUC-{KR,JP,TW},
KOI8-{R,U}, GB2312, GB18030, GBK, BIG5, BIG5-HKSCS, TIS-620 (Ʊ)
(롼ޥ˥ ISO-8859-16 ڤؤäƤ뤫⤷ʤ)
.SS ASCII
ASCII (American Standard Code For Information Interchange)
7ӥåʸθȤʤäΤǤꡢ
ȤȤƸ(American English) Τ˥ǥ줿
ߤϡECMA-6 ɸƤ롣
.LP
ɥĸ졢ե졢ڥʤɤ 7 ӥåȤб뤿ᡢ
ASCII Υɥ뵭¾̲ߵ֤
ѸʸΤΤ֤͡Ѽ郎¸ߤ롣
ƻȤ٤ǤϤʤ
glibc ASCII δʥѡåȤǤʤʸåȤΥ
бƤʤ
(ʸåȤ ISO-646 ȤΤ롣
ASCII ȶᤤطˤꡢʸ֤뤳ȤǧƤ)
.LP
Linux ƹ߷פ줿ϡɥΤ˽줿Τǡ
Ϥᤫ ASCII ݡȤƤ롣
.SS ISO 8859
ISO 8859 15 ȤΰϢ 8 ӥåʸǤ롣
(7 ӥå) US ASCII ޤߡ 128 159 ˤʸ֤졢
160 255 ˤ 96 Ĥθʸ֤Ƥ롣
.LP
ΤǡäȤפʤΤ ISO 8859-1 (Latin-1) Ǥ롣
Linux ɥ饤Фˤƥͥƥ֤˥ݡȤƤꡢ
.\"nakano ǤʤȻפޤ
X11R6 ˤƤƱͤ˥ݡȤƤ롣ˡ
HTML δʸǤ롣
.LP
ˤ롢¾ 8859 ʸΥݡȤ
.RB ( setfont (8))
Τ褦ʥ桼⡼ɡ桼ƥƥѤDzǽˤʤ롣
Τ褦ʥ桼ƥƥѤ뤳Ȥˤꡢɥ饤Фˤ
륭ܡɤ EGA եåơ֥γƤѹ"桼
(user mapping)"եȥơ֥Ѥ뤳ȤǤ롣
.LP
ʲϡ줾νδñǤ롣
.TP
8859-1 (Latin-1)
Latin-1 Х˥(Albanian)˥(Catalan)ǥޡ
(Danish)(Dutch)Ѹ(English)ե(Faroese)
եɸ(Finnish)ե(French)ɥĸ(German)
ꥷ(Galician)ɸ(Irish)ɸ(Icelandic)
ꥢ(Italian)Υ륦(Norwegian)ݥȥ(Portuguese)
ڥ(Spanish)ǥ(Swedish)ȤäۤȤɤ
衼åѸС롣
ɥĸ ij ե oe ιӸŤ
,,ɥĸ`` ϤʤϰϤȹͤƤ롣
.TP
8859-2 (Latin-2)
Latin-2 ϥ(Slavic)(Croatian)
(Czech)ɥĸ(German)ϥ(Hungarian)ݡɸ
(Polish)롼ޥ˥(Rumanian)(Slovak)
٥˥(Slovene)ȤäʸȤƥƥʸ
Ѥ롢ַϸ衼åѤθΤۤȤɤݡȤ롣
.TP
8859-3 (Latin-3)
Latin-3 ϥڥ(Esperanto)ꥷ(Galician)ޥ륿
(Maltese)ʤɤνδ֤ɤѤ롣
(ȥ륳(Turkish)Ϥ 8859-9 ǽ褦ˤʤäƤ)
.TP
8859-4 (Latin-4)
Latin-4 ϥȥ˥(Estonian)ȥӥ(Latvian)ȥ˥
(Lithuanian)ʸ롣Latain-4 ϡ
ܼŪˤѻߤƤ(obsolate Ǥ)
8859-10 (Latin-6) 8859-13 (Latin-7) ȤΤȡ
.TP
8859-5
.br
֥륬ꥢ(Bulgarian)٥롼(Byelorussian)ޥɥ˥
(Macedonian)(Russian)ӥ(Serbian)饤ʸ
(Ukrainian) ݡȤ륭ʸǤ롣 饤ʸǤ
downstroke Ĥ "ghe" Ȥʸ "heh" ɤߡ
ghe ˤ ghe upstroke ĤʤФʤʤ
ˤĤƤϡ
KOI8-R ˴ؤȤΤȡ
.TP
8859-6
.br
ӥ(Arabic)ݡȤ롣8859-6 Υեơ֥(glyph table)
ʸη֤ʬ䤷եȤǤ롣
ΤᡢŬڤʥǥץ쥤
initial, medial, final ե˷礷ʤФʤʤ
.TP
8859-7
奮ꥷ(Modern Greek)ݡȤ롣
.TP
8859-8
niqud() Τʤإ֥饤(Hebrew)ݡȤ롣
niqud ȴإ֥饤(Biblical Hebrew)ϤʸåȤ
оݳǤ롣
Linux ǤϡΤˤ UTF-8 ޤǥǤ롣
.TP
8859-9 (Latin-5)
ϡLatin-1 Ѽǡɸʸȥ륳(Turkish)ʸ
֤ΤǤ롣
.TP
8859-10 (Latin-6)
Latin-6 ̲(Nordic)ϰС뤿 Latin-4 ˤϴޤޤƤʤ
̥åȸ(Inuit)(ɸ(Greenlandic))
(Sami)(å(Lappish)) äƤ롣
RFC 1345 ˤϡʳΡۤʤä "latin6" ܤƤ롣
ȡ(Skolt Sami)Ǥϡ
ˤĤΥȵ椬ɬפȤ롣
.TP
8859-11
ϵ䤵줿ɸΤ¸ߤ롣
ɸ Linux ǥΤѤ TIS-620 ƱΤǤ롣
.TP
8859-12
ʸåȤ¸ߤʤ
٥ȥʥ줬ξȤ褦Ƥ
ISO 8859 Ƥ(Ǥʤ) 96 ʸ˼ޤʤä
Linux Ǥϥ٥ȥʥ UTF-8 ޤʸåȤǤ롣
.TP
8859-13 (Latin-7)
ХȳθݡȤ롣
äˡLatin-4 ¸ߤʤȥӥʸޤࡣ
.TP
8859-14 (Latin-8)
ϥȸʸåȤǤꡢ(Gaelic)ȥ륺(Welsh)
б롣
ʸåȤϸ奢ɸѤդʸޤࡣ
.TP
8859-15 (Latin-9)
ϥ桼 Latin-1 äƤʤեȥեɸʸ
ɲäƤ롣
.TP
8859-16 (Latin-10)
ʸåȤ 8859-2 б¿θб
˥롼ޥ˥ˤϤ괰б롣
.SS KOI8-R
KOI8-R ϥˤɤѤ롢ISO ǤʤʸǤ롣
Ⱦʬ US ASCII Ǥ롣Ⱦʬ ISO 8859-5 ʬɤ
ǥ줿ʸǤ롣
KOI8-U KOI8-R ˤʸåȤǤꡢ
饤ʸ(Ukrainian) ˤ褯б롣
Τɤ ISO-8859 Τ褦 ISO-2022 ߴǤϤʤ
.LP
Linux Ǥ KOI8-R Υ륵ݡȤϡ
桼⡼ɤΥ桼ƥƥǼ¸Ƥ롣
ϥܡɤγƤ EGA եåơ֥ѹ
ɥ饤ФΥեȥơ֥ "桼" Ԥ
.\" Thanks to Tomohiro KUBOTA for the following sections about
.\" national standards.
.SS JIS X 0208
JIS X 0208 ܸιɸʸåȤǤ롣
¾ˤ⤤ĤܸιɸʸåȤϤ
(JIS X 0201, JIS X 0212, JIS X 0213 ʤ)줬ǤפǤ롣
ʸ 94x94 2 Хȥޥȥå֤롣
ƥХȤ 0x21-0x7e ͤġ
JIS X 0208 ʸåȤǤꡢǥǤϤʤȤդ뤳ȡ
ϡ
JIS X 0208 ȤϥƥȥǡɽˤϻȤʤȤȤǤ롣
JIS X 0208 ϡ
EUC-JP, Shift_JIS, ISO-2022-JP Ȥäǥ
ʤȤѤ롣
EUC-JP Linux ˤƺǤפʥǥǤꡢ
US ASCII JIS X 0208 ޤǤ롣
EUC-JP ǤϡJIS X 0208 ʸ 2 ХȤɽ졢
ƥХȤ JIS X 0208 ɤ 0x80 äΤǤ롣
.SS KS X 1001
KS X 1001 ϴڹιɸʸåȤǤ롣
JIS X 0208 Ʊͤˡʸ 94x94 2 Хȥޥȥå֤롣
KS X 1001 JIS X 0208 Ʊͤˡ
EUC-KR, Johab, ISO-2022-KR ȤäǥʤȤѤ롣
EUC-KR Linux ˤƺǤפʥǥǤꡢ
US ASCII KS X 1001 ޤǤ롣
KS C 5601 KS X 1001 θŤ̾Ǥ롣
.SS GB 2312
GB 2312 ϡʸɽ뤿ιɸʸåȤǤ롣
JIS X 0208 Ʊͤˡʸ 94x94 2 Хȥޥȥå֤졢
EUC-CN Ѥ롣
EUC-CN Linux ˤƺǤפʥǥǤꡢ
US ASCII GB 2312 ޤǤ롣
EUC-CN ϤФ GB, GB 2312, CN-GN ʤɤȸƤФ롣
.SS Big5
Big5 ѤʸҤΤ˰Ū˻ȤʸåȤǤ롣
(Big5 ʸåȤȥǥξǤ롣)
US ASCII ξ̽Ǥ롣
ASCII ʸ 2 ХȤɽ롣
0xa1-0xfe ΥХȤ 2 Хʸ 1 ʸܤȤѤ롣
Big5 ȤγĥѤȹǹѤƤ롣
ISO 2022 ǤϤʤ
.SS TIS 620
TIS 620 ϥιɸʸåȤǡUS ASCII ξ̽Ǥ롣
ISO 8859 Ʊͤˡʸ 0xa1-0xfe ֤롣
TIS 620 Linux ǤΤ߰ŪѤƤʸåȤǤꡢ
ޤUTF-8 ϹʸäƤ롣
.SS UNICODE
Unicode (ISO10646) ϡʹ֤ѤƤθƤʸ
Τˤ魯ȤŪȤʤǤ롣
Unicode ι¤ϳʸΥɤ 20.1 ӥåȤͿƤ롣
ۤȤɤΥԥ塼 20.1 ӥåȤʤΤǡ
Unicode ǡȤ 32 ӥå˥ɤ졢
16 ӥå (UTF-16)(ʸɤˤ
2 Ĥ 16 ӥåɬפȤʤ)
8 ӥåȥХȤ (UTF-8)Ȥư롣
Unicode ˤĤƤξϡ<http://www.unicode.org> 롣
.LP
Linux 8-bit Unicode Transformation Form(UTF-8) Ѥ Unicode
魯 UTF-8 Unicode βĹɽǤ롣UTF-8 7 ӥåȤ
沽Τ 1 ХȤ 11 ӥåȤǤ 2 ХȤ
16 ӥåȤǤ 3 ХȤ
21 ӥåȤǤ 4 ХȤ
26 ӥåȤǤ 5 ХȤ
31 ӥåȤǤ 6 ХȤѤ롣
.LP
0,1,x ǤդΥӥåȤȤȡХ 0xxxxxxx Unicode Ǥ
00000000 0xxxxxxx Ȥ蘆롣ϡASCII 0xxxxxxx Ʊ
ܥΥɤǤ롣Τ褦ˡASCII ѹʤ UTF-8 ѴǤ
ASCII ΤߤȤϡɤˤƤե륵ˤƤ⡢
ѹ˴ؤƲⵤˤʤƤ褤
.LP
110xxxxx ȤХȤ 2 ХȥɤλϤޤǤ롢ơ110xxxxx
10yyyyyy 00000xxx xxyyyyyy Ȥ褦ȤΩƤ롣ޤ
1110xxxx 3 ХȥɤλϤޤǤꡢ1110xxxx 10yyyyyy 10zzzzzz
xxxxyyyy yyzzzzzz Ȥ褦ȤΩƤ(UTF-8 31 ӥå
ISO 10646 ɤѤȤϡι 6 ХȥɤޤȯŸ)
.LP
ISO-8859-1 ʸåȤȤۤȤɤΥ桼ˤȤäơ
λ¤ϡASCII ϰϳȤäʸ
ĤΥХȤ沽ȤȤ̣롣ΤȤ
(UTF-8 ȤȡISO-8859-1ѤƤ)ΥƥȥեΥ
1 2 ѡ礭ʤäƤޤȤˤʤ롣
䥮ꥷѤ桼ˤȤäƤϡ
ˤäƸΥƥȤ 2 ܤ礭ˤʤ뤳Ȥˤʤ롣
ʤʤ餳θϤۤȤɤ ASCII ϰϳǤ롣
16-bit ɤѤƤܸѤ桼ˤ
3 ХɬפȤʤ롣
Unicode ؤѴ˥르ꥺŪѴФ褤ʸåȤ
(ä ISO-8859-1)ŪˤѴơ֥뤬ɬפǤꡢ
16 ӥåȥɤξϤΥơ֥Ϥʤ礭ʤΤȤʤ롣
.LP
UTF-8 ϼƱŪǤ롣10xxxxxx ϽüǤꡢۤΥХȤϥɤ
ƬǤ롣UTF-8 ʸˤ ASCII ΥХȤϡˤʸȤ
ɽ뤳ȤܤƤۤäˡĤ礭ʥɤΥѡȤ
뤿ˡNUL (\(aq\\0\(aq)) \(aq/\(aq ɬפϤʤ
.LP
ASCII NUL \(aq/\(aq ѹʤᡢͥ UTF-8
ѤƤ뤳Ȥä˰ռʤƤɤ
ͥϥХȤ路Ƥ뤫դɬפʤ
.LP
Unicode ǡΥŵŪˤ Unicode Υ֥åȤ
դؤΥޥåפǤ"֥ե(subfont)"ơ֥Ѥ
Ԥ롣ͥǤϡUnicode ӥǥ RAM ˥ɤ줿
֥եȤȤƵҤ롣ϡUTF-8 ⡼ɤǤ 512 ΰۤʤäܥ
äʸѲǽǤ뤳Ȥ̣롣
ϡܸ졢졢ڹǤϽʬǤϤʤ¾ѤǤ
ʬǤ롣
.LP
ߤΤȤɥ饤ФϹʸʤ
äơ졢䤽¾ιʸɬפʸϤ
Ǥϰʤ
.SS "ISO 2022 ISO 4873"
ISO 2022 ISO 4873 ɸǤϡ
VT100 ư˴ŤեȥȥǥҤ٤Ƥ롣
Υǥ Linux ͥ
.BR xterm (1)
ˤ(ʬŪ)ݡȤƤ롣ɸܤڹˤƤ褯
Ѥ롣
.LP
G0, G1, G2, G3 ȸƤФ 4 Ĥοʸ礬롣
ΤΤҤȤĤϡǾ̥ӥåȤ 0 Ǥ륳ɤΤθߤʸ
(ͤ G0)ޤҤȤĤϺǾ̥ӥåȤ 1 Ǥ륳ɤΤθߤ
ʸ(ͤ G1)Ǥ롣줾οʸ 94 96 ʸ
Ū 7-bitʸǤꡢ040-0177 (041-0176)
0240-0377 (0241-0376)ΥɤȤ
G0 Ͼ 94 ʸ 041-0176 ΥɤѤ롣
.LP
ʸڤؤϥեȥե \fB^N\fP (SO ޤ LS1),
\fB^O\fP (SI ޤ LS0), ESC n (LS2), ESC o (LS3), ESC N (SS2), ESC O (SS3),
ESC ~ (LS1R), ESC } (LS2R), ESC | (LS3R) ȤäƹԤ롣
ե LS\fIn\fP ϺǾ̥ӥåȤ 0 Ǥ륳ɤΤʸ
G\fIn\fP ꤹ롣
ե LS\fIn\fPR ϺǾ̥ӥåȤ 1 Ǥ륳ɤΤʸåȤ
G\fIn\fP ꤹ롣
ե SS\fIn\fP (Ǿ̥ӥåȤͤˤ餺)ʸΤ
ʸ G\fIn\fP (\fIn\fP=2 ޤ 3)ꤹ롣
.LP
94 ʸǤϡץ ESC ( xx (G0 ), ESC ) xx (G1
), ESC * xx (G2 ), ESC + xx (G3 ) ˤäơG\fIn\fP ʸ
Ѥ褦˻ؼ롣
xx "ISO 2375 International Register of Coded Character Sets"
ƤʸޤʸǤ롣
Ȥ ESC ( @ ISO 646 ʸ G0 ȤӡESC ( A
(ʥС()ˡݥ()) UK ʸ
롣ESC ( B (̲ߵΤ˥顼()) ASCII롣
ESC ( M եꥫ(African languages) ESC
( ! A 塼и(Cuban)ʸ롣ʤɤʤɡ
.LP
96-ʸǤϡץ ESC
\- xx (G1 ), ESC . xx (G2 ), ECS / xx (G3 )Ѥ뤳Ȥǡ
G\fIn\fP ʸѤ褦˻ؼ롣
㤨СESC - G ϥإ֥饤ե٥å(Hebrew alphabet)
G1 Ȥ롣
.LP
ޥХʸǤϥץ E $ xx ޤ ESC $ ( xx
(G0 ), ESC $ ) xx (G1 ), ESC $ * xx (G2 ), ESC$ + xx (G3 )
Ѥ뤳Ȥǡ G\fIn\fP ʸѤ褦˻ؼ롣
㤨СESC $ ( C ڹ(Korean)ʸ G0 Ȥ롣
ESC $ B ˤäܸʸåȤϡǶΥСǤ
ESC & @ ESC $ B ˤä褦ˤʤä
.LP
ISO 4873 Ϥ¤줿ʸѤꤹ롢ε
ϡG0 ( ASCII)ꤵ롣äơG1, G2, G3 ϺǾ̥ӥåȤ
åȤ줿ɤȤƤΤ߸ƤӽФȤǤ롣
äˡ\fB^N\fP \fB^O\fP Ѥ줺ESC ( xx xx=B ȤƤΤ
Ѥ뤳ȤǤ
ESC ) xx, ESC * xx, ESC + xx Ϥ줾 ESC \- xx, ESC . xx, ESC / xx
ˤʤ롣
.SH Ϣ
.BR console (4),
.BR console_codes (4),
.BR console_ioctl (4),
.BR ascii (7),
.BR iso_8859-1 (7),
.BR unicode (7),
.BR utf-8 (7)
|