File: LatinCharReplacementTWTest.java

package info (click to toggle)
openjdk-11 11.0.4%2B11-1
  • links: PTS, VCS
  • area: main
  • in suites: sid
  • size: 757,028 kB
  • sloc: java: 5,016,041; xml: 1,191,974; cpp: 934,731; ansic: 555,697; sh: 24,299; objc: 12,703; python: 3,602; asm: 3,415; makefile: 2,772; awk: 351; sed: 172; perl: 114; jsp: 24; csh: 3
file content (80 lines) | stat: -rw-r--r-- 3,098 bytes parent folder | download | duplicates (17)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
/*
 * Copyright (c) 2008, Oracle and/or its affiliates. All rights reserved.
 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
 *
 * This code is free software; you can redistribute it and/or modify it
 * under the terms of the GNU General Public License version 2 only, as
 * published by the Free Software Foundation.
 *
 * This code is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
 * version 2 for more details (a copy is included in the LICENSE file that
 * accompanied this code).
 *
 * You should have received a copy of the GNU General Public License version
 * 2 along with this work; if not, write to the Free Software Foundation,
 * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 *
 * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
 * or visit www.oracle.com if you need additional information or have any
 * questions.
 */

/* @test
   @bug 4658679 4879644
   @summary Checks replacement logic within EUC-TW decoder
*/

/*
 * Tests goodness of fix for bugID 4658679: EUC-TW decoder should
 * perform replacement when it encounters latin chars outside the
 * normal US-ASCII range. For example: Isolated occurrences of
 * French accented chars. See bugID: 4658679.
 */
import java.io.*;
public class LatinCharReplacementTWTest {
    public static void  main(String[] args) throws Exception {
        final String bugID = "4658679";
        // Attempt to decode
        byte[] input = { (byte)0xa1,
                         (byte)0xf0,
                         (byte)'r',
                         (byte)'e',
                         (byte)'s',
                         (byte)0xe9,  // illegal within EUC-TW
                         (byte)'r',
                         (byte)'v',
                         (byte)0xe9,  // illegal within EUC-TW
                         (byte)'s',
                         (byte)0xa2,
                         (byte)0xf8
                       };

        char[] expected = { (char) 0xa7,
                         (char) 'r',
                         (char) 'e',
                         (char) 's',
                         (char) 0xFFFD,  // replacement for accented lowercase e
                         (char) 'r',
                         (char) 'v',
                         (char) 0xFFFD,  // replacement for accented lowercase e
                         (char) 's',
                         (char) 0xb0 };

        ByteArrayInputStream bais = new ByteArrayInputStream(input);
        InputStreamReader isr = new InputStreamReader(bais, "x-EUC-TW");

        char[] decoded = new char[128];
        int numChars = isr.read(decoded);

        if (numChars != expected.length) {
            throw new Exception("failure of test for bug " + bugID);
        }

        for (int i = 0 ; i < numChars; i++) {
           if (decoded[i] != expected[i])
                throw new Exception("failure of test for bug " + bugID);
        }
    }
}