File: Utf16TransformationStrategyTest.java

package info (click to toggle)
libdsiutils-java 2.7.4%2Bdfsg-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 4,012 kB
  • sloc: java: 34,189; xml: 531; makefile: 51; sh: 47
file content (111 lines) | stat: -rw-r--r-- 6,726 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
/*
 * DSI utilities
 *
 * Copyright (C) 2010-2023 Sebastiano Vigna
 *
 * This program and the accompanying materials are made available under the
 * terms of the GNU Lesser General Public License v2.1 or later,
 * which is available at
 * http://www.gnu.org/licenses/old-licenses/lgpl-2.1-standalone.html,
 * or the Apache Software License 2.0, which is available at
 * https://www.apache.org/licenses/LICENSE-2.0.
 *
 * This program is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY
 * or FITNESS FOR A PARTICULAR PURPOSE.
 *
 * SPDX-License-Identifier: LGPL-2.1-or-later OR Apache-2.0
 */

package it.unimi.dsi.bits;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;
import static org.junit.Assert.assertTrue;

import org.junit.Test;

import it.unimi.dsi.lang.MutableString;

public class Utf16TransformationStrategyTest {

	@Test
	public void testCharacterSequence() {
		String s = new String(new char[] { '\u0001', '\u0002' });
		assertEquals(48, TransformationStrategies.prefixFreeUtf16().toBitVector(s).length());
		assertEquals(0x40008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 32));
		assertEquals(0x40008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 48));
		assertFalse(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(0));
		assertFalse(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(1));
		assertTrue(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(15));
		assertFalse(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(33));

		s = new String(new char[] { '\u0001', '\u0002', '\u0003' });
		assertEquals(64, TransformationStrategies.prefixFreeUtf16().toBitVector(s).length());
		assertEquals(0xC00040008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 48));
		assertEquals(0xC00040008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 64));
		s = new String(new char[] { '\u0001', '\u0002', '\u0003', '\u0004' });
		assertEquals(80, TransformationStrategies.prefixFreeUtf16().toBitVector(s).length());
		assertEquals(0x2000C00040008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 64));
		assertEquals(0, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(64, 80));
		//System.err.println(Long.toHexString(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(16, 80)));
		assertEquals(0x2000C0004000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(16, 80));


		s = new String(new char[] { '\u0001', '\u0002' });
		assertEquals(32, TransformationStrategies.utf16().toBitVector(s).length());
		assertEquals(0x40008000L, TransformationStrategies.utf16().toBitVector(s).getLong(0, 32));
		assertFalse(TransformationStrategies.utf16().toBitVector(s).getBoolean(0));
		assertFalse(TransformationStrategies.utf16().toBitVector(s).getBoolean(1));
		assertTrue(TransformationStrategies.utf16().toBitVector(s).getBoolean(15));

		s = new String(new char[] { '\u0001', '\u0002', '\u0003' });
		assertEquals(48, TransformationStrategies.utf16().toBitVector(s).length());
		assertEquals(0xC00040008000L, TransformationStrategies.utf16().toBitVector(s).getLong(0, 48));
		s = new String(new char[] { '\u0001', '\u0002', '\u0003', '\u0004' });
		assertEquals(64, TransformationStrategies.utf16().toBitVector(s).length());
		assertEquals(0x2000C00040008000L, TransformationStrategies.utf16().toBitVector(s).getLong(0, 64));
		assertEquals(0x2000C000400080L, TransformationStrategies.utf16().toBitVector(s).getLong(8, 62));
		assertEquals(0x000C000400080L, TransformationStrategies.utf16().toBitVector(s).getLong(8, 61));
	}

	@Test
	public void testMutableString() {
		MutableString s = new MutableString(new char[] { '\u0001', '\u0002' });
		assertEquals(48, TransformationStrategies.prefixFreeUtf16().toBitVector(s).length());
		assertEquals(0x40008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 32));
		assertEquals(0x40008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 48));
		assertFalse(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(0));
		assertFalse(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(1));
		assertTrue(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(15));
		assertFalse(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getBoolean(33));

		s = new MutableString(new char[] { '\u0001', '\u0002', '\u0003' });
		assertEquals(64, TransformationStrategies.prefixFreeUtf16().toBitVector(s).length());
		assertEquals(0xC00040008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 48));
		assertEquals(0xC00040008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 64));
		s = new MutableString(new char[] { '\u0001', '\u0002', '\u0003', '\u0004' });
		assertEquals(80, TransformationStrategies.prefixFreeUtf16().toBitVector(s).length());
		assertEquals(0x2000C00040008000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(0, 64));
		assertEquals(0, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(64, 80));
		//System.err.println(Long.toHexMutableString(TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(16, 80)));
		assertEquals(0x2000C0004000L, TransformationStrategies.prefixFreeUtf16().toBitVector(s).getLong(16, 80));


		s = new MutableString(new char[] { '\u0001', '\u0002' });
		assertEquals(32, TransformationStrategies.utf16().toBitVector(s).length());
		assertEquals(0x40008000L, TransformationStrategies.utf16().toBitVector(s).getLong(0, 32));
		assertFalse(TransformationStrategies.utf16().toBitVector(s).getBoolean(0));
		assertFalse(TransformationStrategies.utf16().toBitVector(s).getBoolean(1));
		assertTrue(TransformationStrategies.utf16().toBitVector(s).getBoolean(15));

		s = new MutableString(new char[] { '\u0001', '\u0002', '\u0003' });
		assertEquals(48, TransformationStrategies.utf16().toBitVector(s).length());
		assertEquals(0xC00040008000L, TransformationStrategies.utf16().toBitVector(s).getLong(0, 48));
		s = new MutableString(new char[] { '\u0001', '\u0002', '\u0003', '\u0004' });
		assertEquals(64, TransformationStrategies.utf16().toBitVector(s).length());
		assertEquals(0x2000C00040008000L, TransformationStrategies.utf16().toBitVector(s).getLong(0, 64));
		assertEquals(0x2000C000400080L, TransformationStrategies.utf16().toBitVector(s).getLong(8, 62));
		assertEquals(0x000C000400080L, TransformationStrategies.utf16().toBitVector(s).getLong(8, 61));
	}
}