File: utf8.c

package info (click to toggle)
vifm 0.14.3-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 14,252 kB
  • sloc: ansic: 179,567; sh: 5,445; makefile: 723; perl: 347; python: 76; xml: 26
file content (117 lines) | stat: -rw-r--r-- 3,115 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
#include <stic.h>

#include <stddef.h> /* size_t */
#include <stdlib.h> /* free() */
#include <string.h> /* strlen() */
#include <wchar.h>

#include <test-utils.h>

#include "../../src/utils/str.h"
#include "../../src/utils/utf8.h"

SETUP_ONCE()
{
	try_enable_utf8_locale();
}

TEST(get_real_string_width_full)
{
	const char utf8_str[] = "师вгд";
	const size_t expected_len = strlen(utf8_str);
	const size_t calculated_len = utf8_strsnlen(utf8_str, 5);
	assert_int_equal(expected_len, calculated_len);
}

TEST(tabulation_is_counted_correctly)
{
	const char utf8_str[] = "ab\tcd";
	assert_int_equal(5, utf8_strsw_with_tabs(utf8_str, 1));
	assert_int_equal(6, utf8_strsw_with_tabs(utf8_str, 2));
	assert_int_equal(5, utf8_strsw_with_tabs(utf8_str, 3));
	assert_int_equal(10, utf8_strsw_with_tabs(utf8_str, 8));
}

TEST(get_real_string_width_in_the_middle_a, IF(utf8_locale))
{
#define ENDING "丝刀"
	const char utf8_str[] = "师螺" ENDING;
	const char utf8_end[] = ENDING;
#undef ENDING
	const size_t expected_len = strlen(utf8_str) - strlen(utf8_end);
	const size_t calculated_len = utf8_strsnlen(utf8_str, 5);
	assert_int_equal(expected_len, calculated_len);
}

TEST(get_real_string_width_in_the_middle_b, IF(utf8_locale))
{
#define ENDING "丝刀"
	const char utf8_str[] = "师从螺" ENDING;
	const char utf8_end[] = ENDING;
#undef ENDING
	const size_t expected_len = strlen(utf8_str) - strlen(utf8_end);
	const size_t calculated_len = utf8_strsnlen(utf8_str, 7);
	assert_int_equal(expected_len, calculated_len);
}

TEST(length_is_less_or_equal_to_string_length, IF(utf8_locale))
{
	const char *str = "01 R\366yksopp - You Know I Have To Go (\326z"
	                  "g\374r \326zkan 5 AM Edit).mp3";
	const size_t len = strlen(str);
	size_t i;

	for(i = 0; i < len; ++i)
	{
		assert_true(utf8_nstrsnlen(str, i) <= i);
	}
}

TEST(utf8_nstrsw_works, IF(utf8_locale))
{
	const char str[] = "师从abаб";

	/* Full chars. */
	assert_int_equal(0, utf8_nstrsw(str, strlen("")));
	assert_int_equal(2, utf8_nstrsw(str, strlen("师")));
	assert_int_equal(4, utf8_nstrsw(str, strlen("师从")));
	assert_int_equal(5, utf8_nstrsw(str, strlen("师从a")));
	assert_int_equal(6, utf8_nstrsw(str, strlen("师从ab")));
	assert_int_equal(7, utf8_nstrsw(str, strlen("师从abа")));
	assert_int_equal(8, utf8_nstrsw(str, strlen("师从abаб")));
	assert_int_equal(8, utf8_nstrsw(str, strlen("师从abаб   ")));

	/* Cut char in half. */
	int max = strlen("师");
	int i;
	for(i = 1; i < max; ++i)
	{
		assert_int_equal(2, utf8_nstrsw(str, i));
	}
}

#ifdef _WIN32

TEST(utf16_roundtrip, IF(utf8_locale))
{
	const wchar_t str[] = { 0x79d8, 0 };

	char *const utf8 = utf8_from_utf16(str);
	wchar_t *const utf16 = utf8_to_utf16(utf8);
	assert_true(wcscmp(str, utf16) == 0);
	free(utf16);
	free(utf8);
}

TEST(first_char, IF(utf8_locale))
{
	const wchar_t str[] = { 0x79d8, 0 };
	char *const utf8 = utf8_from_utf16(str);
	assert_int_equal(0x79d8, get_first_wchar(utf8));
	free(utf8);
}

#endif

/* vim: set tabstop=2 softtabstop=2 shiftwidth=2 noexpandtab cinoptions-=(0 : */
/* vim: set cinoptions+=t0 filetype=c : */