File: extra_word_break_test_data.rsv

package info (click to toggle)
rust-unic-segment 0.9.0-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm, forky, sid, trixie
  • size: 364 kB
  • sloc: makefile: 2
file content (50 lines) | stat: -rw-r--r-- 1,589 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
// Copyright 2012-2015 The Rust Project Developers.
// Copyright 2017 The UNIC Project Developers.
//
// See the COPYRIGHT file at the top-level directory of this distribution.
//
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
// option. This file may not be copied, modified, or distributed
// except according to those terms.

// TODO: This could be improved with more tests like flag emoji with interspersed Extend chars and
// ZWJ

&[
    ("hello world", &["hello", " ", "world"]),

    // Long chains of flag emoji
    (
        "πŸ‡¦πŸ‡«πŸ‡¦πŸ‡½πŸ‡¦πŸ‡±πŸ‡©πŸ‡ΏπŸ‡¦πŸ‡ΈπŸ‡¦πŸ‡©πŸ‡¦πŸ‡΄",
        &["πŸ‡¦πŸ‡«", "πŸ‡¦πŸ‡½", "πŸ‡¦πŸ‡±", "πŸ‡©πŸ‡Ώ", "πŸ‡¦πŸ‡Έ", "πŸ‡¦πŸ‡©", "πŸ‡¦πŸ‡΄"],
    ),

    // Long chains of flag emoji
    (
        "πŸ‡¦πŸ‡«πŸ‡¦πŸ‡½πŸ‡¦πŸ‡±πŸ‡©πŸ‡ΏπŸ‡¦πŸ‡ΈπŸ‡¦πŸ‡©πŸ‡¦",
        &["πŸ‡¦πŸ‡«", "πŸ‡¦πŸ‡½", "πŸ‡¦πŸ‡±", "πŸ‡©πŸ‡Ώ", "πŸ‡¦πŸ‡Έ", "πŸ‡¦πŸ‡©", "πŸ‡¦"],
    ),

    // Long chains of flag emoji
    (
        "πŸ‡¦aπŸ‡«πŸ‡¦πŸ‡½aπŸ‡¦πŸ‡±πŸ‡©πŸ‡ΏπŸ‡¦πŸ‡ΈπŸ‡¦πŸ‡©πŸ‡¦",
        &["πŸ‡¦", "a", "πŸ‡«πŸ‡¦", "πŸ‡½", "a", "πŸ‡¦πŸ‡±", "πŸ‡©πŸ‡Ώ", "πŸ‡¦πŸ‡Έ", "πŸ‡¦πŸ‡©", "πŸ‡¦"],
    ),

    (
        "\u{1f468}\u{200d}\u{1f468}\u{200d}\u{1f466}",
        &["\u{1f468}\u{200d}\u{1f468}\u{200d}\u{1f466}"],
    ),

    (
        "πŸ˜ŒπŸ‘ŽπŸΌ",
        &["😌", "πŸ‘ŽπŸΌ"],
    ),

    (
        "πŸ‡¨πŸ‡¦πŸ‡¨πŸ‡­πŸ‡ΏπŸ‡²πŸ‡Ώ hi",
        &["πŸ‡¨πŸ‡¦", "πŸ‡¨πŸ‡­", "πŸ‡ΏπŸ‡²", "πŸ‡Ώ", " ", "hi"],
    ),
]