File: TextNormalizerTest.php

package info (click to toggle)
php-league-commonmark 2.7.1-1
  • links: PTS, VCS
  • area: main
  • in suites: experimental
  • size: 8,264 kB
  • sloc: php: 20,396; xml: 1,988; ruby: 45; makefile: 21; javascript: 15
file content (70 lines) | stat: -rw-r--r-- 3,064 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
<?php

declare(strict_types=1);

/*
 * This file is part of the league/commonmark package.
 *
 * (c) Colin O'Dell <colinodell@gmail.com>
 *
 * For the full copyright and license information, please view the LICENSE
 * file that was distributed with this source code.
 */

namespace League\CommonMark\Tests\Unit\Normalizer;

use League\CommonMark\Normalizer\TextNormalizer;
use PHPUnit\Framework\Attributes\DataProvider;
use PHPUnit\Framework\TestCase;

final class TextNormalizerTest extends TestCase
{
    #[DataProvider('dataProviderForTestNormalize')]
    public function testNormalize(string $input, string $expectedOutput): void
    {
        $this->assertEquals($expectedOutput, (new TextNormalizer())->normalize($input));
    }

    /**
     * @return iterable<string[]>
     */
    public static function dataProviderForTestNormalize(): iterable
    {
        yield ['', ''];
        yield ['hello world', 'hello world'];
        yield ['hello-world', 'hello-world'];
        yield ['hello     world', 'hello world'];
        yield ['Hello World!', 'hello world!'];

        yield ['456*(&^3484389462342#$#$#$#$', '456*(&^3484389462342#$#$#$#$'];
        yield ['me&you', 'me&you'];
        yield ['special char ὐ here', 'special char ὐ here'];
        yield ['ПРИСТАНЯМ СТРЕМЯТСЯ', 'пристаням стремятся'];
        yield ['пристаням стремятся', 'пристаням стремятся'];
        yield ['emoji 😂 example', 'emoji 😂 example'];
        yield ['One ½ half', 'one ½ half'];
        yield ['Roman ↁ example', 'roman ↁ example'];
        yield ['Here\'s a DŽ digraph', 'here\'s a dž digraph'];
        yield ['Here\'s another dž digraph', 'here\'s another dž digraph'];
        yield ['Unicode x² superscript', 'unicode x² superscript'];
        yield ['Equal = sign', 'equal = sign'];
        yield ['Tabs	in	here', 'tabs in here'];
        yield ['Tabs-	-in-	-here-too', 'tabs- -in- -here-too'];
        yield ['We-love---dashes even with -lots- of    spaces', 'we-love---dashes even with -lots- of spaces'];
        yield ['LOUD NOISES', 'loud noises'];
        yield ['ťęŝŧ', 'ťęŝŧ'];
        yield ['ŤĘŜŦ', 'ťęŝŧ'];

        yield ["\nWho\nput\n\n newlines  \nin here?!\n", 'who put newlines in here?!'];

        yield ['අත්හදා බලන මාතෘකාව', 'අත්හදා බලන මාතෘකාව'];
        yield ['අත්හදා බලන මාතෘකාව -', 'අත්හදා බලන මාතෘකාව -'];
        yield ['අත්හදා බලන මාතෘකාව - ', 'අත්හදා බලන මාතෘකාව -'];
        yield ['අත්හදා බලන මාතෘකාව - අ', 'අත්හදා බලන මාතෘකාව - අ'];

        yield ['测试标题', '测试标题'];
        yield ['测试 # 标题', '测试 # 标题'];
        yield ['测试 x² 标题', '测试 x² 标题'];
        yield ['試験タイトル', '試験タイトル'];
    }
}