File: SmartReplaceICU.cpp

package info (click to toggle)
chromium-browser 57.0.2987.98-1~deb8u1
  • links: PTS, VCS
  • area: main
  • in suites: jessie
  • size: 2,637,852 kB
  • ctags: 2,544,394
  • sloc: cpp: 12,815,961; ansic: 3,676,222; python: 1,147,112; asm: 526,608; java: 523,212; xml: 286,794; perl: 92,654; sh: 86,408; objc: 73,271; makefile: 27,698; cs: 18,487; yacc: 13,031; tcl: 12,957; pascal: 4,875; ml: 4,716; lex: 3,904; sql: 3,862; ruby: 1,982; lisp: 1,508; php: 1,368; exp: 404; awk: 325; csh: 117; jsp: 39; sed: 37
file content (113 lines) | stat: -rw-r--r-- 4,800 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
/*
 * Copyright (C) 2007 Apple Inc.  All rights reserved.
 * Copyright (C) 2008 Tony Chang <idealisms@gmail.com>
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 *
 * 1.  Redistributions of source code must retain the above copyright
 *     notice, this list of conditions and the following disclaimer.
 * 2.  Redistributions in binary form must reproduce the above copyright
 *     notice, this list of conditions and the following disclaimer in the
 *     documentation and/or other materials provided with the distribution.
 * 3.  Neither the name of Apple Computer, Inc. ("Apple") nor the names of
 *     its contributors may be used to endorse or promote products derived
 *     from this software without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY APPLE AND ITS CONTRIBUTORS "AS IS" AND ANY
 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
 * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 * DISCLAIMED. IN NO EVENT SHALL APPLE OR ITS CONTRIBUTORS BE LIABLE FOR ANY
 * DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
 * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
 * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#include "core/editing/commands/SmartReplace.h"

#if !OS(MACOSX)
#include "wtf/Assertions.h"
#include "wtf/text/WTFString.h"
#include <unicode/uset.h>

namespace blink {

static void addAllCodePoints(USet* smartSet, const String& string) {
  for (size_t i = 0; i < string.length(); i++)
    uset_add(smartSet, string[i]);
}

// This is mostly a port of the code in WebCore/editing/SmartReplaceCF.cpp
// except we use icu in place of CoreFoundations character classes.
static USet* getSmartSet(bool isPreviousCharacter) {
  static USet* preSmartSet = nullptr;
  static USet* postSmartSet = nullptr;
  USet* smartSet = isPreviousCharacter ? preSmartSet : postSmartSet;
  if (!smartSet) {
    // Whitespace and newline (kCFCharacterSetWhitespaceAndNewline)
    static const UChar* kWhitespaceAndNewLine = reinterpret_cast<const UChar*>(
        u"[[:WSpace:] [\\u000A\\u000B\\u000C\\u000D\\u0085]]");
    UErrorCode ec = U_ZERO_ERROR;
    smartSet = uset_openPattern(
        kWhitespaceAndNewLine,
        lengthOfNullTerminatedString(kWhitespaceAndNewLine), &ec);
    DCHECK(U_SUCCESS(ec)) << ec;

    // CJK ranges
    uset_addRange(smartSet, 0x1100,
                  0x1100 + 256);  // Hangul Jamo (0x1100 - 0x11FF)
    uset_addRange(smartSet, 0x2E80,
                  0x2E80 + 352);  // CJK & Kangxi Radicals (0x2E80 - 0x2FDF)
    // Ideograph Descriptions, CJK Symbols, Hiragana, Katakana, Bopomofo, Hangul
    // Compatibility Jamo, Kanbun, & Bopomofo Ext (0x2FF0 - 0x31BF)
    uset_addRange(smartSet, 0x2FF0, 0x2FF0 + 464);
    // Enclosed CJK, CJK Ideographs (Uni Han & Ext A), & Yi (0x3200 - 0xA4CF)
    uset_addRange(smartSet, 0x3200, 0x3200 + 29392);
    uset_addRange(smartSet, 0xAC00,
                  0xAC00 + 11183);  // Hangul Syllables (0xAC00 - 0xD7AF)
    uset_addRange(
        smartSet, 0xF900,
        0xF900 + 352);  // CJK Compatibility Ideographs (0xF900 - 0xFA5F)
    uset_addRange(smartSet, 0xFE30,
                  0xFE30 + 32);  // CJK Compatibility From (0xFE30 - 0xFE4F)
    uset_addRange(smartSet, 0xFF00,
                  0xFF00 + 240);  // Half/Full Width Form (0xFF00 - 0xFFEF)
    uset_addRange(smartSet, 0x20000,
                  0x20000 + 0xA6D7);  // CJK Ideograph Exntension B
    uset_addRange(
        smartSet, 0x2F800,
        0x2F800 + 0x021E);  // CJK Compatibility Ideographs (0x2F800 - 0x2FA1D)

    if (isPreviousCharacter) {
      addAllCodePoints(smartSet, "([\"\'#$/-`{");
      preSmartSet = smartSet;
    } else {
      addAllCodePoints(smartSet, ")].,;:?\'!\"%*-/}");

      // Punctuation (kCFCharacterSetPunctuation)
      static const UChar* kPunctuationClass =
          reinterpret_cast<const UChar*>(u"[:P:]");
      UErrorCode ec = U_ZERO_ERROR;
      USet* icuPunct = uset_openPattern(
          kPunctuationClass, lengthOfNullTerminatedString(kPunctuationClass),
          &ec);
      DCHECK(U_SUCCESS(ec)) << ec;
      uset_addAll(smartSet, icuPunct);
      uset_close(icuPunct);

      postSmartSet = smartSet;
    }
  }
  return smartSet;
}

bool isCharacterSmartReplaceExempt(UChar32 c, bool isPreviousCharacter) {
  return uset_contains(getSmartSet(isPreviousCharacter), c);
}
}

#endif  // !OS(MACOSX)