File: utf16.h

package info (click to toggle)
chromium 139.0.7258.138-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 6,120,676 kB
  • sloc: cpp: 35,100,869; ansic: 7,163,530; javascript: 4,103,002; python: 1,436,920; asm: 946,517; xml: 746,709; pascal: 187,653; perl: 88,691; sh: 88,436; objc: 79,953; sql: 51,488; cs: 44,583; fortran: 24,137; makefile: 22,147; tcl: 15,277; php: 13,980; yacc: 8,984; ruby: 7,485; awk: 3,720; lisp: 3,096; lex: 1,327; ada: 727; jsp: 228; sed: 36
file content (68 lines) | stat: -rw-r--r-- 2,476 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
// Copyright 2024 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#ifndef THIRD_PARTY_BLINK_RENDERER_PLATFORM_WTF_TEXT_UTF16_H_
#define THIRD_PARTY_BLINK_RENDERER_PLATFORM_WTF_TEXT_UTF16_H_

#include <unicode/utf16.h>

#include "base/containers/span.h"
#include "third_party/blink/renderer/platform/wtf/text/wtf_uchar.h"

namespace WTF {

// U16_GET() for base::span.
//  - If text[offset] is a leading surrogate and text[offset + 1] is a
//    trailing surrogate, a code point computed from text[offset] and
//    text[offset + 1] is returned.
//  - If text[offset] is a trailing surrogate and text[offset - 1] is a
//    leading surrogate, a code point computed from text[offset - 1] and
//    text[offset] is returned.
//  - Otherwise, text[offset] is returned;
inline UChar32 CodePointAt(base::span<const UChar> text, size_t offset) {
  UChar32 code_point;
  U16_GET(text, 0, offset, text.size(), code_point);
  return code_point;
}

// U16_NEXT() for base::span.
// The return value is same as CodePointAt()'s. `offset` argument is updated
// to point the next of the read character.
template <typename T>
UChar32 CodePointAtAndNext(base::span<const UChar> text, T& offset) {
  UChar32 code_point;
  U16_NEXT(text, offset, text.size(), code_point);
  return code_point;
}
template <typename T>
UChar32 CodePointAtAndNext(base::span<const LChar> text, T& offset) {
  return text[offset++];
}

// This is U16_PREV() for base::span.
// Returns a code point ending with text[offset - 1].  That is to say,
//  - Returns a code point computed from text[offset - 2] and text[offset - 1]
//    if offset-1 is greater than start_offset and text[offset - 2] is a
//    leading surrogate and text[offset - 1] is a trailing surrogate.
//  - Otherwise, text[offset - 1] is returned.
//
// `offset` argument is updated to point the first code unit of the read
//  character.  `offset` won't be smaller than `start_offset`.
template <typename T>
UChar32 CodePointAtAndPrevious(base::span<const UChar> text,
                               T start_offset,
                               T& offset) {
  DCHECK_LT(start_offset, offset);
  UChar32 code_point;
  U16_PREV(text, start_offset, offset, code_point);
  return code_point;
}

}  // namespace WTF

using WTF::CodePointAt;
using WTF::CodePointAtAndNext;
using WTF::CodePointAtAndPrevious;

#endif  // THIRD_PARTY_BLINK_RENDERER_PLATFORM_WTF_TEXT_UTF16_H_