File: text_encoder.cc

package info (click to toggle)
chromium 138.0.7204.183-1
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 6,071,908 kB
  • sloc: cpp: 34,937,088; ansic: 7,176,967; javascript: 4,110,704; python: 1,419,953; asm: 946,768; xml: 739,971; pascal: 187,324; sh: 89,623; perl: 88,663; objc: 79,944; sql: 50,304; cs: 41,786; fortran: 24,137; makefile: 21,806; php: 13,980; tcl: 13,166; yacc: 8,925; ruby: 7,485; awk: 3,720; lisp: 3,096; lex: 1,327; ada: 727; jsp: 228; sed: 36
file content (105 lines) | stat: -rw-r--r-- 4,622 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
/*
 * Copyright (C) 2013 Google Inc. All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are
 * met:
 *
 *     * Redistributions of source code must retain the above copyright
 * notice, this list of conditions and the following disclaimer.
 *     * Redistributions in binary form must reproduce the above
 * copyright notice, this list of conditions and the following disclaimer
 * in the documentation and/or other materials provided with the
 * distribution.
 *     * Neither the name of Google Inc. nor the names of its
 * contributors may be used to endorse or promote products derived from
 * this software without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 */

#include "third_party/blink/renderer/modules/encoding/text_encoder.h"

#include "base/feature_list.h"
#include "third_party/blink/renderer/bindings/modules/v8/v8_text_encoder_encode_into_result.h"
#include "third_party/blink/renderer/core/execution_context/execution_context.h"
#include "third_party/blink/renderer/modules/encoding/encoding.h"
#include "third_party/blink/renderer/platform/bindings/exception_state.h"
#include "third_party/blink/renderer/platform/wtf/text/character_visitor.h"
#include "third_party/blink/renderer/platform/wtf/text/text_encoding_registry.h"

namespace blink {

// Controls if TextEncode will throw an exception when failed to allocate
// buffer.
BASE_FEATURE(kThrowExceptionWhenTextEncodeOOM,
             "ThrowExceptionWhenTextEncodeOOM",
             base::FEATURE_ENABLED_BY_DEFAULT);

TextEncoder* TextEncoder::Create(ExecutionContext* context,
                                 ExceptionState& exception_state) {
  return MakeGarbageCollected<TextEncoder>(UTF8Encoding());
}

TextEncoder::TextEncoder(const WTF::TextEncoding& encoding)
    : encoding_(encoding), codec_(NewTextCodec(encoding)) {
  DCHECK_EQ(encoding_.GetName(), "UTF-8");
}

TextEncoder::~TextEncoder() = default;

String TextEncoder::encoding() const {
  String name = encoding_.GetName().GetString().DeprecatedLower();
  DCHECK_EQ(name, "utf-8");
  return name;
}

NotShared<DOMUint8Array> TextEncoder::encode(const String& input,
                                             ExceptionState& exception_state) {
  // Note that the UnencodableHandling here is never used since the
  // only possible encoding is UTF-8, which will use
  // U+FFFD-replacement rather than ASCII fallback substitution when
  // unencodable sequences (for instance, unpaired UTF-16 surrogates)
  // are present in the input.
  std::string result = WTF::VisitCharacters(input, [this](auto chars) {
    return codec_->Encode(chars, WTF::kNoUnencodables);
  });
  if (base::FeatureList::IsEnabled(kThrowExceptionWhenTextEncodeOOM)) {
    NotShared<DOMUint8Array> result_array(
        DOMUint8Array::CreateOrNull(base::as_byte_span(result)));
    if (result_array.IsNull()) {
      exception_state.ThrowDOMException(DOMExceptionCode::kUnknownError,
                                        "Failed to allocate buffer.");
    }
    return result_array;
  }
  return NotShared<DOMUint8Array>(
      DOMUint8Array::Create(base::as_byte_span(result)));
}

TextEncoderEncodeIntoResult* TextEncoder::encodeInto(
    const String& source,
    NotShared<DOMUint8Array>& destination) {
  TextEncoderEncodeIntoResult* encode_into_result =
      TextEncoderEncodeIntoResult::Create();

  TextCodec::EncodeIntoResult encode_into_result_data =
      WTF::VisitCharacters(source, [this, &destination](auto chars) {
        return codec_->EncodeInto(chars, destination->ByteSpan());
      });
  encode_into_result->setRead(encode_into_result_data.code_units_read);
  encode_into_result->setWritten(encode_into_result_data.bytes_written);
  return encode_into_result;
}

}  // namespace blink