File: inner_text_builder.h

package info (click to toggle)
chromium 138.0.7204.183-1
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 6,071,908 kB
  • sloc: cpp: 34,937,088; ansic: 7,176,967; javascript: 4,110,704; python: 1,419,953; asm: 946,768; xml: 739,971; pascal: 187,324; sh: 89,623; perl: 88,663; objc: 79,944; sql: 50,304; cs: 41,786; fortran: 24,137; makefile: 21,806; php: 13,980; tcl: 13,166; yacc: 8,925; ruby: 7,485; awk: 3,720; lisp: 3,096; lex: 1,327; ada: 727; jsp: 228; sed: 36
file content (98 lines) | stat: -rw-r--r-- 3,725 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
// Copyright 2023 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#ifndef THIRD_PARTY_BLINK_RENDERER_MODULES_CONTENT_EXTRACTION_INNER_TEXT_BUILDER_H_
#define THIRD_PARTY_BLINK_RENDERER_MODULES_CONTENT_EXTRACTION_INNER_TEXT_BUILDER_H_

#include <optional>

#include "base/memory/stack_allocated.h"
#include "third_party/blink/public/common/tokens/tokens.h"
#include "third_party/blink/public/mojom/content_extraction/inner_text.mojom-blink.h"
#include "third_party/blink/renderer/core/dom/text_visitor.h"
#include "third_party/blink/renderer/modules/modules_export.h"
#include "third_party/blink/renderer/platform/heap/collection_support/heap_vector.h"
#include "third_party/blink/renderer/platform/heap/member.h"

namespace blink {

class HTMLElement;
class HTMLIFrameElement;
class LocalFrame;

// Builds mojom::blink::InnerTextFrame for a frame, and all suitable
// iframes. See the mojom for details on the format.
//
// An InnerTextBuilder is created per Frame. Internally it tracks all iframes
// and will build results for them as well.
class MODULES_EXPORT InnerTextBuilder final : public TextVisitor {
  STACK_ALLOCATED();

 public:
  InnerTextBuilder(const InnerTextBuilder&) = delete;
  InnerTextBuilder& operator=(const InnerTextBuilder&) = delete;

  static mojom::blink::InnerTextFramePtr Build(
      LocalFrame& frame,
      const mojom::blink::InnerTextParams& params);

 private:
  // A ChildIFrame is created for every HTMLIFrame in a particular frame. These
  // are created (and added to `child_iframes_`) as the inner-text is generated.
  struct ChildIFrame : public GarbageCollected<ChildIFrame> {
    void Trace(Visitor* visitor) const;
    // The location of the child frame in the resulting inner-text of the
    // parent frame.
    unsigned offset;
    Member<const HTMLIFrameElement> iframe;
  };

  InnerTextBuilder(const mojom::blink::InnerTextParams& params,
                   HeapVector<Member<ChildIFrame>>& child_iframes);

  // Builds the results for a frame, and recurses through all child frames.
  void Build(HTMLElement& body, mojom::blink::InnerTextFrame& frame);

  // Adds text (or NodeLocation) to Segments `frame.segments`. `text_offset` is
  // the current offset into `text` and `next_child_offset` the offset into
  // `text` of the next child.
  void AddNextNonFrameSegments(const String& text,
                               unsigned next_child_offset,
                               unsigned& text_offset,
                               mojom::blink::InnerTextFrame& frame);

  // TextVisitor:
  void WillVisit(const Node& element, unsigned offset) override;

  const mojom::blink::InnerTextParams& params_;

  // Set if `params` contained a `InnerTextDomNodeId` and the node was found.
  std::optional<unsigned> matching_node_location_;

  // Child iframes encountered.
  HeapVector<Member<ChildIFrame>>& child_iframes_;
};

// An alternative implementation wrapping DocumentChunker passage extraction.
// This will be used only when one or more of the relevant optional parameters
// are specified on InnerTextParams.
class MODULES_EXPORT InnerTextPassagesBuilder final {
  STACK_ALLOCATED();

 public:
  InnerTextPassagesBuilder(const InnerTextPassagesBuilder&) = delete;
  InnerTextPassagesBuilder& operator=(const InnerTextPassagesBuilder&) = delete;

  static mojom::blink::InnerTextFramePtr Build(
      LocalFrame& frame,
      const mojom::blink::InnerTextParams& params);

 private:
  explicit InnerTextPassagesBuilder(
      const mojom::blink::InnerTextParams& params);
};

}  // namespace blink

#endif  // THIRD_PARTY_BLINK_RENDERER_MODULES_CONTENT_EXTRACTION_INNER_TEXT_BUILDER_H_