File: tokenized_string_char_iterator.h

package info (click to toggle)
chromium 138.0.7204.183-1
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 6,071,908 kB
  • sloc: cpp: 34,937,088; ansic: 7,176,967; javascript: 4,110,704; python: 1,419,953; asm: 946,768; xml: 739,971; pascal: 187,324; sh: 89,623; perl: 88,663; objc: 79,944; sql: 50,304; cs: 41,786; fortran: 24,137; makefile: 21,806; php: 13,980; tcl: 13,166; yacc: 8,925; ruby: 7,485; awk: 3,720; lisp: 3,096; lex: 1,327; ada: 727; jsp: 228; sed: 36
file content (84 lines) | stat: -rw-r--r-- 2,487 bytes parent folder | download | duplicates (8)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
// Copyright 2019 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#ifndef CHROMEOS_ASH_COMPONENTS_STRING_MATCHING_TOKENIZED_STRING_CHAR_ITERATOR_H_
#define CHROMEOS_ASH_COMPONENTS_STRING_MATCHING_TOKENIZED_STRING_CHAR_ITERATOR_H_

#include <stddef.h>
#include <stdint.h>

#include <memory>

#include "base/memory/raw_ref.h"
#include "chromeos/ash/components/string_matching/tokenized_string.h"

namespace base::i18n {
class UTF16CharIterator;
}

namespace ash::string_matching {

// An UTF16 char iterator for a TokenizedString.
class TokenizedStringCharIterator {
 public:
  struct State {
    State();
    State(size_t token_index, int char_index);

    size_t token_index;
    int32_t char_index;
  };

  // Requires |tokenized| out-lives this iterator.
  explicit TokenizedStringCharIterator(const TokenizedString& tokenized);

  TokenizedStringCharIterator(const TokenizedStringCharIterator&) = delete;
  TokenizedStringCharIterator& operator=(const TokenizedStringCharIterator&) =
      delete;

  ~TokenizedStringCharIterator();

  // Advances to the next char. Returns false if there is no next char.
  bool NextChar();

  // Advances to the first char of the next token. Returns false if there is
  // no next token.
  bool NextToken();

  // Returns the current char if there is one. Otherwise, returns 0.
  int32_t Get() const;

  // Returns the array index in original text of the tokenized string that is
  // passed in constructor.
  int32_t GetArrayPos() const;

  // Returns the number of UTF16 code units for the current char.
  size_t GetCharSize() const;

  // Returns true if the current char is the first char of the current token.
  bool IsFirstCharOfToken() const;

  // Returns true if the current char is the second char of the current token.
  bool IsSecondCharOfToken() const;

  // Helpers to get and restore the iterator's state.
  State GetState() const;
  void SetState(const State& state);

  // Returns true if the iterator is at the end.
  bool end() const { return !current_token_iter_; }

 private:
  void CreateTokenCharIterator();

  const raw_ref<const TokenizedString::Tokens> tokens_;
  const raw_ref<const TokenizedString::Mappings> mappings_;

  size_t current_token_;
  std::unique_ptr<base::i18n::UTF16CharIterator> current_token_iter_;
};

}  // namespace ash::string_matching

#endif  // CHROMEOS_ASH_COMPONENTS_STRING_MATCHING_TOKENIZED_STRING_CHAR_ITERATOR_H_