File: CharacterClass.swift

package info (click to toggle)
swiftlang 6.0.3-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 2,519,992 kB
  • sloc: cpp: 9,107,863; ansic: 2,040,022; asm: 1,135,751; python: 296,500; objc: 82,456; f90: 60,502; lisp: 34,951; pascal: 19,946; sh: 18,133; perl: 7,482; ml: 4,937; javascript: 4,117; makefile: 3,840; awk: 3,535; xml: 914; fortran: 619; cs: 573; ruby: 573
file content (140 lines) | stat: -rw-r--r-- 3,857 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
//===----------------------------------------------------------------------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2021-2022 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
//
//===----------------------------------------------------------------------===//

// MARK: - Element Consumer

/// An alternate formation of consumers: Don't bind collection type as we're just
/// consuming elements by classification or literal sequencing.
protocol ElementConsumer {
  associatedtype Element
  func consume<C: Collection>(
    _ c: C, in: Range<C.Index>
  ) -> C.Index? where C.Element == Element
}

protocol CharacterConsumer: ElementConsumer
where Element == Character { }

protocol ScalarConsumer: ElementConsumer
where Element == Unicode.Scalar { }

protocol UTF8Consumer: ElementConsumer
where Element == UInt8 { }

protocol UTF16Consumer: ElementConsumer
where Element == UInt16 { }

// struct ...LiteralSequence: ...Consumer { ... }

// MARK: - Element Classes

protocol ElementClass: ElementConsumer {
  func contains(_ e: Element) -> Bool
}
extension ElementClass {
  func consume<C: Collection>(
    _ c: C, in range: Range<C.Index>
  ) -> C.Index? where C.Element == Element {
    // FIXME: empty ranges, etc...
    let lower = range.lowerBound
    return contains(c[lower]) ? c.index(after: lower) : nil
  }
}

protocol ScalarClass: ElementClass, ScalarConsumer {}
protocol CharacterClass: ElementClass, CharacterConsumer {}

// MARK: Granularity adapters

/// Any higher-granularity consumer can be a lower-granularity
/// consumer by just consuming at its higher-granularity
struct _CharacterToScalar <
  Characters: CharacterConsumer
>: ScalarConsumer {
  var characters: Characters

  func consume<C: Collection>(
    _ c: C, in range: Range<C.Index>
  ) -> C.Index? where C.Element == Unicode.Scalar {
    let str = String(c)
    let r = c.convertByOffset(range, in: str)
    guard let idx = characters.consume(str, in: r) else {
      return nil
    }

    return str.convertByOffset(idx, in: c)
  }
}
// ...

/// Any lower-granularity consumer can be a higher
/// granularity consumer by checking if the result falls on a
/// boundary.
struct _ScalarToCharacter <
  Scalars: ScalarConsumer
>: CharacterConsumer {
  var scalars: Scalars

  func _consume(
    _ str: String, in range: Range<String.Index>
  ) -> String.Index? {
    guard let idx = scalars.consume(str.unicodeScalars, in: range),
          str.isOnGraphemeClusterBoundary(idx)
    else {
      return nil
    }
    return idx
  }

  func consume<C: Collection>(
    _ c: C, in range: Range<C.Index>
  ) -> C.Index? where C.Element == Character {
    let str = String(c)
    let r = c.convertByOffset(range, in: str)

    guard let idx = _consume(str, in: r) else {
      return nil
    }
    return str.convertByOffset(idx, in: c)
  }
}

/// Any lower-granularity class can be a higher-granularity
/// class if we choose a semantic-extension style
struct _FirstScalarCharacters<
  Scalars: ScalarClass
>: CharacterClass {
  var scalars: Scalars
  func contains(_ c: Character) -> Bool {
    scalars.contains(c.unicodeScalars.first!)
  }
}
struct _SingleScalarCharacters<
  Scalars: ScalarClass
>: CharacterClass {
  var scalars: Scalars
  func contains(_ c: Character) -> Bool {
    let scs = c.unicodeScalars
    return scs.count == 1 && scalars.contains(scs.first!)
  }
  // NOTE: This would be equivalent to _ScalarToCharacter
  // for any scalar consumer that consumes only one scalar
  // at a time.
}
struct _AllScalarCharacters<
  Scalars: ScalarClass
>: CharacterClass {
  var scalars: Scalars
  func contains(_ c: Character) -> Bool {
    c.unicodeScalars.allSatisfy(scalars.contains)
  }
}