File: HandWrittenParticipant.swift

package info (click to toggle)
swiftlang 6.0.3-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 2,519,992 kB
  • sloc: cpp: 9,107,863; ansic: 2,040,022; asm: 1,135,751; python: 296,500; objc: 82,456; f90: 60,502; lisp: 34,951; pascal: 19,946; sh: 18,133; perl: 7,482; ml: 4,937; javascript: 4,117; makefile: 3,840; awk: 3,535; xml: 914; fortran: 619; cs: 573; ruby: 573
file content (150 lines) | stat: -rw-r--r-- 4,186 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
//===----------------------------------------------------------------------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2021-2022 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
//
//===----------------------------------------------------------------------===//

struct HandWrittenParticipant: Participant {
  static var name: String { "HandWritten" }

  static func graphemeBreakProperty() throws -> (String) -> GraphemeBreakEntry? {
    graphemeBreakPropertyData(forLine:)
  }
}

// Try to parse a Unicode scalar off the input
private func parseScalar(_ str: inout Substring) -> Unicode.Scalar? {
  let val = str.eat(while: { $0.isHexDigit })
  guard !val.isEmpty else { return nil }

  // Subtle potential bug: if this init fails, we need to restore
  // str.startIndex. Because of how this is currently called, the bug wont
  // manifest now, but could if the call site is changed.
  return Unicode.Scalar(hex: val)
}

// Useful for testing the testing framework
private var forceFailure: Bool { false }

private func graphemeBreakPropertyData(
  forLine line: String
) -> GraphemeBreakEntry? {
  var line = line[...]
  guard let lower = parseScalar(&line) else {
    // Comment or whitespace line
    return nil
  }

  let upper: Unicode.Scalar
  if line.peek(".") {
    guard !line.eat(exactly: "..").isEmpty else {
      fatalError("Parse error")
    }
    guard let s = parseScalar(&line) else {
      fatalError("Parse error")
    }
    upper = s
  } else {
    upper = lower
  }

  line.eat(while: { !$0.isLetter })
  let name = line.eat(while: { $0.isLetter || $0 == "_" })
  guard let prop = Unicode.GraphemeBreakProperty(name) else {
    return nil
  }

  // For testing our framework
  if forceFailure, lower == Unicode.Scalar(0x07FD) {
    return nil
  }

  return GraphemeBreakEntry(lower ... upper, prop)
}


//
// MARK: Eat Convenience Overloads
//

extension Collection where SubSequence == Self {
  // TODO: optionality of return? Probably a good idea to signal if something happened...

  // TODO: worth having?
  @discardableResult
  internal mutating func eat() -> Element? {
    self.eat(count: 1).first
  }

  @discardableResult
  internal mutating func eat(count n: Int = 0) -> SubSequence {
    let idx = self.index(self.startIndex, offsetBy: n, limitedBy: self.endIndex) ?? self.endIndex
    return self.eat(upTo: idx)
  }

  @discardableResult
  internal mutating func eat(one predicate: (Element) -> Bool) -> Element? {
    guard let elt = self.first, predicate(elt) else { return nil }
    return eat()
  }
}

extension Collection where SubSequence == Self, Element: Equatable {
  @discardableResult
  internal mutating func eat(one e: Element) -> Element? {
    self.eat(one: { (other: Element) in other == e })
  }
  @discardableResult
  internal mutating func eat(many e: Element) -> SubSequence {
    self.eat(while: { (other: Element) in other == e })
  }

  internal func peek(_ e: Element) -> Bool {
    self.first == e
  }

  @discardableResult
  internal mutating func eat<S: Sequence>(exactly s: S) -> SubSequence where S.Element == Element {
    var idx = startIndex
    for e in s {
      guard idx < endIndex, e == self[idx] else {
        idx = startIndex
        break
      }
      formIndex(after: &idx)
    }
    return eat(upTo: idx)
  }
}

extension Collection where SubSequence == Self, Element: Hashable {
  @discardableResult
  internal mutating func eat(oneIn s: Set<Element>) -> Element? {
    self.eat(one: { s.contains($0) })
  }
  @discardableResult
  internal mutating func eat(whileIn s: Set<Element>) -> SubSequence {
    self.eat(while: { s.contains($0) })
  }
}

extension Collection where SubSequence == Self {
  @discardableResult
  internal mutating func eat(upTo idx: Index) -> SubSequence {
    defer { self = self[idx...] }
    return self[..<idx]
  }

  @discardableResult
  internal mutating func eat(
    while predicate: (Element) -> Bool
  ) -> SubSequence {
    eat(upTo: self.firstIndex(where: { !predicate($0) }) ?? endIndex)
  }

}