1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247
|
//===----------------------------------------------------------------------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2021-2022 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
//
//===----------------------------------------------------------------------===//
@_implementationOnly import _RegexParser
extension AST {
var dslTree: DSLTree {
return DSLTree(root.dslTreeNode)
}
}
extension AST.Node {
/// Converts an AST node to a `convertedRegexLiteral` node.
var dslTreeNode: DSLTree.Node {
func wrap(_ node: DSLTree.Node) -> DSLTree.Node {
switch node {
case .convertedRegexLiteral:
// FIXME: DSL can have one item concats
// assertionFailure("Double wrapping?")
return node
default:
break
}
// TODO: Should we do this for the
// single-concatenation child too, or should?
// we wrap _that_?
return .convertedRegexLiteral(node, .init(ast: self))
}
// Convert the top-level node without wrapping
func convert() throws -> DSLTree.Node {
switch self {
case let .alternation(v):
let children = v.children.map(\.dslTreeNode)
return .orderedChoice(children)
case let .concatenation(v):
return .concatenation(v.children.map(\.dslTreeNode))
case let .group(v):
let child = v.child.dslTreeNode
switch v.kind.value {
case .capture:
return .capture(child)
case .namedCapture(let name):
return .capture(name: name.value, child)
case .balancedCapture:
throw Unsupported("TODO: balanced captures")
default:
return .nonCapturingGroup(.init(ast: v.kind.value), child)
}
case let .conditional(v):
let trueBranch = v.trueBranch.dslTreeNode
let falseBranch = v.falseBranch.dslTreeNode
return .conditional(
.init(ast: v.condition.kind), trueBranch, falseBranch)
case let .quantification(v):
let child = v.child.dslTreeNode
return .quantification(
.init(ast: v.amount.value), .syntax(.init(ast: v.kind.value)), child)
case let .quote(v):
return .quotedLiteral(v.literal)
case let .trivia(v):
return .trivia(v.contents)
case .interpolation:
throw Unsupported("TODO: interpolation")
case let .atom(v):
switch v.kind {
case .scalarSequence(let seq):
// The DSL doesn't have an equivalent node for scalar sequences. Splat
// them into a concatenation of scalars.
return .concatenation(seq.scalarValues.map { .atom(.scalar($0)) })
default:
return .atom(v.dslTreeAtom)
}
case let .customCharacterClass(ccc):
return .customCharacterClass(ccc.dslTreeClass)
case .empty(_):
return .empty
case let .absentFunction(abs):
// TODO: What should this map to?
return .absentFunction(.init(ast: abs))
#if RESILIENT_LIBRARIES
@unknown default:
fatalError()
#endif
}
}
// FIXME: make total function again
let converted = try! convert()
return wrap(converted)
}
}
extension AST.CustomCharacterClass {
var dslTreeClass: DSLTree.CustomCharacterClass {
// TODO: Not quite 1-1
func convert(
_ member: Member
) -> DSLTree.CustomCharacterClass.Member {
switch member {
case let .custom(ccc):
return .custom(ccc.dslTreeClass)
case let .range(r):
return .range(
r.lhs.dslTreeAtom, r.rhs.dslTreeAtom)
case let .atom(a):
return .atom(a.dslTreeAtom)
case let .quote(q):
return .quotedLiteral(q.literal)
case let .setOperation(lhs, op, rhs):
let lhs = DSLTree.CustomCharacterClass(
members: lhs.map(convert),
isInverted: false)
let rhs = DSLTree.CustomCharacterClass(
members: rhs.map(convert),
isInverted: false)
switch op.value {
case .subtraction:
return .subtraction(lhs, rhs)
case .intersection:
return .intersection(lhs, rhs)
case .symmetricDifference:
return .symmetricDifference(lhs, rhs)
#if RESILIENT_LIBRARIES
@unknown default:
fatalError()
#endif
}
case let .trivia(t):
return .trivia(t.contents)
#if RESILIENT_LIBRARIES
@unknown default:
fatalError()
#endif
}
}
return .init(
members: members.map(convert),
isInverted: self.isInverted)
}
}
extension AST.Atom.EscapedBuiltin {
var dslAssertionKind: DSLTree.Atom.Assertion? {
switch self {
case .wordBoundary: return .wordBoundary
case .notWordBoundary: return .notWordBoundary
case .startOfSubject: return .startOfSubject
case .endOfSubject: return .endOfSubject
case .textSegment: return .textSegment
case .notTextSegment: return .notTextSegment
case .endOfSubjectBeforeNewline: return .endOfSubjectBeforeNewline
case .firstMatchingPositionInSubject: return .firstMatchingPositionInSubject
case .resetStartOfMatch: return .resetStartOfMatch
default: return nil
}
}
var dslCharacterClass: DSLTree.Atom.CharacterClass? {
switch self {
case .decimalDigit: return .digit
case .notDecimalDigit: return .notDigit
case .horizontalWhitespace: return .horizontalWhitespace
case .notHorizontalWhitespace: return .notHorizontalWhitespace
case .newlineSequence: return .newlineSequence
case .notNewline: return .notNewline
case .whitespace: return .whitespace
case .notWhitespace: return .notWhitespace
case .verticalTab: return .verticalWhitespace
case .notVerticalTab: return .notVerticalWhitespace
case .wordCharacter: return .word
case .notWordCharacter: return .notWord
case .graphemeCluster: return .anyGrapheme
default: return nil
}
}
}
extension AST.Atom {
var dslAssertionKind: DSLTree.Atom.Assertion? {
switch kind {
case .caretAnchor: return .caretAnchor
case .dollarAnchor: return .dollarAnchor
case .escaped(let b): return b.dslAssertionKind
default: return nil
}
}
var dslCharacterClass: DSLTree.Atom.CharacterClass? {
switch kind {
case .escaped(let b): return b.dslCharacterClass
default: return nil
}
}
}
extension AST.Atom {
var dslTreeAtom: DSLTree.Atom {
if let kind = dslAssertionKind {
return .assertion(kind)
}
if let cc = dslCharacterClass {
return .characterClass(cc)
}
switch self.kind {
case let .char(c): return .char(c)
case let .scalar(s): return .scalar(s.value)
case .dot: return .dot
case let .backreference(r): return .backreference(.init(ast: r))
case let .changeMatchingOptions(seq): return .changeMatchingOptions(.init(ast: seq))
case .escaped(let c):
guard let val = c.scalarValue else {
fatalError("Got a .escaped that was not an assertion, character class, or scalar value \(self)")
}
return .scalar(val)
default: return .unconverted(.init(ast: self))
}
}
}
|