File: EmailRegex.swift

package info (click to toggle)
swiftlang 6.1.3-4
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 2,791,644 kB
  • sloc: cpp: 9,901,738; ansic: 2,201,433; asm: 1,091,827; python: 308,252; objc: 82,166; f90: 80,126; lisp: 38,358; pascal: 25,559; sh: 20,429; ml: 5,058; perl: 4,745; makefile: 4,484; awk: 3,535; javascript: 3,018; xml: 918; fortran: 664; cs: 573; ruby: 396
file content (49 lines) | stat: -rw-r--r-- 1,776 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
import _StringProcessing
import Foundation

extension BenchmarkRunner {
  mutating func addEmail() {
    // Regexes from https://www.regular-expressions.info/email.html
    // Inputs.validEmails is generated by Utils/generateEmails.py
    
    // Relatively simple regex to match email addresses, based on the offical RFC grammar
    // Notably: The character classes contain ‘ which is a non-ascii character, so many optimizations are skipped
    let emailRFC = #"[A-z0-9!#$%&'*+\/=?^_‘{|}~-]+(?:\.[A-z0-9!#$%&'*+\/=?^_‘{|}~-]+)*@(?:[A-z0-9](?:[A-z0-9-]*[A-z0-9])?\.)+[A-z0-9](?:[A-z0-9-]*[A-z0-9])?"#
    
    // More complex, does length and consecutive hyphen validation via lookaheads
    let emailWithLookaheads = #"(?=[A-z0-9][A-z0-9@._%+-]{5,253})[A-z0-9._%+-]{1,64}@(?:(?=[A-z0-9-]{1,63}\.)[A-z0-9]+(?:-[A-z0-9]+)*\.){1,8}[A-z]{2,63}"#
    
    let emailRFCValid = CrossBenchmark(
      baseName: "EmailRFC", regex: emailRFC, input: Inputs.validEmails)
    
    let emailRFCInvalid = CrossBenchmark(
      baseName: "EmailRFCNoMatches",
      regex: emailRFC,
      input: Inputs.graphemeBreakData
    )
    
    let emailValid = CrossBenchmark(
      baseName: "EmailLookahead",
      regex: emailWithLookaheads,
      input: Inputs.validEmails
    )
    
    let emailInvalid = CrossBenchmark(
      baseName: "EmailLookaheadNoMatches",
      regex: emailWithLookaheads,
      input: Inputs.graphemeBreakData
    )
    
    let emailDirect = CrossInputListBenchmark(
      baseName: "EmailLookaheadList",
      regex: emailWithLookaheads,
      inputs: Inputs.validEmailsList
    )
    
    emailRFCValid.register(&self)
    emailRFCInvalid.register(&self)
    emailValid.register(&self)
    emailInvalid.register(&self)
    emailDirect.register(&self)
  }
}