File: EmailRegex.swift

package info (click to toggle)
swiftlang 6.0.3-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 2,519,992 kB
  • sloc: cpp: 9,107,863; ansic: 2,040,022; asm: 1,135,751; python: 296,500; objc: 82,456; f90: 60,502; lisp: 34,951; pascal: 19,946; sh: 18,133; perl: 7,482; ml: 4,937; javascript: 4,117; makefile: 3,840; awk: 3,535; xml: 914; fortran: 619; cs: 573; ruby: 573
file content (49 lines) | stat: -rw-r--r-- 1,776 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
import _StringProcessing
import Foundation

extension BenchmarkRunner {
  mutating func addEmail() {
    // Regexes from https://www.regular-expressions.info/email.html
    // Inputs.validEmails is generated by Utils/generateEmails.py
    
    // Relatively simple regex to match email addresses, based on the offical RFC grammar
    // Notably: The character classes contain ‘ which is a non-ascii character, so many optimizations are skipped
    let emailRFC = #"[A-z0-9!#$%&'*+\/=?^_‘{|}~-]+(?:\.[A-z0-9!#$%&'*+\/=?^_‘{|}~-]+)*@(?:[A-z0-9](?:[A-z0-9-]*[A-z0-9])?\.)+[A-z0-9](?:[A-z0-9-]*[A-z0-9])?"#
    
    // More complex, does length and consecutive hyphen validation via lookaheads
    let emailWithLookaheads = #"(?=[A-z0-9][A-z0-9@._%+-]{5,253})[A-z0-9._%+-]{1,64}@(?:(?=[A-z0-9-]{1,63}\.)[A-z0-9]+(?:-[A-z0-9]+)*\.){1,8}[A-z]{2,63}"#
    
    let emailRFCValid = CrossBenchmark(
      baseName: "EmailRFC", regex: emailRFC, input: Inputs.validEmails)
    
    let emailRFCInvalid = CrossBenchmark(
      baseName: "EmailRFCNoMatches",
      regex: emailRFC,
      input: Inputs.graphemeBreakData
    )
    
    let emailValid = CrossBenchmark(
      baseName: "EmailLookahead",
      regex: emailWithLookaheads,
      input: Inputs.validEmails
    )
    
    let emailInvalid = CrossBenchmark(
      baseName: "EmailLookaheadNoMatches",
      regex: emailWithLookaheads,
      input: Inputs.graphemeBreakData
    )
    
    let emailDirect = CrossInputListBenchmark(
      baseName: "EmailLookaheadList",
      regex: emailWithLookaheads,
      inputs: Inputs.validEmailsList
    )
    
    emailRFCValid.register(&self)
    emailRFCInvalid.register(&self)
    emailValid.register(&self)
    emailInvalid.register(&self)
    emailDirect.register(&self)
  }
}