File: Mph.swift

package info (click to toggle)
swiftlang 6.0.3-2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 2,519,992 kB
  • sloc: cpp: 9,107,863; ansic: 2,040,022; asm: 1,135,751; python: 296,500; objc: 82,456; f90: 60,502; lisp: 34,951; pascal: 19,946; sh: 18,133; perl: 7,482; ml: 4,937; javascript: 4,117; makefile: 3,840; awk: 3,535; xml: 914; fortran: 619; cs: 573; ruby: 573
file content (105 lines) | stat: -rw-r--r-- 2,545 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
//===----------------------------------------------------------------------===//
//
// This source file is part of the Swift.org open source project
//
// Copyright (c) 2021 Apple Inc. and the Swift project authors
// Licensed under Apache License v2.0 with Runtime Library Exception
//
// See https://swift.org/LICENSE.txt for license information
// See https://swift.org/CONTRIBUTORS.txt for the list of Swift project authors
//
//===----------------------------------------------------------------------===//

public struct Mph {
  public var bitArrays: [BitArray] = []
  public var ranks: [[UInt16]] = []
  
  init(gamma: Double, keys: [UInt64]) {
    var size: Int
    var a: BitArray
    var collide: Set<Int>
    var redoKeys: [UInt64] = keys
    var i: UInt64 = 0
    
    repeat {
      size = Swift.max(64, Int(gamma * Double(redoKeys.count)))
      a = BitArray(size: size)
      collide = []
      
      for key in redoKeys {
        let idx = Int(hash(key, UInt64(size), seed: i))
        
        if !collide.contains(idx), !a.insert(idx) {
          collide.insert(idx)
        }
      }
      
      var tmpRedo: [UInt64] = []
      
      for key in redoKeys {
        let idx = Int(hash(key, UInt64(size), seed: i))
        
        if collide.contains(idx) {
          a[idx] = false
          tmpRedo.append(key)
        }
      }
      
      bitArrays.append(a)
      redoKeys = tmpRedo
      i += 1
    } while !redoKeys.isEmpty
    
    computeRanks()
  }
  
  mutating func computeRanks() {
    var pop: UInt16 = 0
    
    for bitArray in bitArrays {
      var rank: [UInt16] = []
      
      for i in 0 ..< bitArray.words.count {
        let v = bitArray.words[i]
        
        if i % 8 == 0 {
          rank.append(pop)
        }
        
        pop += UInt16(v.nonzeroBitCount)
      }
      
      ranks.append(rank)
    }
  }
  
  public func index(for key: UInt64) -> Int {
    for i in 0 ..< bitArrays.count {
      let b = bitArrays[i]
      let idx = Int(hash(key, UInt64(b.size), seed: UInt64(i)))
      
      if b[idx] {
        var rank = ranks[i][idx / 512]
        
        for j in (idx / 64) & ~7 ..< idx / 64 {
          rank += UInt16(b.words[j].nonzeroBitCount)
        }
        
        let finalWord = b.words[idx / 64]
        
        if idx % 64 > 0 {
          rank += UInt16((finalWord << (64 - (idx % 64))).nonzeroBitCount)
        }
        
        return Int(rank)
      }
    }
    
    return -1
  }
}


public func mph(for keys: [UInt64]) -> Mph {
  Mph(gamma: 1, keys: keys)
}