File: MultinomialSampler.hpp

package info (click to toggle)
salmon 1.10.3%2Bds1-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 35,148 kB
  • sloc: cpp: 200,707; ansic: 171,082; sh: 859; python: 792; makefile: 238
file content (67 lines) | stat: -rw-r--r-- 1,615 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
#ifndef _MULTINOMIAL_SAMPLER_HPP_
#define _MULTINOMIAL_SAMPLER_HPP_

#include <algorithm>
#include <random>
#include <vector>

class MultinomialSampler {
public:
  MultinomialSampler(std::random_device& rd) : gen_(rd()), u01_(0.0, 1.0) {}

  void operator()(std::vector<uint64_t>::iterator sampleBegin, uint32_t n,
                  uint32_t k, std::vector<double>::iterator probsBegin,
                  bool clearCounts = true) {
    uint32_t i, j;
    double u, sum;
    std::vector<double> z(k + 1, 0.0);

    if (clearCounts) {
      for (i = 0; i < k; i++) {
        *(sampleBegin + i) = 0;
      }
    }

    z[0] = 0;
    for (i = 1; i <= k; i++) {
      sum = 0;
      for (j = 0; j < i; j++)
        sum += *(probsBegin + j);
      z[i] = sum;
    }

    // If k is small (<= 100), linear search is usually faster
    if (k <= 100) {
      for (j = 0; j < n; j++) {
        u = u01_(gen_);

        for (i = 0; i < k; i++) {
          if ((z[i] < u) && (u <= z[i + 1])) {
            (*(sampleBegin + i))++;
            break;
          }
        }
      }
    } else { // k is large enough to warrant binary search
      for (j = 0; j < n; j++) {
        u = u01_(gen_);

        // Find the offset of the element to increment
        auto it = std::lower_bound(z.begin(), z.end() - 1, u);
        size_t offset = static_cast<size_t>(std::distance(z.begin(), it));

        if (*it > u and offset > 0) {
          offset -= 1;
        }

        (*(sampleBegin + offset))++;
      }
    }
  }

private:
  std::mt19937 gen_;
  std::uniform_real_distribution<> u01_;
};

#endif //_MULTINOMIAL_SAMPLER_HPP_