File: FastxParserThreadUtils.hpp

package info (click to toggle)
rapmap 0.15.0%2Bdfsg-4
  • links: PTS, VCS
  • area: main
  • in suites: trixie
  • size: 6,356 kB
  • sloc: cpp: 48,826; ansic: 4,471; sh: 215; python: 82; makefile: 19
file content (68 lines) | stat: -rw-r--r-- 2,215 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
#ifndef FASTX_PARSER_THREAD_UTILS_HPP
#define FASTX_PARSER_THREAD_UTILS_HPP

#include <cassert>
#include <thread>
#include <chrono>
#include <random>
#include <pthread.h>
#if defined(__SSE2__)
#include <xmmintrin.h> // _mm_pause
#endif

// Most of this code is taken directly from https://github.com/geidav/spinlocks-bench/blob/master/os.hpp.
// However, things may be renamed, modified, or randomly mangled over time.
#define ALWAYS_INLINE   inline __attribute__((__always_inline__))

namespace fastx_parser {
  namespace thread_utils {

    static const constexpr size_t MIN_BACKOFF_ITERS = 32;
    static const size_t MAX_BACKOFF_ITERS = 1024;

    ALWAYS_INLINE static void cpuRelax() {
    #if defined(__SSE2__)  // AMD and Intel
      _mm_pause();
    #elif defined(__i386__) || defined(__x86_64__)
      asm volatile("pause");
    #elif defined(__aarch64__)
      asm volatile("wfe");
    #elif defined(__armel__) || defined(__ARMEL__)
      asm volatile ("nop" ::: "memory");
    #elif defined(__arm__) || defined(__aarch64__)
      __asm__ __volatile__ ("yield" ::: "memory");
    #elif defined(__ia64__)  // IA64
      __asm__ __volatile__ ("hint @pause");
    #elif defined(__powerpc__) || defined(__ppc__) || defined(__PPC__)
       __asm__ __volatile__ ("or 27,27,27" ::: "memory");
    #else  // everything else.
       asm volatile ("nop" ::: "memory");
    #endif
    }

    ALWAYS_INLINE void yieldSleep() {
      using namespace std::chrono;
      std::chrono::microseconds ytime(500);
      std::this_thread::sleep_for(ytime);
    }

    ALWAYS_INLINE void backoffExp(size_t &curMaxIters) {
      thread_local std::uniform_int_distribution<size_t> dist;
      thread_local std::minstd_rand gen(std::random_device{}());
      const size_t spinIters = dist(gen, decltype(dist)::param_type{0, curMaxIters});
      curMaxIters = std::min(2*curMaxIters, MAX_BACKOFF_ITERS);
      for (size_t i=0; i<spinIters; i++) { cpuRelax(); }
    }

    ALWAYS_INLINE void backoffOrYield(size_t& curMaxDelay) {
      if (curMaxDelay >= MAX_BACKOFF_ITERS) {
        yieldSleep();
        curMaxDelay = MIN_BACKOFF_ITERS;
      }
      backoffExp(curMaxDelay);
    }

  }
}

#endif // FASTX_PARSER_THREAD_UTILS_HPP