File: lzcnt64.c

package info (click to toggle)
valgrind 1%3A3.12.0~svn20160714-1
  • links: PTS, VCS
  • area: main
  • in suites: stretch
  • size: 120,428 kB
  • ctags: 70,855
  • sloc: ansic: 674,645; exp: 26,134; xml: 21,574; asm: 7,570; cpp: 7,567; makefile: 7,380; sh: 6,188; perl: 5,855; haskell: 195
file content (93 lines) | stat: -rw-r--r-- 2,405 bytes parent folder | download | duplicates (9)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93

#include <stdio.h>

typedef  unsigned long long int  ULong;
typedef  unsigned int            UInt;

__attribute__((noinline))
void do_lzcnt64 ( /*OUT*/UInt* flags, /*OUT*/ULong* res, ULong arg )
{
  ULong block[3] = { arg, 0ULL, 0ULL };
  __asm__ __volatile__(
    "movabsq $0x5555555555555555, %%r11" "\n\t"
    "lzcntq 0(%0), %%r11"     "\n\t"
    "movq %%r11, 8(%0)"       "\n\t"
    "pushfq"                  "\n\t"
    "popq %%r11"              "\n\t"
    "movq %%r11, 16(%0)"      "\n"
    : : "r"(&block[0]) : "r11","cc","memory"
  );
  *res = block[1];
  *flags = block[2] & 0x8d5;
}

__attribute__((noinline))
void do_lzcnt32 ( /*OUT*/UInt* flags, /*OUT*/ULong* res, ULong arg )
{
  ULong block[3] = { arg, 0ULL, 0ULL };
  __asm__ __volatile__(
    "movabsq $0x5555555555555555, %%r11" "\n\t"
    "lzcntl 0(%0), %%r11d"    "\n\t"
    "movq %%r11, 8(%0)"       "\n\t"
    "pushfq"                  "\n\t"
    "popq %%r11"              "\n\t"
    "movq %%r11, 16(%0)"      "\n"
    : : "r"(&block[0]) : "r11","cc","memory"
  );
  *res = block[1];
  *flags = block[2] & 0x8d5;
}

__attribute__((noinline))
void do_lzcnt16 ( /*OUT*/UInt* flags, /*OUT*/ULong* res, ULong arg )
{
  ULong block[3] = { arg, 0ULL, 0ULL };
  __asm__ __volatile__(
    "movabsq $0x5555555555555555, %%r11" "\n\t"
    "lzcntw 0(%0), %%r11w"    "\n\t"
    "movq %%r11, 8(%0)"       "\n\t"
    "pushfq"                  "\n\t"
    "popq %%r11"              "\n\t"
    "movq %%r11, 16(%0)"      "\n"
    : : "r"(&block[0]) : "r11","cc","memory"
  );
  *res = block[1];
  *flags = block[2] & 0x8d5;
}

int main ( void )
{
   ULong w;

   w = 0xFEDC192837475675ULL;
   while (1) {
      ULong res;
      UInt  flags;
      do_lzcnt64(&flags, &res, w);
      printf("lzcntq %016llx -> %016llx %04x\n", w, res, flags);
      if (w == 0) break;
      w = ((w >> 2) | (w >> 1)) + (w / 17ULL);
   }

   w = 0xFEDC192837475675ULL;
   while (1) {
      ULong res;
      UInt  flags;
      do_lzcnt32(&flags, &res, w);
      printf("lzcntl %016llx -> %016llx %04x\n", w, res, flags);
      if (w == 0) break;
      w = ((w >> 2) | (w >> 1)) + (w / 17ULL);
   }

   w = 0xFEDC192837475675ULL;
   while (1) {
      ULong res;
      UInt  flags;
      do_lzcnt16(&flags, &res, w);
      printf("lzcntw %016llx -> %016llx %04x\n", w, res, flags);
      if (w == 0) break;
      w = ((w >> 2) | (w >> 1)) + (w / 17ULL);
   }

   return 0;
}