File: bmi2-pext64-1a.c

package info (click to toggle)
gcc-arm-none-eabi 15%3A12.2.rel1-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 959,712 kB
  • sloc: cpp: 3,275,382; ansic: 2,061,766; ada: 840,956; f90: 208,513; makefile: 76,132; asm: 73,433; xml: 50,448; exp: 34,146; sh: 32,436; objc: 15,637; fortran: 14,012; python: 11,991; pascal: 6,787; awk: 4,779; perl: 3,054; yacc: 338; ml: 285; lex: 201; haskell: 122
file content (36 lines) | stat: -rw-r--r-- 1,375 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
/* { dg-do compile } */
/* { dg-skip-if "" { powerpc*-*-darwin* } } */
/* { dg-options "-O3 -mdejagnu-cpu=power7" } */
/* { dg-require-effective-target lp64 } */
/* { dg-require-effective-target powerpc_vsx_ok } */

#define NO_WARN_X86_INTRINSICS 1
#include <x86intrin.h>

unsigned long long
test__pexp_cmask_u64 (unsigned long long a[4])
{
  /* The _pext implmentation is nominally a popcount of the mask,
     followed by a loop using count leading zeros to find the
     next bit to process.
     If the mask is a const, the popcount should be folded and
     the constant propagation should eliminate the mask
     generation loop and produce a single constant bpermd permute
     control word.
     This test verifies that the compiler is replacing the mask
     popcount and loop with a const bperm control and generating
     the bpermd for this case.  */
  const unsigned long mask = 0x00000000100000a4UL;
  unsigned long res;
  res = _pext_u64 (a[0], mask);
  res = (res << 8) | _pext_u64 (a[1], mask);
  res = (res << 8) | _pext_u64 (a[2], mask);
  res = (res << 8) | _pext_u64 (a[3], mask);
  return (res);
}
/* the resulting assembler should have 4 X bpermd and no popcntd or
   cntlzd instructions.  */

/* { dg-final { scan-assembler-times "bpermd" 4 } } */
/* { dg-final { scan-assembler-not "popcntd" } } */
/* { dg-final { scan-assembler-not "cntlzd" } } */