File: p8vector-vectorize-4.c

package info (click to toggle)
gcc-arm-none-eabi 15%3A12.2.rel1-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 959,712 kB
  • sloc: cpp: 3,275,382; ansic: 2,061,766; ada: 840,956; f90: 208,513; makefile: 76,132; asm: 73,433; xml: 50,448; exp: 34,146; sh: 32,436; objc: 15,637; fortran: 14,012; python: 11,991; pascal: 6,787; awk: 4,779; perl: 3,054; yacc: 338; ml: 285; lex: 201; haskell: 122
file content (69 lines) | stat: -rw-r--r-- 2,073 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
/* { dg-do compile { target { powerpc*-*-* } } } */
/* { dg-skip-if "" { powerpc*-*-darwin* } } */
/* { dg-require-effective-target powerpc_p8vector_ok } */
/* { dg-options "-mdejagnu-cpu=power8 -O2 -ftree-vectorize -fvect-cost-model=dynamic -fno-unroll-loops -fno-unroll-all-loops" } */

#ifndef SIZE
#define SIZE 1024
#endif

#ifndef ALIGN
#define ALIGN 32
#endif

#define ALIGN_ATTR __attribute__((__aligned__(ALIGN)))

#define DO_BUILTIN(PREFIX, TYPE, CLZ, POPCNT)				\
TYPE PREFIX ## _a[SIZE] ALIGN_ATTR;					\
TYPE PREFIX ## _b[SIZE] ALIGN_ATTR;					\
									\
void									\
PREFIX ## _clz (void)							\
{									\
  unsigned long i;							\
									\
  for (i = 0; i < SIZE; i++)						\
    PREFIX ## _a[i] = CLZ (PREFIX ## _b[i]);				\
}									\
									\
void									\
PREFIX ## _popcnt (void)						\
{									\
  unsigned long i;							\
									\
  for (i = 0; i < SIZE; i++)						\
    PREFIX ## _a[i] = POPCNT (PREFIX ## _b[i]);				\
}

#if !defined(DO_LONG_LONG) && !defined(DO_LONG) && !defined(DO_INT) && !defined(DO_SHORT) && !defined(DO_CHAR)
#define DO_INT 1
#endif

#if DO_LONG_LONG
/* At the moment, only int is auto vectorized.  */
DO_BUILTIN (sll, long long,		__builtin_clzll, __builtin_popcountll)
DO_BUILTIN (ull, unsigned long long,	__builtin_clzll, __builtin_popcountll)
#endif

#if defined(_ARCH_PPC64) && DO_LONG
DO_BUILTIN (sl,  long,			__builtin_clzl,  __builtin_popcountl)
DO_BUILTIN (ul,  unsigned long,		__builtin_clzl,  __builtin_popcountl)
#endif

#if DO_INT
DO_BUILTIN (si,  int,			__builtin_clz,   __builtin_popcount)
DO_BUILTIN (ui,  unsigned int,		__builtin_clz,   __builtin_popcount)
#endif

#if DO_SHORT
DO_BUILTIN (ss,  short,			__builtin_clz,   __builtin_popcount)
DO_BUILTIN (us,  unsigned short,	__builtin_clz,   __builtin_popcount)
#endif

#if DO_CHAR
DO_BUILTIN (sc,  signed char,		__builtin_clz,   __builtin_popcount)
DO_BUILTIN (uc,  unsigned char,		__builtin_clz,   __builtin_popcount)
#endif

/* { dg-final { scan-assembler-times "vclzw"     2 } } */
/* { dg-final { scan-assembler-times "vpopcntw"  2 } } */