File: sse2-pinsrw.c

package info (click to toggle)
gcc-arm-none-eabi 15%3A12.2.rel1-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 959,712 kB
  • sloc: cpp: 3,275,382; ansic: 2,061,766; ada: 840,956; f90: 208,513; makefile: 76,132; asm: 73,433; xml: 50,448; exp: 34,146; sh: 32,436; objc: 15,637; fortran: 14,012; python: 11,991; pascal: 6,787; awk: 4,779; perl: 3,054; yacc: 338; ml: 285; lex: 201; haskell: 122
file content (86 lines) | stat: -rw-r--r-- 1,831 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
/* { dg-do run } */
/* { dg-options "-O3 -mpower8-vector -Wno-psabi" } */
/* { dg-require-effective-target p8vector_hw } */

#ifndef CHECK_H
#define CHECK_H "sse2-check.h"
#endif

#include CHECK_H

#ifndef TEST
#define TEST sse2_test_pinsrw_1
#endif

#include <emmintrin.h>
#include <string.h>

#define msk0 0x00
#define msk1 0x01
#define msk2 0x02
#define msk3 0x03
#define msk4 0x04
#define msk5 0x05
#define msk6 0x06
#define msk7 0x07

static void
TEST (void)
{
  union
    {
      __m128i x;
      unsigned int i[4];
      unsigned short s[8];
    } res [8], val, tmp;
  int masks[8];
  unsigned short ins[4] = { 3, 4, 5, 6 };
  int i;

  val.i[0] = 0x35251505;
  val.i[1] = 0x75655545;
  val.i[2] = 0xB5A59585;
  val.i[3] = 0xF5E5D5C5;

  /* Check pinsrw imm8, r32, xmm.  */
  res[0].x = _mm_insert_epi16 (val.x, ins[0], msk0);
  res[1].x = _mm_insert_epi16 (val.x, ins[0], msk1);
  res[2].x = _mm_insert_epi16 (val.x, ins[0], msk2);
  res[3].x = _mm_insert_epi16 (val.x, ins[0], msk3);
  res[4].x = _mm_insert_epi16 (val.x, ins[0], msk4);
  res[5].x = _mm_insert_epi16 (val.x, ins[0], msk5);
  res[6].x = _mm_insert_epi16 (val.x, ins[0], msk6);
  res[7].x = _mm_insert_epi16 (val.x, ins[0], msk7);

  masks[0] = msk0;
  masks[1] = msk1;
  masks[2] = msk2;
  masks[3] = msk3;
  masks[4] = msk4;
  masks[5] = msk5;
  masks[6] = msk6;
  masks[7] = msk7;

  for (i = 0; i < 8; i++)
    {
      tmp.x = val.x;
      tmp.s[masks[i]] = ins[0];
      if (memcmp (&tmp, &res[i], sizeof (tmp)))
	abort ();
    }
    
  /* Check pinsrw imm8, m16, xmm.  */
  for (i = 0; i < 8; i++)
    {
      res[i].x = _mm_insert_epi16 (val.x, ins[i % 2], msk0);
      masks[i] = msk0;
    }

  for (i = 0; i < 8; i++)
    {
      tmp.x = val.x;
      tmp.s[masks[i]] = ins[i % 2];
      if (memcmp (&tmp, &res[i], sizeof (tmp)))
	abort ();
    }
}