File: amx-transpose-intel.s

package info (click to toggle)
llvm-toolchain-21 1%3A21.1.6-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 2,245,028 kB
  • sloc: cpp: 7,619,726; ansic: 1,434,018; asm: 1,058,748; python: 252,740; f90: 94,671; objc: 70,685; lisp: 42,813; pascal: 18,401; sh: 8,601; ml: 5,111; perl: 4,720; makefile: 3,675; awk: 3,523; javascript: 2,409; xml: 892; fortran: 770
file content (153 lines) | stat: -rw-r--r-- 6,177 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
// RUN: llvm-mc -triple x86_64-unknown-unknown -x86-asm-syntax=intel -output-asm-variant=1 --show-encoding %s | FileCheck %s

// CHECK: t2rpntlvwz0     tmm6, [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0xc4,0xa2,0x78,0x6e,0xb4,0xf5,0x00,0x00,0x00,0x10]
          t2rpntlvwz0 tmm6, [rbp + 8*r14 + 268435456]

// CHECK: t2rpntlvwz0     tmm2, [r8 + 4*rax + 291]
// CHECK: encoding: [0xc4,0xc2,0x78,0x6e,0x94,0x80,0x23,0x01,0x00,0x00]
          t2rpntlvwz0 tmm2, [r8 + 4*rax + 291]

// CHECK: t2rpntlvwz0     tmm2, [2*rbp - 32]
// CHECK: encoding: [0xc4,0xe2,0x78,0x6e,0x14,0x6d,0xe0,0xff,0xff,0xff]
          t2rpntlvwz0 tmm2, [2*rbp - 32]

// CHECK: t2rpntlvwz0t1     tmm6, [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0xc4,0xa2,0x78,0x6f,0xb4,0xf5,0x00,0x00,0x00,0x10]
          t2rpntlvwz0t1 tmm7, [rbp + 8*r14 + 268435456]

// CHECK: t2rpntlvwz0t1     tmm2, [r8 + 4*rax + 291]
// CHECK: encoding: [0xc4,0xc2,0x78,0x6f,0x94,0x80,0x23,0x01,0x00,0x00]
          t2rpntlvwz0t1 tmm2, [r8 + 4*rax + 291]

// CHECK: t2rpntlvwz0t1     tmm2, [2*rbp - 32]
// CHECK: encoding: [0xc4,0xe2,0x78,0x6f,0x14,0x6d,0xe0,0xff,0xff,0xff]
          t2rpntlvwz0t1 tmm2, [2*rbp - 32]

// CHECK: t2rpntlvwz1     tmm0, [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0xc4,0xa2,0x79,0x6e,0x84,0xf5,0x00,0x00,0x00,0x10]
          t2rpntlvwz1 tmm1, [rbp + 8*r14 + 268435456]

// CHECK: t2rpntlvwz1     tmm2, [r8 + 4*rax + 291]
// CHECK: encoding: [0xc4,0xc2,0x79,0x6e,0x94,0x80,0x23,0x01,0x00,0x00]
          t2rpntlvwz1 tmm2, [r8 + 4*rax + 291]

// CHECK: t2rpntlvwz1     tmm2, [2*rbp - 32]
// CHECK: encoding: [0xc4,0xe2,0x79,0x6e,0x14,0x6d,0xe0,0xff,0xff,0xff]
          t2rpntlvwz1 tmm2, [2*rbp - 32]

// CHECK: t2rpntlvwz1t1     tmm6, [rbp + 8*r14 + 268435456]
// CHECK: encoding: [0xc4,0xa2,0x79,0x6f,0xb4,0xf5,0x00,0x00,0x00,0x10]
          t2rpntlvwz1t1 tmm6, [rbp + 8*r14 + 268435456]

// CHECK: t2rpntlvwz1t1     tmm2, [r8 + 4*rax + 291]
// CHECK: encoding: [0xc4,0xc2,0x79,0x6f,0x94,0x80,0x23,0x01,0x00,0x00]
          t2rpntlvwz1t1 tmm2, [r8 + 4*rax + 291]

// CHECK: t2rpntlvwz1t1     tmm2, [2*rbp - 32]
// CHECK: encoding: [0xc4,0xe2,0x79,0x6f,0x14,0x6d,0xe0,0xff,0xff,0xff]
          t2rpntlvwz1t1 tmm2, [2*rbp - 32]

// CHECK: t2rpntlvwz0     tmm4, [r16 + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xba,0x7c,0x08,0x6e,0xa4,0xf0,0x00,0x00,0x00,0x10]
          t2rpntlvwz0 tmm4, [r16 + 8*r14 + 268435456]

// CHECK: t2rpntlvwz0     tmm2, [r8 + 4*r17 + 291]
// CHECK: encoding: [0x62,0xd2,0x78,0x08,0x6e,0x94,0x88,0x23,0x01,0x00,0x00]
          t2rpntlvwz0 tmm2, [r8 + 4*r17 + 291]

// CHECK: {evex} t2rpntlvwz0     tmm2, [2*rbp - 32]
// CHECK: encoding: [0x62,0xf2,0x7c,0x08,0x6e,0x14,0x6d,0xe0,0xff,0xff,0xff]
          {evex} t2rpntlvwz0 tmm2, [2*rbp - 32]

// CHECK: t2rpntlvwz0t1     tmm4, [r16 + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xba,0x7c,0x08,0x6f,0xa4,0xf0,0x00,0x00,0x00,0x10]
          t2rpntlvwz0t1 tmm4, [r16 + 8*r14 + 268435456]

// CHECK: t2rpntlvwz0t1     tmm2, [r8 + 4*r17 + 291]
// CHECK: encoding: [0x62,0xd2,0x78,0x08,0x6f,0x94,0x88,0x23,0x01,0x00,0x00]
          t2rpntlvwz0t1 tmm2, [r8 + 4*r17 + 291]

// CHECK: {evex} t2rpntlvwz0t1     tmm2, [2*rbp - 32]
// CHECK: encoding: [0x62,0xf2,0x7c,0x08,0x6f,0x14,0x6d,0xe0,0xff,0xff,0xff]
          {evex} t2rpntlvwz0t1 tmm2, [2*rbp - 32]

// CHECK: t2rpntlvwz1     tmm4, [r16 + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xba,0x7d,0x08,0x6e,0xa4,0xf0,0x00,0x00,0x00,0x10]
          t2rpntlvwz1 tmm4, [r16 + 8*r14 + 268435456]

// CHECK: t2rpntlvwz1     tmm2, [r8 + 4*r17 + 291]
// CHECK: encoding: [0x62,0xd2,0x79,0x08,0x6e,0x94,0x88,0x23,0x01,0x00,0x00]
          t2rpntlvwz1 tmm2, [r8 + 4*r17 + 291]

// CHECK: {evex} t2rpntlvwz1     tmm2, [2*rbp - 32]
// CHECK: encoding: [0x62,0xf2,0x7d,0x08,0x6e,0x14,0x6d,0xe0,0xff,0xff,0xff]
          {evex} t2rpntlvwz1 tmm2, [2*rbp - 32]

// CHECK: t2rpntlvwz1t1     tmm4, [r16 + 8*r14 + 268435456]
// CHECK: encoding: [0x62,0xba,0x7d,0x08,0x6f,0xa4,0xf0,0x00,0x00,0x00,0x10]
          t2rpntlvwz1t1 tmm4, [r16 + 8*r14 + 268435456]

// CHECK: t2rpntlvwz1t1     tmm2, [r8 + 4*r17 + 291]
// CHECK: encoding: [0x62,0xd2,0x79,0x08,0x6f,0x94,0x88,0x23,0x01,0x00,0x00]
          t2rpntlvwz1t1 tmm2, [r8 + 4*r17 + 291]

// CHECK: {evex} t2rpntlvwz1t1     tmm2, [2*rbp - 32]
// CHECK: encoding: [0x62,0xf2,0x7d,0x08,0x6f,0x14,0x6d,0xe0,0xff,0xff,0xff]
          {evex} t2rpntlvwz1t1 tmm2, [2*rbp - 32]

// CHECK: ttransposed     tmm5, tmm1
// CHECK: encoding: [0xc4,0xe2,0x7a,0x5f,0xe9]
          ttransposed tmm5, tmm1

// CHECK: ttransposed     tmm3, tmm2
// CHECK: encoding: [0xc4,0xe2,0x7a,0x5f,0xda]
          ttransposed tmm3, tmm2

// CHECK: ttdpbf16ps     tmm5, tmm0, tmm4
// CHECK: encoding: [0xc4,0xe2,0x5a,0x6c,0xe8]
          ttdpbf16ps tmm5, tmm0, tmm4

// CHECK: ttdpbf16ps     tmm3, tmm2, tmm1
// CHECK: encoding: [0xc4,0xe2,0x72,0x6c,0xda]
          ttdpbf16ps tmm3, tmm2, tmm1

// CHECK: ttdpfp16ps     tmm1, tmm0, tmm4
// CHECK: encoding: [0xc4,0xe2,0x5b,0x6c,0xc8]
          ttdpfp16ps tmm1, tmm0, tmm4

// CHECK: ttdpfp16ps     tmm3, tmm2, tmm1
// CHECK: encoding: [0xc4,0xe2,0x73,0x6c,0xda]
          ttdpfp16ps tmm3, tmm2, tmm1

// CHECK: ttcmmimfp16ps tmm6, tmm5, tmm4
// CHECK: encoding: [0xc4,0xe2,0x5b,0x6b,0xf5]
          ttcmmimfp16ps tmm6, tmm5, tmm4

// CHECK: ttcmmimfp16ps tmm3, tmm2, tmm1
// CHECK: encoding: [0xc4,0xe2,0x73,0x6b,0xda]
          ttcmmimfp16ps tmm3, tmm2, tmm1

// CHECK: ttcmmrlfp16ps tmm6, tmm5, tmm4
// CHECK: encoding: [0xc4,0xe2,0x5a,0x6b,0xf5]
          ttcmmrlfp16ps tmm6, tmm5, tmm4

// CHECK: ttcmmrlfp16ps tmm3, tmm2, tmm1
// CHECK: encoding: [0xc4,0xe2,0x72,0x6b,0xda]
          ttcmmrlfp16ps tmm3, tmm2, tmm1

// CHECK: tconjtcmmimfp16ps tmm6, tmm5, tmm4
// CHECK: encoding: [0xc4,0xe2,0x58,0x6b,0xf5]
          tconjtcmmimfp16ps tmm6, tmm5, tmm4

// CHECK: tconjtcmmimfp16ps tmm3, tmm2, tmm1
// CHECK: encoding: [0xc4,0xe2,0x70,0x6b,0xda]
          tconjtcmmimfp16ps tmm3, tmm2, tmm1

// CHECK: tconjtfp16 tmm6, tmm5
// CHECK: encoding: [0xc4,0xe2,0x79,0x6b,0xf5]
          tconjtfp16 tmm6, tmm5

// CHECK: tconjtfp16 tmm3, tmm2
// CHECK: encoding: [0xc4,0xe2,0x79,0x6b,0xda]
          tconjtfp16 tmm3, tmm2