File: matrix-multiply-int8.s

package info (click to toggle)
llvm-toolchain-13 1%3A13.0.1-11
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 1,418,840 kB
  • sloc: cpp: 5,290,826; ansic: 996,570; asm: 544,593; python: 188,212; objc: 72,027; lisp: 30,291; f90: 25,395; sh: 24,898; javascript: 9,780; pascal: 9,398; perl: 7,484; ml: 5,432; awk: 3,523; makefile: 2,913; xml: 953; cs: 573; fortran: 539
file content (129 lines) | stat: -rw-r--r-- 4,094 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
// RUN: llvm-mc -triple=aarch64 -show-encoding -mattr=+sve,+i8mm < %s \
// RUN:        | FileCheck %s --check-prefixes=CHECK-ENCODING,CHECK-INST
// RUN: not llvm-mc -triple=aarch64 -show-encoding -mattr=+sve < %s 2>&1 \
// RUN:        | FileCheck %s --check-prefix=CHECK-ERROR
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sve,+i8mm < %s \
// RUN:        | llvm-objdump -d --mattr=+sve,+i8mm - | FileCheck %s --check-prefix=CHECK-INST
// RUN: llvm-mc -triple=aarch64 -filetype=obj -mattr=+sve,+i8mm < %s \
// RUN:        | llvm-objdump -d - | FileCheck %s --check-prefix=CHECK-UNKNOWN


// --------------------------------------------------------------------------//
// SMMLA, UMMLA, USMMLA (SVE)

ummla z0.s, z1.b, z2.b
// CHECK-INST: ummla z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x98,0xc2,0x45]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 98 c2 45 <unknown>

smmla z0.s, z1.b, z2.b
// CHECK-INST: smmla z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x98,0x02,0x45]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 98 02 45 <unknown>

usmmla z0.s, z1.b, z2.b
// CHECK-INST: usmmla z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x98,0x82,0x45]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 98 82 45 <unknown>


// Test compatibility with MOVPRFX instruction.

movprfx z0, z7
// CHECK-INST: movprfx	z0, z7
// CHECK-ENCODING: [0xe0,0xbc,0x20,0x04]
// CHECK-UNKNOWN: e0 bc 20 04 <unknown>

ummla z0.s, z1.b, z2.b
// CHECK-INST: ummla z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x98,0xc2,0x45]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 98 c2 45 <unknown>

movprfx z0, z7
// CHECK-INST: movprfx	z0, z7
// CHECK-ENCODING: [0xe0,0xbc,0x20,0x04]
// CHECK-UNKNOWN: e0 bc 20 04 <unknown>

smmla z0.s, z1.b, z2.b
// CHECK-INST: smmla z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x98,0x02,0x45]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 98 02 45 <unknown>

movprfx z0, z7
// CHECK-INST: movprfx	z0, z7
// CHECK-ENCODING: [0xe0,0xbc,0x20,0x04]
// CHECK-UNKNOWN: e0 bc 20 04 <unknown>

usmmla z0.s, z1.b, z2.b
// CHECK-INST: usmmla z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x98,0x82,0x45]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 98 82 45 <unknown>


// --------------------------------------------------------------------------//
// USDOT (SVE, vectors)

usdot z0.s, z1.b, z2.b
// CHECK-INST: usdot z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x78,0x82,0x44]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 78 82 44 <unknown>

// Test compatibility with MOVPRFX instruction.

movprfx z0, z7
// CHECK-INST: movprfx	z0, z7
// CHECK-ENCODING: [0xe0,0xbc,0x20,0x04]
// CHECK-UNKNOWN: e0 bc 20 04 <unknown>

usdot z0.s, z1.b, z2.b
// CHECK-INST: usdot z0.s, z1.b, z2.b
// CHECK-ENCODING: [0x20,0x78,0x82,0x44]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 78 82 44 <unknown>


// --------------------------------------------------------------------------//
// USDOT, SUDOT (SVE, indexed)

usdot z0.s, z1.b, z2.b[0]
// CHECK-INST: usdot z0.s, z1.b, z2.b[0]
// CHECK-ENCODING: [0x20,0x18,0xa2,0x44]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 18 a2 44 <unknown>

sudot z0.s, z1.b, z2.b[3]
// CHECK-INST: sudot z0.s, z1.b, z2.b[3]
// CHECK-ENCODING: [0x20,0x1c,0xba,0x44]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 1c ba 44 <unknown>

// Test compatibility with MOVPRFX instruction.

movprfx z0, z7
// CHECK-INST: movprfx	z0, z7
// CHECK-ENCODING: [0xe0,0xbc,0x20,0x04]
// CHECK-UNKNOWN: e0 bc 20 04 <unknown>

usdot z0.s, z1.b, z2.b[0]
// CHECK-INST: usdot z0.s, z1.b, z2.b[0]
// CHECK-ENCODING: [0x20,0x18,0xa2,0x44]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 18 a2 44 <unknown>

movprfx z0, z7
// CHECK-INST: movprfx	z0, z7
// CHECK-ENCODING: [0xe0,0xbc,0x20,0x04]
// CHECK-UNKNOWN: e0 bc 20 04 <unknown>

sudot z0.s, z1.b, z2.b[0]
// CHECK-INST: sudot z0.s, z1.b, z2.b[0]
// CHECK-ENCODING: [0x20,0x1c,0xa2,0x44]
// CHECK-ERROR: instruction requires: i8mm
// CHECK-UNKNOWN: 20 1c a2 44 <unknown>