Skip to content

Commit 1cf3405

Browse files
committed
instcountci: Cache predicate register generation from pattern
1 parent 28c9ea4 commit 1cf3405

File tree

1 file changed

+4
-20
lines changed

1 file changed

+4
-20
lines changed

unittests/InstructionCountCI/X87ldst-SVE.json

Lines changed: 4 additions & 20 deletions
Original file line numberDiff line numberDiff line change
@@ -34,7 +34,7 @@
3434
},
3535
"2-store 80bit": {
3636
"x86InstructionCount": 2,
37-
"ExpectedInstructionCount": 25,
37+
"ExpectedInstructionCount": 24,
3838
"x86Insts": [
3939
"fstp tword [rax]",
4040
"fstp tword [rax+10]"
@@ -56,7 +56,6 @@
5656
"add x21, x4, #0xa (10)",
5757
"add x0, x28, x20, lsl #4",
5858
"ldr q2, [x0, #1040]",
59-
"ptrue p2.h, vl5",
6059
"st1h {z2.h}, p2, [x21]",
6160
"ldrb w21, [x28, #1298]",
6261
"lsl w22, w22, w20",
@@ -69,7 +68,7 @@
6968
},
7069
"8-store 80bit": {
7170
"x86InstructionCount": 8,
72-
"ExpectedInstructionCount": 97,
71+
"ExpectedInstructionCount": 90,
7372
"x86Insts": [
7473
"fstp tword [rax]",
7574
"fstp tword [rax+10]",
@@ -97,7 +96,6 @@
9796
"add x21, x4, #0xa (10)",
9897
"add x0, x28, x20, lsl #4",
9998
"ldr q2, [x0, #1040]",
100-
"ptrue p2.h, vl5",
10199
"st1h {z2.h}, p2, [x21]",
102100
"ldrb w21, [x28, #1298]",
103101
"lsl w23, w22, w20",
@@ -109,7 +107,6 @@
109107
"add x21, x4, #0x14 (20)",
110108
"add x0, x28, x20, lsl #4",
111109
"ldr q2, [x0, #1040]",
112-
"ptrue p2.h, vl5",
113110
"st1h {z2.h}, p2, [x21]",
114111
"ldrb w21, [x28, #1298]",
115112
"lsl w23, w22, w20",
@@ -121,7 +118,6 @@
121118
"add x21, x4, #0x1e (30)",
122119
"add x0, x28, x20, lsl #4",
123120
"ldr q2, [x0, #1040]",
124-
"ptrue p2.h, vl5",
125121
"st1h {z2.h}, p2, [x21]",
126122
"ldrb w21, [x28, #1298]",
127123
"lsl w23, w22, w20",
@@ -133,7 +129,6 @@
133129
"add x21, x4, #0x28 (40)",
134130
"add x0, x28, x20, lsl #4",
135131
"ldr q2, [x0, #1040]",
136-
"ptrue p2.h, vl5",
137132
"st1h {z2.h}, p2, [x21]",
138133
"ldrb w21, [x28, #1298]",
139134
"lsl w23, w22, w20",
@@ -145,7 +140,6 @@
145140
"add x21, x4, #0x32 (50)",
146141
"add x0, x28, x20, lsl #4",
147142
"ldr q2, [x0, #1040]",
148-
"ptrue p2.h, vl5",
149143
"st1h {z2.h}, p2, [x21]",
150144
"ldrb w21, [x28, #1298]",
151145
"lsl w23, w22, w20",
@@ -157,7 +151,6 @@
157151
"add x21, x4, #0x3c (60)",
158152
"add x0, x28, x20, lsl #4",
159153
"ldr q2, [x0, #1040]",
160-
"ptrue p2.h, vl5",
161154
"st1h {z2.h}, p2, [x21]",
162155
"ldrb w21, [x28, #1298]",
163156
"lsl w23, w22, w20",
@@ -169,7 +162,6 @@
169162
"add x21, x4, #0x46 (70)",
170163
"add x0, x28, x20, lsl #4",
171164
"ldr q2, [x0, #1040]",
172-
"ptrue p2.h, vl5",
173165
"st1h {z2.h}, p2, [x21]",
174166
"ldrb w21, [x28, #1298]",
175167
"lsl w22, w22, w20",
@@ -201,7 +193,7 @@
201193
},
202194
"2-load 80bit": {
203195
"x86InstructionCount": 2,
204-
"ExpectedInstructionCount": 22,
196+
"ExpectedInstructionCount": 21,
205197
"x86Insts": [
206198
"fld tword [rax]",
207199
"fld tword [rax+10]"
@@ -210,7 +202,6 @@
210202
"ptrue p2.h, vl5",
211203
"ld1h {z2.h}, p2/z, [x4]",
212204
"add x20, x4, #0xa (10)",
213-
"ptrue p2.h, vl5",
214205
"ld1h {z3.h}, p2/z, [x20]",
215206
"ldrb w20, [x28, #1019]",
216207
"sub w20, w20, #0x2 (2)",
@@ -233,7 +224,7 @@
233224
},
234225
"8-load 80bit": {
235226
"x86InstructionCount": 8,
236-
"ExpectedInstructionCount": 59,
227+
"ExpectedInstructionCount": 52,
237228
"x86Insts": [
238229
"fld tword [rax]",
239230
"fld tword [rax+10]",
@@ -248,25 +239,18 @@
248239
"ptrue p2.h, vl5",
249240
"ld1h {z2.h}, p2/z, [x4]",
250241
"add x20, x4, #0xa (10)",
251-
"ptrue p2.h, vl5",
252242
"ld1h {z3.h}, p2/z, [x20]",
253243
"add x20, x4, #0x14 (20)",
254-
"ptrue p2.h, vl5",
255244
"ld1h {z4.h}, p2/z, [x20]",
256245
"add x20, x4, #0x1e (30)",
257-
"ptrue p2.h, vl5",
258246
"ld1h {z5.h}, p2/z, [x20]",
259247
"add x20, x4, #0x28 (40)",
260-
"ptrue p2.h, vl5",
261248
"ld1h {z6.h}, p2/z, [x20]",
262249
"add x20, x4, #0x32 (50)",
263-
"ptrue p2.h, vl5",
264250
"ld1h {z7.h}, p2/z, [x20]",
265251
"add x20, x4, #0x3c (60)",
266-
"ptrue p2.h, vl5",
267252
"ld1h {z8.h}, p2/z, [x20]",
268253
"add x20, x4, #0x46 (70)",
269-
"ptrue p2.h, vl5",
270254
"ld1h {z9.h}, p2/z, [x20]",
271255
"ldrb w20, [x28, #1019]",
272256
"sub w20, w20, #0x8 (8)",

0 commit comments

Comments
 (0)