Skip to content

Commit

Permalink
instcount: Ensure predicate cache is reset when control flow leaves b…
Browse files Browse the repository at this point in the history
…lock
  • Loading branch information
pmatos committed Jan 27, 2025
1 parent 3dc7b8d commit ddd241f
Showing 1 changed file with 6 additions and 28 deletions.
34 changes: 6 additions & 28 deletions unittests/InstructionCountCI/X87ldst-SVE.json
Original file line number Diff line number Diff line change
Expand Up @@ -14,13 +14,12 @@
},
"Instructions": {
"fstp tword [rax]": {
"ExpectedInstructionCount": 13,
"ExpectedInstructionCount": 12,
"Comment": "Single 80-bit store.",
"ExpectedArm64ASM": [
"ldrb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"st1h {z2.h}, p2, [x4]",
"ldrb w21, [x28, #1298]",
"mov w22, #0x1",
Expand All @@ -34,7 +33,7 @@
},
"2-store 80bit": {
"x86InstructionCount": 2,
"ExpectedInstructionCount": 25,
"ExpectedInstructionCount": 23,
"x86Insts": [
"fstp tword [rax]",
"fstp tword [rax+10]"
Expand All @@ -43,7 +42,6 @@
"ldrb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"st1h {z2.h}, p2, [x4]",
"ldrb w21, [x28, #1298]",
"mov w22, #0x1",
Expand All @@ -55,7 +53,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0xa (10)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -69,7 +66,7 @@
},
"8-store 80bit": {
"x86InstructionCount": 8,
"ExpectedInstructionCount": 97,
"ExpectedInstructionCount": 89,
"x86Insts": [
"fstp tword [rax]",
"fstp tword [rax+10]",
Expand All @@ -84,7 +81,6 @@
"ldrb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"st1h {z2.h}, p2, [x4]",
"ldrb w21, [x28, #1298]",
"mov w22, #0x1",
Expand All @@ -96,7 +92,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0xa (10)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -108,7 +103,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0x14 (20)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -120,7 +114,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0x1e (30)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -132,7 +125,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0x28 (40)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -144,7 +136,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0x32 (50)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -156,7 +147,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0x3c (60)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -168,7 +158,6 @@
"strb w20, [x28, #1019]",
"add x0, x28, x20, lsl #4",
"ldr q2, [x0, #1040]",
"ptrue p2.h, vl5",
"add x21, x4, #0x46 (70)",
"st1h {z2.h}, p2, [x21]",
"ldrb w21, [x28, #1298]",
Expand All @@ -181,10 +170,9 @@
]
},
"fld tword [rax]": {
"ExpectedInstructionCount": 13,
"ExpectedInstructionCount": 12,
"Comment": "Single 80-bit store.",
"ExpectedArm64ASM": [
"ptrue p2.h, vl5",
"ld1h {z2.h}, p2/z, [x4]",
"ldrb w20, [x28, #1019]",
"mov w21, #0x1",
Expand All @@ -201,16 +189,14 @@
},
"2-load 80bit": {
"x86InstructionCount": 2,
"ExpectedInstructionCount": 22,
"ExpectedInstructionCount": 20,
"x86Insts": [
"fld tword [rax]",
"fld tword [rax+10]"
],
"ExpectedArm64ASM": [
"ptrue p2.h, vl5",
"ld1h {z2.h}, p2/z, [x4]",
"add x20, x4, #0xa (10)",
"ptrue p2.h, vl5",
"ld1h {z3.h}, p2/z, [x20]",
"ldrb w20, [x28, #1019]",
"sub w20, w20, #0x2 (2)",
Expand All @@ -233,7 +219,7 @@
},
"8-load 80bit": {
"x86InstructionCount": 8,
"ExpectedInstructionCount": 59,
"ExpectedInstructionCount": 51,
"x86Insts": [
"fld tword [rax]",
"fld tword [rax+10]",
Expand All @@ -245,28 +231,20 @@
"fld tword [rax+70]"
],
"ExpectedArm64ASM": [
"ptrue p2.h, vl5",
"ld1h {z2.h}, p2/z, [x4]",
"add x20, x4, #0xa (10)",
"ptrue p2.h, vl5",
"ld1h {z3.h}, p2/z, [x20]",
"add x20, x4, #0x14 (20)",
"ptrue p2.h, vl5",
"ld1h {z4.h}, p2/z, [x20]",
"add x20, x4, #0x1e (30)",
"ptrue p2.h, vl5",
"ld1h {z5.h}, p2/z, [x20]",
"add x20, x4, #0x28 (40)",
"ptrue p2.h, vl5",
"ld1h {z6.h}, p2/z, [x20]",
"add x20, x4, #0x32 (50)",
"ptrue p2.h, vl5",
"ld1h {z7.h}, p2/z, [x20]",
"add x20, x4, #0x3c (60)",
"ptrue p2.h, vl5",
"ld1h {z8.h}, p2/z, [x20]",
"add x20, x4, #0x46 (70)",
"ptrue p2.h, vl5",
"ld1h {z9.h}, p2/z, [x20]",
"ldrb w20, [x28, #1019]",
"sub w20, w20, #0x8 (8)",
Expand Down

0 comments on commit ddd241f

Please sign in to comment.