Skip to content

Commit

Permalink
InstCountCI: Adds hot block that doesn't generate optimal code
Browse files Browse the repository at this point in the history
  • Loading branch information
Sonicadvance1 committed Dec 11, 2024
1 parent 800d447 commit fb838fd
Show file tree
Hide file tree
Showing 2 changed files with 111 additions and 0 deletions.
41 changes: 41 additions & 0 deletions unittests/InstructionCountCI/FEXOpt/MultiInst.json
Original file line number Diff line number Diff line change
Expand Up @@ -1309,6 +1309,47 @@
"ldr x6, [x8], #8",
"cfinv"
]
},
"Load variables from structs": {
"x86InstructionCount": 7,
"ExpectedInstructionCount": 21,
"Comment": [
"Saw this in 32-bit libvulkan_freedreno.so:tu_cs_begin_sub_stream_aligned",
"Loads a bunch of values from structs passed as arguments",
"Loads failed to use LRCPC2/ldapur with small immediate offset when possible"
],
"x86Insts": [
"mov edi, [ecx + 8]",
"mov edx, [ecx + 4]",
"mov ebx, [ecx]",
"mov esi, [ecx + 0xc]",
"imul edx, edi",
"mov eax, [ebx + 0xc]",
"sub eax, [ebx + 4]"
],
"ExpectedArm64ASM": [
"add x20, x7, #0x8 (8)",
"mov w20, w20",
"ldr w11, [x20]",
"add x20, x7, #0x4 (4)",
"mov w20, w20",
"ldr w5, [x20]",
"mov w20, w7",
"ldr w6, [x20]",
"add x20, x7, #0xc (12)",
"mov w20, w20",
"ldr w10, [x20]",
"mul w5, w5, w11",
"add x20, x6, #0xc (12)",
"mov w20, w20",
"ldr w4, [x20]",
"add x20, x6, #0x4 (4)",
"mov w20, w20",
"ldr w20, [x20]",
"eor w27, w4, w20",
"subs w26, w4, w20",
"mov x4, x26"
]
}
}
}
70 changes: 70 additions & 0 deletions unittests/InstructionCountCI/FEXOpt/MultiInst_TSO.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,70 @@
{
"Features": {
"Bitness": 64,
"EnabledHostFeatures": [
"TSO",
"LRCPC",
"LRCPC2",
"FLAGM",
"FLAGM2"
],
"DisabledHostFeatures": [
"SVE128",
"SVE256",
"RPRES",
"AFP"
]
},
"Comment": [
"These are instruction combinations that could be more optimal if FEX optimized for them"
],
"Instructions": {
"Load variables from structs": {
"x86InstructionCount": 7,
"ExpectedInstructionCount": 27,
"Comment": [
"Saw this in 32-bit libvulkan_freedreno.so:tu_cs_begin_sub_stream_aligned",
"Loads a bunch of values from structs passed as arguments",
"Loads failed to use LRCPC2/ldapur with small immediate offset when possible"
],
"x86Insts": [
"mov edi, [ecx + 8]",
"mov edx, [ecx + 4]",
"mov ebx, [ecx]",
"mov esi, [ecx + 0xc]",
"imul edx, edi",
"mov eax, [ebx + 0xc]",
"sub eax, [ebx + 4]"
],
"ExpectedArm64ASM": [
"add x20, x7, #0x8 (8)",
"mov w20, w20",
"ldapur w11, [x20]",
"nop",
"add x20, x7, #0x4 (4)",
"mov w20, w20",
"ldapur w5, [x20]",
"nop",
"mov w20, w7",
"ldapur w6, [x20]",
"nop",
"add x20, x7, #0xc (12)",
"mov w20, w20",
"ldapur w10, [x20]",
"nop",
"mul w5, w5, w11",
"add x20, x6, #0xc (12)",
"mov w20, w20",
"ldapur w4, [x20]",
"nop",
"add x20, x6, #0x4 (4)",
"mov w20, w20",
"ldapur w20, [x20]",
"nop",
"eor w27, w4, w20",
"subs w26, w4, w20",
"mov x4, x26"
]
}
}
}

0 comments on commit fb838fd

Please sign in to comment.