diff --git a/unittests/InstructionCountCI/FEXOpt/MultiInst.json b/unittests/InstructionCountCI/FEXOpt/MultiInst.json index 5c8d068139..6102c7e8be 100644 --- a/unittests/InstructionCountCI/FEXOpt/MultiInst.json +++ b/unittests/InstructionCountCI/FEXOpt/MultiInst.json @@ -1309,6 +1309,47 @@ "ldr x6, [x8], #8", "cfinv" ] + }, + "Load variables from structs": { + "x86InstructionCount": 7, + "ExpectedInstructionCount": 21, + "Comment": [ + "Saw this in 32-bit libvulkan_freedreno.so:tu_cs_begin_sub_stream_aligned", + "Loads a bunch of values from structs passed as arguments", + "Loads failed to use LRCPC2/ldapur with small immediate offset when possible" + ], + "x86Insts": [ + "mov edi, [ecx + 8]", + "mov edx, [ecx + 4]", + "mov ebx, [ecx]", + "mov esi, [ecx + 0xc]", + "imul edx, edi", + "mov eax, [ebx + 0xc]", + "sub eax, [ebx + 4]" + ], + "ExpectedArm64ASM": [ + "add x20, x7, #0x8 (8)", + "mov w20, w20", + "ldr w11, [x20]", + "add x20, x7, #0x4 (4)", + "mov w20, w20", + "ldr w5, [x20]", + "mov w20, w7", + "ldr w6, [x20]", + "add x20, x7, #0xc (12)", + "mov w20, w20", + "ldr w10, [x20]", + "mul w5, w5, w11", + "add x20, x6, #0xc (12)", + "mov w20, w20", + "ldr w4, [x20]", + "add x20, x6, #0x4 (4)", + "mov w20, w20", + "ldr w20, [x20]", + "eor w27, w4, w20", + "subs w26, w4, w20", + "mov x4, x26" + ] } } } diff --git a/unittests/InstructionCountCI/FEXOpt/MultiInst_TSO.json b/unittests/InstructionCountCI/FEXOpt/MultiInst_TSO.json new file mode 100644 index 0000000000..69bc00aa52 --- /dev/null +++ b/unittests/InstructionCountCI/FEXOpt/MultiInst_TSO.json @@ -0,0 +1,70 @@ +{ + "Features": { + "Bitness": 64, + "EnabledHostFeatures": [ + "TSO", + "LRCPC", + "LRCPC2", + "FLAGM", + "FLAGM2" + ], + "DisabledHostFeatures": [ + "SVE128", + "SVE256", + "RPRES", + "AFP" + ] + }, + "Comment": [ + "These are instruction combinations that could be more optimal if FEX optimized for them" + ], + "Instructions": { + "Load variables from structs": { + "x86InstructionCount": 7, + "ExpectedInstructionCount": 27, + "Comment": [ + "Saw this in 32-bit libvulkan_freedreno.so:tu_cs_begin_sub_stream_aligned", + "Loads a bunch of values from structs passed as arguments", + "Loads failed to use LRCPC2/ldapur with small immediate offset when possible" + ], + "x86Insts": [ + "mov edi, [ecx + 8]", + "mov edx, [ecx + 4]", + "mov ebx, [ecx]", + "mov esi, [ecx + 0xc]", + "imul edx, edi", + "mov eax, [ebx + 0xc]", + "sub eax, [ebx + 4]" + ], + "ExpectedArm64ASM": [ + "add x20, x7, #0x8 (8)", + "mov w20, w20", + "ldapur w11, [x20]", + "nop", + "add x20, x7, #0x4 (4)", + "mov w20, w20", + "ldapur w5, [x20]", + "nop", + "mov w20, w7", + "ldapur w6, [x20]", + "nop", + "add x20, x7, #0xc (12)", + "mov w20, w20", + "ldapur w10, [x20]", + "nop", + "mul w5, w5, w11", + "add x20, x6, #0xc (12)", + "mov w20, w20", + "ldapur w4, [x20]", + "nop", + "add x20, x6, #0x4 (4)", + "mov w20, w20", + "ldapur w20, [x20]", + "nop", + "eor w27, w4, w20", + "subs w26, w4, w20", + "mov x4, x26" + ] + } + } +}