Files
llvm-project/llvm/test/CodeGen/AArch64/machine-outliner-sort-per-priority.mir
Xuan Zhang 3b16630c26 [MachineOutliner] Sort by Benefit to Cost Ratio (#90264)
This PR depends on https://github.com/llvm/llvm-project/pull/90260

We changed the order in which functions are outlined in Machine
Outliner.

The formula for priority is found via a black-box Bayesian optimization
toolbox. Using this formula for sorting consistently reduces the
uncompressed size of large real-world mobile apps. We also ran a few
benchmarks using LLVM test suites, and showed that sorting by priority
consistently reduces the text segment size.

|run (CTMark/)   |baseline (1)|priority (2)|diff (1 -> 2)|
|----------------|------------|------------|-------------|
|lencod          |349624      |349264      |-0.1030%     |
|SPASS           |219672      |219480      |-0.0874%     |
|kc              |271956      |251200      |-7.6321%     |
|sqlite3         |223920      |223708      |-0.0947%     |
|7zip-benchmark  |405364      |402624      |-0.6759%     |
|bullet          |139820      |139500      |-0.2289%     |
|consumer-typeset|295684      |290196      |-1.8560%     |
|pairlocalalign  |72236       |72092       |-0.1993%     |
|tramp3d-v4      |189572      |189292      |-0.1477%     |

This is part of an enhanced version of machine outliner -- see
[RFC](https://discourse.llvm.org/t/rfc-enhanced-machine-outliner-part-1-fulllto-part-2-thinlto-nolto-to-come/78732).
2024-06-07 06:50:13 -07:00

207 lines
6.4 KiB
YAML

# The content of this test is modfied upon the output obtained from running
# `bin/llc -O2 -stop-before=machine-outliner <path_to_llvm_project>/llvm/test/CodeGen/AArch64/machine-outliner-sort-per-priority.ll -o -`
# RUN: llc -mtriple=aarch64 -run-pass=machine-outliner -verify-machineinstrs %s -o - | FileCheck %s
--- |
declare i32 @foo()
define void @f1() #0 { ret void }
define void @f2() #0 { ret void }
define void @f3() #0 { ret void }
define void @f4() #0 { ret void }
define void @f5() #0 { ret void }
define void @f6() #0 { ret void }
attributes #0 = { minsize }
...
---
# CHECK-LABEL: name: f1
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $lr
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $x5 = ORRXrs $xzr, $lr, 0
# CHECK-NEXT: BL @OUTLINED_FUNCTION_1
# CHECK-NEXT: $lr = ORRXrs $xzr, $x5, 0
# CHECK-NEXT: $w5 = MOVZWi 11, 0
# CHECK-NEXT: TCRETURNdi @OUTLINED_FUNCTION_0
name: f1
tracksRegLiveness: true
frameInfo:
isCalleeSavedInfoValid: true
machineFunctionInfo:
hasRedZone: false
body: |
bb.0:
$w0 = MOVZWi 1, 0
$w1 = MOVZWi 2, 0
$w2 = MOVZWi 3, 0
$w3 = MOVZWi 4, 0
$w4 = MOVZWi 5, 0
$w5 = MOVZWi 11, 0
$w6 = MOVZWi 6, 0
$w7 = MOVZWi 7, 0
TCRETURNdi @foo, 0, csr_darwin_aarch64_aapcs, implicit $sp, implicit killed $w0, implicit killed $w1, implicit killed $w2, implicit killed $w3, implicit killed $w4, implicit killed $w5, implicit killed $w6, implicit killed $w7
...
---
# CHECK-LABEL: name: f2
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $lr
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $x5 = ORRXrs $xzr, $lr, 0
# CHECK-NEXT: BL @OUTLINED_FUNCTION_1
# CHECK-NEXT: $lr = ORRXrs $xzr, $x5, 0
# CHECK-NEXT: $w5 = MOVZWi 12, 0
# CHECK-NEXT: TCRETURNdi @OUTLINED_FUNCTION_0
name: f2
tracksRegLiveness: true
frameInfo:
isCalleeSavedInfoValid: true
machineFunctionInfo:
hasRedZone: false
body: |
bb.0:
$w0 = MOVZWi 1, 0
$w1 = MOVZWi 2, 0
$w2 = MOVZWi 3, 0
$w3 = MOVZWi 4, 0
$w4 = MOVZWi 5, 0
$w5 = MOVZWi 12, 0
$w6 = MOVZWi 6, 0
$w7 = MOVZWi 7, 0
TCRETURNdi @foo, 0, csr_darwin_aarch64_aapcs, implicit $sp, implicit killed $w0, implicit killed $w1, implicit killed $w2, implicit killed $w3, implicit killed $w4, implicit killed $w5, implicit killed $w6, implicit killed $w7
...
---
# CHECK-LABEL: name: f3
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $lr
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $x5 = ORRXrs $xzr, $lr, 0
# CHECK-NEXT: BL @OUTLINED_FUNCTION_1
# CHECK-NEXT: $lr = ORRXrs $xzr, $x5, 0
# CHECK-NEXT: $w5 = MOVZWi 13, 0
# CHECK-NEXT: TCRETURNdi @OUTLINED_FUNCTION_0
name: f3
tracksRegLiveness: true
frameInfo:
isCalleeSavedInfoValid: true
machineFunctionInfo:
hasRedZone: false
body: |
bb.0:
$w0 = MOVZWi 1, 0
$w1 = MOVZWi 2, 0
$w2 = MOVZWi 3, 0
$w3 = MOVZWi 4, 0
$w4 = MOVZWi 5, 0
$w5 = MOVZWi 13, 0
$w6 = MOVZWi 6, 0
$w7 = MOVZWi 7, 0
TCRETURNdi @foo, 0, csr_darwin_aarch64_aapcs, implicit $sp, implicit killed $w0, implicit killed $w1, implicit killed $w2, implicit killed $w3, implicit killed $w4, implicit killed $w5, implicit killed $w6, implicit killed $w7
...
---
# CHECK-LABEL: name: f4
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $lr
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $x5 = ORRXrs $xzr, $lr, 0
# CHECK-NEXT: BL @OUTLINED_FUNCTION_1
# CHECK-NEXT: $lr = ORRXrs $xzr, $x5, 0
# CHECK-NEXT: $w5 = MOVZWi 14, 0
# CHECK-NEXT: TCRETURNdi @OUTLINED_FUNCTION_0
name: f4
tracksRegLiveness: true
frameInfo:
isCalleeSavedInfoValid: true
machineFunctionInfo:
hasRedZone: false
body: |
bb.0:
$w0 = MOVZWi 1, 0
$w1 = MOVZWi 2, 0
$w2 = MOVZWi 3, 0
$w3 = MOVZWi 4, 0
$w4 = MOVZWi 5, 0
$w5 = MOVZWi 14, 0
$w6 = MOVZWi 6, 0
$w7 = MOVZWi 7, 0
TCRETURNdi @foo, 0, csr_darwin_aarch64_aapcs, implicit $sp, implicit killed $w0, implicit killed $w1, implicit killed $w2, implicit killed $w3, implicit killed $w4, implicit killed $w5, implicit killed $w6, implicit killed $w7
...
---
# CHECK-LABEL: name: f5
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $lr
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $x5 = ORRXrs $xzr, $lr, 0
# CHECK-NEXT: BL @OUTLINED_FUNCTION_1
# CHECK-NEXT: $lr = ORRXrs $xzr, $x5, 0
# CHECK-NOT: @OUTLINED_FUNCTION_0
name: f5
tracksRegLiveness: true
frameInfo:
isCalleeSavedInfoValid: true
machineFunctionInfo:
hasRedZone: false
body: |
bb.0:
$w0 = MOVZWi 1, 0
$w1 = MOVZWi 2, 0
$w2 = MOVZWi 3, 0
$w3 = MOVZWi 4, 0
$w4 = MOVZWi 5, 0
$w5 = MOVZWi 15, 0
$w6 = MOVZWi 8, 0
$w7 = MOVZWi 9, 0
TCRETURNdi @foo, 0, csr_darwin_aarch64_aapcs, implicit $sp, implicit killed $w0, implicit killed $w1, implicit killed $w2, implicit killed $w3, implicit killed $w4, implicit killed $w5, implicit killed $w6, implicit killed $w7
...
---
# CHECK-LABEL: name: f6
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $lr
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $x5 = ORRXrs $xzr, $lr, 0
# CHECK-NEXT: BL @OUTLINED_FUNCTION_1
# CHECK-NEXT: $lr = ORRXrs $xzr, $x5, 0
# CHECK-NOT: @OUTLINED_FUNCTION_0
name: f6
tracksRegLiveness: true
frameInfo:
isCalleeSavedInfoValid: true
machineFunctionInfo:
hasRedZone: false
body: |
bb.0:
$w0 = MOVZWi 1, 0
$w1 = MOVZWi 2, 0
$w2 = MOVZWi 3, 0
$w3 = MOVZWi 4, 0
$w4 = MOVZWi 5, 0
$w5 = MOVZWi 16, 0
$w6 = MOVZWi 9, 0
$w7 = MOVZWi 8, 0
TCRETURNdi @foo, 0, csr_darwin_aarch64_aapcs, implicit $sp, implicit killed $w0, implicit killed $w1, implicit killed $w2, implicit killed $w3, implicit killed $w4, implicit killed $w5, implicit killed $w6, implicit killed $w7
...
# CHECK-LABEL: name: OUTLINED_FUNCTION_0
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $x19, $x20, $x21, $x22, $x23, $x24, $x25, $x26, $x27, $x28, $lr, $d8, $d9, $d10, $d11, $d12, $d13, $d14, $d15, $w0, $w1, $w2, $w3, $w4, $w5
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $w6 = MOVZWi 6, 0
# CHECK-NEXT: $w7 = MOVZWi 7, 0
# CHECK-LABEL: name: OUTLINED_FUNCTION_1
# CHECK-LABEL: bb.0:
# CHECK-NEXT: liveins: $x19, $x20, $x21, $x22, $x23, $x24, $x25, $x26, $x27, $x28, $lr, $d8, $d9, $d10, $d11, $d12, $d13, $d14, $d15
# CHECK-NEXT: {{ $}}
# CHECK-NEXT: $w0 = MOVZWi 1, 0
# CHECK-NEXT: $w1 = MOVZWi 2, 0
# CHECK-NEXT: $w2 = MOVZWi 3, 0
# CHECK-NEXT: $w3 = MOVZWi 4, 0
# CHECK-NEXT: $w4 = MOVZWi 5, 0
# CHECK-NEXT: RET $lr