Skip to content

Commit cd55329

Browse files
committed
separate tests for O2 and O3
1 parent 435d1c6 commit cd55329

File tree

1 file changed

+137
-2
lines changed

1 file changed

+137
-2
lines changed

llvm/test/CodeGen/AMDGPU/llc-pipeline-npm.ll

Lines changed: 137 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,142 @@
1-
; RUN: llc -O3 -enable-new-pm -mtriple=amdgcn--amdhsa -disable-verify -print-pipeline-passes < %s 2>&1 \
1+
; RUN: llc -enable-new-pm -disable-verify -mtriple=amdgcn--amdhsa -print-pipeline-passes < %s 2>&1 \
2+
; RUN: | FileCheck -check-prefix=GCN-O2 %s
3+
4+
; RUN: llc -O3 -enable-new-pm -disable-verify -mtriple=amdgcn--amdhsa -print-pipeline-passes < %s 2>&1 \
25
; RUN: | FileCheck -check-prefix=GCN-O3 %s
36

4-
; REQUIRES: asserts
7+
; GCN-O2: require<MachineModuleAnalysis>
8+
; GCN-O2: require<profile-summary>
9+
; GCN-O2: require<collector-metadata>
10+
; GCN-O2: pre-isel-intrinsic-lowering
11+
; GCN-O2: function(expand-large-div-rem
12+
; GCN-O2: expand-fp)
13+
; GCN-O2: amdgpu-remove-incompatible-functions
14+
; GCN-O2: amdgpu-printf-runtime-binding
15+
; GCN-O2: amdgpu-lower-ctor-dtor
16+
; GCN-O2: function(amdgpu-image-intrinsic-opt)
17+
; GCN-O2: expand-variadics
18+
; GCN-O2: amdgpu-always-inline
19+
; GCN-O2: always-inline
20+
; GCN-O2: amdgpu-export-kernel-runtime-handles
21+
; GCN-O2: amdgpu-sw-lower-lds
22+
; GCN-O2: amdgpu-lower-module-lds
23+
; GCN-O2: function(infer-address-spaces
24+
; GCN-O2: amdgpu-atomic-optimizer
25+
; GCN-O2: atomic-expand
26+
; GCN-O2: amdgpu-promote-alloca
27+
; GCN-O2: separate-const-offset-from-gep<>
28+
; GCN-O2: slsr
29+
; GCN-O2: early-cse<>
30+
; GCN-O2: nary-reassociate
31+
; GCN-O2: early-cse<>
32+
; GCN-O2: amdgpu-codegenprepare
33+
; GCN-O2: loop-mssa(loop-reduce)
34+
; GCN-O2: mergeicmps
35+
; GCN-O2: expand-memcmp
36+
; GCN-O2: gc-lowering
37+
; GCN-O2: lower-constant-intrinsics
38+
; GCN-O2: UnreachableBlockElimPass
39+
; GCN-O2: consthoist
40+
; GCN-O2: ReplaceWithVeclib
41+
; GCN-O2: partially-inline-libcalls
42+
; GCN-O2: ee-instrument<post-inline>
43+
; GCN-O2: scalarize-masked-mem-intrin
44+
; GCN-O2: ExpandReductionsPass
45+
; GCN-O2: early-cse<>
46+
; GCN-O2: amdgpu-lower-kernel-arguments)
47+
; GCN-O2: amdgpu-lower-buffer-fat-pointers
48+
; GCN-O2: cgscc(function(codegenprepare
49+
; GCN-O2: load-store-vectorizer
50+
; GCN-O2: lower-switch
51+
; GCN-O2: lower-invoke
52+
; GCN-O2: UnreachableBlockElimPass
53+
; GCN-O2: flatten-cfg
54+
; GCN-O2: sink
55+
; GCN-O2: amdgpu-late-codegenprepare
56+
; GCN-O2: amdgpu-unify-divergent-exit-nodes
57+
; GCN-O2: fix-irreducible
58+
; GCN-O2: unify-loop-exits
59+
; GCN-O2: StructurizeCFGPass
60+
; GCN-O2: amdgpu-annotate-uniform
61+
; GCN-O2: si-annotate-control-flow
62+
; GCN-O2: amdgpu-rewrite-undef-for-phi
63+
; GCN-O2: lcssa))
64+
; GCN-O2: amdgpu-perf-hint
65+
; GCN-O2: cgscc(function(require<uniformity>
66+
; GCN-O2: callbr-prepare
67+
; GCN-O2: safe-stack
68+
; GCN-O2: stack-protector))
69+
; GCN-O2: cgscc(function(machine-function(amdgpu-isel
70+
; GCN-O2: si-fix-sgpr-copies
71+
; GCN-O2: si-i1-copies
72+
; GCN-O2: finalize-isel
73+
; GCN-O2: early-tailduplication
74+
; GCN-O2: opt-phis
75+
; GCN-O2: stack-coloring
76+
; GCN-O2: localstackalloc
77+
; GCN-O2: dead-mi-elimination
78+
; GCN-O2: early-machinelicm
79+
; GCN-O2: machine-cse
80+
; GCN-O2: machine-sink
81+
; GCN-O2: peephole-opt
82+
; GCN-O2: dead-mi-elimination
83+
; GCN-O2: si-fold-operands
84+
; GCN-O2: gcn-dpp-combine
85+
; GCN-O2: si-load-store-opt
86+
; GCN-O2: si-peephole-sdwa
87+
; GCN-O2: early-machinelicm
88+
; GCN-O2: machine-cse
89+
; GCN-O2: si-fold-operands
90+
; GCN-O2: dead-mi-elimination
91+
; GCN-O2: si-shrink-instructions
92+
; GCN-O2: detect-dead-lanes
93+
; GCN-O2: InitUndefPass
94+
; GCN-O2: ProcessImplicitDefsPass
95+
; GCN-O2: unreachable-mbb-elimination
96+
; GCN-O2: require<live-vars>
97+
; GCN-O2: require<machine-loops>
98+
; GCN-O2: phi-node-elimination
99+
; GCN-O2: two-address-instruction
100+
; GCN-O2: register-coalescer
101+
; GCN-O2: rename-independent-subregs
102+
; GCN-O2: machine-scheduler
103+
; GCN-O2: greedy<all>
104+
; GCN-O2: amdgpu-nsa-reassign
105+
; GCN-O2: VirtRegRewriterPass
106+
; GCN-O2: stack-slot-coloring
107+
; GCN-O2: machine-cp
108+
; GCN-O2: machinelicm
109+
; GCN-O2: si-fix-vgpr-copies
110+
; GCN-O2: si-optimize-exec-masking
111+
; GCN-O2: remove-redundant-debug-values
112+
; GCN-O2: fixup-statepoint-caller-saved
113+
; GCN-O2: PostRAMachineSinkingPass
114+
; GCN-O2: ShrinkWrapPass
115+
; GCN-O2: PrologEpilogInserterPass
116+
; GCN-O2: branch-folder
117+
; GCN-O2: tailduplication
118+
; GCN-O2: machine-latecleanup
119+
; GCN-O2: machine-cp
120+
; GCN-O2: post-ra-pseudos
121+
; GCN-O2: postmisched
122+
; GCN-O2: block-placement
123+
; GCN-O2: fentry-insert
124+
; GCN-O2: xray-instrumentation
125+
; GCN-O2: patchable-function
126+
; GCN-O2: gcn-create-vopd
127+
; GCN-O2: si-memory-legalizer
128+
; GCN-O2: si-insert-waitcnts
129+
; GCN-O2: si-late-branch-lowering
130+
; GCN-O2: si-pre-emit-peephole
131+
; GCN-O2: post-RA-hazard-rec
132+
; GCN-O2: AMDGPUWaitSGPRHazardsPass
133+
; GCN-O2: amdgpu-insert-delay-alu
134+
; GCN-O2: branch-relaxation
135+
; GCN-O2: remove-loads-into-fake-uses
136+
; GCN-O2: live-debug-values
137+
; GCN-O2: machine-sanmd
138+
; GCN-O2: stack-frame-layout)
139+
; GCN-O2: invalidate<machine-function-info>))
5140

6141
; GCN-O3: require<MachineModuleAnalysis>
7142
; GCN-O3: require<profile-summary>

0 commit comments

Comments
 (0)