Skip to content

Commit e2a4289

Browse files
committed
condense test into one line
pipeline is printed on a single line, so having CHECK lines on separate lines can allow extra characters in between (and will not error out on extra passes being in the pipeline)
1 parent 61aa7b9 commit e2a4289

File tree

1 file changed

+11
-268
lines changed

1 file changed

+11
-268
lines changed

llvm/test/CodeGen/AMDGPU/llc-pipeline-npm.ll

Lines changed: 11 additions & 268 deletions
Original file line numberDiff line numberDiff line change
@@ -1,276 +1,19 @@
1-
; RUN: llc -enable-new-pm -disable-verify -mtriple=amdgcn--amdhsa -print-pipeline-passes < %s 2>&1 \
1+
; RUN: llc -enable-new-pm -mtriple=amdgcn--amdhsa -O0 -print-pipeline-passes < %s 2>&1 \
2+
; RUN: | FileCheck -check-prefix=GCN-O0 %s
3+
4+
; RUN: llc -enable-new-pm -mtriple=amdgcn--amdhsa -print-pipeline-passes < %s 2>&1 \
25
; RUN: | FileCheck -check-prefix=GCN-O2 %s
36

4-
; RUN: llc -O3 -enable-new-pm -disable-verify -mtriple=amdgcn--amdhsa -print-pipeline-passes < %s 2>&1 \
7+
; RUN: llc -O3 -enable-new-pm -mtriple=amdgcn--amdhsa -print-pipeline-passes < %s 2>&1 \
58
; RUN: | FileCheck -check-prefix=GCN-O3 %s
69

7-
; GCN-O2: require<MachineModuleAnalysis>
8-
; GCN-O2: require<profile-summary>
9-
; GCN-O2: require<collector-metadata>
10-
; GCN-O2: pre-isel-intrinsic-lowering
11-
; GCN-O2: function(expand-large-div-rem
12-
; GCN-O2: expand-fp)
13-
; GCN-O2: amdgpu-remove-incompatible-functions
14-
; GCN-O2: amdgpu-printf-runtime-binding
15-
; GCN-O2: amdgpu-lower-ctor-dtor
16-
; GCN-O2: function(amdgpu-image-intrinsic-opt)
17-
; GCN-O2: expand-variadics
18-
; GCN-O2: amdgpu-always-inline
19-
; GCN-O2: always-inline
20-
; GCN-O2: amdgpu-export-kernel-runtime-handles
21-
; GCN-O2: amdgpu-sw-lower-lds
22-
; GCN-O2: amdgpu-lower-module-lds
23-
; GCN-O2: function(infer-address-spaces
24-
; GCN-O2: amdgpu-atomic-optimizer
25-
; GCN-O2: atomic-expand
26-
; GCN-O2: amdgpu-promote-alloca
27-
; GCN-O2: separate-const-offset-from-gep<>
28-
; GCN-O2: slsr
29-
; GCN-O2: early-cse<>
30-
; GCN-O2: nary-reassociate
31-
; GCN-O2: early-cse<>
32-
; GCN-O2: amdgpu-codegenprepare
33-
; GCN-O2: loop-mssa(loop-reduce)
34-
; GCN-O2: mergeicmps
35-
; GCN-O2: expand-memcmp
36-
; GCN-O2: gc-lowering
37-
; GCN-O2: lower-constant-intrinsics
38-
; GCN-O2: UnreachableBlockElimPass
39-
; GCN-O2: consthoist
40-
; GCN-O2: ReplaceWithVeclib
41-
; GCN-O2: partially-inline-libcalls
42-
; GCN-O2: ee-instrument<post-inline>
43-
; GCN-O2: scalarize-masked-mem-intrin
44-
; GCN-O2: ExpandReductionsPass
45-
; GCN-O2: early-cse<>
46-
; GCN-O2: amdgpu-lower-kernel-arguments)
47-
; GCN-O2: amdgpu-lower-buffer-fat-pointers
48-
; GCN-O2: cgscc(function(codegenprepare
49-
; GCN-O2: load-store-vectorizer
50-
; GCN-O2: lower-switch
51-
; GCN-O2: lower-invoke
52-
; GCN-O2: UnreachableBlockElimPass
53-
; GCN-O2: flatten-cfg
54-
; GCN-O2: sink
55-
; GCN-O2: amdgpu-late-codegenprepare
56-
; GCN-O2: amdgpu-unify-divergent-exit-nodes
57-
; GCN-O2: fix-irreducible
58-
; GCN-O2: unify-loop-exits
59-
; GCN-O2: StructurizeCFGPass
60-
; GCN-O2: amdgpu-annotate-uniform
61-
; GCN-O2: si-annotate-control-flow
62-
; GCN-O2: amdgpu-rewrite-undef-for-phi
63-
; GCN-O2: lcssa))
64-
; GCN-O2: amdgpu-perf-hint
65-
; GCN-O2: cgscc(function(require<uniformity>
66-
; GCN-O2: callbr-prepare
67-
; GCN-O2: safe-stack
68-
; GCN-O2: stack-protector))
69-
; GCN-O2: cgscc(function(machine-function(amdgpu-isel
70-
; GCN-O2: si-fix-sgpr-copies
71-
; GCN-O2: si-i1-copies
72-
; GCN-O2: finalize-isel
73-
; GCN-O2: early-tailduplication
74-
; GCN-O2: opt-phis
75-
; GCN-O2: stack-coloring
76-
; GCN-O2: localstackalloc
77-
; GCN-O2: dead-mi-elimination
78-
; GCN-O2: early-machinelicm
79-
; GCN-O2: machine-cse
80-
; GCN-O2: machine-sink
81-
; GCN-O2: peephole-opt
82-
; GCN-O2: dead-mi-elimination
83-
; GCN-O2: si-fold-operands
84-
; GCN-O2: gcn-dpp-combine
85-
; GCN-O2: si-load-store-opt
86-
; GCN-O2: si-peephole-sdwa
87-
; GCN-O2: early-machinelicm
88-
; GCN-O2: machine-cse
89-
; GCN-O2: si-fold-operands
90-
; GCN-O2: dead-mi-elimination
91-
; GCN-O2: si-shrink-instructions
92-
; GCN-O2: detect-dead-lanes
93-
; GCN-O2: InitUndefPass
94-
; GCN-O2: ProcessImplicitDefsPass
95-
; GCN-O2: unreachable-mbb-elimination
96-
; GCN-O2: require<live-vars>
97-
; GCN-O2: require<machine-loops>
98-
; GCN-O2: phi-node-elimination
99-
; GCN-O2: two-address-instruction
100-
; GCN-O2: register-coalescer
101-
; GCN-O2: rename-independent-subregs
102-
; GCN-O2: machine-scheduler
103-
; GCN-O2: greedy<all>
104-
; GCN-O2: amdgpu-nsa-reassign
105-
; GCN-O2: VirtRegRewriterPass
106-
; GCN-O2: stack-slot-coloring
107-
; GCN-O2: machine-cp
108-
; GCN-O2: machinelicm
109-
; GCN-O2: si-fix-vgpr-copies
110-
; GCN-O2: si-optimize-exec-masking
111-
; GCN-O2: remove-redundant-debug-values
112-
; GCN-O2: fixup-statepoint-caller-saved
113-
; GCN-O2: PostRAMachineSinkingPass
114-
; GCN-O2: ShrinkWrapPass
115-
; GCN-O2: PrologEpilogInserterPass
116-
; GCN-O2: branch-folder
117-
; GCN-O2: tailduplication
118-
; GCN-O2: machine-latecleanup
119-
; GCN-O2: machine-cp
120-
; GCN-O2: post-ra-pseudos
121-
; GCN-O2: postmisched
122-
; GCN-O2: block-placement
123-
; GCN-O2: fentry-insert
124-
; GCN-O2: xray-instrumentation
125-
; GCN-O2: patchable-function
126-
; GCN-O2: gcn-create-vopd
127-
; GCN-O2: si-memory-legalizer
128-
; GCN-O2: si-insert-waitcnts
129-
; GCN-O2: si-late-branch-lowering
130-
; GCN-O2: si-pre-emit-peephole
131-
; GCN-O2: post-RA-hazard-rec
132-
; GCN-O2: AMDGPUWaitSGPRHazardsPass
133-
; GCN-O2: amdgpu-insert-delay-alu
134-
; GCN-O2: branch-relaxation
135-
; GCN-O2: remove-loads-into-fake-uses
136-
; GCN-O2: live-debug-values
137-
; GCN-O2: machine-sanmd
138-
; GCN-O2: stack-frame-layout)
139-
; GCN-O2: invalidate<machine-function-info>))
14010

141-
; GCN-O3: require<MachineModuleAnalysis>
142-
; GCN-O3: require<profile-summary>
143-
; GCN-O3: require<collector-metadata>
144-
; GCN-O3: pre-isel-intrinsic-lowering
145-
; GCN-O3: function(expand-large-div-rem
146-
; GCN-O3: expand-fp)
147-
; GCN-O3: amdgpu-remove-incompatible-functions
148-
; GCN-O3: amdgpu-printf-runtime-binding
149-
; GCN-O3: amdgpu-lower-ctor-dtor
150-
; GCN-O3: function(amdgpu-image-intrinsic-opt)
151-
; GCN-O3: expand-variadics
152-
; GCN-O3: amdgpu-always-inline
153-
; GCN-O3: always-inline
154-
; GCN-O3: amdgpu-export-kernel-runtime-handles
155-
; GCN-O3: amdgpu-sw-lower-lds
156-
; GCN-O3: amdgpu-lower-module-lds
157-
; GCN-O3: function(infer-address-spaces
158-
; GCN-O3: amdgpu-atomic-optimizer
159-
; GCN-O3: atomic-expand
160-
; GCN-O3: amdgpu-promote-alloca
161-
; GCN-O3: separate-const-offset-from-gep<>
162-
; GCN-O3: slsr
163-
; GCN-O3: gvn<>
164-
; GCN-O3: nary-reassociate
165-
; GCN-O3: early-cse<>
166-
; GCN-O3: amdgpu-codegenprepare
167-
; GCN-O3: loop-mssa(loop-reduce)
168-
; GCN-O3: mergeicmps
169-
; GCN-O3: expand-memcmp
170-
; GCN-O3: gc-lowering
171-
; GCN-O3: lower-constant-intrinsics
172-
; GCN-O3: UnreachableBlockElimPass
173-
; GCN-O3: consthoist
174-
; GCN-O3: ReplaceWithVeclib
175-
; GCN-O3: partially-inline-libcalls
176-
; GCN-O3: ee-instrument<post-inline>
177-
; GCN-O3: scalarize-masked-mem-intrin
178-
; GCN-O3: ExpandReductionsPass
179-
; GCN-O3: gvn<>
180-
; GCN-O3: amdgpu-lower-kernel-arguments)
181-
; GCN-O3: amdgpu-lower-buffer-fat-pointers
182-
; GCN-O3: cgscc(function(codegenprepare
183-
; GCN-O3: load-store-vectorizer
184-
; GCN-O3: lower-switch
185-
; GCN-O3: lower-invoke
186-
; GCN-O3: UnreachableBlockElimPass
187-
; GCN-O3: flatten-cfg
188-
; GCN-O3: sink
189-
; GCN-O3: amdgpu-late-codegenprepare
190-
; GCN-O3: amdgpu-unify-divergent-exit-nodes
191-
; GCN-O3: fix-irreducible
192-
; GCN-O3: unify-loop-exits
193-
; GCN-O3: StructurizeCFGPass
194-
; GCN-O3: amdgpu-annotate-uniform
195-
; GCN-O3: si-annotate-control-flow
196-
; GCN-O3: amdgpu-rewrite-undef-for-phi
197-
; GCN-O3: lcssa))
198-
; GCN-O3: amdgpu-perf-hint
199-
; GCN-O3: cgscc(function(require<uniformity>
200-
; GCN-O3: callbr-prepare
201-
; GCN-O3: safe-stack
202-
; GCN-O3: stack-protector))
203-
; GCN-O3: cgscc(function(machine-function(amdgpu-isel
204-
; GCN-O3: si-fix-sgpr-copies
205-
; GCN-O3: si-i1-copies
206-
; GCN-O3: finalize-isel
207-
; GCN-O3: early-tailduplication
208-
; GCN-O3: opt-phis
209-
; GCN-O3: stack-coloring
210-
; GCN-O3: localstackalloc
211-
; GCN-O3: dead-mi-elimination
212-
; GCN-O3: early-machinelicm
213-
; GCN-O3: machine-cse
214-
; GCN-O3: machine-sink
215-
; GCN-O3: peephole-opt
216-
; GCN-O3: dead-mi-elimination
217-
; GCN-O3: si-fold-operands
218-
; GCN-O3: gcn-dpp-combine
219-
; GCN-O3: si-load-store-opt
220-
; GCN-O3: si-peephole-sdwa
221-
; GCN-O3: early-machinelicm
222-
; GCN-O3: machine-cse
223-
; GCN-O3: si-fold-operands
224-
; GCN-O3: dead-mi-elimination
225-
; GCN-O3: si-shrink-instructions
226-
; GCN-O3: detect-dead-lanes
227-
; GCN-O3: InitUndefPass
228-
; GCN-O3: ProcessImplicitDefsPass
229-
; GCN-O3: unreachable-mbb-elimination
230-
; GCN-O3: require<live-vars>
231-
; GCN-O3: require<machine-loops>
232-
; GCN-O3: phi-node-elimination
233-
; GCN-O3: two-address-instruction
234-
; GCN-O3: register-coalescer
235-
; GCN-O3: rename-independent-subregs
236-
; GCN-O3: machine-scheduler
237-
; GCN-O3: greedy<all>
238-
; GCN-O3: amdgpu-nsa-reassign
239-
; GCN-O3: VirtRegRewriterPass
240-
; GCN-O3: stack-slot-coloring
241-
; GCN-O3: machine-cp
242-
; GCN-O3: machinelicm
243-
; GCN-O3: si-fix-vgpr-copies
244-
; GCN-O3: si-optimize-exec-masking
245-
; GCN-O3: remove-redundant-debug-values
246-
; GCN-O3: fixup-statepoint-caller-saved
247-
; GCN-O3: PostRAMachineSinkingPass
248-
; GCN-O3: ShrinkWrapPass
249-
; GCN-O3: PrologEpilogInserterPass
250-
; GCN-O3: branch-folder
251-
; GCN-O3: tailduplication
252-
; GCN-O3: machine-latecleanup
253-
; GCN-O3: machine-cp
254-
; GCN-O3: post-ra-pseudos
255-
; GCN-O3: postmisched
256-
; GCN-O3: block-placement
257-
; GCN-O3: fentry-insert
258-
; GCN-O3: xray-instrumentation
259-
; GCN-O3: patchable-function
260-
; GCN-O3: gcn-create-vopd
261-
; GCN-O3: si-memory-legalizer
262-
; GCN-O3: si-insert-waitcnts
263-
; GCN-O3: si-late-branch-lowering
264-
; GCN-O3: si-pre-emit-peephole
265-
; GCN-O3: post-RA-hazard-rec
266-
; GCN-O3: AMDGPUWaitSGPRHazardsPass
267-
; GCN-O3: amdgpu-insert-delay-alu
268-
; GCN-O3: branch-relaxation
269-
; GCN-O3: remove-loads-into-fake-uses
270-
; GCN-O3: live-debug-values
271-
; GCN-O3: machine-sanmd
272-
; GCN-O3: stack-frame-layout)
273-
; GCN-O3: invalidate<machine-function-info>))
11+
; GCN-O0: require<MachineModuleAnalysis>,require<profile-summary>,require<collector-metadata>,pre-isel-intrinsic-lowering,function(expand-large-div-rem,expand-fp),amdgpu-remove-incompatible-functions,amdgpu-printf-runtime-binding,amdgpu-lower-ctor-dtor,expand-variadics,amdgpu-always-inline,always-inline,amdgpu-export-kernel-runtime-handles,amdgpu-sw-lower-lds,amdgpu-lower-module-lds,function(atomic-expand,verify,gc-lowering,lower-constant-intrinsics,UnreachableBlockElimPass,ee-instrument<post-inline>,scalarize-masked-mem-intrin,ExpandReductionsPass,amdgpu-lower-kernel-arguments),amdgpu-lower-buffer-fat-pointers,cgscc(function(lower-switch,lower-invoke,UnreachableBlockElimPass,amdgpu-unify-divergent-exit-nodes,fix-irreducible,unify-loop-exits,StructurizeCFGPass,amdgpu-annotate-uniform,si-annotate-control-flow,amdgpu-rewrite-undef-for-phi,lcssa,require<uniformity>,callbr-prepare,safe-stack,stack-protector,verify)),cgscc(function(machine-function(amdgpu-isel,si-fix-sgpr-copies,si-i1-copies,finalize-isel,localstackalloc,phi-node-elimination,two-address-instruction,regallocfast,si-fix-vgpr-copies,remove-redundant-debug-values,fixup-statepoint-caller-saved,prolog-epilog,post-ra-pseudos,fentry-insert,xray-instrumentation,patchable-function,si-memory-legalizer,si-insert-waitcnts,si-late-branch-lowering,post-RA-hazard-rec,AMDGPUWaitSGPRHazardsPass,branch-relaxation,remove-loads-into-fake-uses,live-debug-values,machine-sanmd,stack-frame-layout,verify),invalidate<machine-function-info>))
12+
13+
14+
; GCN-O2: require<MachineModuleAnalysis>,require<profile-summary>,require<collector-metadata>,pre-isel-intrinsic-lowering,function(expand-large-div-rem,expand-fp),amdgpu-remove-incompatible-functions,amdgpu-printf-runtime-binding,amdgpu-lower-ctor-dtor,function(amdgpu-image-intrinsic-opt),expand-variadics,amdgpu-always-inline,always-inline,amdgpu-export-kernel-runtime-handles,amdgpu-sw-lower-lds,amdgpu-lower-module-lds,function(infer-address-spaces,amdgpu-atomic-optimizer,atomic-expand,amdgpu-promote-alloca,separate-const-offset-from-gep<>,slsr,early-cse<>,nary-reassociate,early-cse<>,amdgpu-codegenprepare,verify,loop-mssa(loop-reduce),mergeicmps,expand-memcmp,gc-lowering,lower-constant-intrinsics,UnreachableBlockElimPass,consthoist,ReplaceWithVeclib,partially-inline-libcalls,ee-instrument<post-inline>,scalarize-masked-mem-intrin,ExpandReductionsPass,early-cse<>,amdgpu-lower-kernel-arguments),amdgpu-lower-buffer-fat-pointers,cgscc(function(codegenprepare,load-store-vectorizer,lower-switch,lower-invoke,UnreachableBlockElimPass,flatten-cfg,sink,amdgpu-late-codegenprepare,amdgpu-unify-divergent-exit-nodes,fix-irreducible,unify-loop-exits,StructurizeCFGPass,amdgpu-annotate-uniform,si-annotate-control-flow,amdgpu-rewrite-undef-for-phi,lcssa)),amdgpu-perf-hint,cgscc(function(require<uniformity>,callbr-prepare,safe-stack,stack-protector,verify)),cgscc(function(machine-function(amdgpu-isel,si-fix-sgpr-copies,si-i1-copies,finalize-isel,early-tailduplication,opt-phis,stack-coloring,localstackalloc,dead-mi-elimination,early-machinelicm,machine-cse,machine-sink,peephole-opt,dead-mi-elimination,si-fold-operands,gcn-dpp-combine,si-load-store-opt,si-peephole-sdwa,early-machinelicm,machine-cse,si-fold-operands,dead-mi-elimination,si-shrink-instructions,detect-dead-lanes,InitUndefPass,ProcessImplicitDefsPass,unreachable-mbb-elimination,require<live-vars>,require<machine-loops>,phi-node-elimination,two-address-instruction,register-coalescer,rename-independent-subregs,machine-scheduler,amdgpu-pre-ra-long-branch-reg,greedy<sgpr>,virt-reg-rewriter<no-clear-vregs>,stack-slot-coloring,si-lower-sgpr-spills,si-pre-allocate-wwm-regs,greedy<wwm>,si-lower-wwm-copies,virt-reg-rewriter<no-clear-vregs>,amdgpu-reserve-wwm-regs,greedy<vgpr>,amdgpu-nsa-reassign,virt-reg-rewriter,machine-cp,machinelicm,si-fix-vgpr-copies,si-optimize-exec-masking,remove-redundant-debug-values,fixup-statepoint-caller-saved,PostRAMachineSinkingPass,shrink-wrap,prolog-epilog,branch-folder,tailduplication,machine-latecleanup,machine-cp,post-ra-pseudos,postmisched,block-placement,fentry-insert,xray-instrumentation,patchable-function,gcn-create-vopd,si-memory-legalizer,si-insert-waitcnts,si-late-branch-lowering,si-pre-emit-peephole,post-RA-hazard-rec,AMDGPUWaitSGPRHazardsPass,amdgpu-insert-delay-alu,branch-relaxation,remove-loads-into-fake-uses,live-debug-values,machine-sanmd,stack-frame-layout,verify),invalidate<machine-function-info>))
15+
16+
; GCN-O3: require<MachineModuleAnalysis>,require<profile-summary>,require<collector-metadata>,pre-isel-intrinsic-lowering,function(expand-large-div-rem,expand-fp),amdgpu-remove-incompatible-functions,amdgpu-printf-runtime-binding,amdgpu-lower-ctor-dtor,function(amdgpu-image-intrinsic-opt),expand-variadics,amdgpu-always-inline,always-inline,amdgpu-export-kernel-runtime-handles,amdgpu-sw-lower-lds,amdgpu-lower-module-lds,function(infer-address-spaces,amdgpu-atomic-optimizer,atomic-expand,amdgpu-promote-alloca,separate-const-offset-from-gep<>,slsr,gvn<>,nary-reassociate,early-cse<>,amdgpu-codegenprepare,verify,loop-mssa(loop-reduce),mergeicmps,expand-memcmp,gc-lowering,lower-constant-intrinsics,UnreachableBlockElimPass,consthoist,ReplaceWithVeclib,partially-inline-libcalls,ee-instrument<post-inline>,scalarize-masked-mem-intrin,ExpandReductionsPass,gvn<>,amdgpu-lower-kernel-arguments),amdgpu-lower-buffer-fat-pointers,cgscc(function(codegenprepare,load-store-vectorizer,lower-switch,lower-invoke,UnreachableBlockElimPass,flatten-cfg,sink,amdgpu-late-codegenprepare,amdgpu-unify-divergent-exit-nodes,fix-irreducible,unify-loop-exits,StructurizeCFGPass,amdgpu-annotate-uniform,si-annotate-control-flow,amdgpu-rewrite-undef-for-phi,lcssa)),amdgpu-perf-hint,cgscc(function(require<uniformity>,callbr-prepare,safe-stack,stack-protector,verify)),cgscc(function(machine-function(amdgpu-isel,si-fix-sgpr-copies,si-i1-copies,finalize-isel,early-tailduplication,opt-phis,stack-coloring,localstackalloc,dead-mi-elimination,early-machinelicm,machine-cse,machine-sink,peephole-opt,dead-mi-elimination,si-fold-operands,gcn-dpp-combine,si-load-store-opt,si-peephole-sdwa,early-machinelicm,machine-cse,si-fold-operands,dead-mi-elimination,si-shrink-instructions,detect-dead-lanes,InitUndefPass,ProcessImplicitDefsPass,unreachable-mbb-elimination,require<live-vars>,require<machine-loops>,phi-node-elimination,two-address-instruction,register-coalescer,rename-independent-subregs,machine-scheduler,amdgpu-pre-ra-long-branch-reg,greedy<sgpr>,virt-reg-rewriter<no-clear-vregs>,stack-slot-coloring,si-lower-sgpr-spills,si-pre-allocate-wwm-regs,greedy<wwm>,si-lower-wwm-copies,virt-reg-rewriter<no-clear-vregs>,amdgpu-reserve-wwm-regs,greedy<vgpr>,amdgpu-nsa-reassign,virt-reg-rewriter,machine-cp,machinelicm,si-fix-vgpr-copies,si-optimize-exec-masking,remove-redundant-debug-values,fixup-statepoint-caller-saved,PostRAMachineSinkingPass,shrink-wrap,prolog-epilog,branch-folder,tailduplication,machine-latecleanup,machine-cp,post-ra-pseudos,postmisched,block-placement,fentry-insert,xray-instrumentation,patchable-function,gcn-create-vopd,si-memory-legalizer,si-insert-waitcnts,si-late-branch-lowering,si-pre-emit-peephole,post-RA-hazard-rec,AMDGPUWaitSGPRHazardsPass,amdgpu-insert-delay-alu,branch-relaxation,remove-loads-into-fake-uses,live-debug-values,machine-sanmd,stack-frame-layout,verify),invalidate<machine-function-info>))
27417

27518

27619
define void @empty() {

0 commit comments

Comments
 (0)