@@ -18,50 +18,50 @@ target triple = "x86_64-unknown-linux-gnu"
18
18
define void @test () {
19
19
; SSE2-LABEL: 'test'
20
20
; SSE2: LV: Found an estimated cost of 1 for VF 1 For instruction: %valB = load i32, ptr %inB, align 4
21
- ; SSE2: LV: Found an estimated cost of 25 for VF 2 For instruction: %valB = load i32, ptr %inB, align 4
22
- ; SSE2: LV: Found an estimated cost of 51 for VF 4 For instruction: %valB = load i32, ptr %inB, align 4
23
- ; SSE2: LV: Found an estimated cost of 102 for VF 8 For instruction: %valB = load i32, ptr %inB, align 4
24
- ; SSE2: LV: Found an estimated cost of 204 for VF 16 For instruction: %valB = load i32, ptr %inB, align 4
21
+ ; SSE2: Cost of 25 for VF 2: {{.*}}ir< %valB> = load
22
+ ; SSE2: Cost of 51 for VF 4: {{.*}}ir< %valB> = load
23
+ ; SSE2: Cost of 102 for VF 8: {{.*}}ir< %valB> = load
24
+ ; SSE2: Cost of 204 for VF 16: {{.*}}ir< %valB> = load
25
25
;
26
26
; SSE42-LABEL: 'test'
27
27
; SSE42: LV: Found an estimated cost of 1 for VF 1 For instruction: %valB = load i32, ptr %inB, align 4
28
- ; SSE42: LV: Found an estimated cost of 24 for VF 2 For instruction: %valB = load i32, ptr %inB, align 4
29
- ; SSE42: LV: Found an estimated cost of 48 for VF 4 For instruction: %valB = load i32, ptr %inB, align 4
30
- ; SSE42: LV: Found an estimated cost of 96 for VF 8 For instruction: %valB = load i32, ptr %inB, align 4
31
- ; SSE42: LV: Found an estimated cost of 192 for VF 16 For instruction: %valB = load i32, ptr %inB, align 4
28
+ ; SSE42: Cost of 24 for VF 2: {{.*}}ir< %valB> = load
29
+ ; SSE42: Cost of 48 for VF 4: {{.*}}ir< %valB> = load
30
+ ; SSE42: Cost of 96 for VF 8: {{.*}}ir< %valB> = load
31
+ ; SSE42: Cost of 192 for VF 16: {{.*}}ir< %valB> = load
32
32
;
33
33
; AVX1-LABEL: 'test'
34
34
; AVX1: LV: Found an estimated cost of 1 for VF 1 For instruction: %valB = load i32, ptr %inB, align 4
35
- ; AVX1: LV: Found an estimated cost of 24 for VF 2 For instruction: %valB = load i32, ptr %inB, align 4
36
- ; AVX1: LV: Found an estimated cost of 48 for VF 4 For instruction: %valB = load i32, ptr %inB, align 4
37
- ; AVX1: LV: Found an estimated cost of 97 for VF 8 For instruction: %valB = load i32, ptr %inB, align 4
38
- ; AVX1: LV: Found an estimated cost of 194 for VF 16 For instruction: %valB = load i32, ptr %inB, align 4
39
- ; AVX1: LV: Found an estimated cost of 388 for VF 32 For instruction: %valB = load i32, ptr %inB, align 4
35
+ ; AVX1: Cost of 24 for VF 2: {{.*}}ir< %valB> = load
36
+ ; AVX1: Cost of 48 for VF 4: {{.*}}ir< %valB> = load
37
+ ; AVX1: Cost of 97 for VF 8: {{.*}}ir< %valB> = load
38
+ ; AVX1: Cost of 194 for VF 16: {{.*}}ir< %valB> = load
39
+ ; AVX1: Cost of 388 for VF 32: {{.*}}ir< %valB> = load
40
40
;
41
41
; AVX2-SLOWGATHER-LABEL: 'test'
42
42
; AVX2-SLOWGATHER: LV: Found an estimated cost of 1 for VF 1 For instruction: %valB = load i32, ptr %inB, align 4
43
- ; AVX2-SLOWGATHER: LV: Found an estimated cost of 4 for VF 2 For instruction: %valB = load i32, ptr %inB, align 4
44
- ; AVX2-SLOWGATHER: LV: Found an estimated cost of 8 for VF 4 For instruction: %valB = load i32, ptr %inB, align 4
45
- ; AVX2-SLOWGATHER: LV: Found an estimated cost of 17 for VF 8 For instruction: %valB = load i32, ptr %inB, align 4
46
- ; AVX2-SLOWGATHER: LV: Found an estimated cost of 34 for VF 16 For instruction: %valB = load i32, ptr %inB, align 4
47
- ; AVX2-SLOWGATHER: LV: Found an estimated cost of 68 for VF 32 For instruction: %valB = load i32, ptr %inB, align 4
43
+ ; AVX2-SLOWGATHER: Cost of 4 for VF 2: {{.*}}ir< %valB> = load
44
+ ; AVX2-SLOWGATHER: Cost of 8 for VF 4: {{.*}}ir< %valB> = load
45
+ ; AVX2-SLOWGATHER: Cost of 17 for VF 8: {{.*}}ir< %valB> = load
46
+ ; AVX2-SLOWGATHER: Cost of 34 for VF 16: {{.*}}ir< %valB> = load
47
+ ; AVX2-SLOWGATHER: Cost of 68 for VF 32: {{.*}}ir< %valB> = load
48
48
;
49
49
; AVX2-FASTGATHER-LABEL: 'test'
50
50
; AVX2-FASTGATHER: LV: Found an estimated cost of 1 for VF 1 For instruction: %valB = load i32, ptr %inB, align 4
51
- ; AVX2-FASTGATHER: LV: Found an estimated cost of 4 for VF 2 For instruction: %valB = load i32, ptr %inB, align 4
52
- ; AVX2-FASTGATHER: LV: Found an estimated cost of 6 for VF 4 For instruction: %valB = load i32, ptr %inB, align 4
53
- ; AVX2-FASTGATHER: LV: Found an estimated cost of 12 for VF 8 For instruction: %valB = load i32, ptr %inB, align 4
54
- ; AVX2-FASTGATHER: LV: Found an estimated cost of 24 for VF 16 For instruction: %valB = load i32, ptr %inB, align 4
55
- ; AVX2-FASTGATHER: LV: Found an estimated cost of 48 for VF 32 For instruction: %valB = load i32, ptr %inB, align 4
51
+ ; AVX2-FASTGATHER: Cost of 4 for VF 2: {{.*}}ir< %valB> = load
52
+ ; AVX2-FASTGATHER: Cost of 6 for VF 4: {{.*}}ir< %valB> = load
53
+ ; AVX2-FASTGATHER: Cost of 12 for VF 8: {{.*}}ir< %valB> = load
54
+ ; AVX2-FASTGATHER: Cost of 24 for VF 16: {{.*}}ir< %valB> = load
55
+ ; AVX2-FASTGATHER: Cost of 48 for VF 32: {{.*}}ir< %valB> = load
56
56
;
57
57
; AVX512-LABEL: 'test'
58
58
; AVX512: LV: Found an estimated cost of 1 for VF 1 For instruction: %valB = load i32, ptr %inB, align 4
59
- ; AVX512: LV: Found an estimated cost of 6 for VF 2 For instruction: %valB = load i32, ptr %inB, align 4
60
- ; AVX512: LV: Found an estimated cost of 13 for VF 4 For instruction: %valB = load i32, ptr %inB, align 4
61
- ; AVX512: LV: Found an estimated cost of 10 for VF 8 For instruction: %valB = load i32, ptr %inB, align 4
62
- ; AVX512: LV: Found an estimated cost of 18 for VF 16 For instruction: %valB = load i32, ptr %inB, align 4
63
- ; AVX512: LV: Found an estimated cost of 36 for VF 32 For instruction: %valB = load i32, ptr %inB, align 4
64
- ; AVX512: LV: Found an estimated cost of 72 for VF 64 For instruction: %valB = load i32, ptr %inB, align 4
59
+ ; AVX512: Cost of 6 for VF 2: {{.*}}ir< %valB> = load
60
+ ; AVX512: Cost of 13 for VF 4: {{.*}}ir< %valB> = load
61
+ ; AVX512: Cost of 10 for VF 8: {{.*}}ir< %valB> = load
62
+ ; AVX512: Cost of 18 for VF 16: {{.*}}ir< %valB> = load
63
+ ; AVX512: Cost of 36 for VF 32: {{.*}}ir< %valB> = load
64
+ ; AVX512: Cost of 72 for VF 64: {{.*}}ir< %valB> = load
65
65
;
66
66
entry:
67
67
br label %for.body
0 commit comments