Skip to content

Commit dd0e38e

Browse files
committed
[SLP]Add a test for missed insert_subvector pattern detection, NFC.
1 parent 8e8bff3 commit dd0e38e

File tree

1 file changed

+56
-0
lines changed

1 file changed

+56
-0
lines changed
Lines changed: 56 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,56 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
2+
; RUN: opt -S --passes=slp-vectorizer -mtriple=riscv64-unknown-linux -pass-remarks-output=%t -mattr=+v -slp-threshold=-10 < %s | FileCheck %s
3+
; RUN: FileCheck %s --check-prefix=YAML < %t
4+
5+
; YAML-LABEL: --- !Passed
6+
; YAML-NEXT: Pass: slp-vectorizer
7+
; YAML-NEXT: Name: StoresVectorized
8+
; YAML-NEXT: Function: test
9+
; YAML-NEXT: Args:
10+
; YAML-NEXT: - String: 'Stores SLP vectorized with cost '
11+
; YAML-NEXT: - Cost: '9'
12+
; YAML-NEXT: - String: ' and with tree size '
13+
; YAML-NEXT: - TreeSize: '7'
14+
15+
define void @test() {
16+
; CHECK-LABEL: define void @test(
17+
; CHECK-SAME: ) #[[ATTR0:[0-9]+]] {
18+
; CHECK-NEXT: entry:
19+
; CHECK-NEXT: [[TMP0:%.*]] = load float, ptr null, align 4
20+
; CHECK-NEXT: [[TMP1:%.*]] = load float, ptr null, align 4
21+
; CHECK-NEXT: [[TMP2:%.*]] = load float, ptr null, align 4
22+
; CHECK-NEXT: [[V9IDX:%.*]] = getelementptr i8, ptr null, i32 4
23+
; CHECK-NEXT: [[V14IDX:%.*]] = getelementptr i8, ptr null, i32 8
24+
; CHECK-NEXT: [[TMP3:%.*]] = insertelement <2 x float> <float poison, float 0.000000e+00>, float [[TMP1]], i32 0
25+
; CHECK-NEXT: [[TMP4:%.*]] = insertelement <2 x float> poison, float [[TMP0]], i32 0
26+
; CHECK-NEXT: [[TMP5:%.*]] = insertelement <2 x float> [[TMP4]], float [[TMP2]], i32 1
27+
; CHECK-NEXT: [[TMP6:%.*]] = fcmp ogt <2 x float> [[TMP3]], [[TMP5]]
28+
; CHECK-NEXT: [[TMP7:%.*]] = extractelement <2 x i1> [[TMP6]], i32 0
29+
; CHECK-NEXT: [[V0_0:%.*]] = select i1 [[TMP7]], float [[TMP0]], float 0.000000e+00
30+
; CHECK-NEXT: [[TMP8:%.*]] = select <2 x i1> [[TMP6]], <2 x float> [[TMP3]], <2 x float> zeroinitializer
31+
; CHECK-NEXT: [[TMP9:%.*]] = extractelement <2 x i1> [[TMP6]], i32 1
32+
; CHECK-NEXT: [[V9_0:%.*]] = select i1 [[TMP9]], float [[TMP2]], float 0.000000e+00
33+
; CHECK-NEXT: store float [[V0_0]], ptr null, align 4
34+
; CHECK-NEXT: store float [[V9_0]], ptr [[V9IDX]], align 4
35+
; CHECK-NEXT: store <2 x float> [[TMP8]], ptr [[V14IDX]], align 4
36+
; CHECK-NEXT: ret void
37+
;
38+
entry:
39+
%0 = load float, ptr null, align 4
40+
%1 = load float, ptr null, align 4
41+
%2 = load float, ptr null, align 4
42+
%cmp.i = fcmp ogt float %1, %0
43+
%v14.0 = select i1 %cmp.i, float %1, float 0.000000e+00
44+
%v0.0 = select i1 %cmp.i, float %0, float 0.000000e+00
45+
%cmp4.i = fcmp ogt float 0.000000e+00, %2
46+
%v19.0 = select i1 %cmp4.i, float 0.000000e+00, float 0.000000e+00
47+
%v9.0 = select i1 %cmp4.i, float %2, float 0.000000e+00
48+
store float %v0.0, ptr null, align 4
49+
%v9idx = getelementptr i8, ptr null, i32 4
50+
store float %v9.0, ptr %v9idx, align 4
51+
%v14idx = getelementptr i8, ptr null, i32 8
52+
store float %v14.0, ptr %v14idx, align 4
53+
%v19idx = getelementptr i8, ptr null, i32 12
54+
store float %v19.0, ptr %v19idx, align 4
55+
ret void
56+
}

0 commit comments

Comments
 (0)