Skip to content

Commit 4dda564

Browse files
committed
[RISCV][SLP] Add test coverage for 2^N-1 vector sizes
Mostly copied from the AArch64 coverage for same, but also added a couple tests for reductions which aren't currently supported.
1 parent 986576f commit 4dda564

File tree

2 files changed

+644
-0
lines changed

2 files changed

+644
-0
lines changed
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,130 @@
1+
; NOTE: Assertions have been autogenerated by utils/update_test_checks.py UTC_ARGS: --version 4
2+
; RUN: opt -passes=slp-vectorizer -slp-vectorize-non-power-of-2 -mtriple=riscv64 -mattr=+v -S %s | FileCheck --check-prefixes=NON-POW2 %s
3+
; RUN: opt -passes=slp-vectorizer -slp-vectorize-non-power-of-2=false -mtriple=riscv64 -mattr=+v -S %s | FileCheck --check-prefixes=POW2-ONLY %s
4+
5+
define void @v15_load_i8_mul_by_constant_store(ptr %src, ptr noalias %dst) {
6+
; NON-POW2-LABEL: define void @v15_load_i8_mul_by_constant_store(
7+
; NON-POW2-SAME: ptr [[SRC:%.*]], ptr noalias [[DST:%.*]]) #[[ATTR0:[0-9]+]] {
8+
; NON-POW2-NEXT: entry:
9+
; NON-POW2-NEXT: [[GEP_SRC_0:%.*]] = getelementptr inbounds i8, ptr [[SRC]], i8 0
10+
; NON-POW2-NEXT: [[TMP0:%.*]] = load <15 x i8>, ptr [[GEP_SRC_0]], align 4
11+
; NON-POW2-NEXT: [[TMP1:%.*]] = mul nsw <15 x i8> [[TMP0]], <i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10>
12+
; NON-POW2-NEXT: store <15 x i8> [[TMP1]], ptr [[DST]], align 1
13+
; NON-POW2-NEXT: ret void
14+
;
15+
; POW2-ONLY-LABEL: define void @v15_load_i8_mul_by_constant_store(
16+
; POW2-ONLY-SAME: ptr [[SRC:%.*]], ptr noalias [[DST:%.*]]) #[[ATTR0:[0-9]+]] {
17+
; POW2-ONLY-NEXT: entry:
18+
; POW2-ONLY-NEXT: [[GEP_SRC_0:%.*]] = getelementptr inbounds i8, ptr [[SRC]], i8 0
19+
; POW2-ONLY-NEXT: [[TMP0:%.*]] = load <8 x i8>, ptr [[GEP_SRC_0]], align 4
20+
; POW2-ONLY-NEXT: [[TMP1:%.*]] = mul nsw <8 x i8> [[TMP0]], <i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10, i8 10>
21+
; POW2-ONLY-NEXT: store <8 x i8> [[TMP1]], ptr [[DST]], align 1
22+
; POW2-ONLY-NEXT: [[GEP_SRC_8:%.*]] = getelementptr inbounds i8, ptr [[SRC]], i8 8
23+
; POW2-ONLY-NEXT: [[DST_8:%.*]] = getelementptr i8, ptr [[DST]], i8 8
24+
; POW2-ONLY-NEXT: [[TMP2:%.*]] = load <4 x i8>, ptr [[GEP_SRC_8]], align 4
25+
; POW2-ONLY-NEXT: [[TMP3:%.*]] = mul nsw <4 x i8> [[TMP2]], <i8 10, i8 10, i8 10, i8 10>
26+
; POW2-ONLY-NEXT: store <4 x i8> [[TMP3]], ptr [[DST_8]], align 1
27+
; POW2-ONLY-NEXT: [[GEP_SRC_12:%.*]] = getelementptr inbounds i8, ptr [[SRC]], i8 12
28+
; POW2-ONLY-NEXT: [[DST_12:%.*]] = getelementptr i8, ptr [[DST]], i8 12
29+
; POW2-ONLY-NEXT: [[TMP4:%.*]] = load <2 x i8>, ptr [[GEP_SRC_12]], align 4
30+
; POW2-ONLY-NEXT: [[TMP5:%.*]] = mul nsw <2 x i8> [[TMP4]], <i8 10, i8 10>
31+
; POW2-ONLY-NEXT: store <2 x i8> [[TMP5]], ptr [[DST_12]], align 1
32+
; POW2-ONLY-NEXT: [[GEP_SRC_14:%.*]] = getelementptr inbounds i8, ptr [[SRC]], i8 14
33+
; POW2-ONLY-NEXT: [[L_SRC_14:%.*]] = load i8, ptr [[GEP_SRC_14]], align 4
34+
; POW2-ONLY-NEXT: [[MUL_14:%.*]] = mul nsw i8 [[L_SRC_14]], 10
35+
; POW2-ONLY-NEXT: [[DST_14:%.*]] = getelementptr i8, ptr [[DST]], i8 14
36+
; POW2-ONLY-NEXT: store i8 [[MUL_14]], ptr [[DST_14]], align 1
37+
; POW2-ONLY-NEXT: ret void
38+
;
39+
entry:
40+
%gep.src.0 = getelementptr inbounds i8, ptr %src, i8 0
41+
%l.src.0 = load i8, ptr %gep.src.0, align 4
42+
%mul.0 = mul nsw i8 %l.src.0, 10
43+
store i8 %mul.0, ptr %dst
44+
45+
%gep.src.1 = getelementptr inbounds i8, ptr %src, i8 1
46+
%l.src.1 = load i8, ptr %gep.src.1, align 4
47+
%mul.1 = mul nsw i8 %l.src.1, 10
48+
%dst.1 = getelementptr i8, ptr %dst, i8 1
49+
store i8 %mul.1, ptr %dst.1
50+
51+
%gep.src.2 = getelementptr inbounds i8, ptr %src, i8 2
52+
%l.src.2 = load i8, ptr %gep.src.2, align 4
53+
%mul.2 = mul nsw i8 %l.src.2, 10
54+
%dst.2 = getelementptr i8, ptr %dst, i8 2
55+
store i8 %mul.2, ptr %dst.2
56+
57+
%gep.src.3 = getelementptr inbounds i8, ptr %src, i8 3
58+
%l.src.3 = load i8, ptr %gep.src.3, align 4
59+
%mul.3 = mul nsw i8 %l.src.3, 10
60+
%dst.3 = getelementptr i8, ptr %dst, i8 3
61+
store i8 %mul.3, ptr %dst.3
62+
63+
%gep.src.4 = getelementptr inbounds i8, ptr %src, i8 4
64+
%l.src.4 = load i8, ptr %gep.src.4, align 4
65+
%mul.4 = mul nsw i8 %l.src.4, 10
66+
%dst.4 = getelementptr i8, ptr %dst, i8 4
67+
store i8 %mul.4, ptr %dst.4
68+
69+
%gep.src.5 = getelementptr inbounds i8, ptr %src, i8 5
70+
%l.src.5 = load i8, ptr %gep.src.5, align 4
71+
%mul.5 = mul nsw i8 %l.src.5, 10
72+
%dst.5 = getelementptr i8, ptr %dst, i8 5
73+
store i8 %mul.5, ptr %dst.5
74+
75+
%gep.src.6 = getelementptr inbounds i8, ptr %src, i8 6
76+
%l.src.6 = load i8, ptr %gep.src.6, align 4
77+
%mul.6 = mul nsw i8 %l.src.6, 10
78+
%dst.6 = getelementptr i8, ptr %dst, i8 6
79+
store i8 %mul.6, ptr %dst.6
80+
81+
%gep.src.7 = getelementptr inbounds i8, ptr %src, i8 7
82+
%l.src.7 = load i8, ptr %gep.src.7, align 4
83+
%mul.7 = mul nsw i8 %l.src.7, 10
84+
%dst.7 = getelementptr i8, ptr %dst, i8 7
85+
store i8 %mul.7, ptr %dst.7
86+
87+
%gep.src.8 = getelementptr inbounds i8, ptr %src, i8 8
88+
%l.src.8 = load i8, ptr %gep.src.8, align 4
89+
%mul.8 = mul nsw i8 %l.src.8, 10
90+
%dst.8 = getelementptr i8, ptr %dst, i8 8
91+
store i8 %mul.8, ptr %dst.8
92+
93+
%gep.src.9 = getelementptr inbounds i8, ptr %src, i8 9
94+
%l.src.9 = load i8, ptr %gep.src.9, align 4
95+
%mul.9 = mul nsw i8 %l.src.9, 10
96+
%dst.9 = getelementptr i8, ptr %dst, i8 9
97+
store i8 %mul.9, ptr %dst.9
98+
99+
%gep.src.10 = getelementptr inbounds i8, ptr %src, i8 10
100+
%l.src.10 = load i8, ptr %gep.src.10, align 4
101+
%mul.10 = mul nsw i8 %l.src.10, 10
102+
%dst.10 = getelementptr i8, ptr %dst, i8 10
103+
store i8 %mul.10, ptr %dst.10
104+
105+
%gep.src.11 = getelementptr inbounds i8, ptr %src, i8 11
106+
%l.src.11 = load i8, ptr %gep.src.11, align 4
107+
%mul.11 = mul nsw i8 %l.src.11, 10
108+
%dst.11 = getelementptr i8, ptr %dst, i8 11
109+
store i8 %mul.11, ptr %dst.11
110+
111+
%gep.src.12 = getelementptr inbounds i8, ptr %src, i8 12
112+
%l.src.12 = load i8, ptr %gep.src.12, align 4
113+
%mul.12 = mul nsw i8 %l.src.12, 10
114+
%dst.12 = getelementptr i8, ptr %dst, i8 12
115+
store i8 %mul.12, ptr %dst.12
116+
117+
%gep.src.13 = getelementptr inbounds i8, ptr %src, i8 13
118+
%l.src.13 = load i8, ptr %gep.src.13, align 4
119+
%mul.13 = mul nsw i8 %l.src.13, 10
120+
%dst.13 = getelementptr i8, ptr %dst, i8 13
121+
store i8 %mul.13, ptr %dst.13
122+
123+
%gep.src.14 = getelementptr inbounds i8, ptr %src, i8 14
124+
%l.src.14 = load i8, ptr %gep.src.14, align 4
125+
%mul.14 = mul nsw i8 %l.src.14, 10
126+
%dst.14 = getelementptr i8, ptr %dst, i8 14
127+
store i8 %mul.14, ptr %dst.14
128+
129+
ret void
130+
}

0 commit comments

Comments
 (0)