@@ -143,12 +143,44 @@ body: |
143
143
; GCN: %var:_(<2 x s16>) = COPY $vgpr0
144
144
; GCN: %four:_(s32) = G_CONSTANT i32 4
145
145
; GCN: %four_vec:_(<2 x s16>) = G_BUILD_VECTOR_TRUNC %four(s32), %four(s32)
146
+ ; GCN: [[C:%[0-9]+]]:_(s16) = G_CONSTANT i16 -1
147
+ ; GCN: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s16>) = G_BUILD_VECTOR [[C]](s16), [[C]](s16)
148
+ ; GCN: [[ADD:%[0-9]+]]:_(<2 x s16>) = G_ADD %four_vec, [[BUILD_VECTOR]]
149
+ ; GCN: %rem:_(<2 x s16>) = G_AND %var, [[ADD]]
150
+ ; GCN: $vgpr0 = COPY %rem(<2 x s16>)
151
+ %var:_(<2 x s16>) = COPY $vgpr0
152
+ %shift_amt:_(s32) = COPY $vgpr1
153
+ %four:_(s32) = G_CONSTANT i32 4
154
+ %four_vec:_(<2 x s16>) = G_BUILD_VECTOR_TRUNC %four, %four
155
+ %rem:_(<2 x s16>) = G_UREM %var, %four_vec
156
+ $vgpr0 = COPY %rem
157
+ ...
158
+
159
+ # The shl is a known power of two, but we do not know if the final
160
+ # value is a power of 2 due to the truncation.
161
+ ---
162
+ name : urem_v2s16_var_nonconst_build_vector_trunc
163
+ tracksRegLiveness : true
164
+ body : |
165
+ bb.0:
166
+ liveins: $vgpr0, $vgpr1
167
+
168
+ ; GCN-LABEL: name: urem_v2s16_var_nonconst_build_vector_trunc
169
+ ; GCN: liveins: $vgpr0, $vgpr1
170
+ ; GCN: %var:_(<2 x s16>) = COPY $vgpr0
171
+ ; GCN: %shift_amt:_(<2 x s16>) = COPY $vgpr1
172
+ ; GCN: %two:_(s32) = G_CONSTANT i32 2
173
+ ; GCN: %four:_(s32) = G_CONSTANT i32 4
174
+ ; GCN: %shift:_(s32) = G_SHL %two, %shift_amt(<2 x s16>)
175
+ ; GCN: %four_vec:_(<2 x s16>) = G_BUILD_VECTOR_TRUNC %four(s32), %shift(s32)
146
176
; GCN: %rem:_(<2 x s16>) = G_UREM %var, %four_vec
147
177
; GCN: $vgpr0 = COPY %rem(<2 x s16>)
148
178
%var:_(<2 x s16>) = COPY $vgpr0
149
179
%shift_amt:_(<2 x s16>) = COPY $vgpr1
180
+ %two:_(s32) = G_CONSTANT i32 2
150
181
%four:_(s32) = G_CONSTANT i32 4
151
- %four_vec:_(<2 x s16>) = G_BUILD_VECTOR_TRUNC %four, %four
182
+ %shift:_(s32) = G_SHL %two, %shift_amt
183
+ %four_vec:_(<2 x s16>) = G_BUILD_VECTOR_TRUNC %four, %shift
152
184
%rem:_(<2 x s16>) = G_UREM %var, %four_vec
153
185
$vgpr0 = COPY %rem
154
186
...
@@ -190,7 +222,10 @@ body: |
190
222
; GCN: %pow2_1:_(s32) = G_CONSTANT i32 4096
191
223
; GCN: %pow2_2:_(s32) = G_CONSTANT i32 2048
192
224
; GCN: %pow2_vec:_(<2 x s32>) = G_BUILD_VECTOR %pow2_1(s32), %pow2_2(s32)
193
- ; GCN: %rem:_(<2 x s32>) = G_UREM %var, %pow2_vec
225
+ ; GCN: [[C:%[0-9]+]]:_(s32) = G_CONSTANT i32 -1
226
+ ; GCN: [[BUILD_VECTOR:%[0-9]+]]:_(<2 x s32>) = G_BUILD_VECTOR [[C]](s32), [[C]](s32)
227
+ ; GCN: [[ADD:%[0-9]+]]:_(<2 x s32>) = G_ADD %pow2_vec, [[BUILD_VECTOR]]
228
+ ; GCN: %rem:_(<2 x s32>) = G_AND %var, [[ADD]]
194
229
; GCN: $vgpr0_vgpr1 = COPY %rem(<2 x s32>)
195
230
%var:_(<2 x s32>) = COPY $vgpr0_vgpr1
196
231
%pow2_1:_(s32) = G_CONSTANT i32 4096
0 commit comments