Skip to content

Commit 8680dd5

Browse files
committed
[X86] getFauxShuffle - don't assume an UNDEF src element for AND/ANDNP results in an UNDEF shuffle mask index
The other src element might be zero, guaranteeing zero. Fixes #55157
1 parent cfb4e78 commit 8680dd5

File tree

1 file changed

+10
-4
lines changed

1 file changed

+10
-4
lines changed

llvm/test/CodeGen/X86/vector-shuffle-combining.ll

Lines changed: 10 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -3333,11 +3333,17 @@ define void @PR45604(<32 x i16>* %dst, <8 x i16>* %src) {
33333333
ret void
33343334
}
33353335

3336-
; FIXME: getFauxShuffle AND/ANDN decoding wrongly assumes an undef src always gives an undef dst.
3336+
; getFauxShuffle AND/ANDN decoding wrongly assumed an undef src always gives an undef dst.
33373337
define <2 x i64> @PR55157(<16 x i8>* %0) {
3338-
; CHECK-LABEL: PR55157:
3339-
; CHECK: # %bb.0:
3340-
; CHECK-NEXT: retq
3338+
; SSE-LABEL: PR55157:
3339+
; SSE: # %bb.0:
3340+
; SSE-NEXT: xorps %xmm0, %xmm0
3341+
; SSE-NEXT: retq
3342+
;
3343+
; AVX-LABEL: PR55157:
3344+
; AVX: # %bb.0:
3345+
; AVX-NEXT: vxorps %xmm0, %xmm0, %xmm0
3346+
; AVX-NEXT: retq
33413347
%2 = load <16 x i8>, <16 x i8>* %0, align 16
33423348
%3 = icmp eq <16 x i8> %2, zeroinitializer
33433349
%4 = tail call <16 x i8> @llvm.x86.sse2.pavg.b(<16 x i8> zeroinitializer, <16 x i8> zeroinitializer)

0 commit comments

Comments
 (0)