From de735247c8b638efa8ce5783ac8c7c2e0b7cf3eb Mon Sep 17 00:00:00 2001 From: Simon Pilgrim Date: Mon, 6 Jan 2020 13:44:55 +0000 Subject: [PATCH] [X86] Add extra PR43971 test case mentioned in D70267 --- llvm/test/CodeGen/X86/extractelement-load.ll | 45 ++++++++++++++++++++ 1 file changed, 45 insertions(+) diff --git a/llvm/test/CodeGen/X86/extractelement-load.ll b/llvm/test/CodeGen/X86/extractelement-load.ll index 76c563e728e7..f499568ca691 100644 --- a/llvm/test/CodeGen/X86/extractelement-load.ll +++ b/llvm/test/CodeGen/X86/extractelement-load.ll @@ -220,3 +220,48 @@ entry: store float %cond, float* %a1, align 4 ret void } + +define float @PR43971_1(<8 x float> *%a0) nounwind { +; X32-SSE2-LABEL: PR43971_1: +; X32-SSE2: # %bb.0: # %entry +; X32-SSE2-NEXT: pushl %eax +; X32-SSE2-NEXT: movl {{[0-9]+}}(%esp), %eax +; X32-SSE2-NEXT: movaps (%eax), %xmm0 +; X32-SSE2-NEXT: shufps {{.*#+}} xmm0 = xmm0[1,1,2,3] +; X32-SSE2-NEXT: xorps %xmm1, %xmm1 +; X32-SSE2-NEXT: cmpeqss %xmm0, %xmm1 +; X32-SSE2-NEXT: movss {{.*#+}} xmm2 = mem[0],zero,zero,zero +; X32-SSE2-NEXT: andps %xmm1, %xmm2 +; X32-SSE2-NEXT: andnps %xmm0, %xmm1 +; X32-SSE2-NEXT: orps %xmm2, %xmm1 +; X32-SSE2-NEXT: movss %xmm1, (%esp) +; X32-SSE2-NEXT: flds (%esp) +; X32-SSE2-NEXT: popl %eax +; X32-SSE2-NEXT: retl +; +; X64-SSSE3-LABEL: PR43971_1: +; X64-SSSE3: # %bb.0: # %entry +; X64-SSSE3-NEXT: movshdup {{.*#+}} xmm1 = mem[1,1,3,3] +; X64-SSSE3-NEXT: xorps %xmm0, %xmm0 +; X64-SSSE3-NEXT: cmpeqss %xmm1, %xmm0 +; X64-SSSE3-NEXT: movss {{.*#+}} xmm2 = mem[0],zero,zero,zero +; X64-SSSE3-NEXT: andps %xmm0, %xmm2 +; X64-SSSE3-NEXT: andnps %xmm1, %xmm0 +; X64-SSSE3-NEXT: orps %xmm2, %xmm0 +; X64-SSSE3-NEXT: retq +; +; X64-AVX-LABEL: PR43971_1: +; X64-AVX: # %bb.0: # %entry +; X64-AVX-NEXT: vmovshdup {{.*#+}} xmm0 = mem[1,1,3,3] +; X64-AVX-NEXT: vxorps %xmm1, %xmm1, %xmm1 +; X64-AVX-NEXT: vcmpeqss %xmm1, %xmm0, %xmm1 +; X64-AVX-NEXT: vmovss {{.*#+}} xmm2 = mem[0],zero,zero,zero +; X64-AVX-NEXT: vblendvps %xmm1, %xmm2, %xmm0, %xmm0 +; X64-AVX-NEXT: retq +entry: + %0 = load <8 x float>, <8 x float>* %a0, align 32 + %vecext = extractelement <8 x float> %0, i32 1 + %cmp = fcmp oeq float %vecext, 0.000000e+00 + %cond = select i1 %cmp, float 1.000000e+00, float %vecext + ret float %cond +}