; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=x86_64-unknown-unknown -mattr=+avx512bw -mattr=+avx512dq -mattr=+avx512vl| FileCheck %s define <8 x i1> @test(<2 x i1> %a) { ; CHECK-LABEL: test: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k0 ; CHECK-NEXT: kshiftlb $2, %k0, %k0 ; CHECK-NEXT: vpmovm2w %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> undef, <8 x i32> ret <8 x i1> %res } define <8 x i1> @test1(<2 x i1> %a) { ; CHECK-LABEL: test1: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k0 ; CHECK-NEXT: kshiftlb $4, %k0, %k0 ; CHECK-NEXT: vpmovm2w %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> undef, <8 x i32> ret <8 x i1> %res } define <8 x i1> @test2(<2 x i1> %a) { ; CHECK-LABEL: test2: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k0 ; CHECK-NEXT: kshiftlb $4, %k0, %k0 ; CHECK-NEXT: vpmovm2w %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> zeroinitializer, <8 x i32> ret <8 x i1> %res } define <8 x i1> @test3(<4 x i1> %a) { ; CHECK-LABEL: test3: ; CHECK: # %bb.0: ; CHECK-NEXT: vpslld $31, %xmm0, %xmm0 ; CHECK-NEXT: vpmovd2m %xmm0, %k0 ; CHECK-NEXT: vpmovm2w %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <4 x i1> %a, <4 x i1> zeroinitializer, <8 x i32> ret <8 x i1> %res } define <8 x i1> @test4(<4 x i1> %a, <4 x i1>%b) { ; CHECK-LABEL: test4: ; CHECK: # %bb.0: ; CHECK-NEXT: vpslld $31, %xmm1, %xmm1 ; CHECK-NEXT: vpmovd2m %xmm1, %k0 ; CHECK-NEXT: vpslld $31, %xmm0, %xmm0 ; CHECK-NEXT: vpmovd2m %xmm0, %k1 ; CHECK-NEXT: kshiftlb $4, %k0, %k0 ; CHECK-NEXT: korb %k0, %k1, %k0 ; CHECK-NEXT: vpmovm2w %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <4 x i1> %a, <4 x i1> %b, <8 x i32> ret <8 x i1> %res } define <4 x i1> @test5(<2 x i1> %a, <2 x i1>%b) { ; CHECK-LABEL: test5: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm1, %xmm1 ; CHECK-NEXT: vpmovq2m %xmm1, %k0 ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k1 ; CHECK-NEXT: kshiftlb $2, %k0, %k0 ; CHECK-NEXT: korw %k0, %k1, %k0 ; CHECK-NEXT: vpmovm2d %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> %b, <4 x i32> ret <4 x i1> %res } define <16 x i1> @test6(<2 x i1> %a, <2 x i1>%b) { ; CHECK-LABEL: test6: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm1, %xmm1 ; CHECK-NEXT: vpmovq2m %xmm1, %k0 ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k1 ; CHECK-NEXT: kshiftlb $2, %k0, %k0 ; CHECK-NEXT: korw %k0, %k1, %k0 ; CHECK-NEXT: vpmovm2b %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> %b, <16 x i32> ret <16 x i1> %res } define <32 x i1> @test7(<4 x i1> %a, <4 x i1>%b) { ; CHECK-LABEL: test7: ; CHECK: # %bb.0: ; CHECK-NEXT: vpslld $31, %xmm1, %xmm1 ; CHECK-NEXT: vpmovd2m %xmm1, %k0 ; CHECK-NEXT: vpslld $31, %xmm0, %xmm0 ; CHECK-NEXT: vpmovd2m %xmm0, %k1 ; CHECK-NEXT: kshiftlb $4, %k0, %k0 ; CHECK-NEXT: korb %k0, %k1, %k0 ; CHECK-NEXT: vpmovm2b %k0, %ymm0 ; CHECK-NEXT: retq %res = shufflevector <4 x i1> %a, <4 x i1> %b, <32 x i32> ret <32 x i1> %res } define <64 x i1> @test8(<8 x i1> %a, <8 x i1>%b) { ; CHECK-LABEL: test8: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllw $15, %xmm1, %xmm1 ; CHECK-NEXT: vpmovw2m %xmm1, %k0 ; CHECK-NEXT: vpsllw $15, %xmm0, %xmm0 ; CHECK-NEXT: vpmovw2m %xmm0, %k1 ; CHECK-NEXT: kunpckdq %k1, %k0, %k0 ; CHECK-NEXT: vpmovm2b %k0, %zmm0 ; CHECK-NEXT: retq %res = shufflevector <8 x i1> %a, <8 x i1> %b, <64 x i32> ret <64 x i1> %res } define <4 x i1> @test9(<8 x i1> %a, <8 x i1> %b) { ; CHECK-LABEL: test9: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllw $15, %xmm0, %xmm0 ; CHECK-NEXT: vpmovw2m %xmm0, %k0 ; CHECK-NEXT: kshiftrb $4, %k0, %k0 ; CHECK-NEXT: vpmovm2d %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <8 x i1> %a, <8 x i1> %b, <4 x i32> ret <4 x i1> %res } define <2 x i1> @test10(<4 x i1> %a, <4 x i1> %b) { ; CHECK-LABEL: test10: ; CHECK: # %bb.0: ; CHECK-NEXT: vpslld $31, %xmm0, %xmm0 ; CHECK-NEXT: vpmovd2m %xmm0, %k0 ; CHECK-NEXT: kshiftrb $2, %k0, %k0 ; CHECK-NEXT: vpmovm2q %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <4 x i1> %a, <4 x i1> %b, <2 x i32> ret <2 x i1> %res } define <8 x i1> @test11(<4 x i1> %a, <4 x i1>%b) { ; CHECK-LABEL: test11: ; CHECK: # %bb.0: ; CHECK-NEXT: vpslld $31, %xmm0, %xmm0 ; CHECK-NEXT: vpmovd2m %xmm0, %k0 ; CHECK-NEXT: kshiftlb $4, %k0, %k0 ; CHECK-NEXT: vpmovm2w %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <4 x i1> %a, <4 x i1> undef, <8 x i32> ret <8 x i1> %res } define <16 x i1> @test12(<2 x i1> %a) { ; CHECK-LABEL: test12: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k0 ; CHECK-NEXT: kshiftlw $10, %k0, %k0 ; CHECK-NEXT: vpmovm2b %k0, %xmm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> zeroinitializer, <16 x i32> ret <16 x i1> %res } define <32 x i1> @test13(<2 x i1> %a) { ; CHECK-LABEL: test13: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k0 ; CHECK-NEXT: kshiftld $10, %k0, %k0 ; CHECK-NEXT: vpmovm2b %k0, %ymm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> zeroinitializer, <32 x i32> ret <32 x i1> %res } define <64 x i1> @test14(<2 x i1> %a) { ; CHECK-LABEL: test14: ; CHECK: # %bb.0: ; CHECK-NEXT: vpsllq $63, %xmm0, %xmm0 ; CHECK-NEXT: vpmovq2m %xmm0, %k0 ; CHECK-NEXT: kshiftlq $10, %k0, %k0 ; CHECK-NEXT: vpmovm2b %k0, %zmm0 ; CHECK-NEXT: retq %res = shufflevector <2 x i1> %a, <2 x i1> zeroinitializer, <64 x i32> ret <64 x i1> %res } ; Make sure we can recognize this shuffle as an insertion in to a zero vector. define i8 @test15(<2 x i64> %x) { ; CHECK-LABEL: test15: ; CHECK: # %bb.0: ; CHECK-NEXT: vptestnmq %xmm0, %xmm0, %k0 ; CHECK-NEXT: kmovd %k0, %eax ; CHECK-NEXT: # kill: def $al killed $al killed $eax ; CHECK-NEXT: retq %a = icmp eq <2 x i64> %x, zeroinitializer %b = shufflevector <2 x i1> %a, <2 x i1> , <8 x i32> %c = bitcast <8 x i1> %b to i8 ret i8 %c }