; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mattr=+avx512f | FileCheck %s --check-prefix=ALL --check-prefix=KNL ; RUN: llc < %s -mtriple=x86_64-apple-darwin -mattr=+avx512f,+avx512vl,+avx512bw,+avx512dq,+fast-variable-shuffle | FileCheck %s --check-prefixes=ALL,SKX attributes #0 = { nounwind } define <16 x i8> @trunc_16x32_to_16x8(<16 x i32> %i) #0 { ; ALL-LABEL: trunc_16x32_to_16x8: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovdb %zmm0, %xmm0 ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <16 x i32> %i to <16 x i8> ret <16 x i8> %x } define <8 x i16> @trunc_8x64_to_8x16(<8 x i64> %i) #0 { ; ALL-LABEL: trunc_8x64_to_8x16: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovqw %zmm0, %xmm0 ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <8 x i64> %i to <8 x i16> ret <8 x i16> %x } define <16 x i16> @trunc_v16i32_to_v16i16(<16 x i32> %x) #0 { ; ALL-LABEL: trunc_v16i32_to_v16i16: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovdw %zmm0, %ymm0 ; ALL-NEXT: retq %1 = trunc <16 x i32> %x to <16 x i16> ret <16 x i16> %1 } define <8 x i8> @trunc_qb_512(<8 x i64> %i) #0 { ; ALL-LABEL: trunc_qb_512: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovqb %zmm0, %xmm0 ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <8 x i64> %i to <8 x i8> ret <8 x i8> %x } define void @trunc_qb_512_mem(<8 x i64> %i, <8 x i8>* %res) #0 { ; ALL-LABEL: trunc_qb_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovqb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <8 x i64> %i to <8 x i8> store <8 x i8> %x, <8 x i8>* %res ret void } define <4 x i8> @trunc_qb_256(<4 x i64> %i) #0 { ; KNL-LABEL: trunc_qb_256: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovqb %zmm0, %xmm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qb_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqb %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <4 x i64> %i to <4 x i8> ret <4 x i8> %x } define void @trunc_qb_256_mem(<4 x i64> %i, <4 x i8>* %res) #0 { ; KNL-LABEL: trunc_qb_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovqb %zmm0, %xmm0 ; KNL-NEXT: vmovd %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qb_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <4 x i64> %i to <4 x i8> store <4 x i8> %x, <4 x i8>* %res ret void } define <2 x i8> @trunc_qb_128(<2 x i64> %i) #0 { ; KNL-LABEL: trunc_qb_128: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,8,u,u,u,u,u,u,u,u,u,u,u,u,u,u] ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qb_128: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqb %xmm0, %xmm0 ; SKX-NEXT: retq %x = trunc <2 x i64> %i to <2 x i8> ret <2 x i8> %x } define void @trunc_qb_128_mem(<2 x i64> %i, <2 x i8>* %res) #0 { ; KNL-LABEL: trunc_qb_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,8,u,u,u,u,u,u,u,u,u,u,u,u,u,u] ; KNL-NEXT: vpextrw $0, %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qb_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqb %xmm0, (%rdi) ; SKX-NEXT: retq %x = trunc <2 x i64> %i to <2 x i8> store <2 x i8> %x, <2 x i8>* %res ret void } define <8 x i16> @trunc_qw_512(<8 x i64> %i) #0 { ; ALL-LABEL: trunc_qw_512: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovqw %zmm0, %xmm0 ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <8 x i64> %i to <8 x i16> ret <8 x i16> %x } define void @trunc_qw_512_mem(<8 x i64> %i, <8 x i16>* %res) #0 { ; ALL-LABEL: trunc_qw_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovqw %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <8 x i64> %i to <8 x i16> store <8 x i16> %x, <8 x i16>* %res ret void } define <4 x i16> @trunc_qw_256(<4 x i64> %i) #0 { ; KNL-LABEL: trunc_qw_256: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovqw %zmm0, %xmm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qw_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqw %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <4 x i64> %i to <4 x i16> ret <4 x i16> %x } define void @trunc_qw_256_mem(<4 x i64> %i, <4 x i16>* %res) #0 { ; KNL-LABEL: trunc_qw_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovqw %zmm0, %xmm0 ; KNL-NEXT: vmovq %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qw_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqw %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <4 x i64> %i to <4 x i16> store <4 x i16> %x, <4 x i16>* %res ret void } define <2 x i16> @trunc_qw_128(<2 x i64> %i) #0 { ; KNL-LABEL: trunc_qw_128: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[0,2,2,3] ; KNL-NEXT: vpshuflw {{.*#+}} xmm0 = xmm0[0,2,2,3,4,5,6,7] ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qw_128: ; SKX: ## %bb.0: ; SKX-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,1,8,9,8,9,10,11,8,9,10,11,12,13,14,15] ; SKX-NEXT: retq %x = trunc <2 x i64> %i to <2 x i16> ret <2 x i16> %x } define void @trunc_qw_128_mem(<2 x i64> %i, <2 x i16>* %res) #0 { ; KNL-LABEL: trunc_qw_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufd {{.*#+}} xmm0 = xmm0[0,2,2,3] ; KNL-NEXT: vpshuflw {{.*#+}} xmm0 = xmm0[0,2,2,3,4,5,6,7] ; KNL-NEXT: vmovd %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qw_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqw %xmm0, (%rdi) ; SKX-NEXT: retq %x = trunc <2 x i64> %i to <2 x i16> store <2 x i16> %x, <2 x i16>* %res ret void } define <8 x i32> @trunc_qd_512(<8 x i64> %i) #0 { ; ALL-LABEL: trunc_qd_512: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovqd %zmm0, %ymm0 ; ALL-NEXT: retq %x = trunc <8 x i64> %i to <8 x i32> ret <8 x i32> %x } define void @trunc_qd_512_mem(<8 x i64> %i, <8 x i32>* %res) #0 { ; ALL-LABEL: trunc_qd_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovqd %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <8 x i64> %i to <8 x i32> store <8 x i32> %x, <8 x i32>* %res ret void } define <4 x i32> @trunc_qd_256(<4 x i64> %i) #0 { ; KNL-LABEL: trunc_qd_256: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovqd %zmm0, %ymm0 ; KNL-NEXT: ## kill: def $xmm0 killed $xmm0 killed $ymm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qd_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqd %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <4 x i64> %i to <4 x i32> ret <4 x i32> %x } define void @trunc_qd_256_mem(<4 x i64> %i, <4 x i32>* %res) #0 { ; KNL-LABEL: trunc_qd_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovqd %zmm0, %ymm0 ; KNL-NEXT: vmovdqa %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qd_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqd %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <4 x i64> %i to <4 x i32> store <4 x i32> %x, <4 x i32>* %res ret void } define <2 x i32> @trunc_qd_128(<2 x i64> %i) #0 { ; ALL-LABEL: trunc_qd_128: ; ALL: ## %bb.0: ; ALL-NEXT: vpermilps {{.*#+}} xmm0 = xmm0[0,2,2,3] ; ALL-NEXT: retq %x = trunc <2 x i64> %i to <2 x i32> ret <2 x i32> %x } define void @trunc_qd_128_mem(<2 x i64> %i, <2 x i32>* %res) #0 { ; KNL-LABEL: trunc_qd_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpermilps {{.*#+}} xmm0 = xmm0[0,2,2,3] ; KNL-NEXT: vmovlps %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_qd_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovqd %xmm0, (%rdi) ; SKX-NEXT: retq %x = trunc <2 x i64> %i to <2 x i32> store <2 x i32> %x, <2 x i32>* %res ret void } define <16 x i8> @trunc_db_512(<16 x i32> %i) #0 { ; ALL-LABEL: trunc_db_512: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovdb %zmm0, %xmm0 ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <16 x i32> %i to <16 x i8> ret <16 x i8> %x } define void @trunc_db_512_mem(<16 x i32> %i, <16 x i8>* %res) #0 { ; ALL-LABEL: trunc_db_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovdb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <16 x i32> %i to <16 x i8> store <16 x i8> %x, <16 x i8>* %res ret void } define <8 x i8> @trunc_db_256(<8 x i32> %i) #0 { ; KNL-LABEL: trunc_db_256: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovdb %zmm0, %xmm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_db_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovdb %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <8 x i32> %i to <8 x i8> ret <8 x i8> %x } define void @trunc_db_256_mem(<8 x i32> %i, <8 x i8>* %res) #0 { ; KNL-LABEL: trunc_db_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovdb %zmm0, %xmm0 ; KNL-NEXT: vmovq %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_db_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovdb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <8 x i32> %i to <8 x i8> store <8 x i8> %x, <8 x i8>* %res ret void } define <4 x i8> @trunc_db_128(<4 x i32> %i) #0 { ; KNL-LABEL: trunc_db_128: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,4,8,12,u,u,u,u,u,u,u,u,u,u,u,u] ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_db_128: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovdb %xmm0, %xmm0 ; SKX-NEXT: retq %x = trunc <4 x i32> %i to <4 x i8> ret <4 x i8> %x } define void @trunc_db_128_mem(<4 x i32> %i, <4 x i8>* %res) #0 { ; KNL-LABEL: trunc_db_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,4,8,12,u,u,u,u,u,u,u,u,u,u,u,u] ; KNL-NEXT: vmovd %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_db_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovdb %xmm0, (%rdi) ; SKX-NEXT: retq %x = trunc <4 x i32> %i to <4 x i8> store <4 x i8> %x, <4 x i8>* %res ret void } define <16 x i16> @trunc_dw_512(<16 x i32> %i) #0 { ; ALL-LABEL: trunc_dw_512: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovdw %zmm0, %ymm0 ; ALL-NEXT: retq %x = trunc <16 x i32> %i to <16 x i16> ret <16 x i16> %x } define void @trunc_dw_512_mem(<16 x i32> %i, <16 x i16>* %res) #0 { ; ALL-LABEL: trunc_dw_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovdw %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x = trunc <16 x i32> %i to <16 x i16> store <16 x i16> %x, <16 x i16>* %res ret void } define <8 x i16> @trunc_dw_256(<8 x i32> %i) #0 { ; KNL-LABEL: trunc_dw_256: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovdw %zmm0, %ymm0 ; KNL-NEXT: ## kill: def $xmm0 killed $xmm0 killed $ymm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_dw_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovdw %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <8 x i32> %i to <8 x i16> ret <8 x i16> %x } define void @trunc_dw_256_mem(<8 x i32> %i, <8 x i16>* %res) #0 { ; KNL-LABEL: trunc_dw_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovdw %zmm0, %ymm0 ; KNL-NEXT: vmovdqa %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_dw_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovdw %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <8 x i32> %i to <8 x i16> store <8 x i16> %x, <8 x i16>* %res ret void } define void @trunc_dw_128_mem(<4 x i32> %i, <4 x i16>* %res) #0 { ; KNL-LABEL: trunc_dw_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,1,4,5,8,9,12,13,u,u,u,u,u,u,u,u] ; KNL-NEXT: vmovq %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_dw_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovdw %xmm0, (%rdi) ; SKX-NEXT: retq %x = trunc <4 x i32> %i to <4 x i16> store <4 x i16> %x, <4 x i16>* %res ret void } define <32 x i8> @trunc_wb_512(<32 x i16> %i) #0 { ; KNL-LABEL: trunc_wb_512: ; KNL: ## %bb.0: ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm1 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm1, %xmm1 ; KNL-NEXT: vextracti64x4 $1, %zmm0, %ymm0 ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, %xmm0 ; KNL-NEXT: vinserti128 $1, %xmm0, %ymm1, %ymm0 ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_wb_512: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovwb %zmm0, %ymm0 ; SKX-NEXT: retq %x = trunc <32 x i16> %i to <32 x i8> ret <32 x i8> %x } define void @trunc_wb_512_mem(<32 x i16> %i, <32 x i8>* %res) #0 { ; KNL-LABEL: trunc_wb_512_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vextracti64x4 $1, %zmm0, %ymm1 ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm1 = ymm1[0],zero,ymm1[1],zero,ymm1[2],zero,ymm1[3],zero,ymm1[4],zero,ymm1[5],zero,ymm1[6],zero,ymm1[7],zero,ymm1[8],zero,ymm1[9],zero,ymm1[10],zero,ymm1[11],zero,ymm1[12],zero,ymm1[13],zero,ymm1[14],zero,ymm1[15],zero ; KNL-NEXT: vpmovdb %zmm1, 16(%rdi) ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_wb_512_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovwb %zmm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <32 x i16> %i to <32 x i8> store <32 x i8> %x, <32 x i8>* %res ret void } define <16 x i8> @trunc_wb_256(<16 x i16> %i) #0 { ; KNL-LABEL: trunc_wb_256: ; KNL: ## %bb.0: ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, %xmm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_wb_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovwb %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <16 x i16> %i to <16 x i8> ret <16 x i8> %x } define void @trunc_wb_256_mem(<16 x i16> %i, <16 x i8>* %res) #0 { ; KNL-LABEL: trunc_wb_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_wb_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovwb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <16 x i16> %i to <16 x i8> store <16 x i8> %x, <16 x i8>* %res ret void } define <16 x i8> @trunc_wb_256_mem_and_ret(<16 x i16> %i, <16 x i8>* %res) #0 { ; KNL-LABEL: trunc_wb_256_mem_and_ret: ; KNL: ## %bb.0: ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, %xmm0 ; KNL-NEXT: vmovdqa %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_wb_256_mem_and_ret: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovwb %ymm0, %xmm0 ; SKX-NEXT: vmovdqa %xmm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x = trunc <16 x i16> %i to <16 x i8> store <16 x i8> %x, <16 x i8>* %res ret <16 x i8> %x } define <8 x i8> @trunc_wb_128(<8 x i16> %i) #0 { ; KNL-LABEL: trunc_wb_128: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,u,u,u,u,u,u,u,u] ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_wb_128: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovwb %xmm0, %xmm0 ; SKX-NEXT: retq %x = trunc <8 x i16> %i to <8 x i8> ret <8 x i8> %x } define void @trunc_wb_128_mem(<8 x i16> %i, <8 x i8>* %res) #0 { ; KNL-LABEL: trunc_wb_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpshufb {{.*#+}} xmm0 = xmm0[0,2,4,6,8,10,12,14,u,u,u,u,u,u,u,u] ; KNL-NEXT: vmovq %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: trunc_wb_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovwb %xmm0, (%rdi) ; SKX-NEXT: retq %x = trunc <8 x i16> %i to <8 x i8> store <8 x i8> %x, <8 x i8>* %res ret void } define void @usat_trunc_wb_256_mem(<16 x i16> %i, <16 x i8>* %res) { ; KNL-LABEL: usat_trunc_wb_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpminuw {{.*}}(%rip), %ymm0, %ymm0 ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: usat_trunc_wb_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovuswb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x3 = icmp ult <16 x i16> %i, %x5 = select <16 x i1> %x3, <16 x i16> %i, <16 x i16> %x6 = trunc <16 x i16> %x5 to <16 x i8> store <16 x i8> %x6, <16 x i8>* %res, align 1 ret void } define <16 x i8> @usat_trunc_wb_256(<16 x i16> %i) { ; KNL-LABEL: usat_trunc_wb_256: ; KNL: ## %bb.0: ; KNL-NEXT: vpminuw {{.*}}(%rip), %ymm0, %ymm0 ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, %xmm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: usat_trunc_wb_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovuswb %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x3 = icmp ult <16 x i16> %i, %x5 = select <16 x i1> %x3, <16 x i16> %i, <16 x i16> %x6 = trunc <16 x i16> %x5 to <16 x i8> ret <16 x i8> %x6 } define void @usat_trunc_wb_128_mem(<8 x i16> %i, <8 x i8>* %res) { ; KNL-LABEL: usat_trunc_wb_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpminuw {{.*}}(%rip), %xmm0, %xmm0 ; KNL-NEXT: vpackuswb %xmm0, %xmm0, %xmm0 ; KNL-NEXT: vmovq %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: usat_trunc_wb_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovuswb %xmm0, (%rdi) ; SKX-NEXT: retq %x3 = icmp ult <8 x i16> %i, %x5 = select <8 x i1> %x3, <8 x i16> %i, <8 x i16> %x6 = trunc <8 x i16> %x5 to <8 x i8> store <8 x i8> %x6, <8 x i8>* %res, align 1 ret void } define void @usat_trunc_db_512_mem(<16 x i32> %i, <16 x i8>* %res) { ; ALL-LABEL: usat_trunc_db_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusdb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x3 = icmp ult <16 x i32> %i, %x5 = select <16 x i1> %x3, <16 x i32> %i, <16 x i32> %x6 = trunc <16 x i32> %x5 to <16 x i8> store <16 x i8> %x6, <16 x i8>* %res, align 1 ret void } define void @usat_trunc_qb_512_mem(<8 x i64> %i, <8 x i8>* %res) { ; ALL-LABEL: usat_trunc_qb_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusqb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x3 = icmp ult <8 x i64> %i, %x5 = select <8 x i1> %x3, <8 x i64> %i, <8 x i64> %x6 = trunc <8 x i64> %x5 to <8 x i8> store <8 x i8> %x6, <8 x i8>* %res, align 1 ret void } define void @usat_trunc_qd_512_mem(<8 x i64> %i, <8 x i32>* %res) { ; ALL-LABEL: usat_trunc_qd_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusqd %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x3 = icmp ult <8 x i64> %i, %x5 = select <8 x i1> %x3, <8 x i64> %i, <8 x i64> %x6 = trunc <8 x i64> %x5 to <8 x i32> store <8 x i32> %x6, <8 x i32>* %res, align 1 ret void } define void @usat_trunc_qw_512_mem(<8 x i64> %i, <8 x i16>* %res) { ; ALL-LABEL: usat_trunc_qw_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusqw %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x3 = icmp ult <8 x i64> %i, %x5 = select <8 x i1> %x3, <8 x i64> %i, <8 x i64> %x6 = trunc <8 x i64> %x5 to <8 x i16> store <8 x i16> %x6, <8 x i16>* %res, align 1 ret void } define <32 x i8> @usat_trunc_db_1024(<32 x i32> %i) { ; ALL-LABEL: usat_trunc_db_1024: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusdb %zmm0, %xmm0 ; ALL-NEXT: vpmovusdb %zmm1, %xmm1 ; ALL-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm0 ; ALL-NEXT: retq %x3 = icmp ult <32 x i32> %i, %x5 = select <32 x i1> %x3, <32 x i32> %i, <32 x i32> %x6 = trunc <32 x i32> %x5 to <32 x i8> ret <32 x i8> %x6 } define void @usat_trunc_db_1024_mem(<32 x i32> %i, <32 x i8>* %p) { ; ALL-LABEL: usat_trunc_db_1024_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusdb %zmm1, 16(%rdi) ; ALL-NEXT: vpmovusdb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x3 = icmp ult <32 x i32> %i, %x5 = select <32 x i1> %x3, <32 x i32> %i, <32 x i32> %x6 = trunc <32 x i32> %x5 to <32 x i8> store <32 x i8>%x6, <32 x i8>* %p, align 1 ret void } define <16 x i16> @usat_trunc_dw_512(<16 x i32> %i) { ; ALL-LABEL: usat_trunc_dw_512: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusdw %zmm0, %ymm0 ; ALL-NEXT: retq %x3 = icmp ult <16 x i32> %i, %x5 = select <16 x i1> %x3, <16 x i32> %i, <16 x i32> %x6 = trunc <16 x i32> %x5 to <16 x i16> ret <16 x i16> %x6 } define <8 x i8> @usat_trunc_wb_128(<8 x i16> %i) { ; KNL-LABEL: usat_trunc_wb_128: ; KNL: ## %bb.0: ; KNL-NEXT: vpminuw {{.*}}(%rip), %xmm0, %xmm0 ; KNL-NEXT: vpackuswb %xmm0, %xmm0, %xmm0 ; KNL-NEXT: retq ; ; SKX-LABEL: usat_trunc_wb_128: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovuswb %xmm0, %xmm0 ; SKX-NEXT: retq %x3 = icmp ult <8 x i16> %i, %x5 = select <8 x i1> %x3, <8 x i16> %i, <8 x i16> %x6 = trunc <8 x i16> %x5 to <8 x i8> ret <8 x i8>%x6 } define <16 x i16> @usat_trunc_qw_1024(<16 x i64> %i) { ; ALL-LABEL: usat_trunc_qw_1024: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovusqw %zmm0, %xmm0 ; ALL-NEXT: vpmovusqw %zmm1, %xmm1 ; ALL-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm0 ; ALL-NEXT: retq %x3 = icmp ult <16 x i64> %i, %x5 = select <16 x i1> %x3, <16 x i64> %i, <16 x i64> %x6 = trunc <16 x i64> %x5 to <16 x i16> ret <16 x i16> %x6 } define <16 x i8> @usat_trunc_db_256(<8 x i32> %x) { ; KNL-LABEL: usat_trunc_db_256: ; KNL: ## %bb.0: ; KNL-NEXT: ## kill: def $ymm0 killed $ymm0 def $zmm0 ; KNL-NEXT: vpmovusdb %zmm0, %xmm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: usat_trunc_db_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpmovusdb %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %tmp1 = icmp ult <8 x i32> %x, %tmp2 = select <8 x i1> %tmp1, <8 x i32> %x, <8 x i32> %tmp3 = trunc <8 x i32> %tmp2 to <8 x i8> %tmp4 = shufflevector <8 x i8> %tmp3, <8 x i8> undef, <16 x i32> ret <16 x i8> %tmp4 } ; Tests for the following unsigned saturation pattern: ; %a = icmp sgt %x, C1 ; %b = select %a, %x, C2 ; %c = icmp slt %b, C2 ; %d = select %c, %b, C2 ; %res = trunc %d define void @smax_usat_trunc_wb_256_mem1(<16 x i16> %i, <16 x i8>* %res) { ; KNL-LABEL: smax_usat_trunc_wb_256_mem1: ; KNL: ## %bb.0: ; KNL-NEXT: vextracti128 $1, %ymm0, %xmm1 ; KNL-NEXT: vpackuswb %xmm1, %xmm0, %xmm0 ; KNL-NEXT: vmovdqu %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: smax_usat_trunc_wb_256_mem1: ; SKX: ## %bb.0: ; SKX-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; SKX-NEXT: vpmaxsw %ymm1, %ymm0, %ymm0 ; SKX-NEXT: vpmovuswb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x1 = icmp sgt <16 x i16> %i, %x2 = select <16 x i1> %x1, <16 x i16> %i, <16 x i16> %x3 = icmp slt <16 x i16> %x2, %x5 = select <16 x i1> %x3, <16 x i16> %x2, <16 x i16> %x6 = trunc <16 x i16> %x5 to <16 x i8> store <16 x i8> %x6, <16 x i8>* %res, align 1 ret void } ; Test for smax(smin(x, C2), C1). define void @smax_usat_trunc_wb_256_mem2(<16 x i16> %i, <16 x i8>* %res) { ; KNL-LABEL: smax_usat_trunc_wb_256_mem2: ; KNL: ## %bb.0: ; KNL-NEXT: vextracti128 $1, %ymm0, %xmm1 ; KNL-NEXT: vpackuswb %xmm1, %xmm0, %xmm0 ; KNL-NEXT: vmovdqu %xmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: smax_usat_trunc_wb_256_mem2: ; SKX: ## %bb.0: ; SKX-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; SKX-NEXT: vpmaxsw %ymm1, %ymm0, %ymm0 ; SKX-NEXT: vpmovuswb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x1 = icmp slt <16 x i16> %i, %x2 = select <16 x i1> %x1, <16 x i16> %i, <16 x i16> %x3 = icmp sgt <16 x i16> %x2, %x5 = select <16 x i1> %x3, <16 x i16> %x2, <16 x i16> %x6 = trunc <16 x i16> %x5 to <16 x i8> store <16 x i8> %x6, <16 x i8>* %res, align 1 ret void } define <16 x i8> @smax_usat_trunc_wb_256(<16 x i16> %i) { ; KNL-LABEL: smax_usat_trunc_wb_256: ; KNL: ## %bb.0: ; KNL-NEXT: vextracti128 $1, %ymm0, %xmm1 ; KNL-NEXT: vpackuswb %xmm1, %xmm0, %xmm0 ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: smax_usat_trunc_wb_256: ; SKX: ## %bb.0: ; SKX-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; SKX-NEXT: vpmaxsw %ymm1, %ymm0, %ymm0 ; SKX-NEXT: vpmovuswb %ymm0, %xmm0 ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x1 = icmp sgt <16 x i16> %i, %x2 = select <16 x i1> %x1, <16 x i16> %i, <16 x i16> %x3 = icmp slt <16 x i16> %x2, %x5 = select <16 x i1> %x3, <16 x i16> %x2, <16 x i16> %x6 = trunc <16 x i16> %x5 to <16 x i8> ret <16 x i8> %x6 } define void @smax_usat_trunc_wb_128_mem(<8 x i16> %i, <8 x i8>* %res) { ; KNL-LABEL: smax_usat_trunc_wb_128_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpackuswb %xmm0, %xmm0, %xmm0 ; KNL-NEXT: vmovq %xmm0, (%rdi) ; KNL-NEXT: retq ; ; SKX-LABEL: smax_usat_trunc_wb_128_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; SKX-NEXT: vpmaxsw %xmm1, %xmm0, %xmm0 ; SKX-NEXT: vpmovuswb %xmm0, (%rdi) ; SKX-NEXT: retq %x1 = icmp sgt <8 x i16> %i, %x2 = select <8 x i1> %x1, <8 x i16> %i, <8 x i16> %x3 = icmp slt <8 x i16> %x2, %x5 = select <8 x i1> %x3, <8 x i16> %x2, <8 x i16> %x6 = trunc <8 x i16> %x5 to <8 x i8> store <8 x i8> %x6, <8 x i8>* %res, align 1 ret void } define void @smax_usat_trunc_db_512_mem(<16 x i32> %i, <16 x i8>* %res) { ; ALL-LABEL: smax_usat_trunc_db_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; ALL-NEXT: vpmaxsd %zmm1, %zmm0, %zmm0 ; ALL-NEXT: vpmovusdb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x1 = icmp sgt <16 x i32> %i, %x2 = select <16 x i1> %x1, <16 x i32> %i, <16 x i32> %x3 = icmp slt <16 x i32> %x2, %x5 = select <16 x i1> %x3, <16 x i32> %x2, <16 x i32> %x6 = trunc <16 x i32> %x5 to <16 x i8> store <16 x i8> %x6, <16 x i8>* %res, align 1 ret void } define void @smax_usat_trunc_qb_512_mem(<8 x i64> %i, <8 x i8>* %res) { ; ALL-LABEL: smax_usat_trunc_qb_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; ALL-NEXT: vpmaxsq %zmm1, %zmm0, %zmm0 ; ALL-NEXT: vpmovusqb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x1 = icmp sgt <8 x i64> %i, %x2 = select <8 x i1> %x1, <8 x i64> %i, <8 x i64> %x3 = icmp slt <8 x i64> %x2, %x5 = select <8 x i1> %x3, <8 x i64> %x2, <8 x i64> %x6 = trunc <8 x i64> %x5 to <8 x i8> store <8 x i8> %x6, <8 x i8>* %res, align 1 ret void } define void @smax_usat_trunc_qd_512_mem(<8 x i64> %i, <8 x i32>* %res) { ; ALL-LABEL: smax_usat_trunc_qd_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; ALL-NEXT: vpmaxsq %zmm1, %zmm0, %zmm0 ; ALL-NEXT: vpmovusqd %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x1 = icmp sgt <8 x i64> %i, %x2 = select <8 x i1> %x1, <8 x i64> %i, <8 x i64> %x3 = icmp slt <8 x i64> %x2, %x5 = select <8 x i1> %x3, <8 x i64> %x2, <8 x i64> %x6 = trunc <8 x i64> %x5 to <8 x i32> store <8 x i32> %x6, <8 x i32>* %res, align 1 ret void } define void @smax_usat_trunc_qw_512_mem(<8 x i64> %i, <8 x i16>* %res) { ; ALL-LABEL: smax_usat_trunc_qw_512_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; ALL-NEXT: vpmaxsq %zmm1, %zmm0, %zmm0 ; ALL-NEXT: vpmovusqw %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x1 = icmp sgt <8 x i64> %i, %x2 = select <8 x i1> %x1, <8 x i64> %i, <8 x i64> %x3 = icmp slt <8 x i64> %x2, %x5 = select <8 x i1> %x3, <8 x i64> %x2, <8 x i64> %x6 = trunc <8 x i64> %x5 to <8 x i16> store <8 x i16> %x6, <8 x i16>* %res, align 1 ret void } define <32 x i8> @smax_usat_trunc_db_1024(<32 x i32> %i) { ; ALL-LABEL: smax_usat_trunc_db_1024: ; ALL: ## %bb.0: ; ALL-NEXT: vpxor %xmm2, %xmm2, %xmm2 ; ALL-NEXT: vpmaxsd %zmm2, %zmm1, %zmm1 ; ALL-NEXT: vpmaxsd %zmm2, %zmm0, %zmm0 ; ALL-NEXT: vpmovusdb %zmm0, %xmm0 ; ALL-NEXT: vpmovusdb %zmm1, %xmm1 ; ALL-NEXT: vinserti128 $1, %xmm1, %ymm0, %ymm0 ; ALL-NEXT: retq %x1 = icmp sgt <32 x i32> %i, %x2 = select <32 x i1> %x1, <32 x i32> %i, <32 x i32> %x3 = icmp slt <32 x i32> %x2, %x5 = select <32 x i1> %x3, <32 x i32> %x2, <32 x i32> %x6 = trunc <32 x i32> %x5 to <32 x i8> ret <32 x i8> %x6 } define void @smax_usat_trunc_db_1024_mem(<32 x i32> %i, <32 x i8>* %p) { ; ALL-LABEL: smax_usat_trunc_db_1024_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpxor %xmm2, %xmm2, %xmm2 ; ALL-NEXT: vpmaxsd %zmm2, %zmm0, %zmm0 ; ALL-NEXT: vpmaxsd %zmm2, %zmm1, %zmm1 ; ALL-NEXT: vpmovusdb %zmm1, 16(%rdi) ; ALL-NEXT: vpmovusdb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x1 = icmp sgt <32 x i32> %i, %x2 = select <32 x i1> %x1, <32 x i32> %i, <32 x i32> %x3 = icmp slt <32 x i32> %x2, %x5 = select <32 x i1> %x3, <32 x i32> %x2, <32 x i32> %x6 = trunc <32 x i32> %x5 to <32 x i8> store <32 x i8>%x6, <32 x i8>* %p, align 1 ret void } define <16 x i16> @smax_usat_trunc_dw_512(<16 x i32> %i) { ; ALL-LABEL: smax_usat_trunc_dw_512: ; ALL: ## %bb.0: ; ALL-NEXT: vpxor %xmm1, %xmm1, %xmm1 ; ALL-NEXT: vpmaxsd %zmm1, %zmm0, %zmm0 ; ALL-NEXT: vpmovusdw %zmm0, %ymm0 ; ALL-NEXT: retq %x1 = icmp sgt <16 x i32> %i, %x2 = select <16 x i1> %x1, <16 x i32> %i, <16 x i32> %x3 = icmp slt <16 x i32> %x2, %x5 = select <16 x i1> %x3, <16 x i32> %x2, <16 x i32> %x6 = trunc <16 x i32> %x5 to <16 x i16> ret <16 x i16> %x6 } define void @negative_test1_smax_usat_trunc_wb_256_mem(<16 x i16> %i, <16 x i8>* %res) { ; KNL-LABEL: negative_test1_smax_usat_trunc_wb_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpminsw {{.*}}(%rip), %ymm0, %ymm0 ; KNL-NEXT: vpmaxsw {{.*}}(%rip), %ymm0, %ymm0 ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: negative_test1_smax_usat_trunc_wb_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpminsw {{.*}}(%rip), %ymm0, %ymm0 ; SKX-NEXT: vpmaxsw {{.*}}(%rip), %ymm0, %ymm0 ; SKX-NEXT: vpmovwb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x1 = icmp slt <16 x i16> %i, %x2 = select <16 x i1> %x1, <16 x i16> %i, <16 x i16> %x3 = icmp sgt <16 x i16> %x2, %x5 = select <16 x i1> %x3, <16 x i16> %x2, <16 x i16> %x6 = trunc <16 x i16> %x5 to <16 x i8> store <16 x i8> %x6, <16 x i8>* %res, align 1 ret void } define void @negative_test2_smax_usat_trunc_wb_256_mem(<16 x i16> %i, <16 x i8>* %res) { ; KNL-LABEL: negative_test2_smax_usat_trunc_wb_256_mem: ; KNL: ## %bb.0: ; KNL-NEXT: vpmaxsw {{.*}}(%rip), %ymm0, %ymm0 ; KNL-NEXT: vpminsw {{.*}}(%rip), %ymm0, %ymm0 ; KNL-NEXT: vpmovzxwd {{.*#+}} zmm0 = ymm0[0],zero,ymm0[1],zero,ymm0[2],zero,ymm0[3],zero,ymm0[4],zero,ymm0[5],zero,ymm0[6],zero,ymm0[7],zero,ymm0[8],zero,ymm0[9],zero,ymm0[10],zero,ymm0[11],zero,ymm0[12],zero,ymm0[13],zero,ymm0[14],zero,ymm0[15],zero ; KNL-NEXT: vpmovdb %zmm0, (%rdi) ; KNL-NEXT: vzeroupper ; KNL-NEXT: retq ; ; SKX-LABEL: negative_test2_smax_usat_trunc_wb_256_mem: ; SKX: ## %bb.0: ; SKX-NEXT: vpmaxsw {{.*}}(%rip), %ymm0, %ymm0 ; SKX-NEXT: vpminsw {{.*}}(%rip), %ymm0, %ymm0 ; SKX-NEXT: vpmovwb %ymm0, (%rdi) ; SKX-NEXT: vzeroupper ; SKX-NEXT: retq %x1 = icmp sgt <16 x i16> %i, %x2 = select <16 x i1> %x1, <16 x i16> %i, <16 x i16> %x3 = icmp slt <16 x i16> %x2, %x5 = select <16 x i1> %x3, <16 x i16> %x2, <16 x i16> %x6 = trunc <16 x i16> %x5 to <16 x i8> store <16 x i8> %x6, <16 x i8>* %res, align 1 ret void } define void @ssat_trunc_db_1024_mem(<32 x i32> %i, <32 x i8>* %p) { ; ALL-LABEL: ssat_trunc_db_1024_mem: ; ALL: ## %bb.0: ; ALL-NEXT: vpmovsdb %zmm1, 16(%rdi) ; ALL-NEXT: vpmovsdb %zmm0, (%rdi) ; ALL-NEXT: vzeroupper ; ALL-NEXT: retq %x1 = icmp sgt <32 x i32> %i, %x2 = select <32 x i1> %x1, <32 x i32> %i, <32 x i32> %x3 = icmp slt <32 x i32> %x2, %x5 = select <32 x i1> %x3, <32 x i32> %x2, <32 x i32> %x6 = trunc <32 x i32> %x5 to <32 x i8> store <32 x i8>%x6, <32 x i8>* %p, align 1 ret void }