; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc -mtriple=thumbv8.1m.main -mattr=+mve -verify-machineinstrs -o - %s | FileCheck %s define arm_aapcs_vfpcc <8 x i16> @test_vbicq_n_u16_sh0(<8 x i16> %a) { ; CHECK-LABEL: test_vbicq_n_u16_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vbic.i16 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = and <8 x i16> %a, ret <8 x i16> %0 } define arm_aapcs_vfpcc <8 x i16> @test_vbicq_n_u16_sh8(<8 x i16> %a) { ; CHECK-LABEL: test_vbicq_n_u16_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vbic.i16 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = and <8 x i16> %a, ret <8 x i16> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_n_u32_sh0(<4 x i32> %a) { ; CHECK-LABEL: test_vbicq_n_u32_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vbic.i32 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = and <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_n_u32_sh8(<4 x i32> %a) { ; CHECK-LABEL: test_vbicq_n_u32_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vbic.i32 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = and <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_n_u32_sh16(<4 x i32> %a) { ; CHECK-LABEL: test_vbicq_n_u32_sh16: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vbic.i32 q0, #0x640000 ; CHECK-NEXT: bx lr entry: %0 = and <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_n_u32_sh24(<4 x i32> %a) { ; CHECK-LABEL: test_vbicq_n_u32_sh24: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vbic.i32 q0, #0x64000000 ; CHECK-NEXT: bx lr entry: %0 = and <4 x i32> %a, ret <4 x i32> %0 } ; The immediate in this case is legal for a VMVN but not for a VBIC, ; so in this case we expect to see the constant being prepared in ; another register. define arm_aapcs_vfpcc <4 x i32> @test_vbicq_n_u32_illegal(<4 x i32> %a) { ; CHECK-LABEL: test_vbicq_n_u32_illegal: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmvn.i32 q1, #0x54ff ; CHECK-NEXT: vand q0, q0, q1 ; CHECK-NEXT: bx lr entry: %0 = and <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <8 x i16> @test_vorrq_n_u16_sh0(<8 x i16> %a) { ; CHECK-LABEL: test_vorrq_n_u16_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vorr.i16 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = or <8 x i16> %a, ret <8 x i16> %0 } define arm_aapcs_vfpcc <8 x i16> @test_vorrq_n_u16_sh8(<8 x i16> %a) { ; CHECK-LABEL: test_vorrq_n_u16_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vorr.i16 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = or <8 x i16> %a, ret <8 x i16> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_n_u32_sh0(<4 x i32> %a) { ; CHECK-LABEL: test_vorrq_n_u32_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vorr.i32 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = or <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_n_u32_sh8(<4 x i32> %a) { ; CHECK-LABEL: test_vorrq_n_u32_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vorr.i32 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = or <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_n_u32_sh16(<4 x i32> %a) { ; CHECK-LABEL: test_vorrq_n_u32_sh16: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vorr.i32 q0, #0x640000 ; CHECK-NEXT: bx lr entry: %0 = or <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_n_u32_sh24(<4 x i32> %a) { ; CHECK-LABEL: test_vorrq_n_u32_sh24: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vorr.i32 q0, #0x64000000 ; CHECK-NEXT: bx lr entry: %0 = or <4 x i32> %a, ret <4 x i32> %0 } define arm_aapcs_vfpcc <8 x i16> @test_vbicq_m_n_u16_sh0(<8 x i16> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vbicq_m_n_u16_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vbict.i16 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) %2 = and <8 x i16> %a, %3 = select <8 x i1> %1, <8 x i16> %2, <8 x i16> %a ret <8 x i16> %3 } define arm_aapcs_vfpcc <8 x i16> @test_vbicq_m_n_u16_sh8(<8 x i16> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vbicq_m_n_u16_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vbict.i16 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) %2 = and <8 x i16> %a, %3 = select <8 x i1> %1, <8 x i16> %2, <8 x i16> %a ret <8 x i16> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_m_n_u32_sh0(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vbicq_m_n_u32_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vbict.i32 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = and <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_m_n_u32_sh8(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vbicq_m_n_u32_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vbict.i32 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = and <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_m_n_u32_sh16(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vbicq_m_n_u32_sh16: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vbict.i32 q0, #0x640000 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = and <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vbicq_m_n_u32_sh24(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vbicq_m_n_u32_sh24: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vbict.i32 q0, #0x64000000 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = and <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <8 x i16> @test_vorrq_m_n_u16_sh0(<8 x i16> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vorrq_m_n_u16_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vorrt.i16 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) %2 = or <8 x i16> %a, %3 = select <8 x i1> %1, <8 x i16> %2, <8 x i16> %a ret <8 x i16> %3 } define arm_aapcs_vfpcc <8 x i16> @test_vorrq_m_n_u16_sh8(<8 x i16> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vorrq_m_n_u16_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vorrt.i16 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) %2 = or <8 x i16> %a, %3 = select <8 x i1> %1, <8 x i16> %2, <8 x i16> %a ret <8 x i16> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_m_n_u32_sh0(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vorrq_m_n_u32_sh0: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vorrt.i32 q0, #0x64 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = or <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_m_n_u32_sh8(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vorrq_m_n_u32_sh8: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vorrt.i32 q0, #0x6400 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = or <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_m_n_u32_sh16(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vorrq_m_n_u32_sh16: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vorrt.i32 q0, #0x640000 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = or <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <4 x i32> @test_vorrq_m_n_u32_sh24(<4 x i32> %a, i16 zeroext %p) { ; CHECK-LABEL: test_vorrq_m_n_u32_sh24: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vorrt.i32 q0, #0x64000000 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = or <4 x i32> %a, %3 = select <4 x i1> %1, <4 x i32> %2, <4 x i32> %a ret <4 x i32> %3 } define arm_aapcs_vfpcc <8 x i16> @test_vmvnq_n_u16() { ; CHECK-LABEL: test_vmvnq_n_u16: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmvn.i16 q0, #0xaa00 ; CHECK-NEXT: bx lr entry: ret <8 x i16> } define arm_aapcs_vfpcc <4 x i32> @test_vmvnq_n_u32() { ; CHECK-LABEL: test_vmvnq_n_u32: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmvn.i32 q0, #0xaa00 ; CHECK-NEXT: bx lr entry: ret <4 x i32> } define arm_aapcs_vfpcc <8 x i16> @test_vmvnq_m_n_u16(<8 x i16> %inactive, i16 zeroext %p) { ; CHECK-LABEL: test_vmvnq_m_n_u16: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vmvnt.i16 q0, #0xaa00 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32 %0) %2 = select <8 x i1> %1, <8 x i16> , <8 x i16> %inactive ret <8 x i16> %2 } define arm_aapcs_vfpcc <4 x i32> @test_vmvnq_m_n_u32(<4 x i32> %inactive, i16 zeroext %p) { ; CHECK-LABEL: test_vmvnq_m_n_u32: ; CHECK: @ %bb.0: @ %entry ; CHECK-NEXT: vmsr p0, r0 ; CHECK-NEXT: vpst ; CHECK-NEXT: vmvnt.i32 q0, #0xaa00 ; CHECK-NEXT: bx lr entry: %0 = zext i16 %p to i32 %1 = tail call <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32 %0) %2 = select <4 x i1> %1, <4 x i32> , <4 x i32> %inactive ret <4 x i32> %2 } declare <8 x i1> @llvm.arm.mve.pred.i2v.v8i1(i32) declare <4 x i1> @llvm.arm.mve.pred.i2v.v4i1(i32)