132 lines
3.7 KiB
LLVM
132 lines
3.7 KiB
LLVM
|
; RUN: llc < %s -mtriple=ve -mattr=+vpu | FileCheck %s
|
||
|
|
||
|
; <256 x i32>
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <256 x i32> @add_vv_v256i32(<256 x i32> %x, <256 x i32> %y) {
|
||
|
; CHECK-LABEL: add_vv_v256i32:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: lea %s0, 256
|
||
|
; CHECK-NEXT: lvl %s0
|
||
|
; CHECK-NEXT: vadds.w.sx %v0, %v0, %v1
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%z = add <256 x i32> %x, %y
|
||
|
ret <256 x i32> %z
|
||
|
}
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <256 x i32> @add_sv_v256i32(i32 %x, <256 x i32> %y) {
|
||
|
; CHECK-LABEL: add_sv_v256i32:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: and %s0, %s0, (32)0
|
||
|
; CHECK-NEXT: lea %s1, 256
|
||
|
; CHECK-NEXT: lvl %s1
|
||
|
; CHECK-NEXT: vadds.w.sx %v0, %s0, %v0
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%xins = insertelement <256 x i32> undef, i32 %x, i32 0
|
||
|
%vx = shufflevector <256 x i32> %xins, <256 x i32> undef, <256 x i32> zeroinitializer
|
||
|
%z = add <256 x i32> %vx, %y
|
||
|
ret <256 x i32> %z
|
||
|
}
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <256 x i32> @add_vs_v256i32(<256 x i32> %x, i32 %y) {
|
||
|
; CHECK-LABEL: add_vs_v256i32:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: and %s0, %s0, (32)0
|
||
|
; CHECK-NEXT: lea %s1, 256
|
||
|
; CHECK-NEXT: lvl %s1
|
||
|
; CHECK-NEXT: vadds.w.sx %v0, %s0, %v0
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%yins = insertelement <256 x i32> undef, i32 %y, i32 0
|
||
|
%vy = shufflevector <256 x i32> %yins, <256 x i32> undef, <256 x i32> zeroinitializer
|
||
|
%z = add <256 x i32> %x, %vy
|
||
|
ret <256 x i32> %z
|
||
|
}
|
||
|
|
||
|
|
||
|
|
||
|
; <256 x i64>
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <256 x i64> @add_vv_v256i64(<256 x i64> %x, <256 x i64> %y) {
|
||
|
; CHECK-LABEL: add_vv_v256i64:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: lea %s0, 256
|
||
|
; CHECK-NEXT: lvl %s0
|
||
|
; CHECK-NEXT: vadds.l %v0, %v0, %v1
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%z = add <256 x i64> %x, %y
|
||
|
ret <256 x i64> %z
|
||
|
}
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <256 x i64> @add_sv_v256i64(i64 %x, <256 x i64> %y) {
|
||
|
; CHECK-LABEL: add_sv_v256i64:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: lea %s1, 256
|
||
|
; CHECK-NEXT: lvl %s1
|
||
|
; CHECK-NEXT: vadds.l %v0, %s0, %v0
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%xins = insertelement <256 x i64> undef, i64 %x, i32 0
|
||
|
%vx = shufflevector <256 x i64> %xins, <256 x i64> undef, <256 x i32> zeroinitializer
|
||
|
%z = add <256 x i64> %vx, %y
|
||
|
ret <256 x i64> %z
|
||
|
}
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <256 x i64> @add_vs_v256i64(<256 x i64> %x, i64 %y) {
|
||
|
; CHECK-LABEL: add_vs_v256i64:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: lea %s1, 256
|
||
|
; CHECK-NEXT: lvl %s1
|
||
|
; CHECK-NEXT: vadds.l %v0, %s0, %v0
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%yins = insertelement <256 x i64> undef, i64 %y, i32 0
|
||
|
%vy = shufflevector <256 x i64> %yins, <256 x i64> undef, <256 x i32> zeroinitializer
|
||
|
%z = add <256 x i64> %x, %vy
|
||
|
ret <256 x i64> %z
|
||
|
}
|
||
|
|
||
|
; <128 x i64>
|
||
|
; We expect this to be widened.
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <128 x i64> @add_vv_v128i64(<128 x i64> %x, <128 x i64> %y) {
|
||
|
; CHECK-LABEL: add_vv_v128i64:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: lea %s0, 256
|
||
|
; CHECK-NEXT: lvl %s0
|
||
|
; CHECK-NEXT: vadds.l %v0, %v0, %v1
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%z = add <128 x i64> %x, %y
|
||
|
ret <128 x i64> %z
|
||
|
}
|
||
|
|
||
|
; <256 x i16>
|
||
|
; We expect promotion.
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <256 x i16> @add_vv_v256i16(<256 x i16> %x, <256 x i16> %y) {
|
||
|
; CHECK-LABEL: add_vv_v256i16:
|
||
|
; CHECK: # %bb.0:
|
||
|
; CHECK-NEXT: lea %s0, 256
|
||
|
; CHECK-NEXT: lvl %s0
|
||
|
; CHECK-NEXT: vadds.w.sx %v0, %v0, %v1
|
||
|
; CHECK-NEXT: b.l.t (, %s10)
|
||
|
%z = add <256 x i16> %x, %y
|
||
|
ret <256 x i16> %z
|
||
|
}
|
||
|
|
||
|
; <128 x i16>
|
||
|
; We expect this to be scalarized (for now).
|
||
|
|
||
|
; Function Attrs: nounwind
|
||
|
define fastcc <128 x i16> @add_vv_v128i16(<128 x i16> %x, <128 x i16> %y) {
|
||
|
; CHECK-LABEL: add_vv_v128i16:
|
||
|
; CHECK-NOT: vadd
|
||
|
%z = add <128 x i16> %x, %y
|
||
|
ret <128 x i16> %z
|
||
|
}
|
||
|
|