34 lines
1.1 KiB
LLVM
34 lines
1.1 KiB
LLVM
|
; RUN: llc < %s -mtriple=thumbv7-apple-ios -mcpu=cortex-a8 | FileCheck %s
|
||
|
|
||
|
; ARM has a peephole optimization which looks for a def / use pair. The def
|
||
|
; produces a 32-bit immediate which is consumed by the use. It tries to
|
||
|
; fold the immediate by breaking it into two parts and fold them into the
|
||
|
; immmediate fields of two uses. e.g
|
||
|
; movw r2, #40885
|
||
|
; movt r3, #46540
|
||
|
; add r0, r0, r3
|
||
|
; =>
|
||
|
; add.w r0, r0, #3019898880
|
||
|
; add.w r0, r0, #30146560
|
||
|
;
|
||
|
; However, this transformation is incorrect if the user produces a flag. e.g.
|
||
|
; movw r2, #40885
|
||
|
; movt r3, #46540
|
||
|
; adds r0, r0, r3
|
||
|
; =>
|
||
|
; add.w r0, r0, #3019898880
|
||
|
; adds.w r0, r0, #30146560
|
||
|
; Note the adds.w may not set the carry flag even if the original sequence
|
||
|
; would.
|
||
|
;
|
||
|
; rdar://11116189
|
||
|
define i64 @t(i64 %aInput) nounwind {
|
||
|
; CHECK-LABEL: t:
|
||
|
; CHECK: movs [[REG:(r[0-9]+)]], #0
|
||
|
; CHECK: movt [[REG]], #46540
|
||
|
; CHECK: adds r{{[0-9]+}}, r{{[0-9]+}}, [[REG]]
|
||
|
%1 = mul i64 %aInput, 1000000
|
||
|
%2 = add i64 %1, -7952618389194932224
|
||
|
ret i64 %2
|
||
|
}
|