llvm.org GIT mirror llvm / 2edda52 test / CodeGen / ARM / sdiv-pow2-arm-size.ll
2edda52

Tree @2edda52 (Download .tar.gz)

sdiv-pow2-arm-size.ll @2edda52raw · history · blame

; RUN: llc -mtriple=armv7a -mattr=+hwdiv-arm %s -o - | FileCheck %s --check-prefixes=CHECK,DIV
; RUN: llc -mtriple=armv7a -mattr=-hwdiv-arm %s -o - | FileCheck %s --check-prefixes=CHECK,NODIV

; Check SREM
define dso_local i32 @test_rem(i32 %F) local_unnamed_addr #0 {
; CHECK-LABEL: test_rem 
; CHECK:       asr   r1, r0, #31
; CHECK-NEXT:  add   r1, r0, r1, lsr #30
; CHECK-NEXT:  bic   r1, r1, #3
; CHECK-NEXT:  sub   r0, r0, r1

entry:
  %div = srem i32 %F, 4
  ret i32 %div
}

; Try an i16 sdiv, with a small immediate.
define dso_local signext i16 @f0(i16 signext %F) local_unnamed_addr #0 {
; CHECK-LABEL: f0

; DIV:         mov     r1, #2
; DIV-NEXT:    sdiv    r0, r0, r1
; DIV-NEXT:    sxth    r0, r0
; DIV-NEXT:    bx      lr

; NODIV:       uxth r1, r0
; NODIV-NEXT:  add  r0, r0, r1, lsr #15
; NODIV-NEXT:  sxth r0, r0
; NODIV-NEXT:  asr  r0, r0, #1
; NODIV-NEXT:  bx   lr

entry:
  %0 = sdiv i16 %F, 2
  ret i16 %0
}

; Try an i32 sdiv, with a small immediate.
define dso_local i32 @f1(i32 %F) local_unnamed_addr #0 {
; CHECK-LABEL: f1

; DIV:       mov     r1, #4
; DIV-NEXT:  sdiv    r0, r0, r1
; DIV-NEXT:  bx      lr

; NODIV:       asr  r1, r0, #31
; NODIV-NEXT:  add  r0, r0, r1, lsr #30
; NODIV-NEXT:  asr  r0, r0, #2
; NODIV-NEXT:  bx	  lr

entry:
  %div = sdiv i32 %F, 4
  ret i32 %div
}

; Try a large power of 2 immediate, which should also be materialised with 1
; move immediate instruction.
define dso_local i32 @f2(i32 %F) local_unnamed_addr #0 {
; CHECK-LABEL:  f2
; DIV:        mov r1, #131072
; DIV-NEXT:   sdiv  r0, r0, r1
; DIV-NEXT:   bx  lr
entry:
  %div = sdiv i32 %F, 131072
  ret i32 %div
}

; MinSize not set, so should expand to the faster but longer sequence.
define dso_local i32 @f3(i32 %F) {
; CHECK-LABEL: f3
; CHECK:       asr r1, r0, #31
; CHECK-NEXT:  add r0, r0, r1, lsr #30
; CHECK-NEXT:  asr r0, r0, #2
; CHECK-NEXT:  bx  lr
entry:
  %div = sdiv i32 %F, 4
  ret i32 %div
}

attributes #0 = { minsize norecurse nounwind optsize readnone }