1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
| ; REQUIRES: asserts
; RUN: llc < %s -mtriple=armv8r-eabi -mcpu=cortex-r52 -verify-misched -debug-only=machine-scheduler -o - 2>&1 > /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=R52_SCHED
; RUN: llc < %s -mtriple=armv8r-eabi -mcpu=generic -enable-misched -verify-misched -debug-only=machine-scheduler -o - 2>&1 > /dev/null | FileCheck %s --check-prefix=CHECK --check-prefix=GENERIC
;
; Check the latency for instructions for both generic and cortex-r52.
; Cortex-r52 machine model will cause the div to be sceduled before eor
; as div takes more cycles to compute than eor.
;
; CHECK: ********** MI Scheduling **********
; CHECK: foo:%bb.0 entry
; CHECK: EORrr
; GENERIC: Latency : 1
; R52_SCHED: Latency : 3
; CHECK: MLA
; GENERIC: Latency : 2
; R52_SCHED: Latency : 4
; CHECK: SDIV
; GENERIC: Latency : 0
; R52_SCHED: Latency : 8
; CHECK: ** Final schedule for %bb.0 ***
; GENERIC: EORrr
; GENERIC: SDIV
; R52_SCHED: SDIV
; R52_SCHED: EORrr
; CHECK: ********** INTERVALS **********
target datalayout = "e-m:e-p:32:32-i64:64-v128:64:128-a:0:32-n32-S64"
target triple = "armv8r-arm-none-eabi"
; Function Attrs: norecurse nounwind readnone
define hidden i32 @foo(i32 %a, i32 %b, i32 %c) local_unnamed_addr #0 {
entry:
%xor = xor i32 %c, %b
%mul = mul nsw i32 %xor, %c
%add = add nsw i32 %mul, %a
%div = sdiv i32 %a, %b
%sub = sub i32 %add, %div
ret i32 %sub
}
|