|
| 1 | +# RUN: llc --verify-machineinstrs -mtriple=aarch64 -o - %s -run-pass pipeliner -aarch64-enable-pipeliner -debug-only=pipeliner 2>&1 | FileCheck %s |
| 2 | + |
| 3 | +# An acceptable loop by pipeliner: TBB == ExitBB, FBB == LoopBB, Branch with NZCV flags |
| 4 | +# CHECK: Schedule Found? 1 |
| 5 | + |
| 6 | +--- | |
| 7 | + define dso_local void @func(ptr noalias nocapture noundef writeonly %a, ptr nocapture noundef readonly %b, i32 noundef %n) local_unnamed_addr #0 { |
| 8 | + entry: |
| 9 | + %cmp6 = icmp sgt i32 %n, 0 |
| 10 | + br i1 %cmp6, label %for.body.preheader, label %for.cond.cleanup |
| 11 | + |
| 12 | + for.body.preheader: ; preds = %entry |
| 13 | + %wide.trip.count = zext nneg i32 %n to i64 |
| 14 | + br label %for.body |
| 15 | + |
| 16 | + for.cond.cleanup: ; preds = %for.body, %entry |
| 17 | + ret void |
| 18 | + |
| 19 | + for.body: ; preds = %for.body.preheader, %for.body |
| 20 | + %lsr.iv11 = phi i64 [ %wide.trip.count, %for.body.preheader ], [ %lsr.iv.next, %for.body ] |
| 21 | + %lsr.iv9 = phi ptr [ %b, %for.body.preheader ], [ %scevgep10, %for.body ] |
| 22 | + %lsr.iv = phi ptr [ %a, %for.body.preheader ], [ %scevgep, %for.body ] |
| 23 | + %0 = load float, ptr %lsr.iv9, align 4 |
| 24 | + %add = fadd float %0, 1.000000e+00 |
| 25 | + store float %add, ptr %lsr.iv, align 4 |
| 26 | + %scevgep = getelementptr i8, ptr %lsr.iv, i64 4 |
| 27 | + %scevgep10 = getelementptr i8, ptr %lsr.iv9, i64 4 |
| 28 | + %lsr.iv.next = add nsw i64 %lsr.iv11, -1 |
| 29 | + %exitcond.not = icmp eq i64 %lsr.iv.next, 0 |
| 30 | + br i1 %exitcond.not, label %for.cond.cleanup, label %for.body |
| 31 | + } |
| 32 | + |
| 33 | +... |
| 34 | +--- |
| 35 | +name: func |
| 36 | +tracksRegLiveness: true |
| 37 | +liveins: |
| 38 | + - { reg: '$x0', virtual-reg: '%7' } |
| 39 | + - { reg: '$x1', virtual-reg: '%8' } |
| 40 | + - { reg: '$w2', virtual-reg: '%9' } |
| 41 | +body: | |
| 42 | + bb.0.entry: |
| 43 | + successors: %bb.1(0x50000000), %bb.2(0x30000000) |
| 44 | + liveins: $x0, $x1, $w2 |
| 45 | +
|
| 46 | + %9:gpr32common = COPY $w2 |
| 47 | + %8:gpr64 = COPY $x1 |
| 48 | + %7:gpr64 = COPY $x0 |
| 49 | + dead $wzr = SUBSWri %9, 1, 0, implicit-def $nzcv |
| 50 | + Bcc 11, %bb.2, implicit $nzcv |
| 51 | + B %bb.1 |
| 52 | +
|
| 53 | + bb.1.for.body.preheader: |
| 54 | + %11:gpr32 = ORRWrs $wzr, %9, 0 |
| 55 | + %0:gpr64all = SUBREG_TO_REG 0, killed %11, %subreg.sub_32 |
| 56 | + %14:fpr32 = FMOVSi 112 |
| 57 | + B %bb.3 |
| 58 | +
|
| 59 | + bb.2.for.cond.cleanup: |
| 60 | + RET_ReallyLR |
| 61 | +
|
| 62 | + bb.3.for.body: |
| 63 | + successors: %bb.2(0x04000000), %bb.3(0x7c000000) |
| 64 | +
|
| 65 | + %1:gpr64sp = PHI %0, %bb.1, %6, %bb.3 |
| 66 | + %2:gpr64sp = PHI %8, %bb.1, %5, %bb.3 |
| 67 | + %3:gpr64sp = PHI %7, %bb.1, %4, %bb.3 |
| 68 | + early-clobber %12:gpr64sp, %13:fpr32 = LDRSpost %2, 4 :: (load (s32) from %ir.lsr.iv9) |
| 69 | + %15:fpr32 = nofpexcept FADDSrr killed %13, %14, implicit $fpcr |
| 70 | + early-clobber %16:gpr64sp = STRSpost killed %15, %3, 4 :: (store (s32) into %ir.lsr.iv) |
| 71 | + %4:gpr64all = COPY %16 |
| 72 | + %5:gpr64all = COPY %12 |
| 73 | + %17:gpr64 = nsw SUBSXri %1, 1, 0, implicit-def $nzcv |
| 74 | + %6:gpr64all = COPY %17 |
| 75 | + Bcc 0, %bb.2, implicit $nzcv |
| 76 | + B %bb.3 |
| 77 | +
|
| 78 | +... |
0 commit comments