; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc -disable-lsr -ppc-asm-full-reg-names -verify-machineinstrs \ ; RUN: -ppc-formprep-update-nonconst-inc -mtriple=powerpc64le-unknown-linux-gnu \ ; RUN: -mcpu=pwr9 < %s | FileCheck %s ; long long foo(char *p, int n, int count) { ; int j = 0; ; long long sum = 0; ; for (int i = 0; i < n; i++) { ; sum += *(unsigned long long *)(p + j + 5); ; sum += *(unsigned long long *)(p + j + 9); ; j += count; ; } ; return sum; ; } define i64 @foo(i8* %p, i32 signext %n, i32 signext %count) { ; CHECK-LABEL: foo: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: cmpwi r4, 1 ; CHECK-NEXT: blt cr0, .LBB0_4 ; CHECK-NEXT: # %bb.1: # %for.body.preheader ; CHECK-NEXT: addi r6, r3, 5 ; CHECK-NEXT: addi r3, r4, -1 ; CHECK-NEXT: extsw r5, r5 ; CHECK-NEXT: clrldi r3, r3, 32 ; CHECK-NEXT: addi r3, r3, 1 ; CHECK-NEXT: mtctr r3 ; CHECK-NEXT: li r3, 0 ; CHECK-NEXT: .p2align 5 ; CHECK-NEXT: .LBB0_2: # %for.body ; CHECK-NEXT: # ; CHECK-NEXT: ld r4, 0(r6) ; CHECK-NEXT: add r3, r4, r3 ; CHECK-NEXT: ld r4, 4(r6) ; CHECK-NEXT: add r6, r6, r5 ; CHECK-NEXT: add r3, r3, r4 ; CHECK-NEXT: bdnz .LBB0_2 ; CHECK-NEXT: # %bb.3: # %for.cond.cleanup ; CHECK-NEXT: blr ; CHECK-NEXT: .LBB0_4: ; CHECK-NEXT: li r3, 0 ; CHECK-NEXT: blr entry: %cmp16 = icmp sgt i32 %n, 0 br i1 %cmp16, label %for.body.preheader, label %for.cond.cleanup for.body.preheader: ; preds = %entry %0 = sext i32 %count to i64 br label %for.body for.cond.cleanup: ; preds = %for.body, %entry %sum.0.lcssa = phi i64 [ 0, %entry ], [ %add5, %for.body ] ret i64 %sum.0.lcssa for.body: ; preds = %for.body.preheader, %for.body %indvars.iv = phi i64 [ 0, %for.body.preheader ], [ %indvars.iv.next, %for.body ] %i.019 = phi i32 [ 0, %for.body.preheader ], [ %inc, %for.body ] %sum.018 = phi i64 [ 0, %for.body.preheader ], [ %add5, %for.body ] %add.ptr = getelementptr inbounds i8, i8* %p, i64 %indvars.iv %add.ptr1 = getelementptr inbounds i8, i8* %add.ptr, i64 5 %1 = bitcast i8* %add.ptr1 to i64* %2 = load i64, i64* %1, align 8 %add = add i64 %2, %sum.018 %add.ptr4 = getelementptr inbounds i8, i8* %add.ptr, i64 9 %3 = bitcast i8* %add.ptr4 to i64* %4 = load i64, i64* %3, align 8 %add5 = add i64 %add, %4 %indvars.iv.next = add nsw i64 %indvars.iv, %0 %inc = add nuw nsw i32 %i.019, 1 %exitcond.not = icmp eq i32 %inc, %n br i1 %exitcond.not, label %for.cond.cleanup, label %for.body } ; char foo1(char *p, int n, int count) { ; int j = 0; ; char sum = 0; ; for (int i = 0; i < n; i++) { ; sum += *(p + j + 1000); ; j += count; ; } ; return sum; ; } define zeroext i8 @foo1(i8* %p, i32 signext %n, i32 signext %count) { ; CHECK-LABEL: foo1: ; CHECK: # %bb.0: # %entry ; CHECK-NEXT: cmpwi r4, 1 ; CHECK-NEXT: blt cr0, .LBB1_4 ; CHECK-NEXT: # %bb.1: # %for.body.preheader ; CHECK-NEXT: extsw r5, r5 ; CHECK-NEXT: sub r3, r3, r5 ; CHECK-NEXT: addi r6, r3, 1000 ; CHECK-NEXT: addi r3, r4, -1 ; CHECK-NEXT: clrldi r3, r3, 32 ; CHECK-NEXT: addi r3, r3, 1 ; CHECK-NEXT: mtctr r3 ; CHECK-NEXT: li r3, 0 ; CHECK-NEXT: .p2align 4 ; CHECK-NEXT: .LBB1_2: # %for.body ; CHECK-NEXT: # ; CHECK-NEXT: lbzux r4, r6, r5 ; CHECK-NEXT: add r3, r4, r3 ; CHECK-NEXT: bdnz .LBB1_2 ; CHECK-NEXT: # %bb.3: # %for.cond.cleanup ; CHECK-NEXT: clrldi r3, r3, 56 ; CHECK-NEXT: blr ; CHECK-NEXT: .LBB1_4: ; CHECK-NEXT: li r3, 0 ; CHECK-NEXT: blr entry: %cmp10 = icmp sgt i32 %n, 0 br i1 %cmp10, label %for.body.preheader, label %for.cond.cleanup for.body.preheader: ; preds = %entry %0 = sext i32 %count to i64 %add.ptr = getelementptr inbounds i8, i8* %p, i64 1000 br label %for.body for.cond.cleanup: ; preds = %for.body, %entry %sum.0.lcssa = phi i8 [ 0, %entry ], [ %add, %for.body ] ret i8 %sum.0.lcssa for.body: ; preds = %for.body.preheader, %for.body %indvars.iv = phi i64 [ 0, %for.body.preheader ], [ %indvars.iv.next, %for.body ] %i.013 = phi i32 [ 0, %for.body.preheader ], [ %inc, %for.body ] %sum.012 = phi i8 [ 0, %for.body.preheader ], [ %add, %for.body ] %add.ptr1 = getelementptr inbounds i8, i8* %add.ptr, i64 %indvars.iv %1 = load i8, i8* %add.ptr1, align 1 %add = add i8 %1, %sum.012 %indvars.iv.next = add nsw i64 %indvars.iv, %0 %inc = add nuw nsw i32 %i.013, 1 %exitcond.not = icmp eq i32 %inc, %n br i1 %exitcond.not, label %for.cond.cleanup, label %for.body }