; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py ; RUN: llc -O0 < %s | FileCheck %s target datalayout = "e-m:e-i64:64-n32:64" target triple = "powerpc64le-unknown-linux-gnu" define void @bn_mul_comba8(i64* nocapture %r, i64* nocapture readonly %a, i64* nocapture readonly %b) { ; CHECK-LABEL: bn_mul_comba8: ; CHECK: # %bb.0: ; CHECK-NEXT: std 4, -8(1) # 8-byte Folded Spill ; CHECK-NEXT: mr 4, 3 ; CHECK-NEXT: ld 3, -8(1) # 8-byte Folded Reload ; CHECK-NEXT: ld 9, 0(3) ; CHECK-NEXT: ld 8, 0(5) ; CHECK-NEXT: mulhdu 7, 8, 9 ; CHECK-NEXT: ld 3, 8(3) ; CHECK-NEXT: mulld 6, 3, 9 ; CHECK-NEXT: mulhdu 3, 3, 9 ; CHECK-NEXT: addc 6, 6, 7 ; CHECK-NEXT: addze 3, 3 ; CHECK-NEXT: ld 5, 8(5) ; CHECK-NEXT: mulld 7, 5, 8 ; CHECK-NEXT: mulhdu 5, 5, 8 ; CHECK-NEXT: addc 6, 6, 7 ; CHECK-NEXT: addze 5, 5 ; CHECK-NEXT: add 3, 5, 3 ; CHECK-NEXT: cmpld 3, 5 ; CHECK-NEXT: crmove 20, 0 ; CHECK-NEXT: li 5, 0 ; CHECK-NEXT: li 3, 1 ; CHECK-NEXT: isel 3, 3, 5, 20 ; CHECK-NEXT: std 3, 0(4) ; CHECK-NEXT: blr %1 = load i64, i64* %a, align 8 %conv = zext i64 %1 to i128 %2 = load i64, i64* %b, align 8 %conv2 = zext i64 %2 to i128 %mul = mul nuw i128 %conv2, %conv %shr = lshr i128 %mul, 64 %agep = getelementptr inbounds i64, i64* %a, i64 1 %3 = load i64, i64* %agep, align 8 %conv14 = zext i64 %3 to i128 %mul15 = mul nuw i128 %conv14, %conv %add17 = add i128 %mul15, %shr %shr19 = lshr i128 %add17, 64 %conv20 = trunc i128 %shr19 to i64 %bgep = getelementptr inbounds i64, i64* %b, i64 1 %4 = load i64, i64* %bgep, align 8 %conv28 = zext i64 %4 to i128 %mul31 = mul nuw i128 %conv28, %conv2 %conv32 = and i128 %add17, 18446744073709551615 %add33 = add i128 %conv32, %mul31 %shr35 = lshr i128 %add33, 64 %conv36 = trunc i128 %shr35 to i64 %add37 = add i64 %conv36, %conv20 %cmp38 = icmp ult i64 %add37, %conv36 %conv148 = zext i1 %cmp38 to i64 store i64 %conv148, i64* %r, align 8 ret void }