blob: f573fdab1b153d2eb5f77ec7e98ad8a5d96d15de [file] [log] [blame] [edit]
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mcpu=ppc -mtriple=powerpc64-unknown-linux-gnu | FileCheck %s --check-prefixes=PPC64
; RUN: llc < %s -mtriple=powerpc-unknown-linux-gnu | FileCheck %s --check-prefixes=PPC32
define { i128, i8 } @muloti_test(i128 %l, i128 %r) unnamed_addr #0 {
; PPC64-LABEL: muloti_test:
; PPC64: # %bb.0: # %start
; PPC64-NEXT: addic 9, 5, -1
; PPC64-NEXT: mulld 10, 5, 4
; PPC64-NEXT: mulld 11, 3, 6
; PPC64-NEXT: subfe 9, 9, 5
; PPC64-NEXT: add 10, 11, 10
; PPC64-NEXT: addic 11, 3, -1
; PPC64-NEXT: mulhdu 8, 3, 6
; PPC64-NEXT: subfe 3, 11, 3
; PPC64-NEXT: and 3, 3, 9
; PPC64-NEXT: addic 9, 8, -1
; PPC64-NEXT: subfe 8, 9, 8
; PPC64-NEXT: or 3, 3, 8
; PPC64-NEXT: mulhdu 5, 5, 4
; PPC64-NEXT: addic 8, 5, -1
; PPC64-NEXT: subfe 5, 8, 5
; PPC64-NEXT: li 7, 0
; PPC64-NEXT: or 5, 3, 5
; PPC64-NEXT: mulhdu 8, 4, 6
; PPC64-NEXT: addc 3, 8, 10
; PPC64-NEXT: addze 7, 7
; PPC64-NEXT: addic 8, 7, -1
; PPC64-NEXT: subfe 7, 8, 7
; PPC64-NEXT: or 5, 5, 7
; PPC64-NEXT: mulld 4, 4, 6
; PPC64-NEXT: blr
;
; PPC32-LABEL: muloti_test:
; PPC32: # %bb.0: # %start
; PPC32-NEXT: stwu 1, -64(1)
; PPC32-NEXT: stw 26, 40(1) # 4-byte Folded Spill
; PPC32-NEXT: mfcr 12
; PPC32-NEXT: stw 27, 44(1) # 4-byte Folded Spill
; PPC32-NEXT: mullw 27, 9, 4
; PPC32-NEXT: stw 21, 20(1) # 4-byte Folded Spill
; PPC32-NEXT: mr 11, 7
; PPC32-NEXT: stw 22, 24(1) # 4-byte Folded Spill
; PPC32-NEXT: li 7, 0
; PPC32-NEXT: mullw 26, 3, 10
; PPC32-NEXT: stw 23, 28(1) # 4-byte Folded Spill
; PPC32-NEXT: add 27, 26, 27
; PPC32-NEXT: stw 24, 32(1) # 4-byte Folded Spill
; PPC32-NEXT: cmpwi 7, 11, 0
; PPC32-NEXT: stw 25, 36(1) # 4-byte Folded Spill
; PPC32-NEXT: mullw 24, 11, 6
; PPC32-NEXT: stw 28, 48(1) # 4-byte Folded Spill
; PPC32-NEXT: stw 29, 52(1) # 4-byte Folded Spill
; PPC32-NEXT: stw 30, 56(1) # 4-byte Folded Spill
; PPC32-NEXT: mulhwu 0, 8, 6
; PPC32-NEXT: stw 12, 16(1)
; PPC32-NEXT: mr 12, 5
; PPC32-NEXT: mulhwu 5, 4, 10
; PPC32-NEXT: addc 5, 5, 27
; PPC32-NEXT: addze 27, 7
; PPC32-NEXT: cmpwi 2, 27, 0
; PPC32-NEXT: mullw 25, 12, 8
; PPC32-NEXT: add 26, 24, 25
; PPC32-NEXT: addc 0, 0, 26
; PPC32-NEXT: addze 26, 7
; PPC32-NEXT: mullw 23, 8, 6
; PPC32-NEXT: mullw 22, 4, 10
; PPC32-NEXT: addc 24, 22, 23
; PPC32-NEXT: adde 22, 5, 0
; PPC32-NEXT: mulhwu 29, 6, 10
; PPC32-NEXT: mullw 21, 12, 10
; PPC32-NEXT: addc 5, 21, 29
; PPC32-NEXT: mulhwu 30, 12, 10
; PPC32-NEXT: addze 0, 30
; PPC32-NEXT: mullw 23, 6, 9
; PPC32-NEXT: addc 5, 23, 5
; PPC32-NEXT: mulhwu 28, 6, 9
; PPC32-NEXT: addze 29, 28
; PPC32-NEXT: addc 0, 0, 29
; PPC32-NEXT: addze 29, 7
; PPC32-NEXT: mullw 30, 12, 9
; PPC32-NEXT: addc 0, 30, 0
; PPC32-NEXT: mulhwu 25, 12, 9
; PPC32-NEXT: adde 30, 25, 29
; PPC32-NEXT: addc 0, 0, 24
; PPC32-NEXT: adde 30, 30, 22
; PPC32-NEXT: addze. 29, 7
; PPC32-NEXT: mcrf 1, 0
; PPC32-NEXT: mulhwu. 29, 11, 6
; PPC32-NEXT: mcrf 6, 0
; PPC32-NEXT: mulhwu. 29, 12, 8
; PPC32-NEXT: mcrf 5, 0
; PPC32-NEXT: cmpwi 12, 0
; PPC32-NEXT: crnor 20, 2, 30
; PPC32-NEXT: cmpwi 3, 0
; PPC32-NEXT: cmpwi 7, 9, 0
; PPC32-NEXT: crnor 24, 30, 2
; PPC32-NEXT: mulhwu. 12, 3, 10
; PPC32-NEXT: crorc 20, 20, 26
; PPC32-NEXT: mcrf 7, 0
; PPC32-NEXT: crorc 20, 20, 22
; PPC32-NEXT: cmpwi 26, 0
; PPC32-NEXT: crorc 28, 20, 2
; PPC32-NEXT: mulhwu. 9, 9, 4
; PPC32-NEXT: mcrf 5, 0
; PPC32-NEXT: crorc 20, 24, 30
; PPC32-NEXT: or. 3, 4, 3
; PPC32-NEXT: mcrf 6, 0
; PPC32-NEXT: crorc 20, 20, 22
; PPC32-NEXT: or. 3, 8, 11
; PPC32-NEXT: crorc 20, 20, 10
; PPC32-NEXT: crnor 21, 2, 26
; PPC32-NEXT: cror 20, 21, 20
; PPC32-NEXT: cror 20, 20, 28
; PPC32-NEXT: crandc 20, 6, 20
; PPC32-NEXT: mullw 6, 6, 10
; PPC32-NEXT: bc 12, 20, .LBB0_2
; PPC32-NEXT: # %bb.1: # %start
; PPC32-NEXT: li 7, 1
; PPC32-NEXT: .LBB0_2: # %start
; PPC32-NEXT: lwz 12, 16(1)
; PPC32-NEXT: mr 3, 30
; PPC32-NEXT: mr 4, 0
; PPC32-NEXT: lwz 30, 56(1) # 4-byte Folded Reload
; PPC32-NEXT: mtcrf 32, 12 # cr2
; PPC32-NEXT: lwz 29, 52(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 28, 48(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 27, 44(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 26, 40(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 25, 36(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 24, 32(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 23, 28(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 22, 24(1) # 4-byte Folded Reload
; PPC32-NEXT: lwz 21, 20(1) # 4-byte Folded Reload
; PPC32-NEXT: addi 1, 1, 64
; PPC32-NEXT: blr
start:
%0 = tail call { i128, i1 } @llvm.umul.with.overflow.i128(i128 %l, i128 %r) #2
%1 = extractvalue { i128, i1 } %0, 0
%2 = extractvalue { i128, i1 } %0, 1
%3 = zext i1 %2 to i8
%4 = insertvalue { i128, i8 } undef, i128 %1, 0
%5 = insertvalue { i128, i8 } %4, i8 %3, 1
ret { i128, i8 } %5
}
; Function Attrs: nounwind readnone speculatable
declare { i128, i1 } @llvm.umul.with.overflow.i128(i128, i128) #1
attributes #0 = { nounwind readnone }
attributes #1 = { nounwind readnone speculatable }
attributes #2 = { nounwind }