672 lines
		
	
	
		
			19 KiB
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			672 lines
		
	
	
		
			19 KiB
		
	
	
	
		
			LLVM
		
	
	
	
| ; RUN: llc -march=arm64 -aarch64-atomic-cfg-tidy=0 -disable-post-ra -verify-machineinstrs < %s | FileCheck %s
 | |
| ; RUN: llc -march=arm64 -aarch64-atomic-cfg-tidy=0 -fast-isel -fast-isel-abort=1 -disable-post-ra -verify-machineinstrs < %s | FileCheck %s
 | |
| 
 | |
| ;
 | |
| ; Get the actual value of the overflow bit.
 | |
| ;
 | |
| define zeroext i1 @saddo1.i32(i32 %v1, i32 %v2, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo1.i32
 | |
| ; CHECK:        adds {{w[0-9]+}}, w0, w1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| ; Test the immediate version.
 | |
| define zeroext i1 @saddo2.i32(i32 %v1, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo2.i32
 | |
| ; CHECK:        adds {{w[0-9]+}}, w0, #4
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 4)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| ; Test negative immediates.
 | |
| define zeroext i1 @saddo3.i32(i32 %v1, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo3.i32
 | |
| ; CHECK:        subs {{w[0-9]+}}, w0, #4
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 -4)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| ; Test immediates that are too large to be encoded.
 | |
| define zeroext i1 @saddo4.i32(i32 %v1, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo4.i32
 | |
| ; CHECK:        adds {{w[0-9]+}}, w0, {{w[0-9]+}}
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 16777215)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| ; Test shift folding.
 | |
| define zeroext i1 @saddo5.i32(i32 %v1, i32 %v2, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo5.i32
 | |
| ; CHECK:        adds {{w[0-9]+}}, w0, w1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %lsl = shl i32 %v2, 16
 | |
|   %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 %lsl)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @saddo1.i64(i64 %v1, i64 %v2, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo1.i64
 | |
| ; CHECK:        adds {{x[0-9]+}}, x0, x1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @saddo2.i64(i64 %v1, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo2.i64
 | |
| ; CHECK:        adds {{x[0-9]+}}, x0, #4
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 4)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @saddo3.i64(i64 %v1, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo3.i64
 | |
| ; CHECK:        subs {{x[0-9]+}}, x0, #4
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 -4)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @uaddo.i32(i32 %v1, i32 %v2, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  uaddo.i32
 | |
| ; CHECK:        adds {{w[0-9]+}}, w0, w1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, hs
 | |
|   %t = call {i32, i1} @llvm.uadd.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @uaddo.i64(i64 %v1, i64 %v2, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  uaddo.i64
 | |
| ; CHECK:        adds {{x[0-9]+}}, x0, x1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, hs
 | |
|   %t = call {i64, i1} @llvm.uadd.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @ssubo1.i32(i32 %v1, i32 %v2, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  ssubo1.i32
 | |
| ; CHECK:        subs {{w[0-9]+}}, w0, w1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i32, i1} @llvm.ssub.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @ssubo2.i32(i32 %v1, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  ssubo2.i32
 | |
| ; CHECK:        adds {{w[0-9]+}}, w0, #4
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i32, i1} @llvm.ssub.with.overflow.i32(i32 %v1, i32 -4)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @ssubo.i64(i64 %v1, i64 %v2, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  ssubo.i64
 | |
| ; CHECK:        subs {{x[0-9]+}}, x0, x1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i64, i1} @llvm.ssub.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @usubo.i32(i32 %v1, i32 %v2, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  usubo.i32
 | |
| ; CHECK:        subs {{w[0-9]+}}, w0, w1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, lo
 | |
|   %t = call {i32, i1} @llvm.usub.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @usubo.i64(i64 %v1, i64 %v2, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  usubo.i64
 | |
| ; CHECK:        subs {{x[0-9]+}}, x0, x1
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, lo
 | |
|   %t = call {i64, i1} @llvm.usub.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @smulo.i32(i32 %v1, i32 %v2, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo.i32
 | |
| ; CHECK:        smull x[[MREG:[0-9]+]], w0, w1
 | |
| ; CHECK-NEXT:   lsr x[[SREG:[0-9]+]], x[[MREG]], #32
 | |
| ; CHECK-NEXT:   cmp w[[SREG]], w[[MREG]], asr #31
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, ne
 | |
|   %t = call {i32, i1} @llvm.smul.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @smulo.i64(i64 %v1, i64 %v2, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo.i64
 | |
| ; CHECK:        mul [[MREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   smulh [[HREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   cmp [[HREG]], [[MREG]], asr #63
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, ne
 | |
|   %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @smulo2.i64(i64 %v1, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo2.i64
 | |
| ; CHECK:        adds [[MREG:x[0-9]+]], x0, x0
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, vs
 | |
|   %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @umulo.i32(i32 %v1, i32 %v2, i32* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo.i32
 | |
| ; CHECK:        umull [[MREG:x[0-9]+]], w0, w1
 | |
| ; CHECK-NEXT:   cmp xzr, [[MREG]], lsr #32
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, ne
 | |
|   %t = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   store i32 %val, i32* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @umulo.i64(i64 %v1, i64 %v2, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo.i64
 | |
| ; CHECK:        umulh [[MREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   cmp xzr, [[MREG]]
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, ne
 | |
|   %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| define zeroext i1 @umulo2.i64(i64 %v1, i64* %res) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo2.i64
 | |
| ; CHECK:        adds [[MREG:x[0-9]+]], x0, x0
 | |
| ; CHECK-NEXT:   cset {{w[0-9]+}}, hs
 | |
|   %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   store i64 %val, i64* %res
 | |
|   ret i1 %obit
 | |
| }
 | |
| 
 | |
| 
 | |
| ;
 | |
| ; Check the use of the overflow bit in combination with a select instruction.
 | |
| ;
 | |
| define i32 @saddo.select.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo.select.i32
 | |
| ; CHECK:        cmn w0, w1
 | |
| ; CHECK-NEXT:   csel w0, w0, w1, vs
 | |
|   %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   %ret = select i1 %obit, i32 %v1, i32 %v2
 | |
|   ret i32 %ret
 | |
| }
 | |
| 
 | |
| define i64 @saddo.select.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo.select.i64
 | |
| ; CHECK:        cmn x0, x1
 | |
| ; CHECK-NEXT:   csel x0, x0, x1, vs
 | |
|   %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   %ret = select i1 %obit, i64 %v1, i64 %v2
 | |
|   ret i64 %ret
 | |
| }
 | |
| 
 | |
| define i32 @uaddo.select.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  uaddo.select.i32
 | |
| ; CHECK:        cmn w0, w1
 | |
| ; CHECK-NEXT:   csel w0, w0, w1, hs
 | |
|   %t = call {i32, i1} @llvm.uadd.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   %ret = select i1 %obit, i32 %v1, i32 %v2
 | |
|   ret i32 %ret
 | |
| }
 | |
| 
 | |
| define i64 @uaddo.select.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  uaddo.select.i64
 | |
| ; CHECK:        cmn x0, x1
 | |
| ; CHECK-NEXT:   csel x0, x0, x1, hs
 | |
|   %t = call {i64, i1} @llvm.uadd.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   %ret = select i1 %obit, i64 %v1, i64 %v2
 | |
|   ret i64 %ret
 | |
| }
 | |
| 
 | |
| define i32 @ssubo.select.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  ssubo.select.i32
 | |
| ; CHECK:        cmp w0, w1
 | |
| ; CHECK-NEXT:   csel w0, w0, w1, vs
 | |
|   %t = call {i32, i1} @llvm.ssub.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   %ret = select i1 %obit, i32 %v1, i32 %v2
 | |
|   ret i32 %ret
 | |
| }
 | |
| 
 | |
| define i64 @ssubo.select.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  ssubo.select.i64
 | |
| ; CHECK:        cmp x0, x1
 | |
| ; CHECK-NEXT:   csel x0, x0, x1, vs
 | |
|   %t = call {i64, i1} @llvm.ssub.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   %ret = select i1 %obit, i64 %v1, i64 %v2
 | |
|   ret i64 %ret
 | |
| }
 | |
| 
 | |
| define i32 @usubo.select.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  usubo.select.i32
 | |
| ; CHECK:        cmp w0, w1
 | |
| ; CHECK-NEXT:   csel w0, w0, w1, lo
 | |
|   %t = call {i32, i1} @llvm.usub.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   %ret = select i1 %obit, i32 %v1, i32 %v2
 | |
|   ret i32 %ret
 | |
| }
 | |
| 
 | |
| define i64 @usubo.select.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  usubo.select.i64
 | |
| ; CHECK:        cmp x0, x1
 | |
| ; CHECK-NEXT:   csel x0, x0, x1, lo
 | |
|   %t = call {i64, i1} @llvm.usub.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   %ret = select i1 %obit, i64 %v1, i64 %v2
 | |
|   ret i64 %ret
 | |
| }
 | |
| 
 | |
| define i32 @smulo.select.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo.select.i32
 | |
| ; CHECK:        smull   x[[MREG:[0-9]+]], w0, w1
 | |
| ; CHECK-NEXT:   lsr     x[[SREG:[0-9]+]], x[[MREG]], #32
 | |
| ; CHECK-NEXT:   cmp     w[[SREG]], w[[MREG]], asr #31
 | |
| ; CHECK-NEXT:   csel    w0, w0, w1, ne
 | |
|   %t = call {i32, i1} @llvm.smul.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   %ret = select i1 %obit, i32 %v1, i32 %v2
 | |
|   ret i32 %ret
 | |
| }
 | |
| 
 | |
| define i64 @smulo.select.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo.select.i64
 | |
| ; CHECK:        mul     [[MREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   smulh   [[HREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   cmp     [[HREG]], [[MREG]], asr #63
 | |
| ; CHECK-NEXT:   csel    x0, x0, x1, ne
 | |
|   %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   %ret = select i1 %obit, i64 %v1, i64 %v2
 | |
|   ret i64 %ret
 | |
| }
 | |
| 
 | |
| define i32 @umulo.select.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo.select.i32
 | |
| ; CHECK:        umull   [[MREG:x[0-9]+]], w0, w1
 | |
| ; CHECK-NEXT:   cmp     xzr, [[MREG]], lsr #32
 | |
| ; CHECK-NEXT:   csel    w0, w0, w1, ne
 | |
|   %t = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   %ret = select i1 %obit, i32 %v1, i32 %v2
 | |
|   ret i32 %ret
 | |
| }
 | |
| 
 | |
| define i64 @umulo.select.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo.select.i64
 | |
| ; CHECK:        umulh   [[MREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   cmp     xzr, [[MREG]]
 | |
| ; CHECK-NEXT:   csel    x0, x0, x1, ne
 | |
|   %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   %ret = select i1 %obit, i64 %v1, i64 %v2
 | |
|   ret i64 %ret
 | |
| }
 | |
| 
 | |
| 
 | |
| ;
 | |
| ; Check the use of the overflow bit in combination with a branch instruction.
 | |
| ;
 | |
| define zeroext i1 @saddo.br.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo.br.i32
 | |
| ; CHECK:        cmn w0, w1
 | |
| ; CHECK-NEXT:   b.vc
 | |
|   %t = call {i32, i1} @llvm.sadd.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @saddo.br.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  saddo.br.i64
 | |
| ; CHECK:        cmn x0, x1
 | |
| ; CHECK-NEXT:   b.vc
 | |
|   %t = call {i64, i1} @llvm.sadd.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @uaddo.br.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  uaddo.br.i32
 | |
| ; CHECK:        cmn w0, w1
 | |
| ; CHECK-NEXT:   b.lo
 | |
|   %t = call {i32, i1} @llvm.uadd.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @uaddo.br.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  uaddo.br.i64
 | |
| ; CHECK:        cmn x0, x1
 | |
| ; CHECK-NEXT:   b.lo
 | |
|   %t = call {i64, i1} @llvm.uadd.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @ssubo.br.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  ssubo.br.i32
 | |
| ; CHECK:        cmp w0, w1
 | |
| ; CHECK-NEXT:   b.vc
 | |
|   %t = call {i32, i1} @llvm.ssub.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @ssubo.br.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  ssubo.br.i64
 | |
| ; CHECK:        cmp x0, x1
 | |
| ; CHECK-NEXT:   b.vc
 | |
|   %t = call {i64, i1} @llvm.ssub.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @usubo.br.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  usubo.br.i32
 | |
| ; CHECK:        cmp w0, w1
 | |
| ; CHECK-NEXT:   b.hs
 | |
|   %t = call {i32, i1} @llvm.usub.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @usubo.br.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  usubo.br.i64
 | |
| ; CHECK:        cmp x0, x1
 | |
| ; CHECK-NEXT:   b.hs
 | |
|   %t = call {i64, i1} @llvm.usub.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @smulo.br.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo.br.i32
 | |
| ; CHECK:        smull   x[[MREG:[0-9]+]], w0, w1
 | |
| ; CHECK-NEXT:   lsr     x[[SREG:[0-9]+]], x8, #32
 | |
| ; CHECK-NEXT:   cmp     w[[SREG]], w[[MREG]], asr #31
 | |
| ; CHECK-NEXT:   b.eq
 | |
|   %t = call {i32, i1} @llvm.smul.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @smulo.br.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo.br.i64
 | |
| ; CHECK:        mul     [[MREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   smulh   [[HREG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   cmp     [[HREG]], [[MREG]], asr #63
 | |
| ; CHECK-NEXT:   b.eq
 | |
|   %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @smulo2.br.i64(i64 %v1) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  smulo2.br.i64
 | |
| ; CHECK:        cmn  x0, x0
 | |
| ; CHECK-NEXT:   b.vc
 | |
|   %t = call {i64, i1} @llvm.smul.with.overflow.i64(i64 %v1, i64 2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @umulo.br.i32(i32 %v1, i32 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo.br.i32
 | |
| ; CHECK:        umull   [[MREG:x[0-9]+]], w0, w1
 | |
| ; CHECK-NEXT:   cmp     xzr, [[MREG]], lsr #32
 | |
| ; CHECK-NEXT:   b.eq
 | |
|   %t = call {i32, i1} @llvm.umul.with.overflow.i32(i32 %v1, i32 %v2)
 | |
|   %val = extractvalue {i32, i1} %t, 0
 | |
|   %obit = extractvalue {i32, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @umulo.br.i64(i64 %v1, i64 %v2) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo.br.i64
 | |
| ; CHECK:        umulh   [[REG:x[0-9]+]], x0, x1
 | |
| ; CHECK-NEXT:   {{cbz|cmp}}
 | |
|   %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 %v2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| define zeroext i1 @umulo2.br.i64(i64 %v1) {
 | |
| entry:
 | |
| ; CHECK-LABEL:  umulo2.br.i64
 | |
| ; CHECK:        cmn  x0, x0
 | |
| ; CHECK-NEXT:   b.lo
 | |
|   %t = call {i64, i1} @llvm.umul.with.overflow.i64(i64 %v1, i64 2)
 | |
|   %val = extractvalue {i64, i1} %t, 0
 | |
|   %obit = extractvalue {i64, i1} %t, 1
 | |
|   br i1 %obit, label %overflow, label %continue
 | |
| 
 | |
| overflow:
 | |
|   ret i1 false
 | |
| 
 | |
| continue:
 | |
|   ret i1 true
 | |
| }
 | |
| 
 | |
| declare {i32, i1} @llvm.sadd.with.overflow.i32(i32, i32) nounwind readnone
 | |
| declare {i64, i1} @llvm.sadd.with.overflow.i64(i64, i64) nounwind readnone
 | |
| declare {i32, i1} @llvm.uadd.with.overflow.i32(i32, i32) nounwind readnone
 | |
| declare {i64, i1} @llvm.uadd.with.overflow.i64(i64, i64) nounwind readnone
 | |
| declare {i32, i1} @llvm.ssub.with.overflow.i32(i32, i32) nounwind readnone
 | |
| declare {i64, i1} @llvm.ssub.with.overflow.i64(i64, i64) nounwind readnone
 | |
| declare {i32, i1} @llvm.usub.with.overflow.i32(i32, i32) nounwind readnone
 | |
| declare {i64, i1} @llvm.usub.with.overflow.i64(i64, i64) nounwind readnone
 | |
| declare {i32, i1} @llvm.smul.with.overflow.i32(i32, i32) nounwind readnone
 | |
| declare {i64, i1} @llvm.smul.with.overflow.i64(i64, i64) nounwind readnone
 | |
| declare {i32, i1} @llvm.umul.with.overflow.i32(i32, i32) nounwind readnone
 | |
| declare {i64, i1} @llvm.umul.with.overflow.i64(i64, i64) nounwind readnone
 | |
| 
 |