25 lines
		
	
	
		
			785 B
		
	
	
	
		
			LLVM
		
	
	
	
			
		
		
	
	
			25 lines
		
	
	
		
			785 B
		
	
	
	
		
			LLVM
		
	
	
	
; RUN: llc < %s -march=nvptx -mcpu=sm_20 -nvptx-fma-level=1 | FileCheck %s -check-prefix=FMA
 | 
						|
; RUN: llc < %s -march=nvptx -mcpu=sm_20 -nvptx-fma-level=0 | FileCheck %s -check-prefix=MUL
 | 
						|
; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 -nvptx-fma-level=1 | FileCheck %s -check-prefix=FMA
 | 
						|
; RUN: llc < %s -march=nvptx64 -mcpu=sm_20 -nvptx-fma-level=0 | FileCheck %s -check-prefix=MUL
 | 
						|
 | 
						|
define ptx_device float @test_mul_add_f(float %x, float %y, float %z) {
 | 
						|
entry:
 | 
						|
; FMA: fma.rn.f32
 | 
						|
; MUL: mul.rn.f32
 | 
						|
; MUL: add.rn.f32
 | 
						|
  %a = fmul float %x, %y
 | 
						|
  %b = fadd float %a, %z
 | 
						|
  ret float %b
 | 
						|
}
 | 
						|
 | 
						|
define ptx_device double @test_mul_add_d(double %x, double %y, double %z) {
 | 
						|
entry:
 | 
						|
; FMA: fma.rn.f64
 | 
						|
; MUL: mul.rn.f64
 | 
						|
; MUL: add.rn.f64
 | 
						|
  %a = fmul double %x, %y
 | 
						|
  %b = fadd double %a, %z
 | 
						|
  ret double %b
 | 
						|
}
 |