You've already forked linux-packaging-mono
							
							
		
			
				
	
	
		
			68 lines
		
	
	
		
			2.6 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
			
		
		
	
	
			68 lines
		
	
	
		
			2.6 KiB
		
	
	
	
		
			LLVM
		
	
	
	
	
	
| ; RUN: llc -march=amdgcn < %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
 | |
| ; Make sure we don't try to form FMAX_LEGACY nodes with f64
 | |
| 
 | |
| declare i32 @llvm.amdgcn.workitem.id.x() #1
 | |
| 
 | |
| ; FUNC-LABEL: @test_fmax_legacy_uge_f64
 | |
| define amdgpu_kernel void @test_fmax_legacy_uge_f64(double addrspace(1)* %out, double addrspace(1)* %in) #0 {
 | |
|   %tid = call i32 @llvm.amdgcn.workitem.id.x() #1
 | |
|   %gep.0 = getelementptr double, double addrspace(1)* %in, i32 %tid
 | |
|   %gep.1 = getelementptr double, double addrspace(1)* %gep.0, i32 1
 | |
| 
 | |
|   %a = load double, double addrspace(1)* %gep.0, align 8
 | |
|   %b = load double, double addrspace(1)* %gep.1, align 8
 | |
| 
 | |
|   %cmp = fcmp uge double %a, %b
 | |
|   %val = select i1 %cmp, double %a, double %b
 | |
|   store double %val, double addrspace(1)* %out, align 8
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; FUNC-LABEL: @test_fmax_legacy_oge_f64
 | |
| define amdgpu_kernel void @test_fmax_legacy_oge_f64(double addrspace(1)* %out, double addrspace(1)* %in) #0 {
 | |
|   %tid = call i32 @llvm.amdgcn.workitem.id.x() #1
 | |
|   %gep.0 = getelementptr double, double addrspace(1)* %in, i32 %tid
 | |
|   %gep.1 = getelementptr double, double addrspace(1)* %gep.0, i32 1
 | |
| 
 | |
|   %a = load double, double addrspace(1)* %gep.0, align 8
 | |
|   %b = load double, double addrspace(1)* %gep.1, align 8
 | |
| 
 | |
|   %cmp = fcmp oge double %a, %b
 | |
|   %val = select i1 %cmp, double %a, double %b
 | |
|   store double %val, double addrspace(1)* %out, align 8
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; FUNC-LABEL: @test_fmax_legacy_ugt_f64
 | |
| define amdgpu_kernel void @test_fmax_legacy_ugt_f64(double addrspace(1)* %out, double addrspace(1)* %in) #0 {
 | |
|   %tid = call i32 @llvm.amdgcn.workitem.id.x() #1
 | |
|   %gep.0 = getelementptr double, double addrspace(1)* %in, i32 %tid
 | |
|   %gep.1 = getelementptr double, double addrspace(1)* %gep.0, i32 1
 | |
| 
 | |
|   %a = load double, double addrspace(1)* %gep.0, align 8
 | |
|   %b = load double, double addrspace(1)* %gep.1, align 8
 | |
| 
 | |
|   %cmp = fcmp ugt double %a, %b
 | |
|   %val = select i1 %cmp, double %a, double %b
 | |
|   store double %val, double addrspace(1)* %out, align 8
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| ; FUNC-LABEL: @test_fmax_legacy_ogt_f64
 | |
| define amdgpu_kernel void @test_fmax_legacy_ogt_f64(double addrspace(1)* %out, double addrspace(1)* %in) #0 {
 | |
|   %tid = call i32 @llvm.amdgcn.workitem.id.x() #1
 | |
|   %gep.0 = getelementptr double, double addrspace(1)* %in, i32 %tid
 | |
|   %gep.1 = getelementptr double, double addrspace(1)* %gep.0, i32 1
 | |
| 
 | |
|   %a = load double, double addrspace(1)* %gep.0, align 8
 | |
|   %b = load double, double addrspace(1)* %gep.1, align 8
 | |
| 
 | |
|   %cmp = fcmp ogt double %a, %b
 | |
|   %val = select i1 %cmp, double %a, double %b
 | |
|   store double %val, double addrspace(1)* %out, align 8
 | |
|   ret void
 | |
| }
 | |
| 
 | |
| attributes #0 = { nounwind }
 | |
| attributes #1 = { nounwind readnone }
 |