mirror of
				https://github.com/c64scene-ar/llvm-6502.git
				synced 2025-11-03 14:21:30 +00:00 
			
		
		
		
	IR for CUDA should use "nvptx[64]-nvidia-cuda", and IR for NV OpenCL should use "nvptx[64]-nvidia-nvcl" git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@184579 91177308-0d34-0410-b5e6-96231b3b80d8
		
			
				
	
	
		
			20 lines
		
	
	
		
			606 B
		
	
	
	
		
			LLVM
		
	
	
	
	
	
			
		
		
	
	
			20 lines
		
	
	
		
			606 B
		
	
	
	
		
			LLVM
		
	
	
	
	
	
; RUN: llc < %s -march=nvptx -mcpu=sm_20 | FileCheck %s
 | 
						|
 | 
						|
target datalayout = "e-p:32:32:32-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64"
 | 
						|
target triple = "nvptx-nvidia-cuda"
 | 
						|
 | 
						|
; Make sure predicate (i1) operands to kernels get expanded out to .u8
 | 
						|
 | 
						|
; CHECK: .entry foo
 | 
						|
; CHECK:   .param .u8 foo_param_0
 | 
						|
; CHECK:   .param .u32 foo_param_1
 | 
						|
define void @foo(i1 %p, i32* %out) {
 | 
						|
  %val = zext i1 %p to i32
 | 
						|
  store i32 %val, i32* %out
 | 
						|
  ret void
 | 
						|
}
 | 
						|
 | 
						|
 | 
						|
!nvvm.annotations = !{!0}
 | 
						|
!0 = metadata !{void (i1, i32*)* @foo, metadata !"kernel", i32 1}
 |