Changeset View
Changeset View
Standalone View
Standalone View
test/GPGPU/kernel-params-only-some-arrays.ll
Show All 10 Lines | |||||
; void kernel_params_only_some_arrays(float A[], float B[]) { | ; void kernel_params_only_some_arrays(float A[], float B[]) { | ||||
; for (long i = 0; i < 32; i++) | ; for (long i = 0; i < 32; i++) | ||||
; A[i] += 42; | ; A[i] += 42; | ||||
; | ; | ||||
; for (long i = 0; i < 32; i++) | ; for (long i = 0; i < 32; i++) | ||||
; B[i] += 42; | ; B[i] += 42; | ||||
; } | ; } | ||||
; KERNEL: ; ModuleID = 'FUNC_kernel_params_only_some_arrays_KERNEL_0' | ; KERNEL: ; ModuleID = 'FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_0' | ||||
; KERNEL-NEXT: source_filename = "FUNC_kernel_params_only_some_arrays_KERNEL_0" | ; KERNEL-NEXT: source_filename = "FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_0" | ||||
; KERNEL-NEXT: target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64" | ; KERNEL-NEXT: target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64" | ||||
; KERNEL-NEXT: target triple = "nvptx64-nvidia-cuda" | ; KERNEL-NEXT: target triple = "nvptx64-nvidia-cuda" | ||||
; KERNEL: define ptx_kernel void @FUNC_kernel_params_only_some_arrays_KERNEL_0(i8 addrspace(1)* %MemRef_A) | ; KERNEL: define ptx_kernel void @FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_0(i8 addrspace(1)* %MemRef_A) | ||||
; KERNEL-NEXT: entry: | ; KERNEL-NEXT: entry: | ||||
; KERNEL-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x() | ; KERNEL-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x() | ||||
; KERNEL-NEXT: %b0 = zext i32 %0 to i64 | ; KERNEL-NEXT: %b0 = zext i32 %0 to i64 | ||||
; KERNEL-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() | ; KERNEL-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() | ||||
; KERNEL-NEXT: %t0 = zext i32 %1 to i64 | ; KERNEL-NEXT: %t0 = zext i32 %1 to i64 | ||||
; KERNEL: ret void | ; KERNEL: ret void | ||||
; KERNEL-NEXT: } | ; KERNEL-NEXT: } | ||||
; KERNEL: ; ModuleID = 'FUNC_kernel_params_only_some_arrays_KERNEL_1' | ; KERNEL: ; ModuleID = 'FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_1' | ||||
; KERNEL-NEXT: source_filename = "FUNC_kernel_params_only_some_arrays_KERNEL_1" | ; KERNEL-NEXT: source_filename = "FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_1" | ||||
; KERNEL-NEXT: target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64" | ; KERNEL-NEXT: target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v16:16:16-v32:32:32-v64:64:64-v128:128:128-n16:32:64" | ||||
; KERNEL-NEXT: target triple = "nvptx64-nvidia-cuda" | ; KERNEL-NEXT: target triple = "nvptx64-nvidia-cuda" | ||||
; KERNEL: define ptx_kernel void @FUNC_kernel_params_only_some_arrays_KERNEL_1(i8 addrspace(1)* %MemRef_B) | ; KERNEL: define ptx_kernel void @FUNC_kernel_params_only_some_arrays_SCOP_0_KERNEL_1(i8 addrspace(1)* %MemRef_B) | ||||
; KERNEL-NEXT: entry: | ; KERNEL-NEXT: entry: | ||||
; KERNEL-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x() | ; KERNEL-NEXT: %0 = call i32 @llvm.nvvm.read.ptx.sreg.ctaid.x() | ||||
; KERNEL-NEXT: %b0 = zext i32 %0 to i64 | ; KERNEL-NEXT: %b0 = zext i32 %0 to i64 | ||||
; KERNEL-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() | ; KERNEL-NEXT: %1 = call i32 @llvm.nvvm.read.ptx.sreg.tid.x() | ||||
; KERNEL-NEXT: %t0 = zext i32 %1 to i64 | ; KERNEL-NEXT: %t0 = zext i32 %1 to i64 | ||||
; KERNEL: ret void | ; KERNEL: ret void | ||||
; KERNEL-NEXT: } | ; KERNEL-NEXT: } | ||||
▲ Show 20 Lines • Show All 58 Lines • Show Last 20 Lines |