summaryrefslogtreecommitdiff
path: root/polly/test/GPGPU/managed-pointers-preparation.ll
blob: 473f0c107a21c702390e6f4a75dbd9b4f3d1b6ed (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
; RUN: opt %loadPolly -polly-codegen-ppcg -polly-acc-dump-code \
; RUN: -polly-invariant-load-hoisting \
; RUN: -S -polly-acc-codegen-managed-memory < %s | FileCheck %s

; RUN: opt %loadPolly -polly-codegen-ppcg -polly-acc-dump-code \
; RUN: -polly-invariant-load-hoisting \
; RUN: -S -polly-acc-codegen-managed-memory -disable-output \
; RUN: -polly-acc-dump-code < %s | FileCheck %s -check-prefix=CODE

; REQUIRES: pollyacc

; CHECK: @polly_launchKernel
; CHECK: @polly_launchKernel
; CHECK: @polly_launchKernel
; CHECK: @polly_launchKernel
; CHECK: @polly_launchKernel
; CHECK-NOT: @polly_launchKernel


; CODE:  if (p_0_loaded_from___data_runcontrol_MOD_lmulti_layer == 1) {
; CODE-NEXT:    {
; CODE-NEXT:      dim3 k0_dimBlock;
; CODE-NEXT:      dim3 k0_dimGrid;
; CODE-NEXT:      kernel0 <<<k0_dimGrid, k0_dimBlock>>> (dev_MemRef__pn__phi, p_0_loaded_from___data_runcontrol_MOD_lmulti_layer);
; CODE-NEXT:      cudaCheckKernel();
; CODE-NEXT:    }

; CODE:  } else {
; CODE-NEXT:    {
; CODE-NEXT:      dim3 k1_dimBlock;
; CODE-NEXT:      dim3 k1_dimGrid;
; CODE-NEXT:      kernel1 <<<k1_dimGrid, k1_dimBlock>>> (dev_MemRef__pn__phi, p_0_loaded_from___data_runcontrol_MOD_lmulti_layer);
; CODE-NEXT:      cudaCheckKernel();
; CODE-NEXT:    }

; CHECK that this program is correctly code generated and does not result in
; 'instruction does not dominate use' errors. At an earlier point, such errors
; have been generated as the preparation of the managed memory pointers was
; performed right before kernel0, which does not dominate all other kernels.
; Now the preparation is performed at the very beginning of the scop.

source_filename = "bugpoint-output-c78f41e.bc"
target datalayout = "e-p:64:64:64-S128-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f16:16:16-f32:32:32-f64:64:64-f128:128:128-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64"
target triple = "x86_64-unknown-linux-gnu"

@__data_radiation_MOD_rad_csalbw = external global [10 x double], align 32
@__data_radiation_MOD_coai = external global [168 x double], align 32
@__data_runcontrol_MOD_lmulti_layer = external global i32

; Function Attrs: nounwind uwtable
define void @__radiation_interface_MOD_radiation_init() #0 {
entry:
  br label %"94"

"94":                                             ; preds = %"97", %entry
  br label %"95"

"95":                                             ; preds = %"95", %"94"
  br i1 undef, label %"97", label %"95"

"97":                                             ; preds = %"95"
  br i1 undef, label %"99", label %"94"

"99":                                             ; preds = %"97"
  br label %"102"

"102":                                            ; preds = %"102", %"99"
  %indvars.iv17 = phi i64 [ %indvars.iv.next18, %"102" ], [ 1, %"99" ]
  store double 1.000000e+00, ptr @__data_radiation_MOD_coai, align 8
  %0 = icmp eq i64 %indvars.iv17, 3
  %indvars.iv.next18 = add nuw nsw i64 %indvars.iv17, 1
  br i1 %0, label %"110", label %"102"

"110":                                            ; preds = %"102"
  %1 = load i32, ptr @__data_runcontrol_MOD_lmulti_layer, align 4, !range !0
  %2 = icmp eq i32 %1, 0
  br i1 %2, label %"112", label %"111"

"111":                                            ; preds = %"110"
  br label %"115"

"112":                                            ; preds = %"110"
  br label %"115"

"115":                                            ; preds = %"112", %"111"
  %.pn = phi double [ undef, %"112" ], [ undef, %"111" ]
  %3 = fdiv double 1.000000e+00, %.pn
  br label %"116"

"116":                                            ; preds = %"116", %"115"
  %indvars.iv = phi i64 [ %indvars.iv.next, %"116" ], [ 1, %"115" ]
  %4 = add nsw i64 %indvars.iv, -1
  %5 = fmul double %3, undef
  %6 = getelementptr [10 x double], ptr @__data_radiation_MOD_rad_csalbw, i64 0, i64 %4
  store double %5, ptr %6, align 8
  %7 = icmp eq i64 %indvars.iv, 10
  %indvars.iv.next = add nuw nsw i64 %indvars.iv, 1
  br i1 %7, label %return, label %"116"

return:                                           ; preds = %"116"
  ret void
}

attributes #0 = { nounwind uwtable }

!0 = !{i32 0, i32 2}