// RUN: %clang_cc1 -verify -fopenmp -triple x86_64-apple-darwin10.6.0 -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm-bc -o %t-host.bc %s // RUN: %clang_cc1 -verify -fopenmp -triple nvptx64-nvidia-cuda -fopenmp-targets=nvptx64-nvidia-cuda -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-host.bc -o - -disable-llvm-optzns | FileCheck %s // expected-no-diagnostics #ifndef HEADER #define HEADER #pragma omp declare target typedef void **omp_allocator_handle_t; extern const omp_allocator_handle_t omp_default_mem_alloc; extern const omp_allocator_handle_t omp_large_cap_mem_alloc; extern const omp_allocator_handle_t omp_const_mem_alloc; extern const omp_allocator_handle_t omp_high_bw_mem_alloc; extern const omp_allocator_handle_t omp_low_lat_mem_alloc; extern const omp_allocator_handle_t omp_cgroup_mem_alloc; extern const omp_allocator_handle_t omp_pteam_mem_alloc; extern const omp_allocator_handle_t omp_thread_mem_alloc; // CHECK-DAG: @{{.+}}St1{{.+}}b{{.+}} = external global i32, // CHECK-DAG: @a ={{ dso_local | }}global i32 0, // CHECK-DAG: @b ={{ dso_local | }}addrspace(4) global i32 0, // CHECK-DAG: @c ={{ dso_local | }}global i32 0, // CHECK-DAG: @d ={{ dso_local | }}global %struct.St1 zeroinitializer, // CHECK-DAG: @{{.+}}ns{{.+}}a{{.+}} ={{ dso_local | }}addrspace(3) global i32 0, // CHECK-DAG: @{{.+}}main{{.+}}a{{.*}} = internal global i32 0, // CHECK-DAG: @{{.+}}ST{{.+}}m{{.+}} = external global i32, // CHECK-DAG: @bar_c = internal global i32 0, // CHECK-DAG: @bar_b = internal addrspace(3) global double 0.000000e+00, struct St{ int a; }; struct St1{ int a; static int b; #pragma omp allocate(b) allocator(omp_default_mem_alloc) } d; int a, b, c; #pragma omp allocate(a) allocator(omp_large_cap_mem_alloc) #pragma omp allocate(b) allocator(omp_const_mem_alloc) #pragma omp allocate(d, c) allocator(omp_high_bw_mem_alloc) template struct ST { static T m; #pragma omp allocate(m) allocator(omp_low_lat_mem_alloc) }; template T foo() { T v; #pragma omp allocate(v) allocator(omp_cgroup_mem_alloc) v = ST::m; return v; } namespace ns{ int a; } #pragma omp allocate(ns::a) allocator(omp_pteam_mem_alloc) // CHECK-LABEL: @main int main () { // CHECK: alloca double, static int a; #pragma omp allocate(a) allocator(omp_thread_mem_alloc) a=2; double b = 3; float c; #pragma omp allocate(b) allocator(omp_default_mem_alloc) #pragma omp allocate(c) allocator(omp_cgroup_mem_alloc) return (foo()); } // CHECK: define {{.*}}i32 @{{.+}}foo{{.+}}() // CHECK-NOT: alloca i32, extern template int ST::m; void baz(float &); // CHECK: define{{ dso_local | }}void @{{.+}}bar{{.+}}() void bar() { // CHECK: alloca float, float bar_a; // CHECK: alloca double, double bar_b; int bar_c; #pragma omp allocate(bar_c) allocator(omp_cgroup_mem_alloc) // CHECK: call void [[OUTLINED:@.+]](i32* %{{.+}}, i32* %{{.+}}) #pragma omp parallel private(bar_a, bar_b) allocate(omp_thread_mem_alloc \ : bar_a) allocate(omp_pteam_mem_alloc \ : bar_b) { bar_b = bar_a; baz(bar_a); } // CHECK: define internal void [[OUTLINED]](i32* noalias %{{.+}}, i32* noalias %{{.+}}) // CHECK-NOT: alloca double, // CHECK: alloca float, // CHECK-NOT: alloca double, // CHECK: load float, float* % // CHECK: store double {{.+}}, double addrspace(3)* @bar_b, } #pragma omp end declare target #endif