animeshk-amd created this revision.
animeshk-amd added reviewers: saiislam, JonChesterfield.
Herald added subscribers: guansong, yaxunl.
Herald added a project: All.
animeshk-amd requested review of this revision.
Herald added a reviewer: jdoerfert.
Herald added subscribers: cfe-commits, sstefan1.
Herald added a project: clang.

This lit test is added based upon the tests present in the
tests/5.0/metadirective directory of the SOLLVE repo
https://github.com/SOLLVE/sollve_vv


Repository:
  rG LLVM Github Monorepo

https://reviews.llvm.org/D131763

Files:
  clang/test/OpenMP/metadirective_device_arch_codegen_amd_or_nvidia.c

Index: clang/test/OpenMP/metadirective_device_arch_codegen_amd_or_nvidia.c
===================================================================
--- /dev/null
+++ clang/test/OpenMP/metadirective_device_arch_codegen_amd_or_nvidia.c
@@ -0,0 +1,122 @@
+// REQUIRES: amdgpu-registered-target
+
+// RUN: %clang_cc1 -fopenmp -x c++ -w -std=c++11 -triple x86_64-unknown-unknown -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm-bc %s -o %t-ppc-host.bc
+// RUN: %clang_cc1 -fopenmp -x c++ -w -std=c++11 -triple amdgcn-amd-amdhsa -fopenmp-targets=amdgcn-amd-amdhsa -emit-llvm %s -fopenmp-is-device -fopenmp-host-ir-file-path %t-ppc-host.bc -target-cpu gfx906 -o - | FileCheck %s
+// expected-no-diagnostics
+
+
+/*===-----------------------------------------------------------------------=== 
+
+Inspired from SOLLVE tests:
+ - 5.0/metadirective/test_metadirective_arch_is_nvidia.c
+ - 5.0/metadirective/test_metadirective_arch_nvidia_or_amd.c
+
+===------------------------------------------------------------------------===*/
+
+
+#define N 1024
+
+int metadirective1() {
+   
+   int v1[N], v2[N], v3[N];
+
+   int target_device_num, host_device_num, default_device;
+   int errors = 0;
+
+   #pragma omp target map(to:v1,v2) map(from:v3, target_device_num) device(default_device)
+   {
+      #pragma omp metadirective \
+                   when(device={arch("amdgcn")}: teams distribute parallel for) \
+                   default(parallel for)
+
+         for (int i = 0; i < N; i++) {
+	    #pragma omp atomic write
+            v3[i] = v1[i] * v2[i];
+         }
+   }
+
+   return errors;
+}
+
+// CHECK-LABEL: define weak_odr amdgpu_kernel void {{.+}}metadirective1
+// CHECK: entry:
+// CHECK: %{{[0-9]}} = call i32 @__kmpc_target_init
+// CHECK: user_code.entry:
+// CHECK: call void @__omp_outlined__
+// CHECK-NOT: call void @__kmpc_parallel_51
+// CHECK: ret void
+
+
+// CHECK-LABEL: define internal void @__omp_outlined__
+// CHECK: entry:
+// CHECK: call void @__kmpc_distribute_static_init
+// CHECK: omp.loop.exit:  
+// CHECK: call void @__kmpc_distribute_static_fini
+
+
+// CHECK-LABEL: define internal void @__omp_outlined__.{{[0-9]+}}
+// CHECK: entry:
+// CHECK: call void @__kmpc_for_static_init_4
+// CHECK: omp.inner.for.body:
+// CHECK: store atomic {{.*}} monotonic
+// CHECK: omp.loop.exit:                                    
+// CHECK-NEXT: call void @__kmpc_distribute_static_fini
+// CHECK-NEXT: ret void
+
+
+
+int metadirective2() {
+   int errors = 0;
+
+   int i, device_num, initial_device;
+   int a[N];
+ 
+     #pragma omp target device(device_num) map(from:initial_device)
+     {
+       #pragma omp metadirective \
+                  when( implementation={vendor(nvidia)}: \
+                        teams num_teams(512) thread_limit(32) ) \
+                  when( implementation={vendor(amd)}: \
+                        teams num_teams(512) thread_limit(64) ) \
+                  when( implementation={vendor(llvm)}: \
+                        teams num_teams(512) thread_limit(64) ) \
+                  default (teams)
+       #pragma omp distribute parallel for
+         for (i = 0; i < N; i++) {
+            #pragma omp atomic write
+            a[i] = i;
+         }
+     }
+   return errors;
+}
+
+
+
+
+// CHECK-LABEL: define weak_odr amdgpu_kernel void {{.+}}metadirective2
+// CHECK: entry:
+// CHECK: %{{[0-9]+}} = call i32 @__kmpc_target_init
+// CHECK: user_code.entry:
+// CHECK: call void @__omp_outlined__.{{[0-9]+}}
+// CHECK: call void @__kmpc_target_deinit
+
+
+// CHECK-LABEL: define internal void @__omp_outlined__.{{[0-9]+}}
+// CHECK: entry:
+// CHECK: call void @__kmpc_distribute_static_init_4
+// CHECK: omp.inner.for.body:
+// CHECK: call void @__kmpc_parallel_51({{.*}}ptr @__omp_outlined__.{{[0-9]+.*}})
+// CHECK: omp.loop.exit:                                    
+// CHECK-NEXT: call void @__kmpc_distribute_static_fini
+
+
+// CHECK-LABEL: define internal void @__omp_outlined__.{{[0-9]+}}
+// CHECK: entry:
+// CHECK: call void @__kmpc_for_static_init_4
+// CHECK: omp.inner.for.body:
+// CHECK: store atomic {{.*}} monotonic
+// CHECK: omp.loop.exit:                                    
+// CHECK-NEXT: call void @__kmpc_distribute_static_fini
+
+
+// CHECK: attributes #{{[0-9]+}} = {{.*}} "omp_target_num_teams"="512"
\ No newline at end of file
_______________________________________________
cfe-commits mailing list
cfe-commits@lists.llvm.org
https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits

Reply via email to