diff options
Diffstat (limited to 'libgomp/testsuite/libgomp.oacc-c-c++-common/loop-red-gwv-1.c')
-rw-r--r-- | libgomp/testsuite/libgomp.oacc-c-c++-common/loop-red-gwv-1.c | 56 |
1 files changed, 56 insertions, 0 deletions
diff --git a/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-red-gwv-1.c b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-red-gwv-1.c new file mode 100644 index 00000000000..1663e65e81a --- /dev/null +++ b/libgomp/testsuite/libgomp.oacc-c-c++-common/loop-red-gwv-1.c @@ -0,0 +1,56 @@ +/* { dg-do run } */ +/* { dg-additional-options "-O2" */ + +#include <stdio.h> + +#define N (32*32*32+17) +int main () +{ + int ix; + int ondev = 0; + int t = 0, h = 0; + +#pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) copy(t) copy(ondev) + { +#pragma acc loop gang worker vector reduction(+:t) + for (unsigned ix = 0; ix < N; ix++) + { + int val = ix; + + if (__builtin_acc_on_device (5)) + { + int g = 0, w = 0, v = 0; + + __asm__ volatile ("mov.u32 %0,%%ctaid.x;" : "=r" (g)); + __asm__ volatile ("mov.u32 %0,%%tid.y;" : "=r" (w)); + __asm__ volatile ("mov.u32 %0,%%tid.x;" : "=r" (v)); + val = (g << 16) | (w << 8) | v; + ondev = 1; + } + t += val; + } + } + + for (ix = 0; ix < N; ix++) + { + int val = ix; + if(ondev) + { + int chunk_size = (N + 32*32*32 - 1) / (32*32*32); + + int g = ix / (chunk_size * 32 * 32); + int w = ix / 32 % 32; + int v = ix % 32; + + val = (g << 16) | (w << 8) | v; + } + h += val; + } + if (t != h) + { + printf ("t=%x expected %x\n", t, h); + return 1; + } + + return 0; +} |