libgomp/testsuite/libgomp.oacc-c-c++-common/loop-red-w-2.c - gcc - Git at Google

 /* This code uses nvptx inline assembly guarded with acc_on_device, which is
    not optimized away at -O0, and then confuses the target assembler.
    { dg-skip-if "" { *-*-* } { "-O0" } { "" } } */

 #include <stdio.h>

 #define N (32*32*32+17)
 int main ()
 {
   int ix;
   int ondev = 0;
   int q = 0,  h = 0;

 #pragma acc parallel num_workers(32) vector_length(32) copy(q) copy(ondev)
   {
     int t = q;

 #pragma acc loop worker reduction(+:t)
     for (unsigned ix = 0; ix < N; ix++)
       {
 	int val = ix;

 	if (__builtin_acc_on_device (5))
 	  {
 	    int g = 0, w = 0, v = 0;

 	    __asm__ volatile ("mov.u32 %0,%%ctaid.x;" : "=r" (g));
 	    __asm__ volatile ("mov.u32 %0,%%tid.y;" : "=r" (w));
 	    __asm__ volatile ("mov.u32 %0,%%tid.x;" : "=r" (v));
 	    val = (g << 16) | (w << 8) | v;
 	    ondev = 1;
 	  }
 	t += val;
       }
     q = t;
   }

   for (ix = 0; ix < N; ix++)
     {
       int val = ix;
       if(ondev)
 	{
 	  int g = 0;
 	  int w = ix % 32;
 	  int v = 0;

 	  val = (g << 16) | (w << 8) | v;
 	}
       h += val;
     }
   if (q != h)
     {
       printf ("t=%x expected %x\n", q, h);
       return 1;
     }

   return 0;
 }
	/* This code uses nvptx inline assembly guarded with acc_on_device, which is
	not optimized away at -O0, and then confuses the target assembler.
	{ dg-skip-if "" { --* } { "-O0" } { "" } } */

	#include <stdio.h>

	#define N (323232+17)
	int main ()
	{
	int ix;
	int ondev = 0;
	int q = 0, h = 0;

	#pragma acc parallel num_workers(32) vector_length(32) copy(q) copy(ondev)
	{
	int t = q;

	#pragma acc loop worker reduction(+:t)
	for (unsigned ix = 0; ix < N; ix++)
	{
	int val = ix;

	if (__builtin_acc_on_device (5))
	{
	int g = 0, w = 0, v = 0;

	__asm__ volatile ("mov.u32 %0,%%ctaid.x;" : "=r" (g));
	__asm__ volatile ("mov.u32 %0,%%tid.y;" : "=r" (w));
	__asm__ volatile ("mov.u32 %0,%%tid.x;" : "=r" (v));
	val = (g << 16) \| (w << 8) \| v;
	ondev = 1;
	}
	t += val;
	}
	q = t;
	}

	for (ix = 0; ix < N; ix++)
	{
	int val = ix;
	if(ondev)
	{
	int g = 0;
	int w = ix % 32;
	int v = 0;

	val = (g << 16) \| (w << 8) \| v;
	}
	h += val;
	}
	if (q != h)
	{
	printf ("t=%x expected %x\n", q, h);
	return 1;
	}

	return 0;
	}