view libgomp/testsuite/libgomp.oacc-c-c++-common/gang-static-2.c @ 120:f93fa5091070

fix conv1.c
author mir3636
date Thu, 08 Mar 2018 14:53:42 +0900
parents 04ced10e8804
children 84e7813d76e9
line wrap: on
line source

/* { dg-do run { target openacc_nvidia_accel_selected } } */
/* This code uses nvptx inline assembly guarded with acc_on_device, which is
   not optimized away at -O0, and then confuses the target assembler.
   { dg-skip-if "" { *-*-* } { "-O0" } { "" } } */

#include <assert.h>
#include <openacc.h>

#define N 100

#define GANG_ID(I)						\
  (acc_on_device (acc_device_nvidia)				\
   ? ({unsigned __r;						\
       __asm__ volatile ("mov.u32 %0,%%ctaid.x;" : "=r" (__r));	\
       __r; }) : (I))

int
test_static(int *a, int num_gangs, int sarg)
{
  int i, j;

  if (sarg == 0)
    sarg = 1;

  for (i = 0; i < N / sarg; i++)
    for (j = 0; j < sarg; j++)
      assert (a[i*sarg+j] == i % num_gangs);
}

int
test_nonstatic(int *a, int gangs)
{
  int i, j;

  for (i = 0; i < N; i+=gangs)
    for (j = 0; j < gangs; j++)
      assert (a[i+j] == i/gangs);
}

int
main ()
{
  int a[N];
  int i, x;

#pragma acc parallel loop gang (static:*) num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_nonstatic (a, 10);

#pragma acc parallel loop gang (static:1) num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_static (a, 10, 1);

#pragma acc parallel loop gang (static:2) num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_static (a, 10, 2);

#pragma acc parallel loop gang (static:5) num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_static (a, 10, 5);

#pragma acc parallel loop gang (static:20) num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_static (a, 10, 20);

  /* Non-static gang.  */
#pragma acc parallel loop gang num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_nonstatic (a, 10);

  /* Static arguments with a variable expression.  */

  x = 20;
#pragma acc parallel loop gang (static:0+x) num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_static (a, 10, 20);

  x = 20;
#pragma acc parallel loop gang (static:x) num_gangs (10)
  for (i = 0; i < 100; i++)
    a[i] = GANG_ID (i);

  test_static (a, 10, 20);

  return 0;
}