
Some systems do not have <alloca.h> but provide alloca differently, e.g. via stdlib.h. Do it like other testcases do and use __builtin_alloca. libgomp/ChangeLog: PR testsuite/102910 * testsuite/libgomp.oacc-c-c++-common/loop-gwv-2.c: Use __builtin_alloca instead of #include <alloca.h> + alloca.
105 lines
3.4 KiB
C
105 lines
3.4 KiB
C
/* { dg-additional-options "-fopt-info-note-omp" }
|
|
{ dg-additional-options "--param=openacc-privatization=noisy" }
|
|
{ dg-additional-options "-foffload=-fopt-info-note-omp" }
|
|
{ dg-additional-options "-foffload=--param=openacc-privatization=noisy" }
|
|
for testing/documenting aspects of that functionality. */
|
|
|
|
#include <stdio.h>
|
|
#include <openacc.h>
|
|
#include <string.h>
|
|
#include <gomp-constants.h>
|
|
#include <stdlib.h>
|
|
|
|
#if 0
|
|
#define DEBUG(DIM, IDX, VAL) \
|
|
fprintf (stderr, "%sdist[%d] = %d\n", (DIM), (IDX), (VAL))
|
|
#else
|
|
#define DEBUG(DIM, IDX, VAL)
|
|
#endif
|
|
|
|
#define N (32*32*32)
|
|
|
|
int
|
|
check (const char *dim, int *dist, int dimsize)
|
|
{
|
|
int ix;
|
|
int exit = 0;
|
|
|
|
for (ix = 0; ix < dimsize; ix++)
|
|
{
|
|
DEBUG(dim, ix, dist[ix]);
|
|
if (dist[ix] < (N) / (dimsize + 0.5)
|
|
|| dist[ix] > (N) / (dimsize - 0.5))
|
|
{
|
|
fprintf (stderr, "did not distribute to %ss (%d not between %d "
|
|
"and %d)\n", dim, dist[ix], (int) ((N) / (dimsize + 0.5)),
|
|
(int) ((N) / (dimsize - 0.5)));
|
|
exit |= 1;
|
|
}
|
|
}
|
|
|
|
return exit;
|
|
}
|
|
|
|
int main ()
|
|
{
|
|
int ary[N];
|
|
int ix;
|
|
int exit = 0;
|
|
int gangsize = 0, workersize = 0, vectorsize = 0;
|
|
int *gangdist, *workerdist, *vectordist;
|
|
|
|
for (ix = 0; ix < N;ix++)
|
|
ary[ix] = -1;
|
|
|
|
#pragma acc parallel num_gangs(32) num_workers(32) vector_length(32) \
|
|
copy(ary) copyout(gangsize, workersize, vectorsize)
|
|
/* { dg-note {variable 'ix' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } .-2 } */
|
|
{
|
|
#pragma acc loop gang worker vector
|
|
/* { dg-note {variable 'ix' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } .-1 } */
|
|
/* { dg-note {variable 'g' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } .-2 } */
|
|
/* { dg-note {variable 'w' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } .-3 } */
|
|
/* { dg-note {variable 'v' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} "" { target *-*-* } .-4 } */
|
|
for (unsigned ix = 0; ix < N; ix++)
|
|
{
|
|
int g, w, v;
|
|
|
|
g = __builtin_goacc_parlevel_id (GOMP_DIM_GANG);
|
|
w = __builtin_goacc_parlevel_id (GOMP_DIM_WORKER);
|
|
v = __builtin_goacc_parlevel_id (GOMP_DIM_VECTOR);
|
|
|
|
ary[ix] = (g << 16) | (w << 8) | v;
|
|
}
|
|
|
|
gangsize = __builtin_goacc_parlevel_size (GOMP_DIM_GANG);
|
|
workersize = __builtin_goacc_parlevel_size (GOMP_DIM_WORKER);
|
|
vectorsize = __builtin_goacc_parlevel_size (GOMP_DIM_VECTOR);
|
|
}
|
|
|
|
gangdist = (int *) __builtin_alloca (gangsize * sizeof (int));
|
|
workerdist = (int *) __builtin_alloca (workersize * sizeof (int));
|
|
vectordist = (int *) __builtin_alloca (vectorsize * sizeof (int));
|
|
memset (gangdist, 0, gangsize * sizeof (int));
|
|
memset (workerdist, 0, workersize * sizeof (int));
|
|
memset (vectordist, 0, vectorsize * sizeof (int));
|
|
|
|
/* Test that work is shared approximately equally amongst each active
|
|
gang/worker/vector. */
|
|
for (ix = 0; ix < N; ix++)
|
|
{
|
|
int g = (ary[ix] >> 16) & 255;
|
|
int w = (ary[ix] >> 8) & 255;
|
|
int v = ary[ix] & 255;
|
|
|
|
gangdist[g]++;
|
|
workerdist[w]++;
|
|
vectordist[v]++;
|
|
}
|
|
|
|
exit = check ("gang", gangdist, gangsize);
|
|
exit |= check ("worker", workerdist, workersize);
|
|
exit |= check ("vector", vectordist, vectorsize);
|
|
|
|
return exit;
|
|
}
|