1 #include <stdlib.h>
2
3 #define N (1024 * 512)
4 #define COUNTERTYPE unsigned int
5
6 int
7 main (void)
8 {
9 unsigned int *__restrict a;
10 unsigned int *__restrict b;
11 unsigned int *__restrict c;
12
13 a = (unsigned int *__restrict)malloc (N * sizeof (unsigned int));
14 b = (unsigned int *__restrict)malloc (N * sizeof (unsigned int));
15 c = (unsigned int *__restrict)malloc (N * sizeof (unsigned int));
16
17 #pragma acc data copyout (a[0:N])
18 {
19 #pragma acc kernels present (a[0:N])
20 {
21 for (COUNTERTYPE i = 0; i < N; i++)
22 a[i] = i * 2;
23 }
24 }
25
26 #pragma acc data copyout (b[0:N])
27 {
28 #pragma acc kernels present (b[0:N])
29 {
30 for (COUNTERTYPE i = 0; i < N; i++)
31 b[i] = i * 4;
32 }
33 }
34
35 #pragma acc data copyin (a[0:N], b[0:N]) copyout (c[0:N])
36 {
37 #pragma acc kernels present (a[0:N], b[0:N], c[0:N])
38 {
39 for (COUNTERTYPE ii = 0; ii < N; ii++)
40 c[ii] = a[ii] + b[ii];
41 }
42 }
43
44 for (COUNTERTYPE i = 0; i < N; i++)
45 if (c[i] != a[i] + b[i])
46 abort ();
47
48 free (a);
49 free (b);
50 free (c);
51
52 return 0;
53 }