1  /* Exercise nested function decomposition, gcc/tree-nested.c.  */
       2  /* See gcc/testsuite/gfortran.dg/goacc/nested-function-1.f90 for the Fortran
       3     version.  */
       4  
       5  /* { dg-additional-options "--param=openacc-kernels=decompose" } */
       6  
       7  /* { dg-additional-options "-fopt-info-all-omp" } */
       8  
       9  /* { dg-additional-options "--param=openacc-privatization=noisy" }
      10     Prune a few: uninteresting, and potentially varying depending on GCC configuration (data types):
      11     { dg-prune-output {note: variable 'D\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} } */
      12  
      13  /* It's only with Tcl 8.5 (released in 2007) that "the variable 'varName'
      14     passed to 'incr' may be unset, and in that case, it will be set to [...]",
      15     so to maintain compatibility with earlier Tcl releases, we manually
      16     initialize counter variables:
      17     { dg-line l_dummy[variable c_compute_loop 0 c_loop 0] }
      18     { dg-message dummy {} { target iN-VAl-Id } l_dummy } to avoid
      19     "WARNING: dg-line var l_dummy defined, but not used".  */
      20  
      21  int main ()
      22  {
      23  #define N 100
      24    int nonlocal_arg;
      25    int nonlocal_a[N];
      26    int nonlocal_i;
      27    int nonlocal_j;
      28  
      29    for (int i = 0; i < N; ++i)
      30      nonlocal_a[i] = 5;
      31    nonlocal_arg = 5;
      32  
      33    void local ()
      34    {
      35      int local_i;
      36      int local_arg;
      37      int local_a[N];
      38      int local_j;
      39  
      40      for (int i = 0; i < N; ++i)
      41        local_a[i] = 5;
      42      local_arg = 5;
      43  
      44  #pragma acc kernels loop /* { dg-line l_compute_loop[incr c_compute_loop] } */ \
      45    gang(num:local_arg) worker(local_arg) vector(local_arg) \
      46    wait async(local_arg)
      47      /* { dg-note {OpenACC 'kernels' decomposition: variable 'local_arg' in 'copy' clause requested to be made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop }
      48         { dg-note {variable 'local_arg' made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      49      /* { dg-note {forwarded loop nest in OpenACC 'kernels' region to 'parloops' for analysis} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      50      /* { dg-note {variable 'local_arg\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      51      /* { dg-note {variable 'local_i\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      52      /* { dg-note {variable 'local_i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      53      /* { dg-optimized {assigned OpenACC seq loop parallelism} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      54      for (local_i = 0; local_i < N; ++local_i)
      55        {
      56  #pragma acc cache (local_a[local_i:5])
      57  	local_a[local_i] = 100;
      58  #pragma acc loop seq tile(*) /* { dg-line l_loop[incr c_loop] } */
      59  	/* { dg-note {variable 'local_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
      60  	for (local_j = 0; local_j < N; ++local_j)
      61  	  ;
      62  #pragma acc loop auto independent tile(1) /* { dg-line l_loop[incr c_loop] } */
      63  	/* { dg-note {variable 'local_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
      64  	for (local_j = 0; local_j < N; ++local_j)
      65  	  ;
      66        }
      67  
      68  #pragma acc kernels loop /* { dg-line l_compute_loop[incr c_compute_loop] } */ \
      69    gang(static:local_arg) worker(local_arg) vector(local_arg) \
      70    wait(local_arg, local_arg + 1, local_arg + 2) async
      71      /* { dg-note {OpenACC 'kernels' decomposition: variable 'local_arg' in 'copy' clause requested to be made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop }
      72         { dg-note {variable 'local_arg' already made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      73      /* { dg-note {forwarded loop nest in OpenACC 'kernels' region to 'parloops' for analysis} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      74      /* { dg-note {variable 'local_arg\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      75      /* { dg-note {variable 'local_i\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      76      /* { dg-note {variable 'local_i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      77      /* { dg-optimized {assigned OpenACC seq loop parallelism} {} { target *-*-* } l_compute_loop$c_compute_loop } */
      78      for (local_i = 0; local_i < N; ++local_i)
      79        {
      80  #pragma acc cache (local_a[local_i:4])
      81  	local_a[local_i] = 100;
      82  #pragma acc loop seq tile(1) /* { dg-line l_loop[incr c_loop] } */
      83  	/* { dg-note {variable 'local_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
      84  	for (local_j = 0; local_j < N; ++local_j)
      85  	  ;
      86  #pragma acc loop auto independent tile(*) /* { dg-line l_loop[incr c_loop] } */
      87  	/* { dg-note {variable 'local_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
      88  	for (local_j = 0; local_j < N; ++local_j)
      89  	  ;
      90        }
      91    }
      92  
      93    void nonlocal ()
      94    {
      95      for (int i = 0; i < N; ++i)
      96        nonlocal_a[i] = 5;
      97      nonlocal_arg = 5;
      98  
      99  #pragma acc kernels loop /* { dg-line l_compute_loop[incr c_compute_loop] } */ \
     100    gang(num:nonlocal_arg) worker(nonlocal_arg) vector(nonlocal_arg) \
     101    wait async(nonlocal_arg)
     102      /* { dg-note {OpenACC 'kernels' decomposition: variable 'nonlocal_arg' in 'copy' clause requested to be made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop }
     103         { dg-note {variable 'nonlocal_arg' made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     104      /* { dg-note {forwarded loop nest in OpenACC 'kernels' region to 'parloops' for analysis} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     105      /* { dg-note {variable 'nonlocal_arg\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     106      /* { dg-note {variable 'nonlocal_i\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     107      /* { dg-note {variable 'nonlocal_i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     108      /* { dg-optimized {assigned OpenACC seq loop parallelism} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     109      for (nonlocal_i = 0; nonlocal_i < N; ++nonlocal_i)
     110        {
     111  #pragma acc cache (nonlocal_a[nonlocal_i:3])
     112  	nonlocal_a[nonlocal_i] = 100;
     113  #pragma acc loop seq tile(2) /* { dg-line l_loop[incr c_loop] } */
     114  	/* { dg-note {variable 'nonlocal_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
     115  	for (nonlocal_j = 0; nonlocal_j < N; ++nonlocal_j)
     116  	  ;
     117  #pragma acc loop auto independent tile(3) /* { dg-line l_loop[incr c_loop] } */
     118  	/* { dg-note {variable 'nonlocal_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
     119  	for (nonlocal_j = 0; nonlocal_j < N; ++nonlocal_j)
     120  	  ;
     121        }
     122  
     123  #pragma acc kernels loop /* { dg-line l_compute_loop[incr c_compute_loop] } */ \
     124    gang(static:nonlocal_arg) worker(nonlocal_arg) vector(nonlocal_arg) \
     125    wait(nonlocal_arg, nonlocal_arg + 1, nonlocal_arg + 2) async
     126      /* { dg-note {OpenACC 'kernels' decomposition: variable 'nonlocal_arg' in 'copy' clause requested to be made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop }
     127         { dg-note {variable 'nonlocal_arg' already made addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     128      /* { dg-note {forwarded loop nest in OpenACC 'kernels' region to 'parloops' for analysis} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     129      /* { dg-note {variable 'nonlocal_arg\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     130      /* { dg-note {variable 'nonlocal_i\.[0-9]+' declared in block isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     131      /* { dg-note {variable 'nonlocal_i' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     132      /* { dg-optimized {assigned OpenACC seq loop parallelism} {} { target *-*-* } l_compute_loop$c_compute_loop } */
     133      for (nonlocal_i = 0; nonlocal_i < N; ++nonlocal_i)
     134        {
     135  #pragma acc cache (nonlocal_a[nonlocal_i:2])
     136  	nonlocal_a[nonlocal_i] = 100;
     137  #pragma acc loop seq tile(*) /* { dg-line l_loop[incr c_loop] } */
     138  	/* { dg-note {variable 'nonlocal_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
     139  	for (nonlocal_j = 0; nonlocal_j < N; ++nonlocal_j)
     140  	  ;
     141  #pragma acc loop auto independent tile(*) /* { dg-line l_loop[incr c_loop] } */
     142  	/* { dg-note {variable 'nonlocal_j' in 'private' clause isn't candidate for adjusting OpenACC privatization level: not addressable} {} { target *-*-* } l_loop$c_loop } */
     143  	for (nonlocal_j = 0; nonlocal_j < N; ++nonlocal_j)
     144  	  ;
     145        }
     146    }
     147  
     148    local ();
     149    nonlocal ();
     150  
     151    return 0;
     152  }