gcc/libgomp/testsuite/libgomp.oacc-fortran/parallel-dims.f90
Tobias Burnus bd7ebe9da7 OpenACC: Fix pattern in dg-bogus in Fortran testcases again
It turned out that a compiler built without offloading support
and one with can produce slightly different diagnostic.

Offloading support implies ENABLE_OFFLOAD which implies that
g->have_offload is set when offloading is actually needed.
In cgraphunit.c, the latter causes flag_generate_offload = 1,
which in turn affects tree.c's free_lang_data.

The result is that the front-end specific diagnostic gets reset
('tree_diagnostics_defaults (global_dc)'), which affects in this
case 'Warning' vs. 'warning' via the Fortran frontend.

Result: 'Warning:' vs. 'warning:'.
Side note: Other FE also override the diagnostic, leading to
similar differences, e.g. the C++ FE outputs mangled function
names differently, cf. patch thread.

libgomp/ChangeLog:

	* testsuite/libgomp.oacc-fortran/par-reduction-2-1.f:
	Use [Ww]arning in dg-bogus as FE diagnostic and default
	diagnostic differ and the result depends on ENABLE_OFFLOAD.
	* testsuite/libgomp.oacc-fortran/par-reduction-2-2.f: Likewise.
	* testsuite/libgomp.oacc-fortran/parallel-dims.f90: Likewise.
	* testsuite/libgomp.oacc-fortran/parallel-reduction.f90: Likewise.

gcc/testsuite/ChangeLog:

	* gfortran.dg/goacc/classify-serial.f95:
	Use [Ww]arning in dg-bogus as FE diagnostic and default
	diagnostic differ and the result depends on ENABLE_OFFLOAD.
	* gfortran.dg/goacc/kernels-decompose-2.f95: Likewise.
	* gfortran.dg/goacc/routine-module-mod-1.f90: Likewise.
2021-04-26 23:13:22 +02:00

126 lines
4.5 KiB
Fortran

! OpenACC parallelism dimensions clauses: num_gangs, num_workers,
! vector_length.
! { dg-additional-sources parallel-dims-aux.c }
! { dg-do run }
! { dg-prune-output "command-line option '-fintrinsic-modules-path=.*' is valid for Fortran but not for C" }
! { dg-additional-options "-Wopenacc-parallelism" } for testing/documenting
! aspects of that functionality.
! See also '../libgomp.oacc-c-c++-common/parallel-dims.c'.
module acc_routines
implicit none (type, external)
interface
integer function acc_gang() bind(C)
!$acc routine seq
end function acc_gang
integer function acc_worker() bind(C)
!$acc routine seq
end function acc_worker
integer function acc_vector() bind(C)
!$acc routine seq
end function acc_vector
end interface
end module acc_routines
program main
use iso_c_binding
use openacc
use acc_routines
implicit none (type, external)
integer :: gangs_min, gangs_max, workers_min, workers_max, vectors_min, vectors_max
integer :: vectors_actual
integer :: i, j, k
call acc_init (acc_device_default)
! OpenACC parallel construct.
!TODO
! OpenACC kernels construct.
!TODO
! OpenACC serial construct.
! GR, WS, VS.
gangs_min = huge(gangs_min) ! INT_MAX
workers_min = huge(workers_min) ! INT_MAX
vectors_min = huge(vectors_min) ! INT_MAX
gangs_max = -huge(gangs_max) - 1 ! INT_MIN
workers_max = -huge(gangs_max) - 1 ! INT_MIN
vectors_max = -huge(gangs_max) - 1 ! INT_MIN
!$acc serial &
!$acc reduction (min: gangs_min, workers_min, vectors_min) reduction (max: gangs_max, workers_max, vectors_max) ! { dg-warning "using vector_length \\(32\\), ignoring 1" "" { target openacc_nvidia_accel_selected } }
do i = 100, -99, -1
gangs_min = acc_gang ();
gangs_max = acc_gang ();
workers_min = acc_worker ();
workers_max = acc_worker ();
vectors_min = acc_vector ();
vectors_max = acc_vector ();
end do
!$acc end serial
if (gangs_min /= 0 .or. gangs_max /= 1 - 1 &
.or. workers_min /= 0 .or. workers_max /= 1 - 1 &
.or. vectors_min /= 0 .or. vectors_max /= 1 - 1) &
stop 1
! Composition of GP, WP, VP.
vectors_actual = 1 ! Implicit 'vector_length (1)' clause.
gangs_min = huge(gangs_min) ! INT_MAX
workers_min = huge(workers_min) ! INT_MAX
vectors_min = huge(vectors_min) ! INT_MAX
gangs_max = -huge(gangs_max) - 1 ! INT_MIN
workers_max = -huge(gangs_max) - 1 ! INT_MIN
vectors_max = -huge(gangs_max) - 1 ! INT_MIN
!$acc serial copy (vectors_actual) &
!$acc copy (gangs_min, gangs_max, workers_min, workers_max, vectors_min, vectors_max) ! { dg-warning "using vector_length \\(32\\), ignoring 1" "" { target openacc_nvidia_accel_selected } }
! { dg-bogus "\[Ww\]arning: region contains gang partitioned code but is not gang partitioned" "TODO 'serial'" { xfail *-*-* } .-1 }
! { dg-bogus "\[Ww\]arning: region contains worker partitioned code but is not worker partitioned" "TODO 'serial'" { xfail *-*-* } .-2 }
! { dg-bogus "\[Ww\]arning: region contains vector partitioned code but is not vector partitioned" "TODO 'serial'" { xfail *-*-* } .-3 }
if (acc_on_device (acc_device_nvidia)) then
! The GCC nvptx back end enforces vector_length (32).
! It's unclear if that's actually permissible here;
! <https://github.com/OpenACC/openacc-spec/issues/238> "OpenACC 'serial'
! construct might not actually be serial".
vectors_actual = 32
end if
!$acc loop gang reduction (min: gangs_min, workers_min, vectors_min) reduction (max: gangs_max, workers_max, vectors_max)
do i = 100, -99, -1
!$acc loop worker reduction (min: gangs_min, workers_min, vectors_min) reduction (max: gangs_max, workers_max, vectors_max)
do j = 100, -99, -1
!$acc loop vector reduction (min: gangs_min, workers_min, vectors_min) reduction (max: gangs_max, workers_max, vectors_max)
do k = 100 * vectors_actual, -99 * vectors_actual, -1
gangs_min = acc_gang ();
gangs_max = acc_gang ();
workers_min = acc_worker ();
workers_max = acc_worker ();
vectors_min = acc_vector ();
vectors_max = acc_vector ();
end do
end do
end do
!$acc end serial
if (acc_get_device_type () .eq. acc_device_nvidia) then
if (vectors_actual /= 32) stop 2
else
if (vectors_actual /= 1) stop 3
end if
if (gangs_min /= 0 .or. gangs_max /= 1 - 1 &
.or. workers_min /= 0 .or. workers_max /= 1 - 1 &
.or. vectors_min /= 0 .or. vectors_max /= vectors_actual - 1) &
stop 4
end program main