[OpenMPOpt] Make parallel regions reachable from new DeviceRTL loop functions (#150927) (333f636c) · Commits · llvm-doe / llvm-project

llvm/lib/Transforms/IPO/OpenMPOpt.cpp

+23 −0

Original line number	Diff line number	Diff line
		@@ -5021,6 +5021,29 @@ struct AAKernelInfoCallSite : AAKernelInfo {
		case OMPRTL___kmpc_free_shared:
		// Return without setting a fixpoint, to be resolved in updateImpl.
		return;
		case OMPRTL___kmpc_distribute_static_loop_4:
		case OMPRTL___kmpc_distribute_static_loop_4u:
		case OMPRTL___kmpc_distribute_static_loop_8:
		case OMPRTL___kmpc_distribute_static_loop_8u:
		case OMPRTL___kmpc_distribute_for_static_loop_4:
		case OMPRTL___kmpc_distribute_for_static_loop_4u:
		case OMPRTL___kmpc_distribute_for_static_loop_8:
		case OMPRTL___kmpc_distribute_for_static_loop_8u:
		case OMPRTL___kmpc_for_static_loop_4:
		case OMPRTL___kmpc_for_static_loop_4u:
		case OMPRTL___kmpc_for_static_loop_8:
		case OMPRTL___kmpc_for_static_loop_8u:
		// Parallel regions might be reached by these calls, as they take a
		// callback argument potentially containing arbitrary user-provided
		// code.
		ReachedUnknownParallelRegions.insert(&CB);
		// TODO: The presence of these calls on their own does not prevent a
		// kernel from being SPMD-izable. We mark it as such because we need
		// further changes in order to also consider the contents of the
		// callbacks passed to them.
		SPMDCompatibilityTracker.indicatePessimisticFixpoint();
		SPMDCompatibilityTracker.insert(&CB);
		break;
		default:
		// Unknown OpenMP runtime calls cannot be executed in SPMD-mode,
		// generally. However, they do not hide parallel regions.

offload/test/offloading/fortran/target-generic-loops.f90

0 → 100644

+130 −0

Original line number	Diff line number	Diff line
		! Offloading test for generic target regions containing different kinds of
		! loop constructs inside.
		! REQUIRES: flang, amdgpu

		! RUN: %libomptarget-compile-fortran-run-and-check-generic
		program main
		integer :: i1, i2, n1, n2, counter

		n1 = 100
		n2 = 50

		counter = 0
		!$omp target map(tofrom:counter)
		!$omp teams distribute reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do
		!$omp end target

		! CHECK: 1 100
		print '(I2" "I0)', 1, counter

		counter = 0
		!$omp target map(tofrom:counter)
		!$omp parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do
		!$omp parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do
		!$omp end target

		! CHECK: 2 200
		print '(I2" "I0)', 2, counter

		counter = 0
		!$omp target map(tofrom:counter)
		counter = counter + 1
		!$omp parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do
		counter = counter + 1
		!$omp parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do
		counter = counter + 1
		!$omp end target

		! CHECK: 3 203
		print '(I2" "I0)', 3, counter

		counter = 0
		!$omp target map(tofrom: counter)
		counter = counter + 1
		!$omp parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do
		counter = counter + 1
		!$omp end target

		! CHECK: 4 102
		print '(I2" "I0)', 4, counter


		counter = 0
		!$omp target teams distribute reduction(+:counter)
		do i1=1, n1
		!$omp parallel do reduction(+:counter)
		do i2=1, n2
		counter = counter + 1
		end do
		end do

		! CHECK: 5 5000
		print '(I2" "I0)', 5, counter

		counter = 0
		!$omp target teams distribute reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		!$omp parallel do reduction(+:counter)
		do i2=1, n2
		counter = counter + 1
		end do
		counter = counter + 1
		end do

		! CHECK: 6 5200
		print '(I2" "I0)', 6, counter

		counter = 0
		!$omp target teams distribute reduction(+:counter)
		do i1=1, n1
		!$omp parallel do reduction(+:counter)
		do i2=1, n2
		counter = counter + 1
		end do
		!$omp parallel do reduction(+:counter)
		do i2=1, n2
		counter = counter + 1
		end do
		end do

		! CHECK: 7 10000
		print '(I2" "I0)', 7, counter

		counter = 0
		!$omp target teams distribute reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		!$omp parallel do reduction(+:counter)
		do i2=1, n2
		counter = counter + 1
		end do
		counter = counter + 1
		!$omp parallel do reduction(+:counter)
		do i2=1, n2
		counter = counter + 1
		end do
		counter = counter + 1
		end do

		! CHECK: 8 10300
		print '(I2" "I0)', 8, counter
		end program

offload/test/offloading/fortran/target-spmd-loops.f90

0 → 100644

+39 −0

Original line number	Diff line number	Diff line
		! Offloading test for generic target regions containing different kinds of
		! loop constructs inside.
		! REQUIRES: flang, amdgpu

		! RUN: %libomptarget-compile-fortran-run-and-check-generic
		program main
		integer :: i1, n1, counter

		n1 = 100

		counter = 0
		!$omp target parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do

		! CHECK: 1 100
		print '(I2" "I0)', 1, counter

		counter = 0
		!$omp target map(tofrom:counter)
		!$omp parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do
		!$omp end target

		! CHECK: 2 100
		print '(I2" "I0)', 2, counter

		counter = 0
		!$omp target teams distribute parallel do reduction(+:counter)
		do i1=1, n1
		counter = counter + 1
		end do

		! CHECK: 3 100
		print '(I2" "I0)', 3, counter
		end program