[flang][OpenMP] Fix firstprivate not working with lastprivate in DO SIMD (#170163)

This fixes a bug where firstprivate was ignored when the same variable
had both firstprivate and lastprivate clauses in a do simd construct.

What was broken:
```
integer :: a
a = 10
!$omp do simd firstprivate(a) lastprivate(a)
do i = 1, 1
   print *, a  ! Should print 10, but printed garbage/0
   a = 20
end do
!$omp end do simd
print *, a  ! Correctly prints 20
```

Inside the loop, [a] wasn't being initialized from the firstprivate
clause—it just had whatever uninitialized value was there.

The fix:

In genCompositeDoSimd(), we were using simdItemDSP to handle
privatization for the whole loop nest. This only looked at SIMD clauses
and missed the firstprivate from the DO part. Changed it to use
wsloopItemDSP instead, which handles both DO clauses (firstprivate,
lastprivate) correctly.

One line change in OpenMP.cpp

Tests added:

Lowering test to check MLIR generation
Runtime test to verify the actual values are correct
<img width="740" height="440" alt="image"
src="https://github.com/user-attachments/assets/fa911ea8-2024-4edf-b710-52c10659742e"
/>


Fixes #168306

---------

Co-authored-by: Krish Gupta <krishgupta@Krishs-MacBook-Air.local>
This commit is contained in:
Krish Gupta
2025-12-09 20:40:21 +05:30
committed by GitHub
parent db59def3b8
commit 748e7af8dd
5 changed files with 151 additions and 23 deletions

View File

@@ -3314,17 +3314,12 @@ static mlir::omp::WsloopOp genCompositeDoSimd(
genSimdClauses(converter, semaCtx, simdItem->clauses, loc, simdClauseOps,
simdReductionSyms);
DataSharingProcessor wsloopItemDSP(
converter, semaCtx, doItem->clauses, eval,
/*shouldCollectPreDeterminedSymbols=*/false,
/*useDelayedPrivatization=*/true, symTable);
DataSharingProcessor wsloopItemDSP(converter, semaCtx, doItem->clauses, eval,
/*shouldCollectPreDeterminedSymbols=*/true,
/*useDelayedPrivatization=*/true,
symTable);
wsloopItemDSP.processStep1(&wsloopClauseOps);
DataSharingProcessor simdItemDSP(converter, semaCtx, simdItem->clauses, eval,
/*shouldCollectPreDeterminedSymbols=*/true,
/*useDelayedPrivatization=*/true, symTable);
simdItemDSP.processStep1(&simdClauseOps, simdItem->id);
// Pass the innermost leaf construct's clauses because that's where COLLAPSE
// is placed by construct decomposition.
mlir::omp::LoopNestOperands loopNestClauseOps;
@@ -3343,8 +3338,9 @@ static mlir::omp::WsloopOp genCompositeDoSimd(
wsloopOp.setComposite(/*val=*/true);
EntryBlockArgs simdArgs;
simdArgs.priv.syms = simdItemDSP.getDelayedPrivSymbols();
simdArgs.priv.vars = simdClauseOps.privateVars;
// For composite 'do simd', privatization is handled by the wsloop.
// The simd does not create separate private storage for variables already
// privatized by the worksharing construct.
simdArgs.reduction.syms = simdReductionSyms;
simdArgs.reduction.vars = simdClauseOps.reductionVars;
auto simdOp =
@@ -3354,7 +3350,7 @@ static mlir::omp::WsloopOp genCompositeDoSimd(
genLoopNestOp(converter, symTable, semaCtx, eval, loc, queue, simdItem,
loopNestClauseOps, iv,
{{wsloopOp, wsloopArgs}, {simdOp, simdArgs}},
llvm::omp::Directive::OMPD_do_simd, simdItemDSP);
llvm::omp::Directive::OMPD_do_simd, wsloopItemDSP);
return wsloopOp;
}

View File

@@ -0,0 +1,48 @@
! Test runtime behavior of DO SIMD with firstprivate and lastprivate on same variable
! This is the reproducer from issue #168306
! REQUIRES: openmp-runtime
! RUN: %flang_fc1 -fopenmp -emit-llvm %s -o - | FileCheck %s --check-prefix=LLVM
! RUN: %flang -fopenmp %s -o %t && %t | FileCheck %s
! LLVM-LABEL: define {{.*}} @_QQmain
program main
integer :: a
integer :: i
a = 10
!$omp do simd lastprivate(a) firstprivate(a)
do i = 1, 1
! Inside loop: a should be 10 (from firstprivate initialization)
! CHECK: main1 : a = 10
print *, "main1 : a = ", a
a = 20
end do
!$omp end do simd
! After loop: a should be 20 (from lastprivate copy-out)
! CHECK: main2 : a = 20
print *, "main2 : a = ", a
call sub
! CHECK: pass
print *, 'pass'
end program main
subroutine sub
integer :: a
integer :: i
a = 10
!$omp do simd lastprivate(a) firstprivate(a)
do i = 1, 1
! Inside loop: a should be 10 (from firstprivate initialization)
! CHECK: sub1 : a = 10
print *, "sub1 : a = ", a
a = 20
end do
!$omp end do simd
! After loop: a should be 20 (from lastprivate copy-out)
! CHECK: sub2 : a = 20
print *, "sub2 : a = ", a
end subroutine sub

View File

@@ -0,0 +1,89 @@
! Test for DO SIMD with the same variable in both firstprivate and lastprivate clauses
! This tests the fix for issue #168306
! RUN: %flang_fc1 -fopenmp -mmlir --enable-delayed-privatization-staging=true -emit-hlfir %s -o - | FileCheck %s
! Test case 1: Basic test with firstprivate + lastprivate on same variable
! CHECK-LABEL: func.func @_QPdo_simd_first_last_same_var
subroutine do_simd_first_last_same_var()
integer :: a
integer :: i
a = 10
! CHECK: omp.wsloop
! CHECK-SAME: private(@{{.*}}firstprivate{{.*}} %{{.*}} -> %[[FIRSTPRIV_A:.*]], @{{.*}}private{{.*}} %{{.*}} -> %[[PRIV_I:.*]] : !fir.ref<i32>, !fir.ref<i32>)
! CHECK-NEXT: omp.simd
! CHECK-NOT: private
! CHECK-NEXT: omp.loop_nest (%[[IV:.*]]) : i32
!$omp do simd firstprivate(a) lastprivate(a)
do i = 1, 1
! CHECK: %[[FIRSTPRIV_A_DECL:.*]]:2 = hlfir.declare %[[FIRSTPRIV_A]]
! CHECK: %[[PRIV_I_DECL:.*]]:2 = hlfir.declare %[[PRIV_I]]
! The private copy should be initialized from firstprivate (value 10)
! and then modified to 20
a = 20
end do
!$omp end do simd
! After the loop, 'a' should be 20 due to lastprivate
end subroutine do_simd_first_last_same_var
! Test case 2: Test with lastprivate and firstprivate in reverse order
! CHECK-LABEL: func.func @_QPdo_simd_last_first_reverse
subroutine do_simd_last_first_reverse()
integer :: a
integer :: i
a = 10
! CHECK: omp.wsloop
! CHECK-SAME: private(@{{.*}}firstprivate{{.*}} %{{.*}} -> %[[FIRSTPRIV_A:.*]], @{{.*}}private{{.*}} %{{.*}} -> %[[PRIV_I:.*]] : !fir.ref<i32>, !fir.ref<i32>)
! CHECK-NEXT: omp.simd
! CHECK-NOT: private
!$omp do simd lastprivate(a) firstprivate(a)
do i = 1, 1
a = 20
end do
!$omp end do simd
end subroutine do_simd_last_first_reverse
! Test case 3: Multiple variables with mixed privatization
! CHECK-LABEL: func.func @_QPdo_simd_multiple_vars
subroutine do_simd_multiple_vars()
integer :: a, b, c
integer :: i
a = 10
b = 20
c = 30
! CHECK: omp.wsloop
! CHECK-SAME: private(@{{.*}}firstprivate{{.*}} %{{.*}} -> %{{.*}}, @{{.*}}firstprivate{{.*}} %{{.*}} -> %{{.*}}, @{{.*}}private{{.*}} %{{.*}} -> %{{.*}} : !fir.ref<i32>, !fir.ref<i32>, !fir.ref<i32>)
! CHECK-NEXT: omp.simd
! CHECK-NOT: private
!$omp do simd firstprivate(a, b) lastprivate(a) private(c)
do i = 1, 5
a = a + 1
b = b + 1
c = i
end do
!$omp end do simd
end subroutine do_simd_multiple_vars
! Test case 4: Reproducer from issue #168306
! CHECK-LABEL: func.func @_QPissue_168306_reproducer
subroutine issue_168306_reproducer()
integer :: a
integer :: i
a = 10
! CHECK: omp.wsloop
! CHECK-SAME: private(@{{.*}}firstprivate{{.*}} %{{.*}} -> %[[FIRSTPRIV_A:.*]], @{{.*}}private{{.*}} %{{.*}} -> %[[PRIV_I:.*]] : !fir.ref<i32>, !fir.ref<i32>)
! CHECK-NEXT: omp.simd
! CHECK-NOT: private
!$omp do simd lastprivate(a) firstprivate(a)
do i = 1, 1
! Inside the loop, 'a' should start at 10 (from firstprivate)
! This is the key behavior that was broken
a = 20
end do
!$omp end do simd
! After the loop, 'a' should be 20 (from lastprivate)
end subroutine issue_168306_reproducer

View File

@@ -36,15 +36,15 @@ end subroutine do_order
!CHECK-LABEL: func.func @_QPdo_simd_order() {
subroutine do_simd_order
!CHECK: omp.wsloop order(reproducible:concurrent) {
!CHECK: omp.wsloop order(reproducible:concurrent)
!$omp do simd order(concurrent)
do i = 1, 10
end do
!CHECK: omp.wsloop order(reproducible:concurrent) {
!CHECK: omp.wsloop order(reproducible:concurrent)
!$omp do simd order(reproducible:concurrent)
do i = 1, 10
end do
!CHECK: omp.wsloop order(unconstrained:concurrent) {
!CHECK: omp.wsloop order(unconstrained:concurrent)
!$omp do simd order(unconstrained:concurrent)
do i = 1, 10
end do
@@ -53,7 +53,7 @@ end subroutine do_simd_order
!CHECK-LABEL: func.func @_QPdo_simd_order_parallel() {
subroutine do_simd_order_parallel
!CHECK: omp.parallel {
!CHECK: omp.wsloop order(reproducible:concurrent) {
!CHECK: omp.wsloop order(reproducible:concurrent)
!$omp parallel do simd order(reproducible:concurrent)
do i = 1, 10
end do

View File

@@ -71,16 +71,13 @@ end subroutine do_simd_reduction
subroutine do_simd_private()
integer, allocatable :: tmp
! CHECK: omp.wsloop
! CHECK-SAME: private(@[[PRIV_IVAR_SYM:.*]] %{{.*}} -> %[[PRIV_IVAR:.*]] : !fir.ref<i32>)
! CHECK-NEXT: omp.simd
! CHECK-SAME: private(@[[PRIV_BOX_SYM:.*]] %{{.*}} -> %[[PRIV_BOX:.*]], @[[PRIV_IVAR_SYM:.*]] %{{.*}} -> %[[PRIV_IVAR:.*]] : !fir.ref<!fir.box<!fir.heap<i32>>>, !fir.ref<i32>)
! CHECK-NEXT: omp.loop_nest (%[[IVAR:.*]]) : i32
!$omp do simd private(tmp)
do i=1, 10
! CHECK: %[[PRIV_BOX_DECL:.*]]:2 = hlfir.declare %[[PRIV_BOX]]
! CHECK: %[[PRIV_IVAR_DECL:.*]]:2 = hlfir.declare %[[PRIV_IVAR]]
! CHECK: hlfir.assign %[[IVAR]] to %[[PRIV_IVAR_DECL]]#0
! CHECK: %[[PRIV_BOX_LOAD:.*]] = fir.load %[[PRIV_BOX_DECL]]
! CHECK: hlfir.assign %{{.*}} to %[[PRIV_BOX_DECL]]#0
! CHECK: omp.yield
tmp = tmp + 1
end do
@@ -90,13 +87,11 @@ end subroutine do_simd_private
subroutine do_simd_lastprivate_firstprivate()
integer :: a
! CHECK: omp.wsloop
! CHECK-SAME: private(@[[FIRSTPRIVATE_A_SYM:.*]] %{{.*}} -> %[[FIRSTPRIVATE_A:.*]] : !fir.ref<i32>)
! CHECK-SAME: private(@[[FIRSTPRIVATE_A_SYM:.*]] %{{.*}} -> %[[FIRSTPRIVATE_A:.*]], @[[PRIVATE_I_SYM:.*]] %{{.*}} -> %[[PRIVATE_I:.*]] : !fir.ref<i32>, !fir.ref<i32>)
! CHECK-NEXT: omp.simd
! CHECK-SAME: private(@[[PRIVATE_A_SYM:.*]] %{{.*}} -> %[[PRIVATE_A:.*]], @[[PRIVATE_I_SYM:.*]] %{{.*}} -> %[[PRIVATE_I:.*]] : !fir.ref<i32>, !fir.ref<i32>)
!$omp do simd lastprivate(a) firstprivate(a)
do i = 1, 10
! CHECK: %[[FIRSTPRIVATE_A_DECL:.*]]:2 = hlfir.declare %[[FIRSTPRIVATE_A]]
! CHECK: %[[PRIVATE_A_DECL:.*]]:2 = hlfir.declare %[[PRIVATE_A]]
! CHECK: %[[PRIVATE_I_DECL:.*]]:2 = hlfir.declare %[[PRIVATE_I]]
a = a + 1
end do