Skip to content

Commit ebde37b

Browse files
committed
[flang][Lower][OpenMP] Don't read moldarg for static sized array
This should further reduce the number of spurious barriers
1 parent 5efc2c5 commit ebde37b

File tree

4 files changed

+51
-28
lines changed

4 files changed

+51
-28
lines changed

flang/lib/Lower/OpenMP/DataSharingProcessor.cpp

+3-2
Original file line numberDiff line numberDiff line change
@@ -508,6 +508,8 @@ void DataSharingProcessor::doPrivatize(const semantics::Symbol *sym,
508508

509509
lower::SymbolBox hsb = converter.lookupOneLevelUpSymbol(*sym);
510510
assert(hsb && "Host symbol box not found");
511+
hlfir::Entity entity{hsb.getAddr()};
512+
bool cannotHaveNonDefaultLowerBounds = !entity.mayHaveNonDefaultLowerBounds();
511513

512514
mlir::Location symLoc = hsb.getAddr().getLoc();
513515
std::string privatizerName = sym->name().ToString() + ".privatizer";
@@ -528,7 +530,6 @@ void DataSharingProcessor::doPrivatize(const semantics::Symbol *sym,
528530
// an alloca for a fir.array type there. Get around this by boxing all
529531
// arrays.
530532
if (mlir::isa<fir::SequenceType>(allocType)) {
531-
hlfir::Entity entity{hsb.getAddr()};
532533
entity = genVariableBox(symLoc, firOpBuilder, entity);
533534
privVal = entity.getBase();
534535
allocType = privVal.getType();
@@ -590,7 +591,7 @@ void DataSharingProcessor::doPrivatize(const semantics::Symbol *sym,
590591
result.getDeallocRegion(),
591592
isFirstPrivate ? DeclOperationKind::FirstPrivate
592593
: DeclOperationKind::Private,
593-
sym);
594+
sym, cannotHaveNonDefaultLowerBounds);
594595
// TODO: currently there are false positives from dead uses of the mold
595596
// arg
596597
if (!result.getInitMoldArg().getUses().empty())

flang/lib/Lower/OpenMP/PrivateReductionUtils.cpp

+41-20
Original file line numberDiff line numberDiff line change
@@ -122,25 +122,40 @@ static void createCleanupRegion(Fortran::lower::AbstractConverter &converter,
122122
typeError();
123123
}
124124

125-
fir::ShapeShiftOp Fortran::lower::omp::getShapeShift(fir::FirOpBuilder &builder,
126-
mlir::Location loc,
127-
mlir::Value box) {
125+
fir::ShapeShiftOp
126+
Fortran::lower::omp::getShapeShift(fir::FirOpBuilder &builder,
127+
mlir::Location loc, mlir::Value box,
128+
bool cannotHaveNonDefaultLowerBounds) {
128129
fir::SequenceType sequenceType = mlir::cast<fir::SequenceType>(
129130
hlfir::getFortranElementOrSequenceType(box.getType()));
130131
const unsigned rank = sequenceType.getDimension();
132+
131133
llvm::SmallVector<mlir::Value> lbAndExtents;
132134
lbAndExtents.reserve(rank * 2);
133-
134135
mlir::Type idxTy = builder.getIndexType();
135-
for (unsigned i = 0; i < rank; ++i) {
136-
// TODO: ideally we want to hoist box reads out of the critical section.
137-
// We could do this by having box dimensions in block arguments like
138-
// OpenACC does
139-
mlir::Value dim = builder.createIntegerConstant(loc, idxTy, i);
140-
auto dimInfo =
141-
builder.create<fir::BoxDimsOp>(loc, idxTy, idxTy, idxTy, box, dim);
142-
lbAndExtents.push_back(dimInfo.getLowerBound());
143-
lbAndExtents.push_back(dimInfo.getExtent());
136+
137+
if (cannotHaveNonDefaultLowerBounds && !sequenceType.hasDynamicExtents()) {
138+
// We don't need fir::BoxDimsOp if all of the extents are statically known
139+
// and we can assume default lower bounds. This helps avoids reads from the
140+
// mold arg.
141+
mlir::Value one = builder.createIntegerConstant(loc, idxTy, 1);
142+
for (int64_t extent : sequenceType.getShape()) {
143+
assert(extent != sequenceType.getUnknownExtent());
144+
mlir::Value extentVal = builder.createIntegerConstant(loc, idxTy, extent);
145+
lbAndExtents.push_back(one);
146+
lbAndExtents.push_back(extentVal);
147+
}
148+
} else {
149+
for (unsigned i = 0; i < rank; ++i) {
150+
// TODO: ideally we want to hoist box reads out of the critical section.
151+
// We could do this by having box dimensions in block arguments like
152+
// OpenACC does
153+
mlir::Value dim = builder.createIntegerConstant(loc, idxTy, i);
154+
auto dimInfo =
155+
builder.create<fir::BoxDimsOp>(loc, idxTy, idxTy, idxTy, box, dim);
156+
lbAndExtents.push_back(dimInfo.getLowerBound());
157+
lbAndExtents.push_back(dimInfo.getExtent());
158+
}
144159
}
145160

146161
auto shapeShiftTy = fir::ShapeShiftType::get(builder.getContext(), rank);
@@ -249,12 +264,13 @@ class PopulateInitAndCleanupRegionsHelper {
249264
mlir::Type argType, mlir::Value scalarInitValue,
250265
mlir::Value allocatedPrivVarArg, mlir::Value moldArg,
251266
mlir::Block *initBlock, mlir::Region &cleanupRegion,
252-
DeclOperationKind kind, const Fortran::semantics::Symbol *sym)
267+
DeclOperationKind kind, const Fortran::semantics::Symbol *sym,
268+
bool cannotHaveLowerBounds)
253269
: converter{converter}, builder{converter.getFirOpBuilder()}, loc{loc},
254270
argType{argType}, scalarInitValue{scalarInitValue},
255271
allocatedPrivVarArg{allocatedPrivVarArg}, moldArg{moldArg},
256272
initBlock{initBlock}, cleanupRegion{cleanupRegion}, kind{kind},
257-
sym{sym} {
273+
sym{sym}, cannotHaveNonDefaultLowerBounds{cannotHaveLowerBounds} {
258274
valType = fir::unwrapRefType(argType);
259275
}
260276

@@ -296,6 +312,10 @@ class PopulateInitAndCleanupRegionsHelper {
296312
/// Any length parameters which have been fetched for the type
297313
mlir::SmallVector<mlir::Value> lenParams;
298314

315+
/// If the source variable being privatized definately can't have non-default
316+
/// lower bounds then we don't need to generate code to read them.
317+
bool cannotHaveNonDefaultLowerBounds;
318+
299319
void createYield(mlir::Value ret) {
300320
builder.create<mlir::omp::YieldOp>(loc, ret);
301321
}
@@ -433,7 +453,8 @@ void PopulateInitAndCleanupRegionsHelper::initAndCleanupBoxedArray(
433453
// Special case for (possibly allocatable) arrays of polymorphic types
434454
// e.g. !fir.class<!fir.heap<!fir.array<?x!fir.type<>>>>
435455
if (source.isPolymorphic()) {
436-
fir::ShapeShiftOp shape = getShapeShift(builder, loc, source);
456+
fir::ShapeShiftOp shape =
457+
getShapeShift(builder, loc, source, cannotHaveNonDefaultLowerBounds);
437458
mlir::Type arrayType = source.getElementOrSequenceType();
438459
mlir::Value allocatedArray = builder.create<fir::AllocMemOp>(
439460
loc, arrayType, /*typeparams=*/mlir::ValueRange{}, shape.getExtents());
@@ -472,8 +493,8 @@ void PopulateInitAndCleanupRegionsHelper::initAndCleanupBoxedArray(
472493
// Put the temporary inside of a box:
473494
// hlfir::genVariableBox doesn't handle non-default lower bounds
474495
mlir::Value box;
475-
fir::ShapeShiftOp shapeShift =
476-
getShapeShift(builder, loc, getLoadedMoldArg());
496+
fir::ShapeShiftOp shapeShift = getShapeShift(builder, loc, getLoadedMoldArg(),
497+
cannotHaveNonDefaultLowerBounds);
477498
mlir::Type boxType = getLoadedMoldArg().getType();
478499
if (mlir::isa<fir::BaseBoxType>(temp.getType()))
479500
// the box created by the declare form createTempFromMold is missing
@@ -608,10 +629,10 @@ void Fortran::lower::omp::populateByRefInitAndCleanupRegions(
608629
mlir::Type argType, mlir::Value scalarInitValue, mlir::Block *initBlock,
609630
mlir::Value allocatedPrivVarArg, mlir::Value moldArg,
610631
mlir::Region &cleanupRegion, DeclOperationKind kind,
611-
const Fortran::semantics::Symbol *sym) {
632+
const Fortran::semantics::Symbol *sym, bool cannotHaveLowerBounds) {
612633
PopulateInitAndCleanupRegionsHelper helper(
613634
converter, loc, argType, scalarInitValue, allocatedPrivVarArg, moldArg,
614-
initBlock, cleanupRegion, kind, sym);
635+
initBlock, cleanupRegion, kind, sym, cannotHaveLowerBounds);
615636
helper.populateByRefInitAndCleanupRegions();
616637

617638
// Often we load moldArg to check something (e.g. length parameters, shape)

flang/lib/Lower/OpenMP/PrivateReductionUtils.h

+4-2
Original file line numberDiff line numberDiff line change
@@ -55,11 +55,13 @@ void populateByRefInitAndCleanupRegions(
5555
mlir::Value scalarInitValue, mlir::Block *initBlock,
5656
mlir::Value allocatedPrivVarArg, mlir::Value moldArg,
5757
mlir::Region &cleanupRegion, DeclOperationKind kind,
58-
const Fortran::semantics::Symbol *sym = nullptr);
58+
const Fortran::semantics::Symbol *sym = nullptr,
59+
bool cannotHaveNonDefaultLowerBounds = false);
5960

6061
/// Generate a fir::ShapeShift op describing the provided boxed array.
6162
fir::ShapeShiftOp getShapeShift(fir::FirOpBuilder &builder, mlir::Location loc,
62-
mlir::Value box);
63+
mlir::Value box,
64+
bool cannotHaveNonDefaultLowerBounds = false);
6365

6466
} // namespace omp
6567
} // namespace lower

flang/test/Lower/OpenMP/delayed-privatization-array.f90

+3-4
Original file line numberDiff line numberDiff line change
@@ -108,15 +108,14 @@ program main
108108
! ONE_DIM_DEFAULT_LB-SAME: @[[PRIVATIZER_SYM:.*]] : [[BOX_TYPE:!fir.box<!fir.array<10xi32>>]] init {
109109

110110
! ONE_DIM_DEFAULT_LB-NEXT: ^bb0(%[[PRIV_ARG:.*]]: [[TYPE:!fir.ref<!fir.box<!fir.array<10xi32>>>]], %[[PRIV_BOX_ALLOC:.*]]: [[TYPE]]):
111-
! ONE_DIM_DEFAULT_LB-NEXT: %[[PRIV_ARG_VAL:.*]] = fir.load %[[PRIV_ARG]]
112111
! ONE_DIM_DEFAULT_LB-NEXT: %[[C10:.*]] = arith.constant 10 : index
113112
! ONE_DIM_DEFAULT_LB-NEXT: %[[SHAPE:.*]] = fir.shape %[[C10]]
114113
! ONE_DIM_DEFAULT_LB-NEXT: %[[ARRAY_ALLOC:.*]] = fir.allocmem !fir.array<10xi32>
115114
! ONE_DIM_DEFAULT_LB-NEXT: %[[TRUE:.*]] = arith.constant true
116115
! ONE_DIM_DEFAULT_LB-NEXT: %[[DECL:.*]]:2 = hlfir.declare %[[ARRAY_ALLOC]](%[[SHAPE]])
117-
! ONE_DIM_DEFAULT_LB-NEXT: %[[C0_0:.*]] = arith.constant 0
118-
! ONE_DIM_DEFAULT_LB-NEXT: %[[DIMS2:.*]]:3 = fir.box_dims %[[PRIV_ARG_VAL]], %[[C0_0]]
119-
! ONE_DIM_DEFAULT_LB-NEXT: %[[SHAPE_SHIFT:.*]] = fir.shape_shift %[[DIMS2]]#0, %[[DIMS2]]#1
116+
! ONE_DIM_DEFAULT_LB-NEXT: %[[ONE:.*]] = arith.constant 1 : index
117+
! ONE_DIM_DEFAULT_LB-NEXT: %[[TEN:.*]] = arith.constant 10 : index
118+
! ONE_DIM_DEFAULT_LB-NEXT: %[[SHAPE_SHIFT:.*]] = fir.shape_shift %[[ONE]], %[[TEN]]
120119
! ONE_DIM_DEFAULT_LB-NEXT: %[[EMBOX:.*]] = fir.embox %[[DECL]]#0(%[[SHAPE_SHIFT]])
121120
! ONE_DIM_DEFAULT_LB-NEXT: fir.store %[[EMBOX]] to %[[PRIV_BOX_ALLOC]]
122121
! ONE_DIM_DEFAULT_LB-NEXT: omp.yield(%[[PRIV_BOX_ALLOC]] : [[TYPE]])

0 commit comments

Comments
 (0)