| //===-- DataSharingProcessor.cpp --------------------------------*- C++ -*-===// |
| // |
| // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| // See https://llvm.org/LICENSE.txt for license information. |
| // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| // |
| //===----------------------------------------------------------------------===// |
| // |
| // Coding style: https://mlir.llvm.org/getting_started/DeveloperGuide/ |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "DataSharingProcessor.h" |
| |
| #include "Utils.h" |
| #include "flang/Lower/PFTBuilder.h" |
| #include "flang/Lower/SymbolMap.h" |
| #include "flang/Optimizer/Builder/HLFIRTools.h" |
| #include "flang/Optimizer/Builder/Todo.h" |
| #include "flang/Semantics/tools.h" |
| |
| namespace Fortran { |
| namespace lower { |
| namespace omp { |
| |
| void DataSharingProcessor::processStep1( |
| mlir::omp::PrivateClauseOps *clauseOps, |
| llvm::SmallVectorImpl<const Fortran::semantics::Symbol *> *privateSyms) { |
| collectSymbolsForPrivatization(); |
| collectDefaultSymbols(); |
| collectImplicitSymbols(); |
| privatize(clauseOps, privateSyms); |
| defaultPrivatize(clauseOps, privateSyms); |
| implicitPrivatize(clauseOps, privateSyms); |
| insertBarrier(); |
| } |
| |
| void DataSharingProcessor::processStep2(mlir::Operation *op, bool isLoop) { |
| // 'sections' lastprivate is handled by genOMP() |
| if (!mlir::isa<mlir::omp::SectionsOp>(op)) { |
| insPt = firOpBuilder.saveInsertionPoint(); |
| copyLastPrivatize(op); |
| firOpBuilder.restoreInsertionPoint(insPt); |
| } |
| |
| if (isLoop) { |
| // push deallocs out of the loop |
| firOpBuilder.setInsertionPointAfter(op); |
| insertDeallocs(); |
| } else { |
| // insert dummy instruction to mark the insertion position |
| mlir::Value undefMarker = firOpBuilder.create<fir::UndefOp>( |
| op->getLoc(), firOpBuilder.getIndexType()); |
| insertDeallocs(); |
| firOpBuilder.setInsertionPointAfter(undefMarker.getDefiningOp()); |
| } |
| } |
| |
| void DataSharingProcessor::insertDeallocs() { |
| for (const Fortran::semantics::Symbol *sym : privatizedSymbols) |
| if (Fortran::semantics::IsAllocatable(sym->GetUltimate())) { |
| if (!useDelayedPrivatization) { |
| converter.createHostAssociateVarCloneDealloc(*sym); |
| return; |
| } |
| |
| Fortran::lower::SymbolBox hsb = converter.lookupOneLevelUpSymbol(*sym); |
| assert(hsb && "Host symbol box not found"); |
| mlir::Type symType = hsb.getAddr().getType(); |
| mlir::Location symLoc = hsb.getAddr().getLoc(); |
| fir::ExtendedValue symExV = converter.getSymbolExtendedValue(*sym); |
| mlir::omp::PrivateClauseOp privatizer = symToPrivatizer.at(sym); |
| |
| symTable->pushScope(); |
| |
| mlir::OpBuilder::InsertionGuard guard(firOpBuilder); |
| |
| mlir::Region &deallocRegion = privatizer.getDeallocRegion(); |
| fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder(); |
| mlir::Block *deallocEntryBlock = firOpBuilder.createBlock( |
| &deallocRegion, /*insertPt=*/{}, symType, symLoc); |
| |
| firOpBuilder.setInsertionPointToEnd(deallocEntryBlock); |
| symTable->addSymbol(*sym, |
| fir::substBase(symExV, deallocRegion.getArgument(0))); |
| |
| converter.createHostAssociateVarCloneDealloc(*sym); |
| firOpBuilder.create<mlir::omp::YieldOp>(hsb.getAddr().getLoc()); |
| |
| symTable->popScope(); |
| } |
| } |
| |
| void DataSharingProcessor::cloneSymbol(const Fortran::semantics::Symbol *sym) { |
| // Privatization for symbols which are pre-determined (like loop index |
| // variables) happen separately, for everything else privatize here. |
| if (sym->test(Fortran::semantics::Symbol::Flag::OmpPreDetermined)) |
| return; |
| bool success = converter.createHostAssociateVarClone(*sym); |
| (void)success; |
| assert(success && "Privatization failed due to existing binding"); |
| } |
| |
| void DataSharingProcessor::copyFirstPrivateSymbol( |
| const Fortran::semantics::Symbol *sym, |
| mlir::OpBuilder::InsertPoint *copyAssignIP) { |
| if (sym->test(Fortran::semantics::Symbol::Flag::OmpFirstPrivate)) |
| converter.copyHostAssociateVar(*sym, copyAssignIP); |
| } |
| |
| void DataSharingProcessor::copyLastPrivateSymbol( |
| const Fortran::semantics::Symbol *sym, |
| [[maybe_unused]] mlir::OpBuilder::InsertPoint *lastPrivIP) { |
| if (sym->test(Fortran::semantics::Symbol::Flag::OmpLastPrivate)) |
| converter.copyHostAssociateVar(*sym, lastPrivIP); |
| } |
| |
| void DataSharingProcessor::collectOmpObjectListSymbol( |
| const omp::ObjectList &objects, |
| llvm::SetVector<const Fortran::semantics::Symbol *> &symbolSet) { |
| for (const omp::Object &object : objects) |
| symbolSet.insert(object.id()); |
| } |
| |
| void DataSharingProcessor::collectSymbolsForPrivatization() { |
| bool hasCollapse = false; |
| for (const omp::Clause &clause : clauses) { |
| if (const auto &privateClause = |
| std::get_if<omp::clause::Private>(&clause.u)) { |
| collectOmpObjectListSymbol(privateClause->v, privatizedSymbols); |
| } else if (const auto &firstPrivateClause = |
| std::get_if<omp::clause::Firstprivate>(&clause.u)) { |
| collectOmpObjectListSymbol(firstPrivateClause->v, privatizedSymbols); |
| } else if (const auto &lastPrivateClause = |
| std::get_if<omp::clause::Lastprivate>(&clause.u)) { |
| const ObjectList &objects = std::get<ObjectList>(lastPrivateClause->t); |
| collectOmpObjectListSymbol(objects, privatizedSymbols); |
| hasLastPrivateOp = true; |
| } else if (std::get_if<omp::clause::Collapse>(&clause.u)) { |
| hasCollapse = true; |
| } |
| } |
| |
| if (hasCollapse && hasLastPrivateOp) |
| TODO(converter.getCurrentLocation(), "Collapse clause with lastprivate"); |
| } |
| |
| bool DataSharingProcessor::needBarrier() { |
| // Emit implicit barrier to synchronize threads and avoid data races on |
| // initialization of firstprivate variables and post-update of lastprivate |
| // variables. |
| // Emit implicit barrier for linear clause. Maybe on somewhere else. |
| for (const Fortran::semantics::Symbol *sym : privatizedSymbols) { |
| if (sym->test(Fortran::semantics::Symbol::Flag::OmpFirstPrivate) && |
| sym->test(Fortran::semantics::Symbol::Flag::OmpLastPrivate)) |
| return true; |
| } |
| return false; |
| } |
| |
| void DataSharingProcessor::insertBarrier() { |
| if (needBarrier()) |
| firOpBuilder.create<mlir::omp::BarrierOp>(converter.getCurrentLocation()); |
| } |
| |
| void DataSharingProcessor::insertLastPrivateCompare(mlir::Operation *op) { |
| mlir::omp::LoopNestOp loopOp; |
| if (auto wrapper = mlir::dyn_cast<mlir::omp::LoopWrapperInterface>(op)) |
| loopOp = wrapper.isWrapper() |
| ? mlir::cast<mlir::omp::LoopNestOp>(wrapper.getWrappedLoop()) |
| : nullptr; |
| |
| bool cmpCreated = false; |
| mlir::OpBuilder::InsertionGuard guard(firOpBuilder); |
| for (const omp::Clause &clause : clauses) { |
| if (clause.id != llvm::omp::OMPC_lastprivate) |
| continue; |
| // TODO: Add lastprivate support for simd construct |
| if (mlir::isa<mlir::omp::WsloopOp>(op)) { |
| // Update the original variable just before exiting the worksharing |
| // loop. Conversion as follows: |
| // |
| // omp.wsloop { omp.wsloop { |
| // omp.loop_nest { omp.loop_nest { |
| // ... ... |
| // store ===> store |
| // omp.yield %v = arith.addi %iv, %step |
| // } %cmp = %step < 0 ? %v < %ub : %v > %ub |
| // omp.terminator fir.if %cmp { |
| // } fir.store %v to %loopIV |
| // ^%lpv_update_blk: |
| // } |
| // omp.yield |
| // } |
| // omp.terminator |
| // } |
| |
| // Only generate the compare once in presence of multiple LastPrivate |
| // clauses. |
| if (cmpCreated) |
| continue; |
| cmpCreated = true; |
| |
| mlir::Location loc = loopOp.getLoc(); |
| mlir::Operation *lastOper = loopOp.getRegion().back().getTerminator(); |
| firOpBuilder.setInsertionPoint(lastOper); |
| |
| mlir::Value iv = loopOp.getIVs()[0]; |
| mlir::Value ub = loopOp.getUpperBound()[0]; |
| mlir::Value step = loopOp.getStep()[0]; |
| |
| // v = iv + step |
| // cmp = step < 0 ? v < ub : v > ub |
| mlir::Value v = firOpBuilder.create<mlir::arith::AddIOp>(loc, iv, step); |
| mlir::Value zero = |
| firOpBuilder.createIntegerConstant(loc, step.getType(), 0); |
| mlir::Value negativeStep = firOpBuilder.create<mlir::arith::CmpIOp>( |
| loc, mlir::arith::CmpIPredicate::slt, step, zero); |
| mlir::Value vLT = firOpBuilder.create<mlir::arith::CmpIOp>( |
| loc, mlir::arith::CmpIPredicate::slt, v, ub); |
| mlir::Value vGT = firOpBuilder.create<mlir::arith::CmpIOp>( |
| loc, mlir::arith::CmpIPredicate::sgt, v, ub); |
| mlir::Value cmpOp = firOpBuilder.create<mlir::arith::SelectOp>( |
| loc, negativeStep, vLT, vGT); |
| |
| auto ifOp = firOpBuilder.create<fir::IfOp>(loc, cmpOp, /*else*/ false); |
| firOpBuilder.setInsertionPointToStart(&ifOp.getThenRegion().front()); |
| assert(loopIV && "loopIV was not set"); |
| firOpBuilder.create<fir::StoreOp>(loopOp.getLoc(), v, loopIV); |
| lastPrivIP = firOpBuilder.saveInsertionPoint(); |
| } else if (mlir::isa<mlir::omp::SectionsOp>(op)) { |
| // Already handled by genOMP() |
| } else { |
| TODO(converter.getCurrentLocation(), |
| "lastprivate clause in constructs other than " |
| "simd/worksharing-loop"); |
| } |
| } |
| } |
| |
| static const Fortran::parser::CharBlock * |
| getSource(const Fortran::semantics::SemanticsContext &semaCtx, |
| const Fortran::lower::pft::Evaluation &eval) { |
| const Fortran::parser::CharBlock *source = nullptr; |
| |
| auto ompConsVisit = [&](const Fortran::parser::OpenMPConstruct &x) { |
| std::visit(Fortran::common::visitors{ |
| [&](const Fortran::parser::OpenMPSectionsConstruct &x) { |
| source = &std::get<0>(x.t).source; |
| }, |
| [&](const Fortran::parser::OpenMPLoopConstruct &x) { |
| source = &std::get<0>(x.t).source; |
| }, |
| [&](const Fortran::parser::OpenMPBlockConstruct &x) { |
| source = &std::get<0>(x.t).source; |
| }, |
| [&](const Fortran::parser::OpenMPCriticalConstruct &x) { |
| source = &std::get<0>(x.t).source; |
| }, |
| [&](const Fortran::parser::OpenMPAtomicConstruct &x) { |
| std::visit([&](const auto &x) { source = &x.source; }, |
| x.u); |
| }, |
| [&](const auto &x) { source = &x.source; }, |
| }, |
| x.u); |
| }; |
| |
| eval.visit(Fortran::common::visitors{ |
| [&](const Fortran::parser::OpenMPConstruct &x) { ompConsVisit(x); }, |
| [&](const Fortran::parser::OpenMPDeclarativeConstruct &x) { |
| source = &x.source; |
| }, |
| [&](const Fortran::parser::OmpEndLoopDirective &x) { |
| source = &x.source; |
| }, |
| [&](const auto &x) {}, |
| }); |
| |
| return source; |
| } |
| |
| void DataSharingProcessor::collectSymbolsInNestedRegions( |
| Fortran::lower::pft::Evaluation &eval, |
| Fortran::semantics::Symbol::Flag flag, |
| llvm::SetVector<const Fortran::semantics::Symbol *> |
| &symbolsInNestedRegions) { |
| for (Fortran::lower::pft::Evaluation &nestedEval : |
| eval.getNestedEvaluations()) { |
| if (nestedEval.hasNestedEvaluations()) { |
| if (nestedEval.isConstruct()) |
| // Recursively look for OpenMP constructs within `nestedEval`'s region |
| collectSymbolsInNestedRegions(nestedEval, flag, symbolsInNestedRegions); |
| else |
| converter.collectSymbolSet(nestedEval, symbolsInNestedRegions, flag, |
| /*collectSymbols=*/true, |
| /*collectHostAssociatedSymbols=*/false); |
| } |
| } |
| } |
| |
| // Collect symbols to be default privatized in two steps. |
| // In step 1, collect all symbols in `eval` that match `flag` into |
| // `defaultSymbols`. In step 2, for nested constructs (if any), if and only if |
| // the nested construct is an OpenMP construct, collect those nested |
| // symbols skipping host associated symbols into `symbolsInNestedRegions`. |
| // Later, in current context, all symbols in the set |
| // `defaultSymbols` - `symbolsInNestedRegions` will be privatized. |
| void DataSharingProcessor::collectSymbols( |
| Fortran::semantics::Symbol::Flag flag, |
| llvm::SetVector<const Fortran::semantics::Symbol *> &symbols) { |
| // Collect all scopes associated with 'eval'. |
| llvm::SetVector<const Fortran::semantics::Scope *> clauseScopes; |
| std::function<void(const Fortran::semantics::Scope *)> collectScopes = |
| [&](const Fortran::semantics::Scope *scope) { |
| clauseScopes.insert(scope); |
| for (const Fortran::semantics::Scope &child : scope->children()) |
| collectScopes(&child); |
| }; |
| const Fortran::parser::CharBlock *source = |
| clauses.empty() ? getSource(semaCtx, eval) : &clauses.front().source; |
| const Fortran::semantics::Scope *curScope = nullptr; |
| if (source && !source->empty()) { |
| curScope = &semaCtx.FindScope(*source); |
| collectScopes(curScope); |
| } |
| // Collect all symbols referenced in the evaluation being processed, |
| // that matches 'flag'. |
| llvm::SetVector<const Fortran::semantics::Symbol *> allSymbols; |
| converter.collectSymbolSet(eval, allSymbols, flag, |
| /*collectSymbols=*/true, |
| /*collectHostAssociatedSymbols=*/true); |
| llvm::SetVector<const Fortran::semantics::Symbol *> symbolsInNestedRegions; |
| collectSymbolsInNestedRegions(eval, flag, symbolsInNestedRegions); |
| // Filter-out symbols that must not be privatized. |
| bool collectImplicit = flag == Fortran::semantics::Symbol::Flag::OmpImplicit; |
| auto isPrivatizable = [](const Fortran::semantics::Symbol &sym) -> bool { |
| return !Fortran::semantics::IsProcedure(sym) && |
| !sym.GetUltimate().has<Fortran::semantics::DerivedTypeDetails>() && |
| !sym.GetUltimate().has<Fortran::semantics::NamelistDetails>() && |
| !Fortran::semantics::IsImpliedDoIndex(sym.GetUltimate()); |
| }; |
| for (const auto *sym : allSymbols) { |
| assert(curScope && "couldn't find current scope"); |
| if (isPrivatizable(*sym) && !symbolsInNestedRegions.contains(sym) && |
| !privatizedSymbols.contains(sym) && |
| !sym->test(Fortran::semantics::Symbol::Flag::OmpPreDetermined) && |
| (collectImplicit || |
| !sym->test(Fortran::semantics::Symbol::Flag::OmpImplicit)) && |
| clauseScopes.contains(&sym->owner())) |
| symbols.insert(sym); |
| } |
| } |
| |
| void DataSharingProcessor::collectDefaultSymbols() { |
| using DataSharingAttribute = omp::clause::Default::DataSharingAttribute; |
| for (const omp::Clause &clause : clauses) { |
| if (const auto *defaultClause = |
| std::get_if<omp::clause::Default>(&clause.u)) { |
| if (defaultClause->v == DataSharingAttribute::Private) |
| collectSymbols(Fortran::semantics::Symbol::Flag::OmpPrivate, |
| defaultSymbols); |
| else if (defaultClause->v == DataSharingAttribute::Firstprivate) |
| collectSymbols(Fortran::semantics::Symbol::Flag::OmpFirstPrivate, |
| defaultSymbols); |
| } |
| } |
| } |
| |
| void DataSharingProcessor::collectImplicitSymbols() { |
| // There will be no implicit symbols when a default clause is present. |
| if (defaultSymbols.empty()) |
| collectSymbols(Fortran::semantics::Symbol::Flag::OmpImplicit, |
| implicitSymbols); |
| } |
| |
| void DataSharingProcessor::privatize( |
| mlir::omp::PrivateClauseOps *clauseOps, |
| llvm::SmallVectorImpl<const Fortran::semantics::Symbol *> *privateSyms) { |
| for (const Fortran::semantics::Symbol *sym : privatizedSymbols) { |
| if (const auto *commonDet = |
| sym->detailsIf<Fortran::semantics::CommonBlockDetails>()) { |
| for (const auto &mem : commonDet->objects()) |
| doPrivatize(&*mem, clauseOps, privateSyms); |
| } else |
| doPrivatize(sym, clauseOps, privateSyms); |
| } |
| } |
| |
| void DataSharingProcessor::copyLastPrivatize(mlir::Operation *op) { |
| insertLastPrivateCompare(op); |
| for (const Fortran::semantics::Symbol *sym : privatizedSymbols) |
| if (const auto *commonDet = |
| sym->detailsIf<Fortran::semantics::CommonBlockDetails>()) { |
| for (const auto &mem : commonDet->objects()) { |
| copyLastPrivateSymbol(&*mem, &lastPrivIP); |
| } |
| } else { |
| copyLastPrivateSymbol(sym, &lastPrivIP); |
| } |
| } |
| |
| void DataSharingProcessor::defaultPrivatize( |
| mlir::omp::PrivateClauseOps *clauseOps, |
| llvm::SmallVectorImpl<const Fortran::semantics::Symbol *> *privateSyms) { |
| for (const Fortran::semantics::Symbol *sym : defaultSymbols) |
| doPrivatize(sym, clauseOps, privateSyms); |
| } |
| |
| void DataSharingProcessor::implicitPrivatize( |
| mlir::omp::PrivateClauseOps *clauseOps, |
| llvm::SmallVectorImpl<const Fortran::semantics::Symbol *> *privateSyms) { |
| for (const Fortran::semantics::Symbol *sym : implicitSymbols) |
| doPrivatize(sym, clauseOps, privateSyms); |
| } |
| |
| void DataSharingProcessor::doPrivatize( |
| const Fortran::semantics::Symbol *sym, |
| mlir::omp::PrivateClauseOps *clauseOps, |
| llvm::SmallVectorImpl<const Fortran::semantics::Symbol *> *privateSyms) { |
| if (!useDelayedPrivatization) { |
| cloneSymbol(sym); |
| copyFirstPrivateSymbol(sym); |
| return; |
| } |
| |
| Fortran::lower::SymbolBox hsb = converter.lookupOneLevelUpSymbol(*sym); |
| assert(hsb && "Host symbol box not found"); |
| |
| mlir::Type symType = hsb.getAddr().getType(); |
| mlir::Location symLoc = hsb.getAddr().getLoc(); |
| std::string privatizerName = sym->name().ToString() + ".privatizer"; |
| bool isFirstPrivate = |
| sym->test(Fortran::semantics::Symbol::Flag::OmpFirstPrivate); |
| |
| mlir::omp::PrivateClauseOp privatizerOp = [&]() { |
| auto moduleOp = firOpBuilder.getModule(); |
| auto uniquePrivatizerName = fir::getTypeAsString( |
| symType, converter.getKindMap(), |
| converter.mangleName(*sym) + |
| (isFirstPrivate ? "_firstprivate" : "_private")); |
| |
| if (auto existingPrivatizer = |
| moduleOp.lookupSymbol<mlir::omp::PrivateClauseOp>( |
| uniquePrivatizerName)) |
| return existingPrivatizer; |
| |
| mlir::OpBuilder::InsertionGuard guard(firOpBuilder); |
| firOpBuilder.setInsertionPoint(&moduleOp.getBodyRegion().front(), |
| moduleOp.getBodyRegion().front().begin()); |
| auto result = firOpBuilder.create<mlir::omp::PrivateClauseOp>( |
| symLoc, uniquePrivatizerName, symType, |
| isFirstPrivate ? mlir::omp::DataSharingClauseType::FirstPrivate |
| : mlir::omp::DataSharingClauseType::Private); |
| fir::ExtendedValue symExV = converter.getSymbolExtendedValue(*sym); |
| |
| symTable->pushScope(); |
| |
| // Populate the `alloc` region. |
| { |
| mlir::Region &allocRegion = result.getAllocRegion(); |
| mlir::Block *allocEntryBlock = firOpBuilder.createBlock( |
| &allocRegion, /*insertPt=*/{}, symType, symLoc); |
| |
| firOpBuilder.setInsertionPointToEnd(allocEntryBlock); |
| |
| fir::ExtendedValue localExV = |
| hlfir::translateToExtendedValue( |
| symLoc, firOpBuilder, hlfir::Entity{allocRegion.getArgument(0)}, |
| /*contiguousHint=*/ |
| Fortran::evaluate::IsSimplyContiguous( |
| *sym, converter.getFoldingContext())) |
| .first; |
| |
| symTable->addSymbol(*sym, localExV); |
| symTable->pushScope(); |
| cloneSymbol(sym); |
| firOpBuilder.create<mlir::omp::YieldOp>( |
| hsb.getAddr().getLoc(), |
| symTable->shallowLookupSymbol(*sym).getAddr()); |
| symTable->popScope(); |
| } |
| |
| // Populate the `copy` region if this is a `firstprivate`. |
| if (isFirstPrivate) { |
| mlir::Region ©Region = result.getCopyRegion(); |
| // First block argument corresponding to the original/host value while |
| // second block argument corresponding to the privatized value. |
| mlir::Block *copyEntryBlock = firOpBuilder.createBlock( |
| ©Region, /*insertPt=*/{}, {symType, symType}, {symLoc, symLoc}); |
| firOpBuilder.setInsertionPointToEnd(copyEntryBlock); |
| |
| auto addSymbol = [&](unsigned argIdx, bool force = false) { |
| symExV.match( |
| [&](const fir::MutableBoxValue &box) { |
| symTable->addSymbol( |
| *sym, fir::substBase(box, copyRegion.getArgument(argIdx)), |
| force); |
| }, |
| [&](const auto &box) { |
| symTable->addSymbol(*sym, copyRegion.getArgument(argIdx), force); |
| }); |
| }; |
| |
| addSymbol(0, true); |
| symTable->pushScope(); |
| addSymbol(1); |
| |
| auto ip = firOpBuilder.saveInsertionPoint(); |
| copyFirstPrivateSymbol(sym, &ip); |
| |
| firOpBuilder.create<mlir::omp::YieldOp>( |
| hsb.getAddr().getLoc(), |
| symTable->shallowLookupSymbol(*sym).getAddr()); |
| symTable->popScope(); |
| } |
| |
| symTable->popScope(); |
| return result; |
| }(); |
| |
| if (clauseOps) { |
| clauseOps->privatizers.push_back(mlir::SymbolRefAttr::get(privatizerOp)); |
| clauseOps->privateVars.push_back(hsb.getAddr()); |
| } |
| |
| if (privateSyms) |
| privateSyms->push_back(sym); |
| |
| symToPrivatizer[sym] = privatizerOp; |
| } |
| |
| } // namespace omp |
| } // namespace lower |
| } // namespace Fortran |