flang/lib/Lower/OpenMP/Utils.cpp - llvm-project - Git at Google

 //===-- Utils..cpp ----------------------------------------------*- C++ -*-===//
 //
 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
 // See https://llvm.org/LICENSE.txt for license information.
 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
 //
 //===----------------------------------------------------------------------===//
 //
 // Coding style: https://mlir.llvm.org/getting_started/DeveloperGuide/
 //
 //===----------------------------------------------------------------------===//

 #include "Utils.h"

 #include "ClauseFinder.h"
 #include "flang/Evaluate/fold.h"
 #include "flang/Evaluate/tools.h"
 #include <flang/Lower/AbstractConverter.h>
 #include <flang/Lower/ConvertType.h>
 #include <flang/Lower/DirectivesCommon.h>
 #include <flang/Lower/OpenMP/Clauses.h>
 #include <flang/Lower/PFTBuilder.h>
 #include <flang/Lower/Support/PrivateReductionUtils.h>
 #include <flang/Optimizer/Builder/BoxValue.h>
 #include <flang/Optimizer/Builder/FIRBuilder.h>
 #include <flang/Optimizer/Builder/Todo.h>
 #include <flang/Optimizer/HLFIR/HLFIROps.h>
 #include <flang/Parser/openmp-utils.h>
 #include <flang/Parser/parse-tree.h>
 #include <flang/Parser/tools.h>
 #include <flang/Semantics/tools.h>
 #include <flang/Semantics/type.h>
 #include <flang/Utils/OpenMP.h>
 #include <llvm/ADT/SmallPtrSet.h>
 #include <llvm/ADT/StringRef.h>
 #include <llvm/Support/CommandLine.h>

 #include <functional>
 #include <iterator>

 template <typename T>
 Fortran::semantics::MaybeIntExpr
 EvaluateIntExpr(Fortran::semantics::SemanticsContext &context, const T &expr) {
   if (Fortran::semantics::MaybeExpr maybeExpr{
           Fold(context.foldingContext(), AnalyzeExpr(context, expr))}) {
     if (auto *intExpr{
             Fortran::evaluate::UnwrapExpr<Fortran::semantics::SomeIntExpr>(
                 *maybeExpr)}) {
       return std::move(*intExpr);
     }
   }
   return std::nullopt;
 }

 template <typename T>
 std::optional<std::int64_t>
 EvaluateInt64(Fortran::semantics::SemanticsContext &context, const T &expr) {
   return Fortran::evaluate::ToInt64(EvaluateIntExpr(context, expr));
 }

 llvm::cl::opt<bool> treatIndexAsSection(
     "openmp-treat-index-as-section",
     llvm::cl::desc("In the OpenMP data clauses treat `a(N)` as `a(N:N)`."),
     llvm::cl::init(true));

 namespace Fortran {
 namespace lower {
 namespace omp {

 mlir::FlatSymbolRefAttr getOrGenImplicitDefaultDeclareMapper(
     lower::AbstractConverter &converter, mlir::Location loc,
     fir::RecordType recordType, llvm::StringRef mapperNameStr) {
   if (mapperNameStr.empty())
     return {};

   if (converter.getModuleOp().lookupSymbol(mapperNameStr))
     return mlir::FlatSymbolRefAttr::get(&converter.getMLIRContext(),
                                         mapperNameStr);

   fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();
   mlir::OpBuilder::InsertionGuard guard(firOpBuilder);

   firOpBuilder.setInsertionPointToStart(converter.getModuleOp().getBody());
   auto declMapperOp = mlir::omp::DeclareMapperOp::create(
       firOpBuilder, loc, mapperNameStr, recordType);
   auto &region = declMapperOp.getRegion();
   firOpBuilder.createBlock(&region);
   auto mapperArg = region.addArgument(firOpBuilder.getRefType(recordType), loc);

   auto declareOp = hlfir::DeclareOp::create(firOpBuilder, loc, mapperArg,
                                             /*uniq_name=*/"");

   const auto genBoundsOps = [&](mlir::Value mapVal,
                                 llvm::SmallVectorImpl<mlir::Value> &bounds) {
     fir::ExtendedValue extVal =
         hlfir::translateToExtendedValue(mapVal.getLoc(), firOpBuilder,
                                         hlfir::Entity{mapVal},
                                         /*contiguousHint=*/true)
             .first;
     fir::factory::AddrAndBoundsInfo info = fir::factory::getDataOperandBaseAddr(
         firOpBuilder, mapVal, /*isOptional=*/false, mapVal.getLoc());
     bounds = fir::factory::genImplicitBoundsOps<mlir::omp::MapBoundsOp,
                                                 mlir::omp::MapBoundsType>(
         firOpBuilder, info, extVal,
         /*dataExvIsAssumedSize=*/false, mapVal.getLoc());
   };

   const auto getFieldRef = [&](mlir::Value rec, llvm::StringRef fieldName,
                                mlir::Type fieldTy, mlir::Type recType) {
     mlir::Value field = fir::FieldIndexOp::create(
         firOpBuilder, loc, fir::FieldType::get(recType.getContext()), fieldName,
         recType, fir::getTypeParams(rec));
     return fir::CoordinateOp::create(
         firOpBuilder, loc, firOpBuilder.getRefType(fieldTy), rec, field);
   };

   llvm::SmallVector<mlir::Value> clauseMapVars;
   llvm::SmallVector<llvm::SmallVector<int64_t>> memberPlacementIndices;
   llvm::SmallVector<mlir::Value> memberMapOps;

   mlir::omp::ClauseMapFlags mapFlag = mlir::omp::ClauseMapFlags::to |
                                       mlir::omp::ClauseMapFlags::from |
                                       mlir::omp::ClauseMapFlags::implicit;
   mlir::omp::VariableCaptureKind captureKind =
       mlir::omp::VariableCaptureKind::ByRef;

   for (const auto &entry : llvm::enumerate(recordType.getTypeList())) {
     const auto &memberName = entry.value().first;
     const auto &memberType = entry.value().second;
     mlir::FlatSymbolRefAttr mapperId;
     if (auto recType = mlir::dyn_cast<fir::RecordType>(
             fir::getFortranElementType(memberType))) {
       std::string mapperIdName =
           recType.getName().str() + llvm::omp::OmpDefaultMapperName;
       if (auto *sym = converter.getCurrentScope().FindSymbol(mapperIdName))
         mapperIdName = converter.mangleName(mapperIdName, sym->owner());
       else if (auto *memberSym =
                    converter.getCurrentScope().FindSymbol(memberName))
         mapperIdName = converter.mangleName(mapperIdName, memberSym->owner());

       mapperId = getOrGenImplicitDefaultDeclareMapper(converter, loc, recType,
                                                       mapperIdName);
     }

     auto ref =
         getFieldRef(declareOp.getBase(), memberName, memberType, recordType);
     llvm::SmallVector<mlir::Value> bounds;
     genBoundsOps(ref, bounds);
     mlir::Value mapOp = Fortran::utils::openmp::createMapInfoOp(
         firOpBuilder, loc, ref, /*varPtrPtr=*/mlir::Value{}, /*name=*/"",
         bounds,
         /*members=*/{},
         /*membersIndex=*/mlir::ArrayAttr{}, mapFlag, captureKind, ref.getType(),
         /*partialMap=*/false, mapperId);
     memberMapOps.emplace_back(mapOp);
     memberPlacementIndices.emplace_back(
         llvm::SmallVector<int64_t>{(int64_t)entry.index()});
   }

   llvm::SmallVector<mlir::Value> bounds;
   genBoundsOps(declareOp.getOriginalBase(), bounds);
   mlir::omp::ClauseMapFlags parentMapFlag = mlir::omp::ClauseMapFlags::implicit;
   mlir::omp::MapInfoOp mapOp = Fortran::utils::openmp::createMapInfoOp(
       firOpBuilder, loc, declareOp.getOriginalBase(),
       /*varPtrPtr=*/mlir::Value(), /*name=*/"", bounds, memberMapOps,
       firOpBuilder.create2DI64ArrayAttr(memberPlacementIndices), parentMapFlag,
       captureKind, declareOp.getType(0),
       /*partialMap=*/true);

   clauseMapVars.emplace_back(mapOp);
   mlir::omp::DeclareMapperInfoOp::create(firOpBuilder, loc, clauseMapVars);
   return mlir::FlatSymbolRefAttr::get(&converter.getMLIRContext(),
                                       mapperNameStr);
 }

 bool requiresImplicitDefaultDeclareMapper(
     const semantics::DerivedTypeSpec &typeSpec) {
   // ISO C interoperable types (e.g., c_ptr, c_funptr) must always have implicit
   // default mappers available so that OpenMP offloading can correctly map them.
   if (semantics::IsIsoCType(&typeSpec))
     return true;

   llvm::SmallPtrSet<const semantics::DerivedTypeSpec *, 8> visited;

   std::function<bool(const semantics::DerivedTypeSpec &)> requiresMapper =
       [&](const semantics::DerivedTypeSpec &spec) -> bool {
     if (!visited.insert(&spec).second)
       return false;

     semantics::DirectComponentIterator directComponents{spec};
     for (const semantics::Symbol &component : directComponents) {
       if (component.attrs().test(semantics::Attr::ALLOCATABLE))
         return true;

       if (const semantics::DeclTypeSpec *declType = component.GetType())
         if (const auto *nested = declType->AsDerived())
           if (requiresMapper(*nested))
             return true;
     }
     return false;
   };

   return requiresMapper(typeSpec);
 }

 int64_t getCollapseValue(const List<Clause> &clauses) {
   auto iter = llvm::find_if(clauses, [](const Clause &clause) {
     return clause.id == llvm::omp::Clause::OMPC_collapse;
   });
   if (iter != clauses.end()) {
     const auto &collapse = std::get<clause::Collapse>(iter->u);
     return evaluate::ToInt64(collapse.v).value();
   }
   return 1;
 }

 void genObjectList(const ObjectList &objects,
                    lower::AbstractConverter &converter,
                    llvm::SmallVectorImpl<mlir::Value> &operands) {
   for (const Object &object : objects) {
     const semantics::Symbol *sym = object.sym();
     assert(sym && "Expected Symbol");
     if (mlir::Value variable = converter.getSymbolAddress(*sym)) {
       operands.push_back(variable);
     } else if (const auto *details =
                    sym->detailsIf<semantics::HostAssocDetails>()) {
       operands.push_back(converter.getSymbolAddress(details->symbol()));
       converter.copySymbolBinding(details->symbol(), *sym);
     }
   }
 }

 mlir::Type getLoopVarType(lower::AbstractConverter &converter,
                           std::size_t loopVarTypeSize) {
   // OpenMP runtime requires 32-bit or 64-bit loop variables.
   loopVarTypeSize = loopVarTypeSize * 8;
   if (loopVarTypeSize < 32) {
     loopVarTypeSize = 32;
   } else if (loopVarTypeSize > 64) {
     loopVarTypeSize = 64;
     mlir::emitWarning(converter.getCurrentLocation(),
                       "OpenMP loop iteration variable cannot have more than 64 "
                       "bits size and will be narrowed into 64 bits.");
   }
   assert((loopVarTypeSize == 32 || loopVarTypeSize == 64) &&
          "OpenMP loop iteration variable size must be transformed into 32-bit "
          "or 64-bit");
   return converter.getFirOpBuilder().getIntegerType(loopVarTypeSize);
 }

 semantics::Symbol *
 getIterationVariableSymbol(const lower::pft::Evaluation &eval) {
   return eval.visit(common::visitors{
       [&](const parser::DoConstruct &doLoop) {
         if (const auto &maybeCtrl = doLoop.GetLoopControl()) {
           using LoopControl = parser::LoopControl;
           if (auto *bounds = std::get_if<LoopControl::Bounds>(&maybeCtrl->u)) {
             static_assert(std::is_same_v<decltype(bounds->name),
                                          parser::Scalar<parser::Name>>);
             return bounds->name.thing.symbol;
           }
         }
         return static_cast<semantics::Symbol *>(nullptr);
       },
       [](auto &&) { return static_cast<semantics::Symbol *>(nullptr); },
   });
 }

 void gatherFuncAndVarSyms(
     const ObjectList &objects, mlir::omp::DeclareTargetCaptureClause clause,
     llvm::SmallVectorImpl<DeclareTargetCaptureInfo> &symbolAndClause,
     bool automap) {
   for (const Object &object : objects)
     symbolAndClause.emplace_back(clause, *object.sym(), automap);
 }

 // This function gathers the individual omp::Object's that make up a
 // larger omp::Object symbol.
 //
 // For example, provided the larger symbol: "parent%child%member", this
 // function breaks it up into its constituent components ("parent",
 // "child", "member"), so we can access each individual component and
 // introspect details. Important to note is this function breaks it up from
 // RHS to LHS ("member" to "parent") and then we reverse it so that the
 // returned omp::ObjectList is LHS to RHS, with the "parent" at the
 // beginning.
 omp::ObjectList gatherObjectsOf(omp::Object derivedTypeMember,
                                 semantics::SemanticsContext &semaCtx) {
   omp::ObjectList objList;
   std::optional<omp::Object> baseObj = derivedTypeMember;
   while (baseObj.has_value()) {
     objList.push_back(baseObj.value());
     baseObj = getBaseObject(baseObj.value(), semaCtx);
   }
   return omp::ObjectList{llvm::reverse(objList)};
 }

 // This function generates a series of indices from a provided omp::Object,
 // that devolves to an ArrayRef symbol, e.g. "array(2,3,4)", this function
 // would generate a series of indices of "[1][2][3]" for the above example,
 // offsetting by -1 to account for the non-zero fortran indexes.
 //
 // These indices can then be provided to a coordinate operation or other
 // GEP-like operation to access the relevant positional member of the
 // array.
 //
 // It is of note that the function only supports subscript integers currently
 // and not Triplets i.e. Array(1:2:3).
 static void generateArrayIndices(lower::AbstractConverter &converter,
                                  fir::FirOpBuilder &firOpBuilder,
                                  lower::StatementContext &stmtCtx,
                                  mlir::Location clauseLocation,
                                  llvm::SmallVectorImpl<mlir::Value> &indices,
                                  omp::Object object) {
   auto maybeRef = evaluate::ExtractDataRef(*object.ref());
   if (!maybeRef)
     return;

   auto *arr = std::get_if<evaluate::ArrayRef>(&maybeRef->u);
   if (!arr)
     return;

   for (auto v : arr->subscript()) {
     if (std::holds_alternative<Triplet>(v.u))
       TODO(clauseLocation, "Triplet indexing in map clause is unsupported");
     auto expr = std::get<Fortran::evaluate::IndirectSubscriptIntegerExpr>(v.u);
     mlir::Value subscript =
         fir::getBase(converter.genExprValue(toEvExpr(expr.value()), stmtCtx));
     indices.push_back(firOpBuilder.createConvert(
         clauseLocation, firOpBuilder.getIndexType(), subscript));
   }
 }

 /// When mapping members of derived types, there is a chance that one of the
 /// members along the way to a mapped member is an descriptor. In which case
 /// we have to make sure we generate a map for those along the way otherwise
 /// we will be missing a chunk of data required to actually map the member
 /// type to device. This function effectively generates these maps and the
 /// appropriate data accesses required to generate these maps. It will avoid
 /// creating duplicate maps, as duplicates are just as bad as unmapped
 /// descriptor data in a lot of cases for the runtime (and unnecessary
 /// data movement should be avoided where possible).
 ///
 /// As an example for the following mapping:
 ///
 /// type :: vertexes
 ///     integer(4), allocatable :: vertexx(:)
 ///     integer(4), allocatable :: vertexy(:)
 /// end type vertexes
 ///
 /// type :: dtype
 ///     real(4) :: i
 ///     type(vertexes), allocatable :: vertexes(:)
 /// end type dtype
 ///
 /// type(dtype), allocatable :: alloca_dtype
 ///
 /// !$omp target map(tofrom: alloca_dtype%vertexes(N1)%vertexx)
 ///
 /// The below HLFIR/FIR is generated (trimmed for conciseness):
 ///
 /// On the first iteration we index into the record type alloca_dtype
 /// to access "vertexes", we then generate a map for this descriptor
 /// alongside bounds to indicate we only need the 1 member, rather than
 /// the whole array block in this case (In theory we could map its
 /// entirety at the cost of data transfer bandwidth).
 ///
 /// %13:2 = hlfir.declare ... "alloca_dtype" ...
 /// %39 = fir.load %13#0 : ...
 /// %40 = fir.coordinate_of %39, %c1 : ...
 /// %51 = omp.map.info var_ptr(%40 : ...) map_clauses(to) capture(ByRef) ...
 /// %52 = fir.load %40 : ...
 ///
 /// Second iteration generating access to "vertexes(N1) utilising the N1 index
 /// %53 = load N1 ...
 /// %54 = fir.convert %53 : (i32) -> i64
 /// %55 = fir.convert %54 : (i64) -> index
 /// %56 = arith.subi %55, %c1 : index
 /// %57 = fir.coordinate_of %52, %56 : ...
 ///
 /// Still in the second iteration we access the allocatable member "vertexx",
 /// we return %58 from the function and provide it to the final and "main"
 /// map of processMap (generated by the record type segment of the below
 /// function), if this were not the final symbol in the list, i.e. we accessed
 /// a member below vertexx, we would have generated the map below as we did in
 /// the first iteration and then continue to generate further coordinates to
 /// access further components as required.
 ///
 /// %58 = fir.coordinate_of %57, %c0 : ...
 /// %61 = omp.map.info var_ptr(%58 : ...) map_clauses(to) capture(ByRef) ...
 ///
 /// Parent mapping containing prior generated mapped members, generated at
 /// a later step but here to showcase the "end" result
 ///
 /// omp.map.info var_ptr(%13#1 : ...) map_clauses(to) capture(ByRef)
 ///   members(%50, %61 : [0, 1, 0], [0, 1, 0] : ...
 ///
 /// \param objectList - The list of omp::Object symbol data for each parent
 ///  to the mapped member (also includes the mapped member), generated via
 ///  gatherObjectsOf.
 /// \param indices - List of index data associated with the mapped member
 ///   symbol, which identifies the placement of the member in its parent,
 ///   this helps generate the appropriate member accesses. These indices
 ///   can be generated via generateMemberPlacementIndices.
 /// \param asFortran - A string generated from the mapped variable to be
 ///   associated with the main map, generally (but not restricted to)
 ///   generated via gatherDataOperandAddrAndBounds or other
 ///   DirectiveCommons.hpp utilities.
 /// \param mapTypeBits - The map flags that will be associated with the
 ///   generated maps, minus alterations of the TO and FROM bits for the
 ///   intermediate components to prevent accidental overwriting on device
 ///   write back.
 mlir::Value createParentSymAndGenIntermediateMaps(
     mlir::Location clauseLocation, lower::AbstractConverter &converter,
     semantics::SemanticsContext &semaCtx, lower::StatementContext &stmtCtx,
     omp::ObjectList &objectList, llvm::SmallVectorImpl<int64_t> &indices,
     OmpMapParentAndMemberData &parentMemberIndices, llvm::StringRef asFortran,
     mlir::omp::ClauseMapFlags mapTypeBits) {
   fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();

   /// Checks if an omp::Object is an array expression with a subscript, e.g.
   /// array(1,2).
   auto isArrayExprWithSubscript = [](omp::Object obj) {
     if (auto maybeRef = evaluate::ExtractDataRef(obj.ref())) {
       evaluate::DataRef ref = *maybeRef;
       if (auto *arr = std::get_if<evaluate::ArrayRef>(&ref.u))
         return !arr->subscript().empty();
     }
     return false;
   };

   // Generate the access to the original parent base address.
   fir::factory::AddrAndBoundsInfo parentBaseAddr =
       lower::getDataOperandBaseAddr(converter, firOpBuilder,
                                     *objectList[0].sym(), clauseLocation);
   mlir::Value curValue = parentBaseAddr.addr;

   // Iterate over all objects in the objectList, this should consist of all
   // record types between the parent and the member being mapped (including
   // the parent). The object list may also contain array objects as well,
   // this can occur when specifying bounds or a specific element access
   // within a member map, we skip these.
   size_t currentIndicesIdx = 0;
   for (size_t i = 0; i < objectList.size(); ++i) {
     // If we encounter a sequence type, i.e. an array, we must generate the
     // correct coordinate operation to index into the array to proceed further,
     // this is only relevant in cases where we encounter subscripts currently.
     //
     // For example in the following case:
     //
     //   map(tofrom: array_dtype(4)%internal_dtypes(3)%float_elements(4))
     //
     // We must generate coordinate operation accesses for each subscript
     // we encounter.
     if (fir::SequenceType arrType = mlir::dyn_cast<fir::SequenceType>(
             fir::unwrapPassByRefType(curValue.getType()))) {
       if (isArrayExprWithSubscript(objectList[i])) {
         llvm::SmallVector<mlir::Value> subscriptIndices;
         generateArrayIndices(converter, firOpBuilder, stmtCtx, clauseLocation,
                              subscriptIndices, objectList[i]);
         assert(!subscriptIndices.empty() &&
                "missing expected indices for map clause");
         if (auto boxTy = llvm::dyn_cast<fir::BaseBoxType>(curValue.getType())) {
           // To accommodate indexing into box types of all dimensions including
           // negative dimensions we have to take into consideration the lower
           // bounds and extents of the data (stored in the box) and convey it
           // to the ArrayCoorOp so that it can appropriately access the element
           // utilising the subscript we provide and the runtime sizes stored in
           // the Box. To do so we need to generate a ShapeShiftOp which combines
           // both the lb (ShiftOp) and extent (ShapeOp) of the Box, giving the
           // ArrayCoorOp the spatial information it needs to calculate the
           // underlying address.
           mlir::Value shapeShift = Fortran::lower::getShapeShift(
               firOpBuilder, clauseLocation, curValue);
           auto addrOp =
               fir::BoxAddrOp::create(firOpBuilder, clauseLocation, curValue);
           curValue = fir::ArrayCoorOp::create(
               firOpBuilder, clauseLocation,
               firOpBuilder.getRefType(arrType.getEleTy()), addrOp, shapeShift,
               /*slice=*/mlir::Value{}, subscriptIndices,
               /*typeparms=*/mlir::ValueRange{});
         } else {
           // We're required to negate by one in the non-Box case as I believe
           // we do not have the shape generated from the dimensions to help
           // adjust the indexing.
           // TODO/FIXME: This may need adjusted to support bounds of unusual
           // dimensions, if that's the case then it is likely best to fold this
           // branch into the above.
           mlir::Value one = firOpBuilder.createIntegerConstant(
               clauseLocation, firOpBuilder.getIndexType(), 1);
           for (auto &v : subscriptIndices)
             v = mlir::arith::SubIOp::create(firOpBuilder, clauseLocation, v,
                                             one);
           curValue = fir::CoordinateOp::create(
               firOpBuilder, clauseLocation,
               firOpBuilder.getRefType(arrType.getEleTy()), curValue,
               subscriptIndices);
         }
       }
     }

     // If we encounter a record type, we must access the subsequent member
     // by indexing into it and creating a coordinate operation to do so, we
     // utilise the index information generated previously and passed in to
     // work out the correct member to access and the corresponding member
     // type.
     if (fir::RecordType recordType = mlir::dyn_cast<fir::RecordType>(
             fir::unwrapPassByRefType(curValue.getType()))) {
       fir::IntOrValue idxConst = mlir::IntegerAttr::get(
           firOpBuilder.getI32Type(), indices[currentIndicesIdx]);
       mlir::Type memberTy = recordType.getType(indices[currentIndicesIdx]);
       curValue = fir::CoordinateOp::create(
           firOpBuilder, clauseLocation, firOpBuilder.getRefType(memberTy),
           curValue, llvm::SmallVector<fir::IntOrValue, 1>{idxConst});

       // If we're a final member, the map will be generated by the processMap
       // call that invoked this function.
       if (currentIndicesIdx == indices.size() - 1)
         break;

       // Skip mapping and the subsequent load if we're not
       // a type with a descriptor such as a pointer/allocatable. If we're not a
       // type with a descriptor then we have no need of generating an
       // intermediate map for it, as we only need to generate a map if a member
       // is a descriptor type (and thus obscures the members it contains via a
       // pointer in which it's data needs mapped).
       if (!fir::isTypeWithDescriptor(memberTy)) {
         currentIndicesIdx++;
         continue;
       }

       llvm::SmallVector<int64_t> interimIndices(
           indices.begin(), std::next(indices.begin(), currentIndicesIdx + 1));
       // Verify we haven't already created a map for this particular member, by
       // checking the list of members already mapped for the current parent,
       // stored in the parentMemberIndices structure
       if (!parentMemberIndices.isDuplicateMemberMapInfo(interimIndices)) {
         // Generate bounds operations using the standard lowering utility,
         // unfortunately this currently does a bit more than just generate
         // bounds and we discard the other bits. May be useful to extend the
         // utility to just provide bounds in the future.
         llvm::SmallVector<mlir::Value> interimBounds;
         if (i + 1 < objectList.size() &&
             objectList[i + 1].sym()->IsObjectArray()) {
           std::stringstream interimFortran;
           Fortran::lower::gatherDataOperandAddrAndBounds<
               mlir::omp::MapBoundsOp, mlir::omp::MapBoundsType>(
               converter, converter.getFirOpBuilder(), semaCtx,
               converter.getFctCtx(), *objectList[i + 1].sym(),
               objectList[i + 1].ref(), clauseLocation, interimFortran,
               interimBounds, treatIndexAsSection);
         }

         // Remove all map-type bits (e.g. TO, FROM, etc.) from the intermediate
         // allocatable maps, as we simply wish to alloc or release them. It may
         // be safer to just pass OMP_MAP_NONE as the map type, but we may still
         // need some of the other map types the mapped member utilises, so for
         // now it's good to keep an eye on this.
         mlir::omp::ClauseMapFlags interimMapType = mapTypeBits;
         interimMapType &= ~mlir::omp::ClauseMapFlags::to;
         interimMapType &= ~mlir::omp::ClauseMapFlags::from;
         interimMapType &= ~mlir::omp::ClauseMapFlags::return_param;

         // Create a map for the intermediate member and insert it and it's
         // indices into the parentMemberIndices list to track it.
         mlir::omp::MapInfoOp mapOp = utils::openmp::createMapInfoOp(
             firOpBuilder, clauseLocation, curValue,
             /*varPtrPtr=*/mlir::Value{}, asFortran,
             /*bounds=*/interimBounds,
             /*members=*/{},
             /*membersIndex=*/mlir::ArrayAttr{}, interimMapType,
             mlir::omp::VariableCaptureKind::ByRef, curValue.getType());

         parentMemberIndices.memberPlacementIndices.push_back(interimIndices);
         parentMemberIndices.memberMap.push_back(mapOp);
       }

       // Load the currently accessed member, so we can continue to access
       // further segments.
       curValue = fir::LoadOp::create(firOpBuilder, clauseLocation, curValue);
       currentIndicesIdx++;
     }
   }
   return curValue;
 }

 static int64_t
 getComponentPlacementInParent(const semantics::Symbol *componentSym) {
   const auto *derived = componentSym->owner()
                             .derivedTypeSpec()
                             ->typeSymbol()
                             .detailsIf<semantics::DerivedTypeDetails>();
   assert(derived &&
          "expected derived type details when processing component symbol");
   for (auto [placement, name] : llvm::enumerate(derived->componentNames()))
     if (name == componentSym->name())
       return placement;
   return -1;
 }

 static std::optional<Object>
 getComponentObject(std::optional<Object> object,
                    semantics::SemanticsContext &semaCtx) {
   if (!object)
     return std::nullopt;

   auto ref = evaluate::ExtractDataRef(object.value().ref());
   if (!ref)
     return std::nullopt;

   if (std::holds_alternative<evaluate::Component>(ref->u))
     return object;

   auto baseObj = getBaseObject(object.value(), semaCtx);
   if (!baseObj)
     return std::nullopt;

   return getComponentObject(baseObj.value(), semaCtx);
 }

 void generateMemberPlacementIndices(const Object &object,
                                     llvm::SmallVectorImpl<int64_t> &indices,
                                     semantics::SemanticsContext &semaCtx) {
   assert(indices.empty() && "indices vector passed to "
                             "generateMemberPlacementIndices should be empty");
   auto compObj = getComponentObject(object, semaCtx);

   while (compObj) {
     int64_t index = getComponentPlacementInParent(compObj->sym());
     assert(
         index >= 0 &&
         "unexpected index value returned from getComponentPlacementInParent");
     indices.push_back(index);
     compObj =
         getComponentObject(getBaseObject(compObj.value(), semaCtx), semaCtx);
   }

   indices = llvm::SmallVector<int64_t>{llvm::reverse(indices)};
 }

 void OmpMapParentAndMemberData::addChildIndexAndMapToParent(
     const omp::Object &object, mlir::omp::MapInfoOp &mapOp,
     semantics::SemanticsContext &semaCtx) {
   llvm::SmallVector<int64_t> indices;
   generateMemberPlacementIndices(object, indices, semaCtx);
   memberPlacementIndices.push_back(indices);
   memberMap.push_back(mapOp);
 }

 bool isMemberOrParentAllocatableOrPointer(
     const Object &object, semantics::SemanticsContext &semaCtx) {
   if (semantics::IsAllocatableOrObjectPointer(object.sym()))
     return true;

   auto compObj = getBaseObject(object, semaCtx);
   while (compObj) {
     if (semantics::IsAllocatableOrObjectPointer(compObj.value().sym()))
       return true;
     compObj = getBaseObject(compObj.value(), semaCtx);
   }

   return false;
 }

 void insertChildMapInfoIntoParent(
     lower::AbstractConverter &converter, semantics::SemanticsContext &semaCtx,
     lower::StatementContext &stmtCtx,
     std::map<Object, OmpMapParentAndMemberData> &parentMemberIndices,
     llvm::SmallVectorImpl<mlir::Value> &mapOperands,
     llvm::SmallVectorImpl<const semantics::Symbol *> &mapSyms) {
   fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();
   for (auto indices : parentMemberIndices) {
     auto *parentIter =
         llvm::find_if(mapSyms, [&indices](const semantics::Symbol *v) {
           return v == indices.first.sym();
         });
     if (parentIter != mapSyms.end()) {
       auto mapOp = llvm::cast<mlir::omp::MapInfoOp>(
           mapOperands[std::distance(mapSyms.begin(), parentIter)]
               .getDefiningOp());

       // Once explicit members are attached to a parent map, do not also invoke
       // a declare mapper on it, otherwise the mapper would remap the same
       // components leading to duplicate mappings at runtime.
       if (!indices.second.memberMap.empty() && mapOp.getMapperIdAttr())
         mapOp.setMapperIdAttr(nullptr);

       // NOTE: To maintain appropriate SSA ordering, we move the parent map
       // which will now have references to its children after the last
       // of its members to be generated. This is necessary when a user
       // has defined a series of parent and children maps where the parent
       // precedes the children. An alternative, may be to do
       // delayed generation of map info operations from the clauses and
       // organize them first before generation. Or to use the
       // topologicalSort utility which will enforce a stronger SSA
       // dominance ordering at the cost of efficiency/time.
       mapOp->moveAfter(indices.second.memberMap.back());

       for (mlir::omp::MapInfoOp memberMap : indices.second.memberMap)
         mapOp.getMembersMutable().append(memberMap.getResult());

       mapOp.setMembersIndexAttr(firOpBuilder.create2DI64ArrayAttr(
           indices.second.memberPlacementIndices));
     } else {
       // NOTE: We take the map type of the first child, this may not
       // be the correct thing to do, however, we shall see. For the moment
       // it allows this to work with enter and exit without causing MLIR
       // verification issues. The more appropriate thing may be to take
       // the "main" map type clause from the directive being used.
       mlir::omp::ClauseMapFlags mapType =
           indices.second.memberMap[0].getMapType();

       llvm::SmallVector<mlir::Value> members;
       members.reserve(indices.second.memberMap.size());
       for (mlir::omp::MapInfoOp memberMap : indices.second.memberMap)
         members.push_back(memberMap.getResult());

       // Create parent to emplace and bind members
       llvm::SmallVector<mlir::Value> bounds;
       std::stringstream asFortran;
       fir::factory::AddrAndBoundsInfo info =
           lower::gatherDataOperandAddrAndBounds<mlir::omp::MapBoundsOp,
                                                 mlir::omp::MapBoundsType>(
               converter, firOpBuilder, semaCtx, converter.getFctCtx(),
               *indices.first.sym(), indices.first.ref(),
               converter.getCurrentLocation(), asFortran, bounds,
               treatIndexAsSection);

       mlir::omp::MapInfoOp mapOp = utils::openmp::createMapInfoOp(
           firOpBuilder, info.rawInput.getLoc(), info.rawInput,
           /*varPtrPtr=*/mlir::Value(), asFortran.str(), bounds, members,
           firOpBuilder.create2DI64ArrayAttr(
               indices.second.memberPlacementIndices),
           mapType, mlir::omp::VariableCaptureKind::ByRef,
           info.rawInput.getType(),
           /*partialMap=*/true);

       mapOperands.push_back(mapOp);
       mapSyms.push_back(indices.first.sym());
     }
   }
 }

 void lastprivateModifierNotSupported(const omp::clause::Lastprivate &lastp,
                                      mlir::Location loc) {
   using Lastprivate = omp::clause::Lastprivate;
   auto &maybeMod =
       std::get<std::optional<Lastprivate::LastprivateModifier>>(lastp.t);
   if (maybeMod) {
     assert(*maybeMod == Lastprivate::LastprivateModifier::Conditional &&
            "Unexpected lastprivate modifier");
     TODO(loc, "lastprivate clause with CONDITIONAL modifier");
   }
 }

 static void convertLoopBounds(lower::AbstractConverter &converter,
                               mlir::Location loc,
                               mlir::omp::LoopRelatedClauseOps &result,
                               std::size_t loopVarTypeSize) {
   fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();
   // The types of lower bound, upper bound, and step are converted into the
   // type of the loop variable if necessary.
   mlir::Type loopVarType = getLoopVarType(converter, loopVarTypeSize);
   for (unsigned it = 0; it < (unsigned)result.loopLowerBounds.size(); it++) {
     result.loopLowerBounds[it] = firOpBuilder.createConvert(
         loc, loopVarType, result.loopLowerBounds[it]);
     result.loopUpperBounds[it] = firOpBuilder.createConvert(
         loc, loopVarType, result.loopUpperBounds[it]);
     result.loopSteps[it] =
         firOpBuilder.createConvert(loc, loopVarType, result.loopSteps[it]);
   }
 }

 // Helper function that finds the sizes clause in a inner OMPD_tile directive
 // and passes the sizes clause to the callback function if found.
 static void processTileSizesFromOpenMPConstruct(
     const parser::OpenMPConstruct *ompCons,
     std::function<void(const parser::OmpClause::Sizes *)> processFun) {
   if (!ompCons)
     return;
   if (auto *ompLoop{std::get_if<parser::OpenMPLoopConstruct>(&ompCons->u)}) {
     if (auto *innerConstruct = ompLoop->GetNestedConstruct()) {
       const parser::OmpDirectiveSpecification &innerBeginSpec =
           innerConstruct->BeginDir();
       if (innerBeginSpec.DirId() == llvm::omp::Directive::OMPD_tile) {
         // Get the size values from parse tree and convert to a vector.
         for (const auto &clause : innerBeginSpec.Clauses().v) {
           if (const auto tclause{
                   std::get_if<parser::OmpClause::Sizes>(&clause.u)}) {
             processFun(tclause);
             break;
           }
         }
       }
     }
   }
 }

 pft::Evaluation *getNestedDoConstruct(pft::Evaluation &eval) {
   for (pft::Evaluation &nested : eval.getNestedEvaluations()) {
     // In an OpenMPConstruct there can be compiler directives:
     // 1 <<OpenMPConstruct>>
     //     2 CompilerDirective: !unroll
     //     <<DoConstruct>> -> 8
     if (nested.getIf<parser::CompilerDirective>())
       continue;
     // Within a DoConstruct, there can be compiler directives, plus
     // there is a DoStmt before the body:
     // <<DoConstruct>> -> 8
     //     3 NonLabelDoStmt -> 7: do i = 1, n
     //     <<DoConstruct>> -> 7
     if (nested.getIf<parser::NonLabelDoStmt>())
       continue;
     assert(nested.getIf<parser::DoConstruct>() &&
            "Unexpected construct in the nested evaluations");
     return &nested;
   }
   llvm_unreachable("Expected do loop to be in the nested evaluations");
 }

 /// Populates the sizes vector with values if the given OpenMPConstruct
 /// contains a loop construct with an inner tiling construct.
 void collectTileSizesFromOpenMPConstruct(
     const parser::OpenMPConstruct *ompCons,
     llvm::SmallVectorImpl<int64_t> &tileSizes,
     Fortran::semantics::SemanticsContext &semaCtx) {
   processTileSizesFromOpenMPConstruct(
       ompCons, [&](const parser::OmpClause::Sizes *tclause) {
         for (auto &tval : tclause->v)
           if (const auto v{EvaluateInt64(semaCtx, tval)})
             tileSizes.push_back(*v);
       });
 }

 int64_t collectLoopRelatedInfo(
     lower::AbstractConverter &converter, mlir::Location currentLocation,
     lower::pft::Evaluation &eval, const omp::List<omp::Clause> &clauses,
     mlir::omp::LoopRelatedClauseOps &result,
     llvm::SmallVectorImpl<const semantics::Symbol *> &iv) {
   int64_t numCollapse = 1;

   // Collect the loops to collapse.
   lower::pft::Evaluation *doConstructEval = getNestedDoConstruct(eval);
   if (doConstructEval->getIf<parser::DoConstruct>()->IsDoConcurrent()) {
     TODO(currentLocation, "Do Concurrent in Worksharing loop construct");
   }

   std::int64_t collapseValue = 1l;
   if (auto *clause =
           ClauseFinder::findUniqueClause<omp::clause::Collapse>(clauses)) {
     collapseValue = evaluate::ToInt64(clause->v).value();
     numCollapse = collapseValue;
   }

   collectLoopRelatedInfo(converter, currentLocation, eval, numCollapse, result,
                          iv);
   return numCollapse;
 }

 void collectLoopRelatedInfo(
     lower::AbstractConverter &converter, mlir::Location currentLocation,
     lower::pft::Evaluation &eval, int64_t numCollapse,
     mlir::omp::LoopRelatedClauseOps &result,
     llvm::SmallVectorImpl<const semantics::Symbol *> &iv) {

   fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();

   // Collect the loops to collapse.
   lower::pft::Evaluation *doConstructEval = getNestedDoConstruct(eval);
   if (doConstructEval->getIf<parser::DoConstruct>()->IsDoConcurrent()) {
     TODO(currentLocation, "Do Concurrent in Worksharing loop construct");
   }

   // Collect sizes from tile directive if present.
   std::int64_t sizesLengthValue = 0l;
   if (auto *ompCons{eval.getIf<parser::OpenMPConstruct>()}) {
     processTileSizesFromOpenMPConstruct(
         ompCons, [&](const parser::OmpClause::Sizes *tclause) {
           sizesLengthValue = tclause->v.size();
         });
   }

   std::int64_t collapseValue = std::max(numCollapse, sizesLengthValue);
   std::size_t loopVarTypeSize = 0;
   do {
     lower::pft::Evaluation *doLoop =
         &doConstructEval->getFirstNestedEvaluation();
     auto *doStmt = doLoop->getIf<parser::NonLabelDoStmt>();
     assert(doStmt && "Expected do loop to be in the nested evaluation");
     const auto &loopControl =
         std::get<std::optional<parser::LoopControl>>(doStmt->t);
     const parser::LoopControl::Bounds *bounds =
         std::get_if<parser::LoopControl::Bounds>(&loopControl->u);
     assert(bounds && "Expected bounds for worksharing do loop");
     lower::StatementContext stmtCtx;
     result.loopLowerBounds.push_back(fir::getBase(
         converter.genExprValue(*semantics::GetExpr(bounds->lower), stmtCtx)));
     result.loopUpperBounds.push_back(fir::getBase(
         converter.genExprValue(*semantics::GetExpr(bounds->upper), stmtCtx)));
     if (bounds->step) {
       result.loopSteps.push_back(fir::getBase(
           converter.genExprValue(*semantics::GetExpr(bounds->step), stmtCtx)));
     } else { // If `step` is not present, assume it as `1`.
       result.loopSteps.push_back(firOpBuilder.createIntegerConstant(
           currentLocation, firOpBuilder.getIntegerType(32), 1));
     }
     iv.push_back(bounds->name.thing.symbol);
     loopVarTypeSize = std::max(loopVarTypeSize,
                                bounds->name.thing.symbol->GetUltimate().size());
     if (--collapseValue)
       doConstructEval = getNestedDoConstruct(*doConstructEval);
   } while (collapseValue > 0);

   convertLoopBounds(converter, currentLocation, result, loopVarTypeSize);
 }

 } // namespace omp
 } // namespace lower
 } // namespace Fortran