[flang-commits] [flang] 2feafd0 - [flang][hlfir] lower hlfir.sum into fir runtime call
Tom Eccles via flang-commits
flang-commits at lists.llvm.org
Mon Feb 13 02:52:18 PST 2023
Author: Tom Eccles
Date: 2023-02-13T10:50:11Z
New Revision: 2feafd059e9f569eaca02a1928109d9572c49e93
URL: https://github.com/llvm/llvm-project/commit/2feafd059e9f569eaca02a1928109d9572c49e93
DIFF: https://github.com/llvm/llvm-project/commit/2feafd059e9f569eaca02a1928109d9572c49e93.diff
LOG: [flang][hlfir] lower hlfir.sum into fir runtime call
This duplicates some argument lowering and return value processing from
flang/lib/Lower/ConvertCall.cpp. The existing code in CovertCall lowers
directly into the fir.call (without the hlfir transformational intrinsic
operation), and it is too tied to the lowering code to move into
flang/lib/Optimizer to allow for more complete re-use here.
Differential Revision: https://reviews.llvm.org/D143512
Added:
flang/test/HLFIR/sum-bufferization.fir
Modified:
flang/lib/Optimizer/HLFIR/Transforms/BufferizeHLFIR.cpp
Removed:
################################################################################
diff --git a/flang/lib/Optimizer/HLFIR/Transforms/BufferizeHLFIR.cpp b/flang/lib/Optimizer/HLFIR/Transforms/BufferizeHLFIR.cpp
index ad5c04a967586..2ada1225dabf5 100644
--- a/flang/lib/Optimizer/HLFIR/Transforms/BufferizeHLFIR.cpp
+++ b/flang/lib/Optimizer/HLFIR/Transforms/BufferizeHLFIR.cpp
@@ -15,6 +15,7 @@
#include "flang/Optimizer/Builder/Character.h"
#include "flang/Optimizer/Builder/FIRBuilder.h"
#include "flang/Optimizer/Builder/HLFIRTools.h"
+#include "flang/Optimizer/Builder/IntrinsicCall.h"
#include "flang/Optimizer/Builder/MutableBox.h"
#include "flang/Optimizer/Builder/Runtime/Assign.h"
#include "flang/Optimizer/Builder/Todo.h"
@@ -498,6 +499,155 @@ struct ElementalOpConversion
}
};
+/// Base class for passes converting transformational intrinsic operations into
+/// runtime calls
+template <class OP>
+class HlfirIntrinsicConversion : public mlir::OpConversionPattern<OP> {
+ using mlir::OpConversionPattern<OP>::OpConversionPattern;
+
+protected:
+ struct IntrinsicArgument {
+ mlir::Value val; // allowed to be null if the argument is absent
+ mlir::Type desiredType;
+ };
+
+ /// Lower the arguments to the intrinsic: adding nesecarry boxing and
+ /// conversion to match the signature of the intrinsic in the runtime library.
+ llvm::SmallVector<fir::ExtendedValue, 3>
+ lowerArguments(mlir::Operation *op,
+ const llvm::ArrayRef<IntrinsicArgument> &args,
+ mlir::ConversionPatternRewriter &rewriter,
+ const fir::IntrinsicArgumentLoweringRules *argLowering) const {
+ assert(args.size() == 3 && "Transformational intrinsics have 3 args");
+ mlir::Location loc = op->getLoc();
+ fir::KindMapping kindMapping{rewriter.getContext()};
+ fir::FirOpBuilder builder{rewriter, kindMapping};
+
+ llvm::SmallVector<fir::ExtendedValue, 3> ret;
+
+ for (size_t i = 0; i < args.size(); ++i) {
+ mlir::Value arg = args[i].val;
+ mlir::Type desiredType = args[i].desiredType;
+ if (!arg) {
+ ret.emplace_back(fir::getAbsentIntrinsicArgument());
+ continue;
+ }
+ hlfir::Entity entity{arg};
+
+ fir::ArgLoweringRule argRules =
+ fir::lowerIntrinsicArgumentAs(*argLowering, i);
+ switch (argRules.lowerAs) {
+ case fir::LowerIntrinsicArgAs::Value: {
+ if (args[i].desiredType != arg.getType()) {
+ arg = builder.createConvert(loc, desiredType, arg);
+ entity = hlfir::Entity{arg};
+ }
+ auto [exv, cleanup] = hlfir::convertToValue(loc, builder, entity);
+ if (cleanup)
+ TODO(loc, "extended value cleanup");
+ ret.emplace_back(exv);
+ } break;
+ case fir::LowerIntrinsicArgAs::Addr: {
+ auto [exv, cleanup] =
+ hlfir::convertToAddress(loc, builder, entity, desiredType);
+ if (cleanup)
+ TODO(loc, "extended value cleanup");
+ ret.emplace_back(exv);
+ } break;
+ case fir::LowerIntrinsicArgAs::Box: {
+ auto [box, cleanup] =
+ hlfir::convertToBox(loc, builder, entity, desiredType);
+ if (cleanup)
+ TODO(loc, "extended value cleanup");
+ ret.emplace_back(box);
+ } break;
+ case fir::LowerIntrinsicArgAs::Inquired: {
+ if (args[i].desiredType != arg.getType()) {
+ arg = builder.createConvert(loc, desiredType, arg);
+ entity = hlfir::Entity{arg};
+ }
+ // Place hlfir.expr in memory, and unbox fir.boxchar. Other entities
+ // are translated to fir::ExtendedValue without transofrmation (notably,
+ // pointers/allocatable are not dereferenced).
+ // TODO: once lowering to FIR retires, UBOUND and LBOUND can be
+ // simplified since the fir.box lowered here are now guarenteed to
+ // contain the local lower bounds thanks to the hlfir.declare (the extra
+ // rebox can be removed).
+ auto [exv, cleanup] =
+ hlfir::translateToExtendedValue(loc, builder, entity);
+ if (cleanup)
+ TODO(loc, "extended value cleanup");
+ ret.emplace_back(exv);
+ } break;
+ }
+ }
+
+ return ret;
+ }
+
+ void processReturnValue(mlir::Operation *op,
+ const fir::ExtendedValue &resultExv, bool mustBeFreed,
+ fir::FirOpBuilder &builder,
+ mlir::PatternRewriter &rewriter) const {
+ mlir::Location loc = op->getLoc();
+
+ mlir::Value firBase = fir::getBase(resultExv);
+ mlir::Type firBaseTy = firBase.getType();
+
+ std::optional<hlfir::EntityWithAttributes> resultEntity;
+ if (fir::isa_trivial(firBaseTy)) {
+ resultEntity = hlfir::EntityWithAttributes{firBase};
+ } else {
+ resultEntity =
+ hlfir::genDeclare(loc, builder, resultExv, ".tmp.intrinsic_result",
+ fir::FortranVariableFlagsAttr{});
+ }
+
+ if (resultEntity->isVariable()) {
+ hlfir::AsExprOp asExpr = builder.create<hlfir::AsExprOp>(
+ loc, *resultEntity, builder.createBool(loc, mustBeFreed));
+ resultEntity = hlfir::EntityWithAttributes{asExpr.getResult()};
+ }
+
+ rewriter.replaceOp(op, resultEntity->getBase());
+ }
+};
+
+struct SumOpConversion : public HlfirIntrinsicConversion<hlfir::SumOp> {
+ using HlfirIntrinsicConversion<hlfir::SumOp>::HlfirIntrinsicConversion;
+
+ mlir::LogicalResult
+ matchAndRewrite(hlfir::SumOp sum, OpAdaptor adaptor,
+ mlir::ConversionPatternRewriter &rewriter) const override {
+ fir::KindMapping kindMapping{rewriter.getContext()};
+ fir::FirOpBuilder builder{rewriter, kindMapping};
+ const mlir::Location &loc = sum->getLoc();
+ HLFIRListener listener{builder, rewriter};
+ builder.setListener(&listener);
+
+ mlir::Type i32 = builder.getI32Type();
+ mlir::Type logicalType = fir::LogicalType::get(
+ builder.getContext(), builder.getKindMap().defaultLogicalKind());
+
+ llvm::SmallVector<IntrinsicArgument, 3> inArgs;
+ inArgs.push_back({sum.getArray(), sum.getArray().getType()});
+ inArgs.push_back({sum.getDim(), i32});
+ inArgs.push_back({sum.getMask(), logicalType});
+
+ auto *argLowering = fir::getIntrinsicArgumentLowering("sum");
+ llvm::SmallVector<fir::ExtendedValue, 3> args =
+ lowerArguments(sum, inArgs, rewriter, argLowering);
+
+ mlir::Type scalarResultType = hlfir::getFortranElementType(sum.getType());
+
+ auto [resultExv, mustBeFreed] =
+ fir::genIntrinsicCall(builder, loc, "sum", scalarResultType, args);
+
+ processReturnValue(sum, resultExv, mustBeFreed, builder, rewriter);
+ return mlir::success();
+ }
+};
+
class BufferizeHLFIR : public hlfir::impl::BufferizeHLFIRBase<BufferizeHLFIR> {
public:
void runOnOperation() override {
@@ -515,7 +665,8 @@ class BufferizeHLFIR : public hlfir::impl::BufferizeHLFIRBase<BufferizeHLFIR> {
.insert<ApplyOpConversion, AsExprOpConversion, AssignOpConversion,
AssociateOpConversion, ConcatOpConversion, DestroyOpConversion,
ElementalOpConversion, EndAssociateOpConversion,
- NoReassocOpConversion, SetLengthOpConversion>(context);
+ NoReassocOpConversion, SetLengthOpConversion, SumOpConversion>(
+ context);
mlir::ConversionTarget target(*context);
target.addIllegalOp<hlfir::ApplyOp, hlfir::AssociateOp, hlfir::ElementalOp,
hlfir::EndAssociateOp, hlfir::SetLengthOp,
diff --git a/flang/test/HLFIR/sum-bufferization.fir b/flang/test/HLFIR/sum-bufferization.fir
new file mode 100644
index 0000000000000..d1bdd9fbd67a1
--- /dev/null
+++ b/flang/test/HLFIR/sum-bufferization.fir
@@ -0,0 +1,182 @@
+// Test hlfir.sum operation lowering to fir runtime call
+// RUN: fir-opt %s -bufferize-hlfir | FileCheck %s
+
+// simple one argument sum
+func.func @_QPsum1(%arg0: !fir.box<!fir.array<?xi32>> {fir.bindc_name = "a"}, %arg1: !fir.ref<i32> {fir.bindc_name = "s"}) {
+ %0:2 = hlfir.declare %arg0 {uniq_name = "_QFsum1Ea"} : (!fir.box<!fir.array<?xi32>>) -> (!fir.box<!fir.array<?xi32>>, !fir.box<!fir.array<?xi32>>)
+ %1:2 = hlfir.declare %arg1 {uniq_name = "_QFsum1Es"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+ %2 = hlfir.sum %0#0 {fastmath = #arith.fastmath<contract>} : (!fir.box<!fir.array<?xi32>>) -> !hlfir.expr<i32>
+ hlfir.assign %2 to %1#0 : !hlfir.expr<i32>, !fir.ref<i32>
+ hlfir.destroy %2 : !hlfir.expr<i32>
+ return
+}
+// CHECK-LABEL: func.func @_QPsum1(
+// CHECK: %[[ARG0:.*]]: !fir.box<!fir.array<?xi32>>
+// CHECK: %[[ARG1:.*]]: !fir.ref<i32>
+// CHECK-DAG: %[[ARRAY:.*]]:2 = hlfir.declare %[[ARG0]]
+// CHECK-DAG: %[[RES:.*]]:2 = hlfir.declare %[[ARG1]]
+// CHECK-DAG: %[[MASK:.*]] = fir.absent !fir.box<i1>
+// CHECK-DAG: %[[ARRAY_ARG:.*]] = fir.convert %[[ARRAY]]#1 : (!fir.box<!fir.array<?xi32>>) -> !fir.box<none>
+// CHECK-DAG: %[[MASK_ARG:.*]] = fir.convert %[[MASK]] : (!fir.box<i1>) -> !fir.box<none>
+// CHECK: %[[RET:.*]] = fir.call @_FortranASumInteger4(%[[ARRAY_ARG]], %[[LOC_STR:.*]], %[[LOC_N:.*]], %[[INT:.*]], %[[MASK_ARG]]) : (!fir.box<none>, !fir.ref<i8>, i32, i32, !fir.box<none>) -> i32
+// CHECK-NEXT: hlfir.assign %[[RET]] to %[[RES]]#0 : i32, !fir.ref<i32>
+// CHECK-NEXT: return
+// CHECK-NEXT: }
+
+// sum with a by-ref dimension of index type
+func.func @_QPsum2(%arg0: !fir.box<!fir.array<?x?xi32>> {fir.bindc_name = "a"}, %arg1: !fir.box<!fir.array<?xi32>> {fir.bindc_name = "s"}, %arg2: !fir.ref<index> {fir.bindc_name = "d"}) {
+ %0:2 = hlfir.declare %arg0 {uniq_name = "_QFsum2Ea"} : (!fir.box<!fir.array<?x?xi32>>) -> (!fir.box<!fir.array<?x?xi32>>, !fir.box<!fir.array<?x?xi32>>)
+ %1:2 = hlfir.declare %arg2 {uniq_name = "_QFsum2Ed"} : (!fir.ref<index>) -> (!fir.ref<index>, !fir.ref<index>)
+ %2:2 = hlfir.declare %arg1 {uniq_name = "_QFsum2Es"} : (!fir.box<!fir.array<?xi32>>) -> (!fir.box<!fir.array<?xi32>>, !fir.box<!fir.array<?xi32>>)
+ %3 = fir.load %1#0 : !fir.ref<index>
+ %4 = hlfir.sum %0#0 dim %3#0 {fastmath = #arith.fastmath<contract>} : (!fir.box<!fir.array<?x?xi32>>, index) -> !hlfir.expr<?xi32>
+ hlfir.assign %4 to %2#0 : !hlfir.expr<?xi32>, !fir.box<!fir.array<?xi32>>
+ hlfir.destroy %4 : !hlfir.expr<?xi32>
+ return
+}
+// CHECK-LABEL: func.func @_QPsum2(
+// CHECK: %[[ARG0:.*]]: !fir.box<!fir.array<?x?xi32>>
+// CHECK: %[[ARG1:.*]]: !fir.box<!fir.array<?xi32>>
+// CHECK: %[[ARG2:.*]]: !fir.ref<index>
+// CHECK-DAG: %[[ARRAY:.*]]:2 = hlfir.declare %[[ARG0]]
+// CHECK-DAG: %[[RES:.*]]:2 = hlfir.declare %[[ARG1]]
+// CHECK-DAG: %[[DIM_VAR:.*]]:2 = hlfir.declare %[[ARG2]]
+
+// CHECK-DAG: %[[RET_BOX:.*]] = fir.alloca !fir.box<!fir.heap<!fir.array<?xi32>>>
+// CHECK-DAG: %[[RET_ADDR:.*]] = fir.zero_bits !fir.heap<!fir.array<?xi32>>
+// CHECK-DAG: %[[C0:.*]] = arith.constant 0 : index
+// CHECK-DAG: %[[RET_SHAPE:.*]] = fir.shape %[[C0]] : (index) -> !fir.shape<1>
+// CHECK-DAG: %[[RET_EMBOX:.*]] = fir.embox %[[RET_ADDR]](%[[RET_SHAPE]])
+// CHECK-DAG: fir.store %[[RET_EMBOX]] to %[[RET_BOX]]
+
+// CHECK-DAG: %[[MASK:.*]] = fir.absent !fir.box<i1>
+// CHECK-DAG: %[[DIM_IDX:.*]] = fir.load %[[DIM_VAR]]#0 : !fir.ref<index>
+// CHECK-DAG: %[[DIM:.*]] = fir.convert %[[DIM_IDX]] : (index) -> i32
+
+// CHECK-DAG: %[[RET_ARG:.*]] = fir.convert %[[RET_BOX]]
+// CHECK-DAG: %[[ARRAY_ARG:.*]] = fir.convert %[[ARRAY]]#1 : (!fir.box<!fir.array<?x?xi32>>) -> !fir.box<none>
+// CHECK-DAG: %[[MASK_ARG:.*]] = fir.convert %[[MASK]] : (!fir.box<i1>) -> !fir.box<none>
+// CHECK: %[[NONE:.*]] = fir.call @_FortranASumDim(%[[RET_ARG]], %[[ARRAY_ARG]], %[[DIM]], %[[LOC_STR:.*]], %[[LOC_N:.*]], %[[MASK_ARG]]) : (!fir.ref<!fir.box<none>>, !fir.box<none>, i32, !fir.ref<i8>, i32, !fir.box<none>) -> none
+
+// CHECK: %[[RET:.*]] = fir.load %[[RET_BOX]]
+// CHECK: %[[BOX_DIMS:.*]]:3 = fir.box_dims %[[RET]]
+// CHECK-NEXT: %[[ADDR:.*]] = fir.box_addr %[[RET]]
+// CHECK-NEXT: %[[SHIFT:.*]] = fir.shape_shift %[[BOX_DIMS]]#0, %[[BOX_DIMS]]#1
+// TODO: fix alias analysis in hlfir.assign bufferization
+// CHECK-NEXT: %[[TMP:.*]]:2 = hlfir.declare %[[ADDR]](%[[SHIFT]]) {uniq_name = ".tmp.intrinsic_result"}
+// CHECK: %[[TUPLE0:.*]] = fir.undefined tuple<!fir.box<!fir.array<?xi32>>, i1>
+// CHECK: %[[TUPLE1:.*]] = fir.insert_value %[[TUPLE0]], %[[TRUE:.*]], [1 : index]
+// CHECK: %[[TUPLE2:.*]] fir.insert_value %[[TUPLE1]], %[[TMP]]#0, [0 : index]
+// CHECK: hlfir.assign %[[TMP]]#0 to %[[RES]]#0
+// CHECK: fir.freemem %[[TMP]]#1
+// CHECK-NEXT: return
+// CHECK-NEXT: }
+
+// sum with scalar mask
+func.func @_QPsum3(%arg0: !fir.box<!fir.array<?xi32>> {fir.bindc_name = "a"}, %arg1: !fir.ref<i32> {fir.bindc_name = "s"}, %arg2: !fir.ref<!fir.logical<4>> {fir.bindc_name = "m"}) {
+ %0:2 = hlfir.declare %arg0 {uniq_name = "_QFsum3Ea"} : (!fir.box<!fir.array<?xi32>>) -> (!fir.box<!fir.array<?xi32>>, !fir.box<!fir.array<?xi32>>)
+ %1:2 = hlfir.declare %arg2 {uniq_name = "_QFsum3Em"} : (!fir.ref<!fir.logical<4>>) -> (!fir.ref<!fir.logical<4>>, !fir.ref<!fir.logical<4>>)
+ %2:2 = hlfir.declare %arg1 {uniq_name = "_QFsum3Es"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+ %3 = hlfir.sum %0#0 mask %1#0 {fastmath = #arith.fastmath<contract>} : (!fir.box<!fir.array<?xi32>>, !fir.ref<!fir.logical<4>>) -> !hlfir.expr<i32>
+ hlfir.assign %3 to %2#0 : !hlfir.expr<i32>, !fir.ref<i32>
+ hlfir.destroy %3 : !hlfir.expr<i32>
+ return
+}
+// CHECK-LABEL: func.func @_QPsum3(
+// CHECK: %[[ARG0:.*]]: !fir.box<!fir.array<?xi32>>
+// CHECK: %[[ARG1:.*]]: !fir.ref<i32>
+// CHECK: %[[ARG2:.*]]: !fir.ref<!fir.logical<4>>
+// CHECK-DAG: %[[ARRAY:.*]]:2 = hlfir.declare %[[ARG0]]
+// CHECK-DAG: %[[RES:.*]]:2 = hlfir.declare %[[ARG1]]
+// CHECK-DAG: %[[MASK:.*]]:2 = hlfir.declare %[[ARG2]]
+// CHECK-DAG: %[[MASK_BOX:.*]] = fir.embox %[[MASK]]#1 : (!fir.ref<!fir.logical<4>>) -> !fir.box<!fir.logical<4>>
+// CHECK-DAG: %[[ARRAY_ARG:.*]] = fir.convert %[[ARRAY]]#1 : (!fir.box<!fir.array<?xi32>>) -> !fir.box<none>
+// CHECK-DAG: %[[MASK_ARG:.*]] = fir.convert %[[MASK_BOX]] : (!fir.box<!fir.logical<4>>) -> !fir.box<none>
+// CHECK: %[[RET:.*]] = fir.call @_FortranASumInteger4(%[[ARRAY_ARG]], %[[LOC_STR:.*]], %[[LOC_N:.*]], %[[INT:.*]], %[[MASK_ARG]]) : (!fir.box<none>, !fir.ref<i8>, i32, i32, !fir.box<none>) -> i32
+// CHECK-NEXT: hlfir.assign %[[RET]] to %[[RES]]#0 : i32, !fir.ref<i32>
+// CHECK-NEXT: return
+// CHECK-NEXT: }
+
+// sum with array mask
+func.func @_QPsum4(%arg0: !fir.box<!fir.array<?xi32>> {fir.bindc_name = "a"}, %arg1: !fir.ref<i32> {fir.bindc_name = "s"}, %arg2: !fir.box<!fir.array<?x!fir.logical<4>>> {fir.bindc_name = "m"}) {
+ %0:2 = hlfir.declare %arg0 {uniq_name = "_QFsum4Ea"} : (!fir.box<!fir.array<?xi32>>) -> (!fir.box<!fir.array<?xi32>>, !fir.box<!fir.array<?xi32>>)
+ %1:2 = hlfir.declare %arg2 {uniq_name = "_QFsum4Em"} : (!fir.box<!fir.array<?x!fir.logical<4>>>) -> (!fir.box<!fir.array<?x!fir.logical<4>>>, !fir.box<!fir.array<?x!fir.logical<4>>>)
+ %2:2 = hlfir.declare %arg1 {uniq_name = "_QFsum4Es"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+ %3 = hlfir.sum %0#0 mask %1#0 {fastmath = #arith.fastmath<contract>} : (!fir.box<!fir.array<?xi32>>, !fir.box<!fir.array<?x!fir.logical<4>>>) -> !hlfir.expr<i32>
+ hlfir.assign %3 to %2#0 : !hlfir.expr<i32>, !fir.ref<i32>
+ hlfir.destroy %3 : !hlfir.expr<i32>
+ return
+}
+// CHECK-LABEL: func.func @_QPsum4(
+// CHECK: %[[ARG0:.*]]: !fir.box<!fir.array<?xi32>>
+// CHECK: %[[ARG1:.*]]: !fir.ref<i32>
+// CHECK: %[[ARG2:.*]]: !fir.box<!fir.array<?x!fir.logical<4>>>
+// CHECK-DAG: %[[ARRAY:.*]]:2 = hlfir.declare %[[ARG0]]
+// CHECK-DAG: %[[RES:.*]]:2 = hlfir.declare %[[ARG1]]
+// CHECK-DAG: %[[MASK:.*]]:2 = hlfir.declare %[[ARG2]]
+// CHECK-DAG: %[[ARRAY_ARG:.*]] = fir.convert %[[ARRAY]]#1 : (!fir.box<!fir.array<?xi32>>) -> !fir.box<none>
+// CHECK-DAG: %[[MASK_ARG:.*]] = fir.convert %[[MASK]]#1 : (!fir.box<!fir.array<?x!fir.logical<4>>>) -> !fir.box<none>
+// CHECK: %[[RET:.*]] = fir.call @_FortranASumInteger4(%[[ARRAY_ARG]], %[[LOC_STR:.*]], %[[LOC_N:.*]], %[[INT:.*]], %[[MASK_ARG]]) : (!fir.box<none>, !fir.ref<i8>, i32, i32, !fir.box<none>) -> i32
+// CHECK-NEXT: hlfir.assign %[[RET]] to %[[RES]]#0 : i32, !fir.ref<i32>
+// CHECK-NEXT: return
+// CHECK-NEXT: }
+
+fir.global internal @_QFsum5Ea : !fir.array<2x2xi32> {
+ %0 = fir.undefined !fir.array<2x2xi32>
+ %c1_i32 = arith.constant 1 : i32
+ %1 = fir.insert_value %0, %c1_i32, [0 : index, 0 : index] : (!fir.array<2x2xi32>, i32) -> !fir.array<2x2xi32>
+ %c2_i32 = arith.constant 2 : i32
+ %2 = fir.insert_value %1, %c2_i32, [1 : index, 0 : index] : (!fir.array<2x2xi32>, i32) -> !fir.array<2x2xi32>
+ %c3_i32 = arith.constant 3 : i32
+ %3 = fir.insert_value %2, %c3_i32, [0 : index, 1 : index] : (!fir.array<2x2xi32>, i32) -> !fir.array<2x2xi32>
+ %c4_i32 = arith.constant 4 : i32
+ %4 = fir.insert_value %3, %c4_i32, [1 : index, 1 : index] : (!fir.array<2x2xi32>, i32) -> !fir.array<2x2xi32>
+ %c2 = arith.constant 2 : index
+ %c2_0 = arith.constant 2 : index
+ fir.has_value %4 : !fir.array<2x2xi32>
+}
+
+// 3 argument sum, using local variables
+func.func @_QPsum5(%arg0: !fir.ref<!fir.array<2xi32>> {fir.bindc_name = "s"}) {
+ %0 = fir.address_of(@_QFsum5Ea) : !fir.ref<!fir.array<2x2xi32>>
+ %c2 = arith.constant 2 : index
+ %c2_0 = arith.constant 2 : index
+ %1 = fir.shape %c2, %c2_0 : (index, index) -> !fir.shape<2>
+ %2:2 = hlfir.declare %0(%1) {uniq_name = "_QFsum5Ea"} : (!fir.ref<!fir.array<2x2xi32>>, !fir.shape<2>) -> (!fir.ref<!fir.array<2x2xi32>>, !fir.ref<!fir.array<2x2xi32>>)
+ %c2_1 = arith.constant 2 : index
+ %3 = fir.shape %c2_1 : (index) -> !fir.shape<1>
+ %4:2 = hlfir.declare %arg0(%3) {uniq_name = "_QFsum5Es"} : (!fir.ref<!fir.array<2xi32>>, !fir.shape<1>) -> (!fir.ref<!fir.array<2xi32>>, !fir.ref<!fir.array<2xi32>>)
+ %c1_i32 = arith.constant 1 : i32
+ %true = arith.constant true
+ %5 = hlfir.sum %2#0 dim %c1_i32 mask %true {fastmath = #arith.fastmath<contract>} : (!fir.ref<!fir.array<2x2xi32>>, i32, i1) -> !hlfir.expr<2xi32>
+ hlfir.assign %5 to %4#0 : !hlfir.expr<2xi32>, !fir.ref<!fir.array<2xi32>>
+ hlfir.destroy %5 : !hlfir.expr<2xi32>
+ return
+}
+// CHECK-LABEL: func.func @_QPsum5(
+// CHECK: %[[ARG0:.*]]: !fir.ref<!fir.array<2xi32>>
+// CHECK-DAG: %[[RET_BOX:.*]] = fir.alloca !fir.box<!fir.heap<!fir.array<?xi32>>>
+// CHECK-DAG: %[[RET_ADDR:.*]] = fir.zero_bits !fir.heap<!fir.array<?xi32>>
+// CHECK-DAG: %[[C0:.*]] = arith.constant 0 : index
+// CHECK-DAG: %[[RET_SHAPE:.*]] = fir.shape %[[C0]] : (index) -> !fir.shape<1>
+// CHECK-DAG: %[[RET_EMBOX:.*]] = fir.embox %[[RET_ADDR]](%[[RET_SHAPE]])
+// CHECK-DAG: fir.store %[[RET_EMBOX]] to %[[RET_BOX]]
+
+// CHECK-DAG: %[[RES_VAR:.*]] = hlfir.declare %[[ARG0]](%[[RES_SHAPE:.*]])
+
+// CHECK-DAG: %[[MASK_ALLOC:.*]] = fir.alloca !fir.logical<4>
+// CHECK-DAG: %[[TRUE:.*]] = arith.constant true
+// CHECK-DAG: %[[MASK_VAL:.*]] = fir.convert %[[TRUE]] : (i1) -> !fir.logical<4>
+// CHECK-DAG: fir.store %[[MASK_VAL]] to %[[MASK_ALLOC]] : !fir.ref<!fir.logical<4>>
+// CHECK-DAG: %[[MASK_BOX:.*]] = fir.embox %[[MASK_ALLOC]]
+
+// CHECK-DAG: %[[ARRAY_ADDR:.*]] = fir.address_of
+// CHECK-DAG: %[[ARRAY_VAR:.*]]:2 = hlfir.declare %[[ARRAY_ADDR]](%[[ARRAY_SHAPE:.*]])
+// CHECK-DAG: %[[ARRAY_BOX:.*]] = fir.embox %[[ARRAY_VAR]]#1(%[[ARRAY_SHAPE:.*]])
+
+// CHECK-DAG: %[[DIM:.*]] = arith.constant 1 : i32
+
+// CHECK-DAG: %[[RET_ARG:.*]] = fir.convert %[[RET_BOX]]
+// CHECK-DAG: %[[ARRAY_ARG:.*]] = fir.convert %[[ARRAY_BOX]] : (!fir.box<!fir.array<2x2xi32>>) -> !fir.box<none>
+// CHECK-DAG: %[[MASK_ARG:.*]] = fir.convert %[[MASK_BOX]] : (!fir.box<!fir.logical<4>>) -> !fir.box<none>
+// CHECK: %[[NONE:.*]] = fir.call @_FortranASumDim(%[[RET_ARG]], %[[ARRAY_ARG]], %[[DIM]], %[[LOC_STR:.*]], %[[LOC_N:.*]], %[[MASK_ARG]]) : (!fir.ref<!fir.box<none>>, !fir.box<none>, i32, !fir.ref<i8>, i32, !fir.box<none>) -> none
More information about the flang-commits
mailing list