[flang-commits] [flang] [Flang][OpenMP]Support for lowering grainsize and num_tasks clause to… (PR #128490)
Kaviya Rajendiran via flang-commits
flang-commits at lists.llvm.org
Tue May 6 23:24:24 PDT 2025
https://github.com/kaviya2510 updated https://github.com/llvm/llvm-project/pull/128490
>From 2527a46c3b687a954dcb5b20c1c90add10796443 Mon Sep 17 00:00:00 2001
From: Kaviya Rajendiran <kaviyara2000 at gmail.com>
Date: Wed, 7 May 2025 11:53:51 +0530
Subject: [PATCH] [Flang][OpenMP]Support for lowering grainsize and num_tasks
clause of taskloop construct to MLIR
---
flang/lib/Lower/OpenMP/ClauseProcessor.cpp | 42 +++++++++++++++
flang/lib/Lower/OpenMP/ClauseProcessor.h | 4 ++
flang/lib/Lower/OpenMP/OpenMP.cpp | 26 ++++-----
.../test/Lower/OpenMP/taskloop-grainsize.f90 | 51 ++++++++++++++++++
flang/test/Lower/OpenMP/taskloop-numtasks.f90 | 54 +++++++++++++++++++
5 files changed, 165 insertions(+), 12 deletions(-)
create mode 100644 flang/test/Lower/OpenMP/taskloop-grainsize.f90
create mode 100644 flang/test/Lower/OpenMP/taskloop-numtasks.f90
diff --git a/flang/lib/Lower/OpenMP/ClauseProcessor.cpp b/flang/lib/Lower/OpenMP/ClauseProcessor.cpp
index 77b4622547d7a..ac940b5c74152 100644
--- a/flang/lib/Lower/OpenMP/ClauseProcessor.cpp
+++ b/flang/lib/Lower/OpenMP/ClauseProcessor.cpp
@@ -365,6 +365,27 @@ bool ClauseProcessor::processHint(mlir::omp::HintClauseOps &result) const {
return false;
}
+bool ClauseProcessor::processGrainsize(
+ lower::StatementContext &stmtCtx,
+ mlir::omp::GrainsizeClauseOps &result) const {
+ using grainsize = omp::clause::Grainsize;
+ if (auto *clause = findUniqueClause<grainsize>()) {
+ fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();
+ mlir::MLIRContext *context = firOpBuilder.getContext();
+ const auto &modifier =
+ std::get<std::optional<grainsize::Prescriptiveness>>(clause->t);
+ if (modifier) {
+ result.grainsizeMod = mlir::omp::ClauseGrainsizeTypeAttr::get(
+ context, mlir::omp::ClauseGrainsizeType::Strict);
+ }
+ const auto &grainsizeExpr = std::get<omp::SomeExpr>(clause->t);
+ result.grainsize =
+ fir::getBase(converter.genExprValue(grainsizeExpr, stmtCtx));
+ return true;
+ }
+ return false;
+}
+
bool ClauseProcessor::processInclusive(
mlir::Location currentLocation,
mlir::omp::InclusiveClauseOps &result) const {
@@ -388,6 +409,27 @@ bool ClauseProcessor::processNowait(mlir::omp::NowaitClauseOps &result) const {
return markClauseOccurrence<omp::clause::Nowait>(result.nowait);
}
+bool ClauseProcessor::processNumTasks(
+ lower::StatementContext &stmtCtx,
+ mlir::omp::NumTasksClauseOps &result) const {
+ using numtasks = omp::clause::NumTasks;
+ if (auto *clause = findUniqueClause<numtasks>()) {
+ fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();
+ mlir::MLIRContext *context = firOpBuilder.getContext();
+ const auto &modifier =
+ std::get<std::optional<numtasks::Prescriptiveness>>(clause->t);
+ if (modifier) {
+ result.numTasksMod = mlir::omp::ClauseNumTasksTypeAttr::get(
+ context, mlir::omp::ClauseNumTasksType::Strict);
+ }
+ const auto &numtasksExpr = std::get<omp::SomeExpr>(clause->t);
+ result.numTasks =
+ fir::getBase(converter.genExprValue(numtasksExpr, stmtCtx));
+ return true;
+ }
+ return false;
+}
+
bool ClauseProcessor::processNumTeams(
lower::StatementContext &stmtCtx,
mlir::omp::NumTeamsClauseOps &result) const {
diff --git a/flang/lib/Lower/OpenMP/ClauseProcessor.h b/flang/lib/Lower/OpenMP/ClauseProcessor.h
index bdddeb145b496..375e24b80fc21 100644
--- a/flang/lib/Lower/OpenMP/ClauseProcessor.h
+++ b/flang/lib/Lower/OpenMP/ClauseProcessor.h
@@ -78,10 +78,14 @@ class ClauseProcessor {
mlir::omp::HasDeviceAddrClauseOps &result,
llvm::SmallVectorImpl<const semantics::Symbol *> &hasDeviceSyms) const;
bool processHint(mlir::omp::HintClauseOps &result) const;
+ bool processGrainsize(lower::StatementContext &stmtCtx,
+ mlir::omp::GrainsizeClauseOps &result) const;
bool processInclusive(mlir::Location currentLocation,
mlir::omp::InclusiveClauseOps &result) const;
bool processMergeable(mlir::omp::MergeableClauseOps &result) const;
bool processNowait(mlir::omp::NowaitClauseOps &result) const;
+ bool processNumTasks(lower::StatementContext &stmtCtx,
+ mlir::omp::NumTasksClauseOps &result) const;
bool processNumTeams(lower::StatementContext &stmtCtx,
mlir::omp::NumTeamsClauseOps &result) const;
bool processNumThreads(lower::StatementContext &stmtCtx,
diff --git a/flang/lib/Lower/OpenMP/OpenMP.cpp b/flang/lib/Lower/OpenMP/OpenMP.cpp
index fcd3de9671098..af227b28d35b3 100644
--- a/flang/lib/Lower/OpenMP/OpenMP.cpp
+++ b/flang/lib/Lower/OpenMP/OpenMP.cpp
@@ -1806,17 +1806,19 @@ static void genTaskgroupClauses(lower::AbstractConverter &converter,
static void genTaskloopClauses(lower::AbstractConverter &converter,
semantics::SemanticsContext &semaCtx,
+ lower::StatementContext &stmtCtx,
const List<Clause> &clauses, mlir::Location loc,
mlir::omp::TaskloopOperands &clauseOps) {
ClauseProcessor cp(converter, semaCtx, clauses);
+ cp.processGrainsize(stmtCtx, clauseOps);
+ cp.processNumTasks(stmtCtx, clauseOps);
cp.processTODO<clause::Allocate, clause::Collapse, clause::Default,
- clause::Final, clause::Grainsize, clause::If,
- clause::InReduction, clause::Lastprivate, clause::Mergeable,
- clause::Nogroup, clause::NumTasks, clause::Priority,
- clause::Reduction, clause::Shared, clause::Untied>(
- loc, llvm::omp::Directive::OMPD_taskloop);
+ clause::Final, clause::If, clause::InReduction,
+ clause::Lastprivate, clause::Mergeable, clause::Nogroup,
+ clause::Priority, clause::Reduction, clause::Shared,
+ clause::Untied>(loc, llvm::omp::Directive::OMPD_taskloop);
}
static void genTaskwaitClauses(lower::AbstractConverter &converter,
@@ -3268,12 +3270,12 @@ genStandaloneSimd(lower::AbstractConverter &converter, lower::SymMap &symTable,
static mlir::omp::TaskloopOp genStandaloneTaskloop(
lower::AbstractConverter &converter, lower::SymMap &symTable,
- semantics::SemanticsContext &semaCtx, lower::pft::Evaluation &eval,
- mlir::Location loc, const ConstructQueue &queue,
- ConstructQueue::const_iterator item) {
+ lower::StatementContext &stmtCtx, semantics::SemanticsContext &semaCtx,
+ lower::pft::Evaluation &eval, mlir::Location loc,
+ const ConstructQueue &queue, ConstructQueue::const_iterator item) {
mlir::omp::TaskloopOperands taskloopClauseOps;
- genTaskloopClauses(converter, semaCtx, item->clauses, loc, taskloopClauseOps);
-
+ genTaskloopClauses(converter, semaCtx, stmtCtx, item->clauses, loc,
+ taskloopClauseOps);
DataSharingProcessor dsp(converter, semaCtx, item->clauses, eval,
/*shouldCollectPreDeterminedSymbols=*/true,
enableDelayedPrivatization, symTable);
@@ -3734,8 +3736,8 @@ static void genOMPDispatch(lower::AbstractConverter &converter,
genTaskgroupOp(converter, symTable, semaCtx, eval, loc, queue, item);
break;
case llvm::omp::Directive::OMPD_taskloop:
- newOp = genStandaloneTaskloop(converter, symTable, semaCtx, eval, loc,
- queue, item);
+ newOp = genStandaloneTaskloop(converter, symTable, stmtCtx, semaCtx, eval,
+ loc, queue, item);
break;
case llvm::omp::Directive::OMPD_taskwait:
newOp = genTaskwaitOp(converter, symTable, semaCtx, eval, loc, queue, item);
diff --git a/flang/test/Lower/OpenMP/taskloop-grainsize.f90 b/flang/test/Lower/OpenMP/taskloop-grainsize.f90
new file mode 100644
index 0000000000000..fa684ad213d0a
--- /dev/null
+++ b/flang/test/Lower/OpenMP/taskloop-grainsize.f90
@@ -0,0 +1,51 @@
+! This test checks lowering of grainsize clause in taskloop directive.
+
+! RUN: bbc -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+! RUN: %flang_fc1 -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = private} @[[I_PRIVATE_TEST2:.*]] : i32
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = firstprivate} @[[X_FIRSTPRIVATE_TEST2:.*]] : i32
+! CHECK-SAME: copy {
+! CHECK: hlfir.assign
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = private} @[[I_PRIVATE:.*]] : i32
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = firstprivate} @[[X_FIRSTPRIVATE:.*]] : i32
+! CHECK-SAME: copy {
+! CHECK: hlfir.assign
+
+! CHECK-LABEL: func.func @_QPtest_grainsize
+! CHECK: %[[ALLOCA_I:.*]] = fir.alloca i32 {bindc_name = "i", uniq_name = "_QFtest_grainsizeEi"}
+! CHECK: %[[DECL_I:.*]]:2 = hlfir.declare %[[ALLOCA_I]] {uniq_name = "_QFtest_grainsizeEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK: %[[ALLOCA_X:.*]] = fir.alloca i32 {bindc_name = "x", uniq_name = "_QFtest_grainsizeEx"}
+! CHECK: %[[DECL_X:.*]]:2 = hlfir.declare %[[ALLOCA_X]] {uniq_name = "_QFtest_grainsizeEx"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK: %[[GRAINSIZE:.*]] = arith.constant 10 : i32
+subroutine test_grainsize
+ integer :: i, x
+ ! CHECK: omp.taskloop grainsize(%[[GRAINSIZE]]: i32)
+ ! CHECK-SAME: private(@[[X_FIRSTPRIVATE]] %[[DECL_X]]#0 -> %[[ARG0:.*]], @[[I_PRIVATE]] %[[DECL_I]]#0 -> %[[ARG1:.*]] : !fir.ref<i32>, !fir.ref<i32>) {
+ ! CHECK: omp.loop_nest (%[[ARG2:.*]]) : i32 = (%{{.*}}) to (%{{.*}}) inclusive step (%{{.*}}) {
+ !$omp taskloop grainsize(10)
+ do i = 1, 1000
+ x = x + 1
+ end do
+ !$omp end taskloop
+end subroutine test_grainsize
+
+!CHECK-LABEL: func.func @_QPtest_grainsize_strict()
+subroutine test_grainsize_strict
+ integer :: i, x
+ ! CHECK: %[[GRAINSIZE:.*]] = arith.constant 10 : i32
+ ! CHECK: omp.taskloop grainsize(strict, %[[GRAINSIZE]]: i32)
+ !$omp taskloop grainsize(strict:10)
+ do i = 1, 1000
+ !CHECK: arith.addi
+ x = x + 1
+ end do
+ !$omp end taskloop
+end subroutine
\ No newline at end of file
diff --git a/flang/test/Lower/OpenMP/taskloop-numtasks.f90 b/flang/test/Lower/OpenMP/taskloop-numtasks.f90
new file mode 100644
index 0000000000000..38f3975bbd371
--- /dev/null
+++ b/flang/test/Lower/OpenMP/taskloop-numtasks.f90
@@ -0,0 +1,54 @@
+! This test checks lowering of num_tasks clause in taskloop directive.
+
+! RUN: bbc -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+! RUN: %flang_fc1 -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = private} @[[I_PRIVATE_TEST2:.*]] : i32
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = firstprivate} @[[X_FIRSTPRIVATE_TEST2:.*]] : i32
+! CHECK-SAME: copy {
+! CHECK: hlfir.assign
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = private} @[[I_PRIVATE:.*]] : i32
+
+! CHECK-LABEL: omp.private
+! CHECK-SAME: {type = firstprivate} @[[X_FIRSTPRIVATE:.*]] : i32
+! CHECK-SAME: copy {
+! CHECK: hlfir.assign
+
+! CHECK-LABEL: func.func @_QPtest_num_tasks
+! CHECK: %[[ALLOCA_I:.*]] = fir.alloca i32 {bindc_name = "i", uniq_name = "_QFtest_num_tasksEi"}
+! CHECK: %[[DECL_I:.*]]:2 = hlfir.declare %[[ALLOCA_I]] {uniq_name = "_QFtest_num_tasksEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK: %[[ALLOCA_X:.*]] = fir.alloca i32 {bindc_name = "x", uniq_name = "_QFtest_num_tasksEx"}
+! CHECK: %[[DECL_X:.*]]:2 = hlfir.declare %[[ALLOCA_X]] {uniq_name = "_QFtest_num_tasksEx"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK: %[[VAL_NUMTASKS:.*]] = arith.constant 10 : i32
+subroutine test_num_tasks
+ integer :: i, x
+ ! CHECK: omp.taskloop num_tasks(%[[VAL_NUMTASKS]]: i32)
+ ! CHECK-SAME: private(@[[X_FIRSTPRIVATE]] %[[DECL_X]]#0 -> %[[ARG0:.*]], @[[I_PRIVATE]] %[[DECL_I]]#0 -> %[[ARG1:.*]] : !fir.ref<i32>, !fir.ref<i32>) {
+ ! CHECK: omp.loop_nest (%[[ARG2:.*]]) : i32 = (%{{.*}}) to (%{{.*}}) inclusive step (%{{.*}}) {
+ !$omp taskloop num_tasks(10)
+ do i = 1, 1000
+ x = x + 1
+ end do
+ !$omp end taskloop
+end subroutine test_num_tasks
+
+! CHECK-LABEL: func.func @_QPtest_num_tasks_strict
+subroutine test_num_tasks_strict
+ integer :: x, i
+ ! CHECK: %[[NUM_TASKS:.*]] = arith.constant 10 : i32
+ ! CHECK: omp.taskloop num_tasks(strict, %[[NUM_TASKS]]: i32)
+ !$omp taskloop num_tasks(strict:10)
+ do i = 1, 100
+ !CHECK: arith.addi
+ x = x + 1
+ end do
+ !$omp end taskloop
+end subroutine
+
+
+
More information about the flang-commits
mailing list