Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

[Flang][OpenMP]Support for lowering grainsize and num_tasks clause to… #128490

Draft
wants to merge 1 commit into
base: main
Choose a base branch
from

Conversation

kaviya2510
Copy link
Contributor

… MLIR.

Added MLIR lowering to taskloop construct.
Added MLIR lowering for grainsize and num_tasks clauses of taskloop construct.

Depends on #128477

@llvmbot llvmbot added flang Flang issues not falling into any other category flang:fir-hlfir flang:openmp labels Feb 24, 2025
@kaviya2510 kaviya2510 marked this pull request as draft February 24, 2025 11:06
@llvmbot
Copy link
Member

llvmbot commented Feb 24, 2025

@llvm/pr-subscribers-flang-fir-hlfir

@llvm/pr-subscribers-flang-openmp

Author: Kaviya Rajendiran (kaviya2510)

Changes

… MLIR.

Added MLIR lowering to taskloop construct.
Added MLIR lowering for grainsize and num_tasks clauses of taskloop construct.

Depends on #128477


Full diff: https://github.com/llvm/llvm-project/pull/128490.diff

8 Files Affected:

  • (modified) flang/lib/Lower/OpenMP/ClauseProcessor.cpp (+42)
  • (modified) flang/lib/Lower/OpenMP/ClauseProcessor.h (+4)
  • (modified) flang/lib/Lower/OpenMP/OpenMP.cpp (+38-1)
  • (removed) flang/test/Lower/OpenMP/Todo/taskloop.f90 (-13)
  • (added) flang/test/Lower/OpenMP/masked_taskloop.f90 (+49)
  • (removed) flang/test/Lower/OpenMP/master_taskloop.f90 (-14)
  • (modified) flang/test/Lower/OpenMP/parallel-master-taskloop.f90 (+39-6)
  • (added) flang/test/Lower/OpenMP/taskloop.f90 (+87)
diff --git a/flang/lib/Lower/OpenMP/ClauseProcessor.cpp b/flang/lib/Lower/OpenMP/ClauseProcessor.cpp
index e21d299570b86..9fbc5e0d5ac61 100644
--- a/flang/lib/Lower/OpenMP/ClauseProcessor.cpp
+++ b/flang/lib/Lower/OpenMP/ClauseProcessor.cpp
@@ -912,6 +912,27 @@ bool ClauseProcessor::processDepend(mlir::omp::DependClauseOps &result) const {
   return findRepeatableClause<omp::clause::Depend>(process);
 }
 
+bool ClauseProcessor::processGrainsize(
+    lower::StatementContext &stmtCtx,
+    mlir::omp::GrainsizeClauseOps &result) const {
+  using grainsize = omp::clause::Grainsize;
+  if (auto *clause = findUniqueClause<grainsize>()) {
+    fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();
+    mlir::MLIRContext *context = firOpBuilder.getContext();
+    const auto &modifier =
+        std::get<std::optional<grainsize::Prescriptiveness>>(clause->t);
+    if (modifier) {
+      result.grainsizeMod = mlir::omp::ClauseGrainsizeTypeAttr::get(
+          context, mlir::omp::ClauseGrainsizeType::Strict);
+    }
+    const auto &grainsizeExpr = std::get<omp::SomeExpr>(clause->t);
+    result.grainsize =
+        fir::getBase(converter.genExprValue(grainsizeExpr, stmtCtx));
+    return true;
+  }
+  return false;
+}
+
 bool ClauseProcessor::processHasDeviceAddr(
     mlir::omp::HasDeviceAddrClauseOps &result,
     llvm::SmallVectorImpl<const semantics::Symbol *> &isDeviceSyms) const {
@@ -1176,6 +1197,27 @@ bool ClauseProcessor::processNontemporal(
       });
 }
 
+bool ClauseProcessor::processNumTasks(
+    lower::StatementContext &stmtCtx,
+    mlir::omp::NumTasksClauseOps &result) const {
+  using numtasks = omp::clause::NumTasks;
+  if (auto *clause = findUniqueClause<numtasks>()) {
+    fir::FirOpBuilder &firOpBuilder = converter.getFirOpBuilder();
+    mlir::MLIRContext *context = firOpBuilder.getContext();
+    const auto &modifier =
+        std::get<std::optional<numtasks::Prescriptiveness>>(clause->t);
+    if (modifier) {
+      result.numTasksMod = mlir::omp::ClauseNumTasksTypeAttr::get(
+          context, mlir::omp::ClauseNumTasksType::Strict);
+    }
+    const auto &numtasksExpr = std::get<omp::SomeExpr>(clause->t);
+    result.numTasks =
+        fir::getBase(converter.genExprValue(numtasksExpr, stmtCtx));
+    return true;
+  }
+  return false;
+}
+
 bool ClauseProcessor::processReduction(
     mlir::Location currentLocation, mlir::omp::ReductionClauseOps &result,
     llvm::SmallVectorImpl<const semantics::Symbol *> &outReductionSyms) const {
diff --git a/flang/lib/Lower/OpenMP/ClauseProcessor.h b/flang/lib/Lower/OpenMP/ClauseProcessor.h
index 889a09a8f0cd8..738cc81348dd7 100644
--- a/flang/lib/Lower/OpenMP/ClauseProcessor.h
+++ b/flang/lib/Lower/OpenMP/ClauseProcessor.h
@@ -105,6 +105,8 @@ class ClauseProcessor {
   bool processDepend(mlir::omp::DependClauseOps &result) const;
   bool
   processEnter(llvm::SmallVectorImpl<DeclareTargetCapturePair> &result) const;
+  bool processGrainsize(lower::StatementContext &stmtCtx,
+                        mlir::omp::GrainsizeClauseOps &result) const;
   bool processIf(omp::clause::If::DirectiveNameModifier directiveName,
                  mlir::omp::IfClauseOps &result) const;
   bool processIsDevicePtr(
@@ -125,6 +127,8 @@ class ClauseProcessor {
   bool processMotionClauses(lower::StatementContext &stmtCtx,
                             mlir::omp::MapClauseOps &result);
   bool processNontemporal(mlir::omp::NontemporalClauseOps &result) const;
+  bool processNumTasks(lower::StatementContext &stmtCtx,
+                       mlir::omp::NumTasksClauseOps &result) const;
   bool processReduction(
       mlir::Location currentLocation, mlir::omp::ReductionClauseOps &result,
       llvm::SmallVectorImpl<const semantics::Symbol *> &reductionSyms) const;
diff --git a/flang/lib/Lower/OpenMP/OpenMP.cpp b/flang/lib/Lower/OpenMP/OpenMP.cpp
index e0d23fc53eeca..63acb235fca3b 100644
--- a/flang/lib/Lower/OpenMP/OpenMP.cpp
+++ b/flang/lib/Lower/OpenMP/OpenMP.cpp
@@ -1740,6 +1740,23 @@ static void genTaskgroupClauses(lower::AbstractConverter &converter,
                                         llvm::omp::Directive::OMPD_taskgroup);
 }
 
+static void genTaskloopClauses(lower::AbstractConverter &converter,
+                               semantics::SemanticsContext &semaCtx,
+                               lower::StatementContext &stmtCtx,
+                               const List<Clause> &clauses, mlir::Location loc,
+                               mlir::omp::TaskloopOperands &clauseOps) {
+  ClauseProcessor cp(converter, semaCtx, clauses);
+  cp.processGrainsize(stmtCtx, clauseOps);
+  cp.processNumTasks(stmtCtx, clauseOps);
+
+  cp.processTODO<clause::Allocate, clause::Collapse, clause::Default,
+                 clause::Final, clause::Firstprivate, clause::If,
+                 clause::InReduction, clause::Lastprivate, clause::Mergeable,
+                 clause::Nogroup, clause::Priority, clause::Private,
+                 clause::Shared, clause::Reduction, clause::Untied>(
+      loc, llvm::omp::Directive::OMPD_taskloop);
+}
+
 static void genTaskwaitClauses(lower::AbstractConverter &converter,
                                semantics::SemanticsContext &semaCtx,
                                const List<Clause> &clauses, mlir::Location loc,
@@ -2639,7 +2656,27 @@ static void genStandaloneTaskloop(lower::AbstractConverter &converter,
                                   mlir::Location loc,
                                   const ConstructQueue &queue,
                                   ConstructQueue::const_iterator item) {
-  TODO(loc, "Taskloop construct");
+  mlir::omp::TaskloopOperands taskloopClauseOps;
+  lower::StatementContext stmtCtx;
+  genTaskloopClauses(converter, semaCtx, stmtCtx, item->clauses, loc,
+                     taskloopClauseOps);
+
+  DataSharingProcessor dsp(converter, semaCtx, item->clauses, eval,
+                           /*shouldCollectPreDeterminedSymbols=*/true,
+                           /*useDelayedPrivatization=*/false, symTable);
+  dsp.processStep1();
+  mlir::omp::LoopNestOperands loopNestClauseOps;
+  llvm::SmallVector<const semantics::Symbol *> iv;
+  genLoopNestClauses(converter, semaCtx, eval, item->clauses, loc,
+                     loopNestClauseOps, iv);
+  EntryBlockArgs taskloopArgs;
+
+  auto taskLoopOp = genWrapperOp<mlir::omp::TaskloopOp>(
+      converter, loc, taskloopClauseOps, taskloopArgs);
+
+  genLoopNestOp(converter, symTable, semaCtx, eval, loc, queue, item,
+                loopNestClauseOps, iv, {{taskLoopOp, taskloopArgs}},
+                llvm::omp::Directive::OMPD_taskloop, dsp);
 }
 
 //===----------------------------------------------------------------------===//
diff --git a/flang/test/Lower/OpenMP/Todo/taskloop.f90 b/flang/test/Lower/OpenMP/Todo/taskloop.f90
deleted file mode 100644
index aca050584cbbe..0000000000000
--- a/flang/test/Lower/OpenMP/Todo/taskloop.f90
+++ /dev/null
@@ -1,13 +0,0 @@
-! RUN: %not_todo_cmd bbc -emit-fir -fopenmp -o - %s -fopenmp-version=50 2>&1 | FileCheck %s
-! RUN: %not_todo_cmd %flang_fc1 -emit-fir -fopenmp -o - %s -fopenmp-version=50 2>&1 | FileCheck %s
-
-! CHECK: not yet implemented: Taskloop construct
-subroutine omp_taskloop
-  integer :: res, i
-  !$omp taskloop
-  do i = 1, 10
-     res = res + 1
-  end do
-  !$omp end taskloop
-end subroutine omp_taskloop
-
diff --git a/flang/test/Lower/OpenMP/masked_taskloop.f90 b/flang/test/Lower/OpenMP/masked_taskloop.f90
new file mode 100644
index 0000000000000..57e8a02dbcefb
--- /dev/null
+++ b/flang/test/Lower/OpenMP/masked_taskloop.f90
@@ -0,0 +1,49 @@
+! This test checks lowering of OpenMP masked taskloop Directive.
+
+! RUN:  bbc -emit-hlfir -fopenmp -o - %s 2>&1 | FileCheck %s
+! RUN:  %flang_fc1 -emit-hlfir -fopenmp -o - %s 2>&1 | FileCheck %s
+
+! CHECK:  func.func @_QPtest_masked_taskloop() {
+! CHECK:    %[[VAL_0:.*]] = fir.alloca i32 {bindc_name = "i", uniq_name = "_QFtest_masked_taskloopEi"}
+! CHECK:    %[[VAL_1:.*]]:2 = hlfir.declare %[[VAL_0]] {uniq_name = "_QFtest_masked_taskloopEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    %[[VAL_2:.*]] = fir.address_of(@_QFtest_masked_taskloopEj) : !fir.ref<i32>
+! CHECK:    %[[VAL_3:.*]]:2 = hlfir.declare %[[VAL_2]] {uniq_name = "_QFtest_masked_taskloopEj"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    omp.masked {
+! CHECK:      %[[VAL_4:.*]] = fir.alloca i32 {bindc_name = "j", pinned, uniq_name = "_QFtest_masked_taskloopEj"}
+! CHECK:      %[[VAL_5:.*]]:2 = hlfir.declare %[[VAL_4]] {uniq_name = "_QFtest_masked_taskloopEj"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:      %[[VAL_6:.*]] = fir.load %[[VAL_3]]#0 : !fir.ref<i32>
+! CHECK:      hlfir.assign %[[VAL_6]] to %[[VAL_5]]#0 : i32, !fir.ref<i32>
+! CHECK:      %[[VAL_7:.*]] = fir.alloca i32 {bindc_name = "i", pinned, uniq_name = "_QFtest_masked_taskloopEi"}
+! CHECK:      %[[VAL_8:.*]]:2 = hlfir.declare %[[VAL_7]] {uniq_name = "_QFtest_masked_taskloopEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:      %[[C1_I32:.*]] = arith.constant 1 : i32
+! CHECK:      %[[C10_I32:.*]] = arith.constant 10 : i32
+! CHECK:      %[[C1_I32_0:.*]] = arith.constant 1 : i32
+! CHECK:      omp.taskloop {
+! CHECK:        omp.loop_nest (%arg0) : i32 = (%[[C1_I32]]) to (%[[C10_I32]]) inclusive step (%[[C1_I32_0]]) {
+! CHECK:          fir.store %arg0 to %[[VAL_8]]#1 : !fir.ref<i32>
+! CHECK:          %[[VAL_9:.*]] = fir.load %[[VAL_5]]#0 : !fir.ref<i32>
+! CHECK:          %[[C1_I32_1:.*]] = arith.constant 1 : i32
+! CHECK:          %[[VAL_10:.*]] = arith.addi %[[VAL_9]], %[[C1_I32_1]] : i32
+! CHECK:          hlfir.assign %[[VAL_10]] to %[[VAL_5]]#0 : i32, !fir.ref<i32>
+! CHECK:          omp.yield
+! CHECK:        }
+! CHECK:      }
+! CHECK:      omp.terminator
+! CHECK:    }
+! CHECK:    return
+! CHECK:  }
+! CHECK:  fir.global internal @_QFtest_masked_taskloopEj : i32 {
+! CHECK:    %[[C1_I32:.*]] = arith.constant 1 : i32
+! CHECK:    fir.has_value %[[C1_I32]] : i32
+! CHECK: }
+
+
+subroutine test_masked_taskloop
+  integer :: i, j = 1
+  !OpenMP directive MASKED has been deprecated, so used MASKED TASKLOOP instead.
+  !$omp masked taskloop
+  do i=1,10
+   j = j + 1
+  end do
+  !$omp end masked taskloop 
+end subroutine
diff --git a/flang/test/Lower/OpenMP/master_taskloop.f90 b/flang/test/Lower/OpenMP/master_taskloop.f90
deleted file mode 100644
index 26f664b2662dc..0000000000000
--- a/flang/test/Lower/OpenMP/master_taskloop.f90
+++ /dev/null
@@ -1,14 +0,0 @@
-! This test checks lowering of OpenMP master taskloop Directive.
-
-! RUN: %not_todo_cmd bbc -emit-fir -fopenmp -o - %s 2>&1 | FileCheck %s
-! RUN: %not_todo_cmd %flang_fc1 -emit-fir -fopenmp -o - %s 2>&1 | FileCheck %s
-
-subroutine test_master_taskloop
-  integer :: i, j = 1
-  !CHECK: not yet implemented: Taskloop construct
-  !$omp master taskloop
-  do i=1,10
-   j = j + 1
-  end do
-  !$omp end master taskloop 
-end subroutine
diff --git a/flang/test/Lower/OpenMP/parallel-master-taskloop.f90 b/flang/test/Lower/OpenMP/parallel-master-taskloop.f90
index 17ceb9496c8d3..602772f47a0e1 100644
--- a/flang/test/Lower/OpenMP/parallel-master-taskloop.f90
+++ b/flang/test/Lower/OpenMP/parallel-master-taskloop.f90
@@ -1,14 +1,47 @@
-! This test checks lowering of OpenMP parallel master taskloop Directive.
+! This test checks lowering of OpenMP parallel masked taskloop Directive.
 
-! RUN: %not_todo_cmd bbc -emit-fir -fopenmp -o - %s 2>&1 | FileCheck %s
-! RUN: %not_todo_cmd %flang_fc1 -emit-fir -fopenmp -o - %s 2>&1 | FileCheck %s
+! RUN: bbc -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+! RUN: %flang_fc1 -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+
+! CHECK: func.func @_QPtest_parallel_master_taskloop() {
+! CHECK:    %[[VAL_0:.*]] = fir.alloca i32 {bindc_name = "i", uniq_name = "_QFtest_parallel_master_taskloopEi"}
+! CHECK:    %[[VAL_1:.*]]:2 = hlfir.declare %[[VAL_0]] {uniq_name = "_QFtest_parallel_master_taskloopEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    %[[VAL_2:.*]] = fir.address_of(@_QFtest_parallel_master_taskloopEj) : !fir.ref<i32>
+! CHECK:    %[[VAL_3:.*]]:2 = hlfir.declare %[[VAL_2]] {uniq_name = "_QFtest_parallel_master_taskloopEj"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    omp.parallel {
+! CHECK:      omp.masked {
+! CHECK:        %[[VAL_4:.*]] = fir.alloca i32 {bindc_name = "i", pinned, uniq_name = "_QFtest_parallel_master_taskloopEi"}
+! CHECK:        %[[VAL_5:.*]]:2 = hlfir.declare %[[VAL_4]] {uniq_name = "_QFtest_parallel_master_taskloopEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:        %[[C1_I32:.*]] = arith.constant 1 : i32
+! CHECK:        %[[C10_I32:.*]] = arith.constant 10 : i32
+! CHECK:        %[[C1_I32_0:.*]] = arith.constant 1 : i32
+! CHECK:        omp.taskloop {
+! CHECK:          omp.loop_nest (%arg0) : i32 = (%[[C1_I32]]) to (%[[C10_I32]]) inclusive step (%[[C1_I32_0]]) {
+! CHECK:            fir.store %arg0 to %[[VAL_5]]#1 : !fir.ref<i32>
+! CHECK:            %[[VAL_6:.*]] = fir.load %[[VAL_3]]#0 : !fir.ref<i32>
+! CHECK:            %[[C1_I32_1:.*]] = arith.constant 1 : i32
+! CHECK:            %[[VAL_7:.*]] = arith.addi %[[VAL_6]], %[[C1_I32_1]] : i32
+! CHECK:            hlfir.assign %[[VAL_7]] to %[[VAL_3]]#0 : i32, !fir.ref<i32>
+! CHECK:            omp.yield
+! CHECK:          }
+! CHECK:        }
+! CHECK:        omp.terminator
+! CHECK:      }
+! CHECK:      omp.terminator
+! CHECK:    }
+! CHECK:    return
+! CHECK:  }
+! CHECK:  fir.global internal @_QFtest_parallel_master_taskloopEj : i32 {
+! CHECK:    %[[C1_I32:.*]] = arith.constant 1 : i32
+! CHECK:    fir.has_value %[[C1_I32]] : i32
+! CHECK:  }
 
 subroutine test_parallel_master_taskloop
   integer :: i, j = 1
-  !CHECK: not yet implemented: Taskloop construct
-  !$omp parallel master taskloop
+  ! OpenMP directive PARALLEL MASTER TASKLOOP has been deprecated, so used PARALLEL MASKED TASKLOOP instead.
+  !$omp parallel masked taskloop
   do i=1,10
    j = j + 1
   end do
-  !$omp end parallel master taskloop 
+  !$omp end parallel masked taskloop 
 end subroutine
diff --git a/flang/test/Lower/OpenMP/taskloop.f90 b/flang/test/Lower/OpenMP/taskloop.f90
new file mode 100644
index 0000000000000..9e0f76de3a642
--- /dev/null
+++ b/flang/test/Lower/OpenMP/taskloop.f90
@@ -0,0 +1,87 @@
+! This test checks lowering of `Taskloop` directive and taskloop clauses "grainsize" and "numtasks".
+
+! RUN: bbc -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+! RUN: %flang_fc1 -emit-hlfir -fopenmp -fopenmp-version=50 -o - %s 2>&1 | FileCheck %s
+
+! CHECK:  func.func @_QPomp_taskloop() {
+! CHECK:    %[[VAL_0:.*]] = fir.alloca i32 {bindc_name = "i", uniq_name = "_QFomp_taskloopEi"}
+! CHECK:    %[[VAL_1:.*]]:2 = hlfir.declare %[[VAL_0]] {uniq_name = "_QFomp_taskloopEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    %[[VAL_2:.*]] = fir.alloca i32 {bindc_name = "res", uniq_name = "_QFomp_taskloopEres"}
+! CHECK:    %[[VAL_3:.*]]:2 = hlfir.declare %[[VAL_2]] {uniq_name = "_QFomp_taskloopEres"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    %[[VAL_4:.*]] = fir.alloca i32 {bindc_name = "res", pinned, uniq_name = "_QFomp_taskloopEres"}
+! CHECK:    %[[VAL_5:.*]]:2 = hlfir.declare %[[VAL_4]] {uniq_name = "_QFomp_taskloopEres"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    %[[VAL_6:.*]] = fir.load %[[VAL_3]]#0 : !fir.ref<i32>
+! CHECK:    hlfir.assign %[[VAL_6]] to %[[VAL_5]]#0 : i32, !fir.ref<i32>
+! CHECK:    %[[VAL_7:.*]] = fir.alloca i32 {bindc_name = "i", pinned, uniq_name = "_QFomp_taskloopEi"}
+! CHECK:    %[[VAL_8:.*]]:2 = hlfir.declare %[[VAL_7]] {uniq_name = "_QFomp_taskloopEi"} : (!fir.ref<i32>) -> (!fir.ref<i32>, !fir.ref<i32>)
+! CHECK:    %[[C1_I32:.*]] = arith.constant 1 : i32
+! CHECK:    %[[C10_I32:.*]] = arith.constant 10 : i32
+! CHECK:    %[[C1_I32_0:.*]] = arith.constant 1 : i32
+! CHECK:    omp.taskloop {
+! CHECK:      omp.loop_nest (%arg0) : i32 = (%[[C1_I32]]) to (%[[C10_I32]]) inclusive step (%[[C1_I32_0]]) {
+! CHECK:        fir.store %arg0 to %[[VAL_8]]#1 : !fir.ref<i32>
+! CHECK:        %[[VAL_9:.*]] = fir.load %[[VAL_5]]#0 : !fir.ref<i32>
+! CHECK:        %[[C1_I32_1:.*]] = arith.constant 1 : i32
+! CHECK:        %[[VAL_10:.*]] = arith.addi %[[VAL_9]], %[[C1_I32_1]] : i32
+! CHECK:        hlfir.assign %[[VAL_10]] to %[[VAL_5]]#0 : i32, !fir.ref<i32>
+! CHECK:        omp.yield
+! CHECK:      }
+! CHECK:    }
+! CHECK:    return
+! CHECK:  }
+subroutine omp_taskloop
+  integer :: res, i
+  !$omp taskloop
+  do i = 1, 10
+     res = res + 1
+  end do
+  !$omp end taskloop
+end subroutine omp_taskloop
+
+!CHECK-LABEL: func.func @_QPtest_grainsize()
+subroutine test_grainsize
+  integer :: res, i
+  !CHECK: omp.taskloop grainsize(%{{.*}}: i32) {
+  !$omp taskloop grainsize(10)
+  do i = 1, 100
+     !CHECK: arith.addi
+     res = res + 1
+  end do
+  !$omp end taskloop
+end subroutine test_grainsize
+
+!CHECK-LABEL: func.func @_QPtest_grainsize_strict()
+subroutine test_grainsize_strict
+  integer :: res, i
+  !CHECK: omp.taskloop grainsize(strict: %{{.*}}: i32) {
+  !$omp taskloop grainsize(strict:10)
+  do i = 1, 100
+     !CHECK: arith.addi
+     res = res + 1
+  end do
+  !$omp end taskloop
+end subroutine
+
+!CHECK-LABEL: func.func @_QPtest_num_tasks()
+subroutine test_num_tasks
+  integer :: res, i
+  !CHECK: omp.taskloop num_tasks(strict: %{{.*}}: i32) {
+  !$omp taskloop num_tasks(strict:10)
+  do i = 1, 100
+     !CHECK: arith.addi
+     res = res + 1
+  end do
+  !$omp end taskloop
+end subroutine
+
+!CHECK-LABEL: func.func @_QPtest_num_tasks_strict()
+subroutine test_num_tasks_strict
+  integer :: res, i
+  !CHECK: omp.taskloop num_tasks(strict: %{{.*}}: i32) {
+  !$omp taskloop num_tasks(strict:10)
+  do i = 1, 100
+     !CHECK: arith.addi
+     res = res + 1
+  end do
+  !$omp end taskloop
+end subroutine
\ No newline at end of file

Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment
Labels
flang:fir-hlfir flang:openmp flang Flang issues not falling into any other category
Projects
None yet
Development

Successfully merging this pull request may close these issues.

2 participants