mirror of
https://github.com/capstone-engine/llvm-capstone.git
synced 2024-12-02 18:58:15 +00:00
[OMPT] Provide the right thread_num for ancestor levels
The current implementation always provides the thread-num for the current parallel region. This patch fixes the behavior for ancestor levels >0. Differential Revision: https://reviews.llvm.org/D46533 llvm-svn: 336085
This commit is contained in:
parent
3af2c992dc
commit
4a73ae167e
@ -341,18 +341,23 @@ int __ompt_get_task_info_internal(int ancestor_level, int *type,
|
||||
ompt_task_info_t *info = NULL;
|
||||
ompt_team_info_t *team_info = NULL;
|
||||
kmp_info_t *thr = ompt_get_thread();
|
||||
int level = ancestor_level;
|
||||
|
||||
if (thr) {
|
||||
kmp_taskdata_t *taskdata = thr->th.th_current_task;
|
||||
if (taskdata == NULL)
|
||||
return 0;
|
||||
kmp_team *team = thr->th.th_team;
|
||||
kmp_team *team = thr->th.th_team, *prev_team = NULL;
|
||||
if (team == NULL)
|
||||
return 0;
|
||||
ompt_lw_taskteam_t *lwt = NULL,
|
||||
*next_lwt = LWT_FROM_TEAM(taskdata->td_team);
|
||||
*next_lwt = LWT_FROM_TEAM(taskdata->td_team),
|
||||
*prev_lwt = NULL;
|
||||
|
||||
while (ancestor_level > 0) {
|
||||
// needed for thread_num
|
||||
prev_team = team;
|
||||
prev_lwt = lwt;
|
||||
// next lightweight team (if any)
|
||||
if (lwt)
|
||||
lwt = lwt->parent;
|
||||
@ -410,7 +415,13 @@ int __ompt_get_task_info_internal(int ancestor_level, int *type,
|
||||
*parallel_data = team_info ? &(team_info->parallel_data) : NULL;
|
||||
}
|
||||
if (thread_num) {
|
||||
*thread_num = __kmp_get_gtid();
|
||||
if (level == 0)
|
||||
*thread_num = __kmp_get_tid();
|
||||
else if (prev_lwt)
|
||||
*thread_num = 0;
|
||||
else
|
||||
*thread_num = prev_team->t.t_master_tid;
|
||||
// *thread_num = team->t.t_master_tid;
|
||||
}
|
||||
return info ? 2 : 0;
|
||||
}
|
||||
|
357
openmp/runtime/test/ompt/parallel/nested_thread_num.c
Normal file
357
openmp/runtime/test/ompt/parallel/nested_thread_num.c
Normal file
@ -0,0 +1,357 @@
|
||||
// RUN: %libomp-compile-and-run | FileCheck %s
|
||||
// RUN: %libomp-compile-and-run | %sort-threads | FileCheck --check-prefix=THREADS %s
|
||||
// REQUIRES: ompt
|
||||
// UNSUPPORTE: gcc-4, gcc-5, gcc-6, gcc-7
|
||||
#define TEST_NEED_PRINT_FRAME_FROM_OUTLINED_FN
|
||||
#include "callback.h"
|
||||
#include <omp.h>
|
||||
#include <unistd.h>
|
||||
|
||||
int main() {
|
||||
int condition = 0;
|
||||
omp_set_nested(1);
|
||||
print_frame(0);
|
||||
|
||||
#pragma omp parallel num_threads(2)
|
||||
{
|
||||
print_frame_from_outlined_fn(1);
|
||||
print_ids(0);
|
||||
print_ids(1);
|
||||
print_frame(0);
|
||||
|
||||
// get all implicit task events before starting nested:
|
||||
#pragma omp barrier
|
||||
|
||||
#pragma omp parallel num_threads(2)
|
||||
{
|
||||
print_frame_from_outlined_fn(1);
|
||||
print_ids(0);
|
||||
print_ids(1);
|
||||
print_ids(2);
|
||||
print_frame(0);
|
||||
OMPT_SIGNAL(condition);
|
||||
OMPT_WAIT(condition, 4);
|
||||
#pragma omp barrier
|
||||
print_fuzzy_address(1);
|
||||
print_ids(0);
|
||||
}
|
||||
print_fuzzy_address(2);
|
||||
print_ids(0);
|
||||
}
|
||||
print_fuzzy_address(3);
|
||||
|
||||
return 0;
|
||||
}
|
||||
// Check if libomp supports the callbacks for this test.
|
||||
// CHECK-NOT: {{^}}0: Could not register callback
|
||||
|
||||
// CHECK: 0: NULL_POINTER=[[NULL:.*$]]
|
||||
|
||||
// make sure initial data pointers are null
|
||||
// CHECK-NOT: 0: parallel_data initially not null
|
||||
// CHECK-NOT: 0: task_data initially not null
|
||||
// CHECK-NOT: 0: thread_data initially not null
|
||||
|
||||
// CHECK: {{^}}[[MASTER_ID:[0-9]+]]: ompt_event_parallel_begin:
|
||||
// CHECK-SAME: parent_task_id=[[PARENT_TASK_ID:[0-9]+]],
|
||||
// CHECK-SAME: parent_task_frame.exit=[[NULL]],
|
||||
// CHECK-SAME: parent_task_frame.reenter={{0x[0-f]+}},
|
||||
// CHECK-SAME: parallel_id=[[PARALLEL_ID:[0-9]+]],
|
||||
// CHECK-SAME: requested_team_size=2,
|
||||
// CHECK-SAME: codeptr_ra=[[RETURN_ADDRESS:0x[0-f]+]]{{[0-f][0-f]}},
|
||||
// CHECK-SAME: invoker=[[PARALLEL_INVOKER:[0-9]+]]
|
||||
|
||||
// CHECK-DAG: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_begin:
|
||||
// CHECK-DAG: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_end:
|
||||
|
||||
// Note that we cannot ensure that the worker threads have already called
|
||||
// barrier_end and implicit_task_end before parallel_end!
|
||||
|
||||
// CHECK-DAG: {{^}}[[THREAD_ID:[0-9]+]]: ompt_event_implicit_task_begin:
|
||||
// CHECK-DAG: {{^}}[[THREAD_ID]]: ompt_event_barrier_begin:
|
||||
|
||||
|
||||
// CHECK: ompt_event_parallel_end: parallel_id=[[PARALLEL_ID]],
|
||||
// CHECK-SAME: task_id=[[PARENT_TASK_ID]], invoker=[[PARALLEL_INVOKER]]
|
||||
// CHECK: {{^}}[[MASTER_ID]]: fuzzy_address={{.*}}[[RETURN_ADDRESS]]
|
||||
|
||||
// THREADS: {{^}}0: NULL_POINTER=[[NULL:.*$]]
|
||||
// THREADS: __builtin_frame_address(0)=[[MAIN_REENTER:0x[0-f]+]]
|
||||
// THREADS: {{^}}[[MASTER_ID:[0-9]+]]: ompt_event_parallel_begin:
|
||||
// THREADS-SAME: parent_task_id=[[PARENT_TASK_ID:[0-9]+]],
|
||||
// THREADS-SAME: parent_task_frame.exit=[[NULL]],
|
||||
// THREADS-SAME: parent_task_frame.reenter=[[MAIN_REENTER]],
|
||||
// THREADS-SAME: parallel_id=[[PARALLEL_ID:[0-9]+]], requested_team_size=2,
|
||||
// THREADS-SAME: codeptr_ra=[[RETURN_ADDRESS:0x[0-f]+]]{{[0-f][0-f]}},
|
||||
// THREADS-SAME: invoker=[[PARALLEL_INVOKER:[0-9]+]]
|
||||
|
||||
// nested parallel masters
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_begin:
|
||||
// THREADS-SAME: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID:[0-9]+]],
|
||||
// THREADS-SAME: team_size=2, thread_num=0
|
||||
|
||||
// THREADS: __builtin_frame_address({{.}})=[[EXIT:0x[0-f]+]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 0: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]], exit_frame=[[EXIT]],
|
||||
// THREADS-SAME: reenter_frame=[[NULL]],
|
||||
// THREADS-SAME: thread_num=0
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 1:
|
||||
// THREADS-SAME: parallel_id=[[IMPLICIT_PARALLEL_ID:[0-9]+]],
|
||||
// THREADS-SAME: task_id=[[PARENT_TASK_ID]], exit_frame=[[NULL]],
|
||||
// THREADS-SAME: reenter_frame=[[MAIN_REENTER]]
|
||||
|
||||
// THREADS: __builtin_frame_address(0)=[[REENTER:0x[0-f]+]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_parallel_begin:
|
||||
// THREADS-SAME: parent_task_id=[[IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: parent_task_frame.exit=[[EXIT]],
|
||||
// THREADS-SAME: parent_task_frame.reenter=[[REENTER]],
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID:[0-9]+]],
|
||||
// THREADS-SAME: requested_team_size=2,
|
||||
// THREADS-SAME: codeptr_ra=[[NESTED_RETURN_ADDRESS:0x[0-f]+]]{{[0-f][0-f]}},
|
||||
// THREADS-SAME: invoker=[[PARALLEL_INVOKER]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID:[0-9]+]], team_size=2,
|
||||
// THREADS-SAME: thread_num=0
|
||||
|
||||
// THREADS: __builtin_frame_address({{.}})=[[NESTED_EXIT:0x[0-f]+]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 0:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: exit_frame=[[NESTED_EXIT]], reenter_frame=[[NULL]],
|
||||
// THREADS-SAME: thread_num=0
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 1: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]], exit_frame=[[EXIT]],
|
||||
// THREADS-SAME: reenter_frame=[[REENTER]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 2:
|
||||
// THREADS-SAME: parallel_id=[[IMPLICIT_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[PARENT_TASK_ID]], exit_frame=[[NULL]],
|
||||
// THREADS-SAME: reenter_frame=[[MAIN_REENTER]]
|
||||
|
||||
// THREADS: __builtin_frame_address(0)=[[NESTED_REENTER:0x[0-f]+]]
|
||||
|
||||
// THREADS-NOT: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_end
|
||||
// explicit barrier
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_barrier_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: codeptr_ra=[[BARRIER_RETURN_ADDRESS:0x[0-f]+]]{{[0-f][0-f]}}
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 0:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: exit_frame=[[NESTED_EXIT]], reenter_frame=[[NESTED_REENTER]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_barrier_end:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: fuzzy_address={{.*}}[[BARRIER_RETURN_ADDRESS]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 0:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: exit_frame=[[NESTED_EXIT]], reenter_frame=[[NULL]]
|
||||
|
||||
// implicit barrier
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_barrier_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: codeptr_ra=[[NESTED_RETURN_ADDRESS]]{{[0-f][0-f]}}
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 0:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: exit_frame=[[NULL]], reenter_frame=[[NULL]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_barrier_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: codeptr_ra=[[NESTED_RETURN_ADDRESS]]{{[0-f][0-f]}}
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[NESTED_IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_parallel_end:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: invoker=[[PARALLEL_INVOKER]],
|
||||
// THREADS-SAME: codeptr_ra=[[NESTED_RETURN_ADDRESS]]{{[0-f][0-f]}}
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: fuzzy_address={{.*}}[[NESTED_RETURN_ADDRESS]]
|
||||
|
||||
// THREADS-NOT: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_end
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 0: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]], exit_frame=[[EXIT]],
|
||||
// THREADS-SAME: reenter_frame=[[NULL]]
|
||||
|
||||
// implicit barrier
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_barrier_begin:
|
||||
// THREADS-SAME: parallel_id=[[PARALLEL_ID]], task_id=[[IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: codeptr_ra=[[RETURN_ADDRESS]]{{[0-f][0-f]}}
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: task level 0: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]], exit_frame=[[NULL]],
|
||||
// THREADS-SAME: reenter_frame=[[NULL]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_barrier_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: codeptr_ra=[[RETURN_ADDRESS]]{{[0-f][0-f]}}
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: ompt_event_parallel_end:
|
||||
// THREADS-SAME: parallel_id=[[PARALLEL_ID]], task_id=[[PARENT_TASK_ID]],
|
||||
// THREADS-SAME: invoker=[[PARALLEL_INVOKER]],
|
||||
// THREADS-SAME: codeptr_ra=[[RETURN_ADDRESS]]{{[0-f][0-f]}}
|
||||
|
||||
// THREADS: {{^}}[[MASTER_ID]]: fuzzy_address={{.*}}[[RETURN_ADDRESS]]
|
||||
|
||||
// Worker of first nesting level
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID:[0-9]+]]: ompt_event_implicit_task_begin:
|
||||
// THREADS-SAME: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID:[0-9]+]], team_size=2,
|
||||
// THREADS-SAME: thread_num=[[OUTER_THREADNUM:[0-9]+]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 0: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: thread_num=[[OUTER_THREADNUM]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 1:
|
||||
// THREADS-SAME: parallel_id=[[IMPLICIT_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[PARENT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_parallel_begin:
|
||||
// THREADS-SAME: parent_task_id=[[IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: parent_task_frame.exit={{0x[0-f]+}},
|
||||
// THREADS-SAME: parent_task_frame.reenter={{0x[0-f]+}},
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID:[0-9]+]], requested_team_size=2,
|
||||
// THREADS-SAME: codeptr_ra=[[NESTED_RETURN_ADDRESS]]{{[0-f][0-f]}},
|
||||
// THREADS-SAME: invoker=[[PARALLEL_INVOKER]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID:[0-9]+]], team_size=2,
|
||||
// THREADS-SAME: thread_num=[[INNER_THREADNUM:[0-9]+]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 0:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: thread_num=[[INNER_THREADNUM]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 1: parallel_id=[[PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]],
|
||||
// THREADS-SAME: thread_num=[[OUTER_THREADNUM]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 2:
|
||||
// THREADS-SAME: parallel_id=[[IMPLICIT_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[PARENT_TASK_ID]]
|
||||
|
||||
// THREADS-NOT: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[NESTED_IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[NESTED_IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[NESTED_IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_parallel_end:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]], invoker=[[PARALLEL_INVOKER]]
|
||||
|
||||
// THREADS-NOT: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_begin:
|
||||
// THREADS-SAME: parallel_id=[[PARALLEL_ID]], task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// nested parallel worker threads
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID:[0-9]+]]: ompt_event_implicit_task_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID:[0-9]+]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID:[0-9]+]]
|
||||
// THREADS-SAME: thread_num=[[THREADNUM:[0-9]+]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 0:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]]
|
||||
// THREADS-SAME: thread_num=[[THREADNUM]]
|
||||
|
||||
// can't reliably tell which parallel region is the parent...
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 1: parallel_id={{[0-9]+}},
|
||||
// THREADS-SAME: task_id={{[0-9]+}}
|
||||
// THREADS-SAME: thread_num={{[01]}}
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 2:
|
||||
// THREADS-SAME: parallel_id=[[IMPLICIT_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[PARENT_TASK_ID]]
|
||||
// THREADS-SAME: thread_num=0
|
||||
|
||||
// THREADS-NOT: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// other nested parallel worker threads
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID:[0-9]+]]: ompt_event_implicit_task_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID:[0-9]+]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID:[0-9]+]]
|
||||
// THREADS-SAME: thread_num=[[THREADNUM:[0-9]+]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 0:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]]
|
||||
// THREADS-SAME: thread_num=[[THREADNUM]]
|
||||
|
||||
// can't reliably tell which parallel region is the parent...
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 1: parallel_id={{[0-9]+}},
|
||||
// THREADS-SAME: task_id={{[0-9]+}}
|
||||
// THREADS-SAME: thread_num={{[01]}}
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: task level 2:
|
||||
// THREADS-SAME: parallel_id=[[IMPLICIT_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[PARENT_TASK_ID]]
|
||||
// THREADS-SAME: thread_num=0
|
||||
|
||||
// THREADS-NOT: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_begin:
|
||||
// THREADS-SAME: parallel_id=[[NESTED_PARALLEL_ID]],
|
||||
// THREADS-SAME: task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_barrier_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
||||
// THREADS: {{^}}[[THREAD_ID]]: ompt_event_implicit_task_end:
|
||||
// THREADS-SAME: parallel_id={{[0-9]+}}, task_id=[[IMPLICIT_TASK_ID]]
|
||||
|
Loading…
Reference in New Issue
Block a user