1 | // RUN: %libomp-compile-and-run | FileCheck %s |
2 | // REQUIRES: ompt |
3 | |
4 | #include "callback.h" |
5 | #include <omp.h> |
6 | |
7 | |
8 | __attribute__ ((noinline)) // workaround for bug in icc |
9 | void print_task_info_at(int ancestor_level, int id) |
10 | { |
11 | #pragma omp critical |
12 | { |
13 | int task_type; |
14 | char buffer[2048]; |
15 | ompt_data_t *parallel_data; |
16 | ompt_data_t *task_data; |
17 | int thread_num; |
18 | ompt_get_task_info(ancestor_level, &task_type, &task_data, NULL, |
19 | ¶llel_data, &thread_num); |
20 | format_task_type(task_type, buffer); |
21 | printf("%" PRIu64 ": ancestor_level=%d id=%d task_type=%s=%d " |
22 | "parallel_id=%" PRIu64 " task_id=%" PRIu64 |
23 | " thread_num=%d\n" , |
24 | ompt_get_thread_data()->value, ancestor_level, id, buffer, |
25 | task_type, parallel_data->value, task_data->value, thread_num); |
26 | } |
27 | }; |
28 | |
29 | __attribute__ ((noinline)) // workaround for bug in icc |
30 | void print_innermost_task_info(int id) |
31 | { |
32 | print_task_info_at(ancestor_level: 0, id); |
33 | } |
34 | |
35 | |
36 | int main() |
37 | { |
38 | |
39 | #pragma omp parallel num_threads(2) |
40 | { |
41 | // sync threads before checking the output |
42 | #pragma omp barrier |
43 | // region 0 |
44 | if (omp_get_thread_num() == 1) { |
45 | // executed by worker thread only |
46 | // assert that thread_num is 1 |
47 | print_innermost_task_info(id: 1); |
48 | |
49 | #pragma omp parallel num_threads(1) |
50 | { |
51 | // serialized region 1 |
52 | // assert that thread_num is 0 |
53 | print_innermost_task_info(id: 2); |
54 | |
55 | #pragma omp parallel num_threads(1) |
56 | { |
57 | // serialized region 2 |
58 | // assert that thread_num is 0 |
59 | print_innermost_task_info(id: 3); |
60 | |
61 | // Check the value of thread_num while iterating over the hierarchy |
62 | // of active tasks. |
63 | print_task_info_at(ancestor_level: 0, id: 3); |
64 | print_task_info_at(ancestor_level: 1, id: 2); |
65 | print_task_info_at(ancestor_level: 2, id: 1); |
66 | |
67 | } |
68 | |
69 | } |
70 | } |
71 | } |
72 | |
73 | |
74 | // Check if libomp supports the callbacks for this test. |
75 | // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_task_create' |
76 | // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_implicit_task' |
77 | |
78 | |
79 | // CHECK: {{^}}0: NULL_POINTER=[[NULL:.*$]] |
80 | // CHECK: {{^}}[[MASTER_ID:[0-9]+]]: ompt_event_initial_task_begin: parallel_id=[[PARALLEL_ID_0:[0-9]+]], task_id=[[TASK_ID_0:[0-9]+]], actual_parallelism=1, index=1, flags=1 |
81 | |
82 | // region 0 |
83 | // CHECK: {{^}}[[MASTER_ID]]: ompt_event_parallel_begin: parent_task_id=[[TASK_ID_0]], |
84 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_1:[0-9]+]] |
85 | // CHECK-DAG: {{^}}[[MASTER_ID]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_1]], task_id=[[TASK_ID_1:[0-9]+]] |
86 | // CHECK-DAG: {{^}}[[WORKER_ID:[0-9]+]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_1]], task_id=[[TASK_ID_2:[0-9]+]] |
87 | // assert some info about implicit task executed by worker thread |
88 | // thread_num is the most important |
89 | // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=1 |
90 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_1]] task_id=[[TASK_ID_2]] |
91 | // CHECK-SAME: thread_num=1 |
92 | |
93 | // serialized region 1 |
94 | // CHECK: {{^}}[[WORKER_ID]]: ompt_event_parallel_begin: parent_task_id=[[TASK_ID_2]], |
95 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_2:[0-9]+]] |
96 | // CHECK-DAG: {{^}}[[WORKER_ID]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_2]], task_id=[[TASK_ID_3:[0-9]+]] |
97 | // assert some information about the implicit task of the serialized region 1 |
98 | // pay attention that thread_num should take value 0 |
99 | // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=2 |
100 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_2]] task_id=[[TASK_ID_3]] |
101 | // CHECK-SAME: thread_num=0 |
102 | |
103 | // serialized region 2 |
104 | // CHECK: {{^}}[[WORKER_ID]]: ompt_event_parallel_begin: parent_task_id=[[TASK_ID_3]], |
105 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_3:[0-9]+]] |
106 | // CHECK-DAG: {{^}}[[WORKER_ID]]: ompt_event_implicit_task_begin: parallel_id=[[PARALLEL_ID_3]], task_id=[[TASK_ID_4:[0-9]+]] |
107 | // assert some information about the implicit task of the serialized region 2 |
108 | // pay attention that thread_num should take value 0 |
109 | // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=3 |
110 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_3]] task_id=[[TASK_ID_4]] |
111 | // CHECK-SAME: thread_num=0 |
112 | |
113 | // Check the value of thread_num argument while iterating over the hierarchy |
114 | // of active tasks. The expected is that thread_num takes the value checked |
115 | // above in the test case (0, 0, 1 - respectively). |
116 | |
117 | // Thread is the master thread of the region 2, so thread_num should be 0. |
118 | // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=0 id=3 |
119 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_3]] task_id=[[TASK_ID_4]] |
120 | // CHECK-SAME: thread_num=0 |
121 | |
122 | // Thread is the master thread of the region 1, so thread_num should be 0. |
123 | // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=1 id=2 |
124 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_2]] task_id=[[TASK_ID_3]] |
125 | // CHECK-SAME: thread_num=0 |
126 | |
127 | // Thread is the worker thread of the region 0, so thread_num should be 1. |
128 | // CHECK: {{^}}[[WORKER_ID]]: ancestor_level=2 id=1 |
129 | // CHECK-SAME: parallel_id=[[PARALLEL_ID_1]] task_id=[[TASK_ID_2]] |
130 | // CHECK-SAME: thread_num=1 |
131 | |
132 | return 0; |
133 | } |
134 | |