| 1 | #include "callback.h" |
| 2 | #include <omp.h> |
| 3 | #include <stdio.h> |
| 4 | |
| 5 | #define STRINGIFY(x) #x |
| 6 | #define STR(x) STRINGIFY(x) |
| 7 | #ifndef SCHED_OUTPUT |
| 8 | #define SCHED_OUTPUT STR(SCHEDULE) |
| 9 | #endif |
| 10 | |
| 11 | /* With the combined parallel-for construct (base.h), the return-addresses are hard to compare. |
| 12 | With the separate parallel and for-nowait construct, the addresses become more predictable, |
| 13 | but the begin of the for-loop still generates additional code, so the offset of loop-begin |
| 14 | to the label is >4 Byte. |
| 15 | */ |
| 16 | |
| 17 | int main() |
| 18 | { |
| 19 | unsigned int i; |
| 20 | printf(format: "0: Schedule: " SCHED_OUTPUT "\n" ); |
| 21 | |
| 22 | #pragma omp parallel num_threads(4) |
| 23 | { |
| 24 | print_current_address(0); |
| 25 | #pragma omp for schedule(SCHEDULE) nowait |
| 26 | for (i = 0; i < 64; i++) { |
| 27 | print_fuzzy_address(1); |
| 28 | } |
| 29 | print_fuzzy_address(2); |
| 30 | } |
| 31 | print_fuzzy_address(3); |
| 32 | |
| 33 | // clang-format off |
| 34 | // Check if libomp supports the callbacks for this test. |
| 35 | // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_parallel_begin' |
| 36 | // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_parallel_end' |
| 37 | // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_implicit_task' |
| 38 | // CHECK-NOT: {{^}}0: Could not register callback 'ompt_callback_work' |
| 39 | |
| 40 | |
| 41 | // CHECK: 0: NULL_POINTER=[[NULL:.*$]] |
| 42 | // CHECK: 0: Schedule: [[SCHED:[a-z]+]] |
| 43 | // CHECK: {{^}}[[MASTER_ID:[0-9]+]]: ompt_event_parallel_begin: parent_task_id={{[0-9]+}}, parent_task_frame.exit=[[NULL]], parent_task_frame.reenter={{(0x)?[0-f]+}}, parallel_id=[[PARALLEL_ID:[0-9]+]], requested_team_size=4, codeptr_ra=[[PARALLEL_RETURN_ADDRESS:(0x)?[0-f]+]]{{[0-f][0-f]}}, invoker={{[0-9]+}} |
| 44 | |
| 45 | // CHECK: {{^}}[[MASTER_ID]]: ompt_event_loop_[[SCHED]]_begin: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra=[[LOOP_BEGIN_RETURN_ADDRESS:(0x)?[0-f]+]]{{[0-f][0-f]}} |
| 46 | // CHECK: {{^}}[[MASTER_ID]]: ompt_event_loop_[[SCHED]]_end: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra=[[LOOP_END_RETURN_ADDRESS:(0x)?[0-f]+]]{{[0-f][0-f]}} |
| 47 | // CHECK: {{^}}[[MASTER_ID]]: fuzzy_address={{.*}}[[LOOP_END_RETURN_ADDRESS]] |
| 48 | |
| 49 | // CHECK: {{^}}[[MASTER_ID]]: ompt_event_parallel_end: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, invoker={{[0-9]+}}, codeptr_ra=[[PARALLEL_RETURN_ADDRESS]] |
| 50 | // CHECK: {{^}}[[MASTER_ID]]: fuzzy_address={{.*}}[[PARALLEL_RETURN_ADDRESS]] |
| 51 | |
| 52 | // CHECK: {{^}}[[THREAD_ID:[0-9]+]]: ompt_event_loop_[[SCHED]]_begin: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra={{(0x)?[0-f]+}} |
| 53 | // CHECK: {{^}}[[THREAD_ID]]: ompt_event_loop_[[SCHED]]_end: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra=[[LOOP_END_RETURN_ADDRESS:(0x)?[0-f]+]]{{[0-f][0-f]}} |
| 54 | // CHECK: {{^}}[[THREAD_ID]]: fuzzy_address={{.*}}[[LOOP_END_RETURN_ADDRESS]] |
| 55 | |
| 56 | // CHECK: {{^}}[[THREAD_ID:[0-9]+]]: ompt_event_loop_[[SCHED]]_begin: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra={{(0x)?[0-f]+}} |
| 57 | // CHECK: {{^}}[[THREAD_ID]]: ompt_event_loop_[[SCHED]]_end: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra=[[LOOP_END_RETURN_ADDRESS:(0x)?[0-f]+]]{{[0-f][0-f]}} |
| 58 | // CHECK: {{^}}[[THREAD_ID]]: fuzzy_address={{.*}}[[LOOP_END_RETURN_ADDRESS]] |
| 59 | |
| 60 | // CHECK: {{^}}[[THREAD_ID:[0-9]+]]: ompt_event_loop_[[SCHED]]_begin: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra={{(0x)?[0-f]+}} |
| 61 | // CHECK: {{^}}[[THREAD_ID]]: ompt_event_loop_[[SCHED]]_end: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra=[[LOOP_END_RETURN_ADDRESS:(0x)?[0-f]+]]{{[0-f][0-f]}} |
| 62 | // CHECK: {{^}}[[THREAD_ID]]: fuzzy_address={{.*}}[[LOOP_END_RETURN_ADDRESS]] |
| 63 | |
| 64 | |
| 65 | // CHECK-LOOP: 0: NULL_POINTER=[[NULL:.*$]] |
| 66 | // CHECK-LOOP: 0: Schedule: [[SCHED:[a-z]+]] |
| 67 | // CHECK-LOOP: 0: ompt_event_runtime_shutdown |
| 68 | // CHECK-LOOP: {{^}}[[MASTER_ID:[0-9]+]]: ompt_event_parallel_begin: parent_task_id={{[0-9]+}}, parent_task_frame.exit=[[NULL]], parent_task_frame.reenter={{(0x)?[0-f]+}}, parallel_id=[[PARALLEL_ID:[0-9]+]], requested_team_size=4, codeptr_ra={{(0x)?[0-f]+}}, invoker={{[0-9]+}} |
| 69 | // CHECK-LOOP: {{^}}[[MASTER_ID]]: ompt_event_loop_[[SCHED]]_begin: parallel_id=[[PARALLEL_ID]], task_id={{[0-9]+}}, codeptr_ra=[[LOOP_BEGIN_RETURN_ADDRESS:(0x)?[0-f]+]]{{[0-f][0-f]}} |
| 70 | // CHECK-LOOP: {{^}}{{[0-9]+}}: fuzzy_address={{.*}}[[LOOP_BEGIN_RETURN_ADDRESS]] |
| 71 | // CHECK-LOOP: {{^}}{{[0-9]+}}: fuzzy_address={{.*}}[[LOOP_BEGIN_RETURN_ADDRESS]] |
| 72 | // CHECK-LOOP: {{^}}{{[0-9]+}}: fuzzy_address={{.*}}[[LOOP_BEGIN_RETURN_ADDRESS]] |
| 73 | // CHECK-LOOP: {{^}}{{[0-9]+}}: fuzzy_address={{.*}}[[LOOP_BEGIN_RETURN_ADDRESS]] |
| 74 | // clang-format on |
| 75 | |
| 76 | return 0; |
| 77 | } |
| 78 | |