1//===-- Test for the parallel scan and reduction operations on the GPU ----===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8
9#include "src/__support/CPP/bit.h"
10#include "src/__support/GPU/utils.h"
11#include "test/IntegrationTest/test.h"
12
13using namespace LIBC_NAMESPACE;
14
15static uint32_t sum(uint32_t n) { return n * (n + 1) / 2; }
16
17// Tests a reduction within a convergant warp or wavefront using some known
18// values. For example, if every element in the lane is one, then the sum should
19// be the size of the warp or wavefront, i.e. 1 + 1 + 1 ... + 1.
20static void test_reduce() {
21 uint64_t mask = gpu::get_lane_mask();
22 uint32_t x = gpu::reduce(lane_mask: mask, x: 1);
23 EXPECT_EQ(x, gpu::get_lane_size());
24
25 uint32_t y = gpu::reduce(lane_mask: mask, x: gpu::get_lane_id());
26 EXPECT_EQ(y, sum(gpu::get_lane_size() - 1));
27
28 uint32_t z = 0;
29 if (gpu::get_lane_id() % 2)
30 z = gpu::reduce(lane_mask: gpu::get_lane_mask(), x: 1);
31 gpu::sync_lane(mask);
32
33 EXPECT_EQ(z, gpu::get_lane_id() % 2 ? gpu::get_lane_size() / 2 : 0);
34}
35
36// Tests an accumulation scan within a convergent warp or wavefront using some
37// known values. For example, if every element in the lane is one, then the scan
38// should have each element be equivalent to its ID, i.e. 1, 1 + 1, ...
39static void test_scan() {
40 uint64_t mask = gpu::get_lane_mask();
41
42 uint32_t x = gpu::scan(lane_mask: mask, x: 1);
43 EXPECT_EQ(x, gpu::get_lane_id() + 1);
44
45 uint32_t y = gpu::scan(lane_mask: mask, x: gpu::get_lane_id());
46 EXPECT_EQ(y, sum(gpu::get_lane_id()));
47
48 uint32_t z = 0;
49 if (gpu::get_lane_id() % 2)
50 z = gpu::scan(lane_mask: gpu::get_lane_mask(), x: 1);
51 gpu::sync_lane(mask);
52
53 EXPECT_EQ(z, gpu::get_lane_id() % 2 ? gpu::get_lane_id() / 2 + 1 : 0);
54}
55
56TEST_MAIN(int argc, char **argv, char **envp) {
57 test_reduce();
58
59 test_scan();
60
61 return 0;
62}
63

source code of libc/test/integration/src/__support/GPU/scan_reduce.cpp