//===-- Test for parallel GPU malloc interface ----------------------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "test/IntegrationTest/test.h" #include "src/__support/GPU/utils.h" #include "src/stdlib/free.h" #include "src/stdlib/malloc.h" using namespace LIBC_NAMESPACE; static inline uint32_t entropy() { return (static_cast(gpu::processor_clock()) ^ (gpu::get_thread_id_x() * 0x632be59b) ^ (gpu::get_block_id_x() * 0x85157af5)) * 0x9e3779bb; } static inline uint32_t xorshift32(uint32_t &state) { state ^= state << 13; state ^= state >> 17; state ^= state << 5; return state * 0x9e3779bb; } static inline void use(uint8_t *ptr, uint32_t size) { EXPECT_NE(ptr, nullptr); for (int i = 0; i < size; ++i) ptr[i] = uint8_t(i + gpu::get_thread_id()); // Try to detect if some other thread manages to clobber our memory. for (int i = 0; i < size; ++i) EXPECT_EQ(ptr[i], uint8_t(i + gpu::get_thread_id())); } TEST_MAIN(int, char **, char **) { void *ptrs[256]; for (int i = 0; i < 256; ++i) ptrs[i] = malloc(gpu::get_lane_id() % 2 ? 16 : 32); for (int i = 0; i < 256; ++i) use(reinterpret_cast(ptrs[i]), gpu::get_lane_id() % 2 ? 16 : 32); for (int i = 0; i < 256; ++i) free(ptrs[i]); uint32_t state = entropy(); for (int i = 0; i < 1024; ++i) { if (xorshift32(state) % 2) { uint64_t size = xorshift32(state) % 256 + 16; uint64_t *ptr = reinterpret_cast(malloc(size)); *ptr = gpu::get_thread_id(); EXPECT_EQ(*ptr, gpu::get_thread_id()); ASSERT_TRUE(ptr); ASSERT_TRUE(__builtin_is_aligned(ptr, 16)); free(ptr); } } return 0; }