- Pass context into various functions. - Factor out some CUDA algorithms. - Use ATS only for update position.
71 lines
2.0 KiB
Plaintext
71 lines
2.0 KiB
Plaintext
/**
|
|
* Copyright 2021-2024, XGBoost Contributors
|
|
*/
|
|
#include <gtest/gtest.h>
|
|
#include <thrust/copy.h> // thrust::copy
|
|
|
|
#include "../../../src/common/device_helpers.cuh"
|
|
#include "../../../src/common/threading_utils.cuh"
|
|
#include "../helpers.h" // for MakeCUDACtx
|
|
|
|
namespace xgboost::common {
|
|
TEST(SegmentedTrapezoidThreads, Basic) {
|
|
size_t constexpr kElements = 24, kGroups = 3;
|
|
auto ctx = MakeCUDACtx(0);
|
|
dh::device_vector<size_t> offset_ptr(kGroups + 1, 0);
|
|
offset_ptr[0] = 0;
|
|
offset_ptr[1] = 8;
|
|
offset_ptr[2] = 16;
|
|
offset_ptr[kGroups] = kElements;
|
|
|
|
size_t h = 1;
|
|
dh::device_vector<size_t> thread_ptr(kGroups + 1, 0);
|
|
size_t total = SegmentedTrapezoidThreads(&ctx, dh::ToSpan(offset_ptr), dh::ToSpan(thread_ptr), h);
|
|
ASSERT_EQ(total, kElements - kGroups);
|
|
|
|
h = 2;
|
|
SegmentedTrapezoidThreads(&ctx, dh::ToSpan(offset_ptr), dh::ToSpan(thread_ptr), h);
|
|
std::vector<size_t> h_thread_ptr(thread_ptr.size());
|
|
thrust::copy(thread_ptr.cbegin(), thread_ptr.cend(), h_thread_ptr.begin());
|
|
for (size_t i = 1; i < h_thread_ptr.size(); ++i) {
|
|
ASSERT_EQ(h_thread_ptr[i] - h_thread_ptr[i - 1], 13);
|
|
}
|
|
|
|
h = 7;
|
|
SegmentedTrapezoidThreads(&ctx, dh::ToSpan(offset_ptr), dh::ToSpan(thread_ptr), h);
|
|
thrust::copy(thread_ptr.cbegin(), thread_ptr.cend(), h_thread_ptr.begin());
|
|
for (size_t i = 1; i < h_thread_ptr.size(); ++i) {
|
|
ASSERT_EQ(h_thread_ptr[i] - h_thread_ptr[i - 1], 28);
|
|
}
|
|
}
|
|
|
|
TEST(SegmentedTrapezoidThreads, Unravel) {
|
|
size_t i = 0, j = 0;
|
|
size_t constexpr kN = 8;
|
|
|
|
UnravelTrapeziodIdx(6, kN, &i, &j);
|
|
ASSERT_EQ(i, 0);
|
|
ASSERT_EQ(j, 7);
|
|
|
|
UnravelTrapeziodIdx(12, kN, &i, &j);
|
|
ASSERT_EQ(i, 1);
|
|
ASSERT_EQ(j, 7);
|
|
|
|
UnravelTrapeziodIdx(15, kN, &i, &j);
|
|
ASSERT_EQ(i, 2);
|
|
ASSERT_EQ(j, 5);
|
|
|
|
UnravelTrapeziodIdx(21, kN, &i, &j);
|
|
ASSERT_EQ(i, 3);
|
|
ASSERT_EQ(j, 7);
|
|
|
|
UnravelTrapeziodIdx(25, kN, &i, &j);
|
|
ASSERT_EQ(i, 5);
|
|
ASSERT_EQ(j, 6);
|
|
|
|
UnravelTrapeziodIdx(27, kN, &i, &j);
|
|
ASSERT_EQ(i, 6);
|
|
ASSERT_EQ(j, 7);
|
|
}
|
|
} // namespace xgboost::common
|