- ./testxgboost (without filters) failed if run on a multi-GPU machine because the memory was allocated on the current device, but device 0 was always passed into LaunchN
372 lines
9.7 KiB
Plaintext
372 lines
9.7 KiB
Plaintext
/*!
|
|
* Copyright 2018 XGBoost contributors
|
|
*/
|
|
#include <gtest/gtest.h>
|
|
|
|
#include <thrust/host_vector.h>
|
|
#include <thrust/device_vector.h>
|
|
#include <thrust/execution_policy.h>
|
|
|
|
#include "../../../src/common/device_helpers.cuh"
|
|
#include "../../../src/common/span.h"
|
|
#include "test_span.h"
|
|
|
|
namespace xgboost {
|
|
namespace common {
|
|
|
|
struct TestStatus {
|
|
int *status_;
|
|
|
|
public:
|
|
TestStatus () {
|
|
dh::safe_cuda(cudaMalloc(&status_, sizeof(int)));
|
|
int h_status = 1;
|
|
dh::safe_cuda(cudaMemcpy(status_, &h_status,
|
|
sizeof(int), cudaMemcpyHostToDevice));
|
|
}
|
|
~TestStatus() {
|
|
dh::safe_cuda(cudaFree(status_));
|
|
}
|
|
|
|
int get() {
|
|
int h_status;
|
|
dh::safe_cuda(cudaMemcpy(&h_status, status_,
|
|
sizeof(int), cudaMemcpyDeviceToHost));
|
|
return h_status;
|
|
}
|
|
|
|
int* data() {
|
|
return status_;
|
|
}
|
|
};
|
|
|
|
__global__ void test_from_other_kernel(Span<float> span) {
|
|
// don't get optimized out
|
|
size_t idx = threadIdx.x + blockIdx.x * blockDim.x;
|
|
|
|
if (idx >= span.size())
|
|
return;
|
|
}
|
|
// Test converting different T
|
|
__global__ void test_from_other_kernel_const(Span<float const, 16> span) {
|
|
// don't get optimized out
|
|
size_t idx = threadIdx.x + blockIdx.x * blockDim.x;
|
|
|
|
if (idx >= span.size())
|
|
return;
|
|
}
|
|
|
|
/*!
|
|
* \brief Here we just test whether the code compiles.
|
|
*/
|
|
TEST(GPUSpan, FromOther) {
|
|
thrust::host_vector<float> h_vec (16);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
// dynamic extent
|
|
{
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_from_other_kernel<<<1, 16>>>(span);
|
|
}
|
|
{
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_from_other_kernel_const<<<1, 16>>>(span);
|
|
}
|
|
// static extent
|
|
{
|
|
Span<float, 16> span(d_vec.data().get(), d_vec.data().get() + 16);
|
|
test_from_other_kernel<<<1, 16>>>(span);
|
|
}
|
|
{
|
|
Span<float, 16> span(d_vec.data().get(), d_vec.data().get() + 16);
|
|
test_from_other_kernel_const<<<1, 16>>>(span);
|
|
}
|
|
}
|
|
|
|
TEST(GPUSpan, Assignment) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestAssignment{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpan, TestStatus) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestTestStatus{status.data()});
|
|
ASSERT_EQ(status.get(), -1);
|
|
}
|
|
|
|
template <typename T>
|
|
struct TestEqual {
|
|
T *lhs_, *rhs_;
|
|
int *status_;
|
|
|
|
TestEqual(T* _lhs, T* _rhs, int * _status) :
|
|
lhs_(_lhs), rhs_(_rhs), status_(_status) {}
|
|
|
|
XGBOOST_DEVICE void operator()(size_t _idx) {
|
|
bool res = lhs_[_idx] == rhs_[_idx];
|
|
SPAN_ASSERT_TRUE(res, status_);
|
|
}
|
|
};
|
|
|
|
TEST(GPUSpan, WithTrust) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
// Not adviced to initialize span with host_vector, since h_vec.data() is
|
|
// a host function.
|
|
thrust::host_vector<float> h_vec (16);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
// Can't initialize span with device_vector, since d_vec.data() is not raw
|
|
// pointer
|
|
{
|
|
Span<float> s (d_vec.data().get(), d_vec.size());
|
|
|
|
ASSERT_EQ(d_vec.size(), s.size());
|
|
ASSERT_EQ(d_vec.data().get(), s.data());
|
|
}
|
|
|
|
{
|
|
TestStatus status;
|
|
thrust::device_vector<float> d_vec1 (d_vec.size());
|
|
thrust::copy(thrust::device, d_vec.begin(), d_vec.end(), d_vec1.begin());
|
|
Span<float> s (d_vec1.data().get(), d_vec.size());
|
|
|
|
dh::LaunchN(0, 16, TestEqual<float>{
|
|
thrust::raw_pointer_cast(d_vec1.data()),
|
|
s.data(), status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
|
|
// FIXME: memory error!
|
|
// bool res = thrust::equal(thrust::device,
|
|
// d_vec.begin(), d_vec.end(),
|
|
// s.begin());
|
|
}
|
|
}
|
|
|
|
TEST(GPUSpan, BeginEnd) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestBeginEnd{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpan, RBeginREnd) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestRBeginREnd{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
__global__ void test_modify_kernel(Span<float> span) {
|
|
size_t idx = threadIdx.x + blockIdx.x * blockDim.x;
|
|
|
|
if (idx >= span.size())
|
|
return;
|
|
|
|
span[idx] = span.size() - idx;
|
|
}
|
|
|
|
TEST(GPUSpan, Modify) {
|
|
thrust::host_vector<float> h_vec (16);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
|
|
test_modify_kernel<<<1, 16>>>(span);
|
|
|
|
for (size_t i = 0; i < d_vec.size(); ++i) {
|
|
ASSERT_EQ(d_vec[i], d_vec.size() - i);
|
|
}
|
|
}
|
|
|
|
TEST(GPUSpan, Observers) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestObservers{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpan, Compare) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestIterCompare{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
struct TestElementAccess {
|
|
Span<float> span_;
|
|
|
|
XGBOOST_DEVICE TestElementAccess (Span<float> _span) : span_(_span) {}
|
|
|
|
XGBOOST_DEVICE float operator()(size_t _idx) {
|
|
float tmp = span_[_idx];
|
|
return tmp;
|
|
}
|
|
};
|
|
|
|
TEST(GPUSpan, ElementAccess) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
EXPECT_DEATH({
|
|
thrust::host_vector<float> h_vec (16);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
dh::LaunchN(0, 17, TestElementAccess{span});}, "");
|
|
}
|
|
|
|
__global__ void test_first_dynamic_kernel(Span<float> _span) {
|
|
_span.first<-1>();
|
|
}
|
|
__global__ void test_first_static_kernel(Span<float> _span) {
|
|
_span.first(-1);
|
|
}
|
|
__global__ void test_last_dynamic_kernel(Span<float> _span) {
|
|
_span.last<-1>();
|
|
}
|
|
__global__ void test_last_static_kernel(Span<float> _span) {
|
|
_span.last(-1);
|
|
}
|
|
|
|
TEST(GPUSpan, FirstLast) {
|
|
// We construct vectors multiple times since thrust can not recover from
|
|
// death test.
|
|
auto lambda_first_dy = []() {
|
|
thrust::host_vector<float> h_vec (4);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_first_dynamic_kernel<<<1, 1>>>(span);
|
|
};
|
|
EXPECT_DEATH(lambda_first_dy(), "");
|
|
|
|
auto lambda_first_static = []() {
|
|
thrust::host_vector<float> h_vec (4);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_first_static_kernel<<<1, 1>>>(span);
|
|
};
|
|
EXPECT_DEATH(lambda_first_static(), "");
|
|
|
|
auto lambda_last_dy = []() {
|
|
thrust::host_vector<float> h_vec (4);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_last_dynamic_kernel<<<1, 1>>>(span);
|
|
};
|
|
EXPECT_DEATH(lambda_last_dy(), "");
|
|
|
|
auto lambda_last_static = []() {
|
|
thrust::host_vector<float> h_vec (4);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_last_static_kernel<<<1, 1>>>(span);
|
|
};
|
|
EXPECT_DEATH(lambda_last_static(), "");
|
|
}
|
|
|
|
|
|
__global__ void test_subspan_dynamic_kernel(Span<float> _span) {
|
|
_span.subspan(16, 0);
|
|
}
|
|
__global__ void test_subspan_static_kernel(Span<float> _span) {
|
|
_span.subspan<16>();
|
|
}
|
|
TEST(GPUSpan, Subspan) {
|
|
auto lambda_subspan_dynamic = []() {
|
|
thrust::host_vector<float> h_vec (4);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_subspan_dynamic_kernel<<<1, 1>>>(span);
|
|
};
|
|
EXPECT_DEATH(lambda_subspan_dynamic(), "");
|
|
|
|
auto lambda_subspan_static = []() {
|
|
thrust::host_vector<float> h_vec (4);
|
|
InitializeRange(h_vec.begin(), h_vec.end());
|
|
|
|
thrust::device_vector<float> d_vec (h_vec.size());
|
|
thrust::copy(h_vec.begin(), h_vec.end(), d_vec.begin());
|
|
|
|
Span<float> span (d_vec.data().get(), d_vec.size());
|
|
test_subspan_static_kernel<<<1, 1>>>(span);
|
|
};
|
|
EXPECT_DEATH(lambda_subspan_static(), "");
|
|
}
|
|
|
|
TEST(GPUSpanIter, Construct) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestIterConstruct{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpanIter, Ref) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestIterRef{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpanIter, Calculate) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestIterCalculate{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpanIter, Compare) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestIterCompare{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpan, AsBytes) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestAsBytes{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
TEST(GPUSpan, AsWritableBytes) {
|
|
dh::safe_cuda(cudaSetDevice(0));
|
|
TestStatus status;
|
|
dh::LaunchN(0, 16, TestAsWritableBytes{status.data()});
|
|
ASSERT_EQ(status.get(), 1);
|
|
}
|
|
|
|
} // namespace common
|
|
} // namespace xgboost
|