/*! * Copyright 2017 XGBoost contributors */ #include #include #include "../../../src/common/device_helpers.cuh" #include "../../../src/common/timer.h" #include "gtest/gtest.h" void CreateTestData(xgboost::bst_uint num_rows, int max_row_size, thrust::host_vector *row_ptr, thrust::host_vector *rows) { row_ptr->resize(num_rows + 1); int sum = 0; for (xgboost::bst_uint i = 0; i <= num_rows; i++) { (*row_ptr)[i] = sum; sum += rand() % max_row_size; // NOLINT if (i < num_rows) { for (int j = (*row_ptr)[i]; j < sum; j++) { (*rows).push_back(i); } } } } void SpeedTest() { int num_rows = 1000000; int max_row_size = 100; dh::CubMemory temp_memory; thrust::host_vector h_row_ptr; thrust::host_vector h_rows; CreateTestData(num_rows, max_row_size, &h_row_ptr, &h_rows); thrust::device_vector row_ptr = h_row_ptr; thrust::device_vector output_row(h_rows.size()); auto d_output_row = output_row.data(); xgboost::common::Timer t; dh::TransformLbs( 0, &temp_memory, h_rows.size(), dh::raw(row_ptr), row_ptr.size() - 1, false, [=] __device__(size_t idx, size_t ridx) { d_output_row[idx] = ridx; }); dh::safe_cuda(cudaDeviceSynchronize()); double time = t.ElapsedSeconds(); const int mb_size = 1048576; size_t size = (sizeof(int) * h_rows.size()) / mb_size; printf("size: %llumb, time: %fs, bandwidth: %fmb/s\n", size, time, size / time); } void TestLbs() { srand(17); dh::CubMemory temp_memory; std::vector test_rows = {4, 100, 1000}; std::vector test_max_row_sizes = {4, 100, 1300}; for (auto num_rows : test_rows) { for (auto max_row_size : test_max_row_sizes) { thrust::host_vector h_row_ptr; thrust::host_vector h_rows; CreateTestData(num_rows, max_row_size, &h_row_ptr, &h_rows); thrust::device_vector row_ptr = h_row_ptr; thrust::device_vector output_row(h_rows.size()); auto d_output_row = output_row.data(); dh::TransformLbs(0, &temp_memory, h_rows.size(), dh::raw(row_ptr), row_ptr.size() - 1, false, [=] __device__(size_t idx, size_t ridx) { d_output_row[idx] = ridx; }); dh::safe_cuda(cudaDeviceSynchronize()); ASSERT_TRUE(h_rows == output_row); } } } TEST(cub_lbs, Test) { TestLbs(); } TEST(sumReduce, Test) { thrust::device_vector data(100, 1.0f); dh::CubMemory temp; auto sum = dh::sumReduction(temp, dh::raw(data), data.size()); ASSERT_NEAR(sum, 100.0f, 1e-5); }