// Copyright (c) 2019 by Contributors #include #include #include #include #include "../../../src/data/adapter.h" #include "../../../src/data/simple_dmatrix.h" #include "../../../src/common/timer.h" #include "../helpers.h" using namespace xgboost; // NOLINT TEST(c_api, CSRAdapter) { int m = 3; int n = 2; std::vector data = {1, 2, 3, 4, 5}; std::vector feature_idx = {0, 1, 0, 1, 1}; std::vector row_ptr = {0, 2, 4, 5}; data::CSRAdapter adapter(row_ptr.data(), feature_idx.data(), data.data(), row_ptr.size() - 1, data.size(), n); adapter.Next(); auto & batch = adapter.Value(); auto line0 = batch.GetLine(0); EXPECT_EQ(line0.GetElement(0).value, 1); EXPECT_EQ(line0.GetElement(1).value, 2); auto line1 = batch.GetLine(1); EXPECT_EQ(line1 .GetElement(0).value, 3); EXPECT_EQ(line1 .GetElement(1).value, 4); auto line2 = batch.GetLine(2); EXPECT_EQ(line2 .GetElement(0).value, 5); EXPECT_EQ(line2 .GetElement(0).row_idx, 2); EXPECT_EQ(line2 .GetElement(0).column_idx, 1); data::SimpleDMatrix dmat(&adapter, -1, std::nan("")); EXPECT_EQ(dmat.Info().num_col_, 2); EXPECT_EQ(dmat.Info().num_row_, 3); EXPECT_EQ(dmat.Info().num_nonzero_, 5); for (auto &batch : dmat.GetBatches()) { for (auto i = 0ull; i < batch.Size(); i++) { auto inst = batch[i]; for(auto j = 0ull; j < inst.size(); j++) { EXPECT_EQ(inst[j].fvalue, data[row_ptr[i] + j]); EXPECT_EQ(inst[j].index, feature_idx[row_ptr[i] + j]); } } } } TEST(c_api, DenseAdapter) { int m = 3; int n = 2; std::vector data = {1, 2, 3, 4, 5, 6}; data::DenseAdapter adapter(data.data(), m, m*n, n); data::SimpleDMatrix dmat(&adapter,-1,std::numeric_limits::quiet_NaN()); EXPECT_EQ(dmat.Info().num_col_, 2); EXPECT_EQ(dmat.Info().num_row_, 3); EXPECT_EQ(dmat.Info().num_nonzero_, 6); for (auto &batch : dmat.GetBatches()) { for (auto i = 0ull; i < batch.Size(); i++) { auto inst = batch[i]; for(auto j = 0ull; j < inst.size(); j++) { EXPECT_EQ(inst[j].fvalue, data[i*n+j]); EXPECT_EQ(inst[j].index, j); } } } } TEST(c_api, CSCAdapter) { std::vector data = {1, 3, 2, 4, 5}; std::vector row_idx = {0, 1, 0, 1, 2}; std::vector col_ptr = {0, 2, 5}; data::CSCAdapter adapter(col_ptr.data(), row_idx.data(), data.data(), 2, 3); data::SimpleDMatrix dmat(&adapter,-1,std::numeric_limits::quiet_NaN()); EXPECT_EQ(dmat.Info().num_col_, 2); EXPECT_EQ(dmat.Info().num_row_, 3); EXPECT_EQ(dmat.Info().num_nonzero_, 5); auto &batch = *dmat.GetBatches().begin(); auto inst = batch[0]; EXPECT_EQ(inst[0].fvalue, 1); EXPECT_EQ(inst[0].index, 0); EXPECT_EQ(inst[1].fvalue, 2); EXPECT_EQ(inst[1].index, 1); inst = batch[1]; EXPECT_EQ(inst[0].fvalue, 3); EXPECT_EQ(inst[0].index, 0); EXPECT_EQ(inst[1].fvalue, 4); EXPECT_EQ(inst[1].index, 1); inst = batch[2]; EXPECT_EQ(inst[0].fvalue, 5); EXPECT_EQ(inst[0].index, 1); } TEST(c_api, FileAdapter) { std::string filename = "test.libsvm"; CreateBigTestData(filename, 10); std::unique_ptr> parser(dmlc::Parser::Create(filename.c_str(), 0, 1,"auto")); data::FileAdapter adapter(parser.get()); }