Span class. (#3548)
* Add basic Span class based on ISO++20. * Use Span<Entry const> instead of Inst in SparsePage. * Add DeviceSpan in HostDeviceVector, use it in regression obj.
This commit is contained in:
committed by
Rory Mitchell
parent
2b7a1c5780
commit
2c502784ff
@@ -48,9 +48,9 @@ void HistCutMatrix::Init(DMatrix* p_fmat, uint32_t max_num_bins) {
|
||||
for (size_t i = 0; i < batch.Size(); ++i) { // NOLINT(*)
|
||||
size_t ridx = batch.base_rowid + i;
|
||||
SparsePage::Inst inst = batch[i];
|
||||
for (bst_uint j = 0; j < inst.length; ++j) {
|
||||
if (inst[j].index >= begin && inst[j].index < end) {
|
||||
sketchs[inst[j].index].Push(inst[j].fvalue, info.GetWeight(ridx));
|
||||
for (auto& ins : inst) {
|
||||
if (ins.index >= begin && ins.index < end) {
|
||||
sketchs[ins.index].Push(ins.fvalue, info.GetWeight(ridx));
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -140,7 +140,7 @@ void GHistIndexMatrix::Init(DMatrix* p_fmat, int max_num_bins) {
|
||||
auto &batch = iter->Value();
|
||||
const size_t rbegin = row_ptr.size() - 1;
|
||||
for (size_t i = 0; i < batch.Size(); ++i) {
|
||||
row_ptr.push_back(batch[i].length + row_ptr.back());
|
||||
row_ptr.push_back(batch[i].size() + row_ptr.back());
|
||||
}
|
||||
index.resize(row_ptr.back());
|
||||
|
||||
@@ -154,9 +154,11 @@ void GHistIndexMatrix::Init(DMatrix* p_fmat, int max_num_bins) {
|
||||
size_t ibegin = row_ptr[rbegin + i];
|
||||
size_t iend = row_ptr[rbegin + i + 1];
|
||||
SparsePage::Inst inst = batch[i];
|
||||
CHECK_EQ(ibegin + inst.length, iend);
|
||||
for (bst_uint j = 0; j < inst.length; ++j) {
|
||||
|
||||
CHECK_EQ(ibegin + inst.size(), iend);
|
||||
for (bst_uint j = 0; j < inst.size(); ++j) {
|
||||
uint32_t idx = cut.GetBinIdx(inst[j]);
|
||||
|
||||
index[ibegin + j] = idx;
|
||||
++hit_count_tloc_[tid * nbins + idx];
|
||||
}
|
||||
|
||||
@@ -53,6 +53,11 @@ GPUSet HostDeviceVector<T>::Devices() const { return GPUSet::Empty(); }
|
||||
template <typename T>
|
||||
T* HostDeviceVector<T>::DevicePointer(int device) { return nullptr; }
|
||||
|
||||
template <typename T>
|
||||
common::Span<T> HostDeviceVector<T>::DeviceSpan(int device) {
|
||||
return common::Span<T>();
|
||||
}
|
||||
|
||||
template <typename T>
|
||||
std::vector<T>& HostDeviceVector<T>::HostVector() { return impl_->data_h_; }
|
||||
|
||||
|
||||
@@ -156,6 +156,13 @@ struct HostDeviceVectorImpl {
|
||||
return shards_[devices_.Index(device)].data_.data().get();
|
||||
}
|
||||
|
||||
common::Span<T> DeviceSpan(int device) {
|
||||
CHECK(devices_.Contains(device));
|
||||
LazySyncDevice(device);
|
||||
return { shards_[devices_.Index(device)].data_.data().get(),
|
||||
static_cast<typename common::Span<T>::index_type>(Size()) };
|
||||
}
|
||||
|
||||
size_t DeviceSize(int device) {
|
||||
CHECK(devices_.Contains(device));
|
||||
LazySyncDevice(device);
|
||||
@@ -323,6 +330,11 @@ GPUSet HostDeviceVector<T>::Devices() const { return impl_->Devices(); }
|
||||
template <typename T>
|
||||
T* HostDeviceVector<T>::DevicePointer(int device) { return impl_->DevicePointer(device); }
|
||||
|
||||
template <typename T>
|
||||
common::Span<T> HostDeviceVector<T>::DeviceSpan(int device) {
|
||||
return impl_->DeviceSpan(device);
|
||||
}
|
||||
|
||||
template <typename T>
|
||||
size_t HostDeviceVector<T>::DeviceStart(int device) { return impl_->DeviceStart(device); }
|
||||
|
||||
|
||||
@@ -11,6 +11,8 @@
|
||||
#include <initializer_list>
|
||||
#include <vector>
|
||||
|
||||
#include "span.h"
|
||||
|
||||
// only include thrust-related files if host_device_vector.h
|
||||
// is included from a .cu file
|
||||
#ifdef __CUDACC__
|
||||
@@ -117,6 +119,7 @@ class HostDeviceVector {
|
||||
size_t Size() const;
|
||||
GPUSet Devices() const;
|
||||
T* DevicePointer(int device);
|
||||
common::Span<T> DeviceSpan(int device);
|
||||
|
||||
T* HostPointer() { return HostVector().data(); }
|
||||
size_t DeviceStart(int device);
|
||||
|
||||
633
src/common/span.h
Normal file
633
src/common/span.h
Normal file
@@ -0,0 +1,633 @@
|
||||
/*!
|
||||
* Copyright 2018 XGBoost contributors
|
||||
* \brief span class based on ISO++20 span
|
||||
*
|
||||
* About NOLINTs in this file:
|
||||
*
|
||||
* If we want Span to work with std interface, like range for loop, the
|
||||
* naming must be consistant with std, not XGBoost. Also, the interface also
|
||||
* conflicts with XGBoost coding style, specifically, the use of `explicit'
|
||||
* keyword.
|
||||
*
|
||||
*
|
||||
* Some of the code is copied from Guidelines Support Library, here is the
|
||||
* license:
|
||||
*
|
||||
* Copyright (c) 2015 Microsoft Corporation. All rights reserved.
|
||||
*
|
||||
* This code is licensed under the MIT License (MIT).
|
||||
*
|
||||
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
||||
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
||||
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
||||
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
||||
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
|
||||
* THE SOFTWARE.
|
||||
*/
|
||||
|
||||
#ifndef XGBOOST_COMMON_SPAN_H_
|
||||
#define XGBOOST_COMMON_SPAN_H_
|
||||
|
||||
#include <xgboost/logging.h> // CHECK
|
||||
|
||||
#include <cinttypes> // int64_t
|
||||
#include <type_traits> // remove_cv_t
|
||||
|
||||
/*!
|
||||
* The version number 1910 is picked up from GSL.
|
||||
*
|
||||
* We might want to use MOODYCAMEL_NOEXCEPT from dmlc/concurrentqueue.h. But
|
||||
* there are a lot more definitions in that file would cause warnings/troubles
|
||||
* in MSVC 2013. Currently we try to keep the closure of Span as minimal as
|
||||
* possible.
|
||||
*
|
||||
* There are other workarounds for MSVC, like _Unwrapped, _Verify_range ...
|
||||
* Some of these are hiden magics of MSVC and I tried to avoid them. Should any
|
||||
* of them become needed, please consult the source code of GSL, and possibily
|
||||
* some explanations from this thread:
|
||||
*
|
||||
* https://github.com/Microsoft/GSL/pull/664
|
||||
*
|
||||
* FIXME: Group these MSVC workarounds into a manageable place.
|
||||
*/
|
||||
#if defined(_MSC_VER) && _MSC_VER < 1910
|
||||
|
||||
#define __span_noexcept
|
||||
|
||||
#pragma push_macro("constexpr")
|
||||
#define constexpr /*constexpr*/
|
||||
|
||||
#else
|
||||
|
||||
#define __span_noexcept noexcept
|
||||
|
||||
#endif
|
||||
|
||||
namespace xgboost {
|
||||
namespace common {
|
||||
|
||||
// Usual logging facility is not available inside device code.
|
||||
// FIXME: Make dmlc check more generic.
|
||||
#define KERNEL_CHECK(cond) \
|
||||
do { \
|
||||
if (!(cond)) { \
|
||||
printf("\nKernel error:\n" \
|
||||
"In: %s, \tline: %d\n" \
|
||||
"\t%s\n\tExpecting: %s\n", \
|
||||
__FILE__, __LINE__, __PRETTY_FUNCTION__, # cond); \
|
||||
asm("trap;"); \
|
||||
} \
|
||||
} while (0); \
|
||||
|
||||
#ifdef __CUDA_ARCH__
|
||||
#define SPAN_CHECK KERNEL_CHECK
|
||||
#else
|
||||
#define SPAN_CHECK CHECK // check from dmlc
|
||||
#endif
|
||||
|
||||
namespace detail {
|
||||
/*!
|
||||
* By default, XGBoost uses uint32_t for indexing data. int64_t covers all
|
||||
* values uint32_t can represent. Also, On x86-64 Linux, GCC uses long int to
|
||||
* represent ptrdiff_t, which is just int64_t. So we make it determinstic
|
||||
* here.
|
||||
*/
|
||||
using ptrdiff_t = int64_t; // NOLINT
|
||||
} // namespace detail
|
||||
|
||||
#if defined(_MSC_VER) && _MSC_VER < 1910
|
||||
constexpr const detail::ptrdiff_t dynamic_extent = -1; // NOLINT
|
||||
#else
|
||||
constexpr detail::ptrdiff_t dynamic_extent = -1; // NOLINT
|
||||
#endif
|
||||
|
||||
enum class byte : unsigned char {}; // NOLINT
|
||||
|
||||
namespace detail {
|
||||
|
||||
template <class ElementType, detail::ptrdiff_t Extent = dynamic_extent>
|
||||
class Span;
|
||||
|
||||
template <typename SpanType, bool IsConst>
|
||||
class SpanIterator {
|
||||
using ElementType = typename SpanType::element_type;
|
||||
|
||||
public:
|
||||
using iterator_category = std::random_access_iterator_tag; // NOLINT
|
||||
using value_type = typename std::remove_cv<ElementType>::type; // NOLINT
|
||||
using difference_type = typename SpanType::index_type; // NOLINT
|
||||
|
||||
using reference = typename std::conditional< // NOLINT
|
||||
IsConst, const ElementType, ElementType>::type&;
|
||||
using pointer = typename std::add_pointer<reference>::type&; // NOLINT
|
||||
|
||||
XGBOOST_DEVICE constexpr SpanIterator() : span_{nullptr}, index_{0} {}
|
||||
|
||||
XGBOOST_DEVICE constexpr SpanIterator(
|
||||
const SpanType* _span,
|
||||
typename SpanType::index_type _idx) __span_noexcept :
|
||||
span_(_span), index_(_idx) {}
|
||||
|
||||
friend SpanIterator<SpanType, true>;
|
||||
template <bool B, typename std::enable_if<!B && IsConst>::type* = nullptr>
|
||||
XGBOOST_DEVICE constexpr SpanIterator( // NOLINT
|
||||
const SpanIterator<SpanType, B>& other_) __span_noexcept
|
||||
: SpanIterator(other_.span_, other_.index_) {}
|
||||
|
||||
XGBOOST_DEVICE reference operator*() const {
|
||||
SPAN_CHECK(index_ < span_->size());
|
||||
return *(span_->data() + index_);
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE pointer operator->() const {
|
||||
SPAN_CHECK(index_ != span_->size());
|
||||
return span_->data() + index_;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator& operator++() {
|
||||
SPAN_CHECK(0 <= index_ && index_ != span_->size());
|
||||
index_++;
|
||||
return *this;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator operator++(int) {
|
||||
auto ret = *this;
|
||||
++(*this);
|
||||
return ret;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator& operator--() {
|
||||
SPAN_CHECK(index_ != 0 && index_ <= span_->size());
|
||||
index_--;
|
||||
return *this;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator operator--(int) {
|
||||
auto ret = *this;
|
||||
--(*this);
|
||||
return ret;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator operator+(difference_type n) const {
|
||||
auto ret = *this;
|
||||
return ret += n;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator& operator+=(difference_type n) {
|
||||
SPAN_CHECK((index_ + n) >= 0 && (index_ + n) <= span_->size());
|
||||
index_ += n;
|
||||
return *this;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE difference_type operator-(SpanIterator rhs) const {
|
||||
SPAN_CHECK(span_ == rhs.span_);
|
||||
return index_ - rhs.index_;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator operator-(difference_type n) const {
|
||||
auto ret = *this;
|
||||
return ret -= n;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE SpanIterator& operator-=(difference_type n) {
|
||||
return *this += -n;
|
||||
}
|
||||
|
||||
// friends
|
||||
XGBOOST_DEVICE constexpr friend bool operator==(
|
||||
SpanIterator _lhs, SpanIterator _rhs) __span_noexcept {
|
||||
return _lhs.span_ == _rhs.span_ && _lhs.index_ == _rhs.index_;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr friend bool operator!=(
|
||||
SpanIterator _lhs, SpanIterator _rhs) __span_noexcept {
|
||||
return !(_lhs == _rhs);
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr friend bool operator<(
|
||||
SpanIterator _lhs, SpanIterator _rhs) __span_noexcept {
|
||||
return _lhs.index_ < _rhs.index_;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr friend bool operator<=(
|
||||
SpanIterator _lhs, SpanIterator _rhs) __span_noexcept {
|
||||
return !(_rhs < _lhs);
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr friend bool operator>(
|
||||
SpanIterator _lhs, SpanIterator _rhs) __span_noexcept {
|
||||
return _rhs < _lhs;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr friend bool operator>=(
|
||||
SpanIterator _lhs, SpanIterator _rhs) __span_noexcept {
|
||||
return !(_rhs > _lhs);
|
||||
}
|
||||
|
||||
protected:
|
||||
const SpanType *span_;
|
||||
detail::ptrdiff_t index_;
|
||||
};
|
||||
|
||||
|
||||
// It's tempting to use constexpr instead of structs to do the following meta
|
||||
// programming. But remember that we are supporting MSVC 2013 here.
|
||||
|
||||
/*!
|
||||
* The extent E of the span returned by subspan is determined as follows:
|
||||
*
|
||||
* - If Count is not std::dynamic_extent, Count;
|
||||
* - Otherwise, if Extent is not std::dynamic_extent, Extent - Offset;
|
||||
* - Otherwise, std::dynamic_extent.
|
||||
*/
|
||||
template <detail::ptrdiff_t Extent,
|
||||
detail::ptrdiff_t Offset,
|
||||
detail::ptrdiff_t Count>
|
||||
struct ExtentValue : public std::integral_constant<
|
||||
detail::ptrdiff_t, Count != dynamic_extent ?
|
||||
Count : (Extent != dynamic_extent ? Extent - Offset : Extent)> {};
|
||||
|
||||
/*!
|
||||
* If N is dynamic_extent, the extent of the returned span E is also
|
||||
* dynamic_extent; otherwise it is detail::ptrdiff_t(sizeof(T)) * N.
|
||||
*/
|
||||
template <typename T, detail::ptrdiff_t Extent>
|
||||
struct ExtentAsBytesValue : public std::integral_constant<
|
||||
detail::ptrdiff_t,
|
||||
Extent == dynamic_extent ?
|
||||
Extent : static_cast<detail::ptrdiff_t>(sizeof(T) * Extent)> {};
|
||||
|
||||
template <detail::ptrdiff_t From, detail::ptrdiff_t To>
|
||||
struct IsAllowedExtentConversion : public std::integral_constant<
|
||||
bool, From == To || From == dynamic_extent || To == dynamic_extent> {};
|
||||
|
||||
template <class From, class To>
|
||||
struct IsAllowedElementTypeConversion : public std::integral_constant<
|
||||
bool, std::is_convertible<From(*)[], To(*)[]>::value> {};
|
||||
|
||||
template <class T>
|
||||
struct IsSpanOracle : std::false_type {};
|
||||
|
||||
template <class T, std::ptrdiff_t Extent>
|
||||
struct IsSpanOracle<Span<T, Extent>> : std::true_type {};
|
||||
|
||||
template <class T>
|
||||
struct IsSpan : public IsSpanOracle<typename std::remove_cv<T>::type> {};
|
||||
|
||||
// Re-implement std algorithms here to adopt CUDA.
|
||||
template <typename T>
|
||||
struct Less {
|
||||
XGBOOST_DEVICE constexpr bool operator()(const T& _x, const T& _y) const {
|
||||
return _x < _y;
|
||||
}
|
||||
};
|
||||
|
||||
template <typename T>
|
||||
struct Greater {
|
||||
XGBOOST_DEVICE constexpr bool operator()(const T& _x, const T& _y) const {
|
||||
return _x > _y;
|
||||
}
|
||||
};
|
||||
|
||||
template <class InputIt1, class InputIt2,
|
||||
class Compare =
|
||||
detail::Less<decltype(std::declval<InputIt1>().operator*())>>
|
||||
XGBOOST_DEVICE bool LexicographicalCompare(InputIt1 first1, InputIt1 last1,
|
||||
InputIt2 first2, InputIt2 last2) {
|
||||
Compare comp;
|
||||
for (; first1 != last1 && first2 != last2; ++first1, ++first2) {
|
||||
if (comp(*first1, *first2)) {
|
||||
return true;
|
||||
}
|
||||
if (comp(*first2, *first1)) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return first1 == last1 && first2 != last2;
|
||||
}
|
||||
|
||||
} // namespace detail
|
||||
|
||||
|
||||
/*!
|
||||
* \brief span class implementation, based on ISO++20 span<T>. The interface
|
||||
* should be the same.
|
||||
*
|
||||
* What's different from span<T> in Guidelines Support Library (GSL)
|
||||
*
|
||||
* Interface might be slightly different, we stick with ISO.
|
||||
*
|
||||
* GSL uses C++14/17 features, which are not available here.
|
||||
* GSL uses constexpr extensively, which is not possibile with limitation
|
||||
* of C++11.
|
||||
* GSL doesn't concern about CUDA.
|
||||
*
|
||||
* GSL is more thoroughly implemented and tested.
|
||||
* GSL is more optimized, especially for static extent.
|
||||
*
|
||||
* GSL uses __buildin_unreachable() when error, Span<T> uses dmlc LOG and
|
||||
* customized CUDA logging.
|
||||
*
|
||||
*
|
||||
* What's different from span<T> in ISO++20 (ISO)
|
||||
*
|
||||
* ISO uses functions/structs from std library, which might be not available
|
||||
* in CUDA.
|
||||
* Initializing from std::array is not supported.
|
||||
*
|
||||
* ISO uses constexpr extensively, which is not possibile with limitation
|
||||
* of C++11.
|
||||
* ISO uses C++14/17 features, which is not available here.
|
||||
* ISO doesn't concern about CUDA.
|
||||
*
|
||||
* ISO uses std::terminate(), Span<T> uses dmlc LOG and customized CUDA
|
||||
* logging.
|
||||
*
|
||||
*
|
||||
* Limitations:
|
||||
* With thrust:
|
||||
* It's not adviced to initialize Span with host_vector directly, since
|
||||
* host_vector::data() is a host function.
|
||||
* It's not possible to initialize Span with device_vector directly, since
|
||||
* device_vector::data() returns a wrapped pointer.
|
||||
* It's unclear that what kind of thrust algorithm can be used without
|
||||
* memory error. See the test case "GPUSpan.WithTrust"
|
||||
*
|
||||
* Pass iterator to kernel:
|
||||
* Not possible. Use subspan instead.
|
||||
*
|
||||
* The underlying Span in SpanIterator is a pointer, but CUDA pass kernel
|
||||
* parameter by value. If we were to hold a Span value instead of a
|
||||
* pointer, the following snippet will crash, violating the safety
|
||||
* purpose of Span:
|
||||
*
|
||||
* \code{.cpp}
|
||||
* Span<float> span {arr_a};
|
||||
* auto beg = span.begin();
|
||||
*
|
||||
* Span<float> span_b = arr_b;
|
||||
* span = span_b;
|
||||
*
|
||||
* delete arr_a;
|
||||
* beg++; // crash
|
||||
* \endcode
|
||||
*
|
||||
* While hoding a pointer or reference should avoid the problem, its a
|
||||
* compromise. Since we have subspan, it's acceptable not to support
|
||||
* passing iterator.
|
||||
*/
|
||||
template <typename T,
|
||||
detail::ptrdiff_t Extent = dynamic_extent>
|
||||
class Span {
|
||||
public:
|
||||
using element_type = T; // NOLINT
|
||||
using value_type = typename std::remove_cv<T>::type; // NOLINT
|
||||
using index_type = detail::ptrdiff_t; // NOLINT
|
||||
using difference_type = detail::ptrdiff_t; // NOLINT
|
||||
using pointer = T*; // NOLINT
|
||||
using reference = T&; // NOLINT
|
||||
|
||||
using iterator = detail::SpanIterator<Span<T, Extent>, false>; // NOLINT
|
||||
using const_iterator = const detail::SpanIterator<Span<T, Extent>, true>; // NOLINT
|
||||
using reverse_iterator = detail::SpanIterator<Span<T, Extent>, false>; // NOLINT
|
||||
using const_reverse_iterator = const detail::SpanIterator<Span<T, Extent>, true>; // NOLINT
|
||||
|
||||
// constructors
|
||||
|
||||
XGBOOST_DEVICE constexpr Span() __span_noexcept : size_(0), data_(nullptr) {}
|
||||
|
||||
XGBOOST_DEVICE Span(pointer _ptr, index_type _count) :
|
||||
size_(_count), data_(_ptr) {
|
||||
SPAN_CHECK(_count >= 0);
|
||||
SPAN_CHECK(_ptr || _count == 0);
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE Span(pointer _first, pointer _last) :
|
||||
size_(_last - _first), data_(_first) {
|
||||
SPAN_CHECK(size_ >= 0);
|
||||
SPAN_CHECK(data_ || size_ == 0);
|
||||
}
|
||||
|
||||
template <std::size_t N>
|
||||
XGBOOST_DEVICE constexpr Span(element_type (&arr)[N]) // NOLINT
|
||||
__span_noexcept : size_(N), data_(&arr[0]) {}
|
||||
|
||||
template <class Container,
|
||||
class = typename std::enable_if<
|
||||
!std::is_const<element_type>::value && !detail::IsSpan<Container>::value &&
|
||||
std::is_convertible<typename Container::pointer,
|
||||
pointer>::value &&
|
||||
std::is_convertible<
|
||||
typename Container::pointer,
|
||||
decltype(std::declval<Container>().data())>::value>>
|
||||
XGBOOST_DEVICE Span(Container& _cont) : // NOLINT
|
||||
size_(_cont.size()), data_(_cont.data()) {}
|
||||
|
||||
template <class Container,
|
||||
class = typename std::enable_if<
|
||||
std::is_const<element_type>::value && !detail::IsSpan<Container>::value &&
|
||||
std::is_convertible<typename Container::pointer, pointer>::value &&
|
||||
std::is_convertible<
|
||||
typename Container::pointer,
|
||||
decltype(std::declval<Container>().data())>::value>>
|
||||
XGBOOST_DEVICE Span(const Container& _cont) : size_(_cont.size()), // NOLINT
|
||||
data_(_cont.data()) {}
|
||||
|
||||
template <class U, ptrdiff_t OtherExtent,
|
||||
class = typename std::enable_if<
|
||||
detail::IsAllowedElementTypeConversion<U, T>::value &&
|
||||
detail::IsAllowedExtentConversion<OtherExtent, Extent>::value>>
|
||||
XGBOOST_DEVICE constexpr Span(const Span<U, OtherExtent>& _other) // NOLINT
|
||||
__span_noexcept : size_(_other.size()), data_(_other.data()) {}
|
||||
|
||||
XGBOOST_DEVICE constexpr Span(const Span& _other)
|
||||
__span_noexcept : size_(_other.size()), data_(_other.data()) {}
|
||||
|
||||
XGBOOST_DEVICE Span& operator=(const Span& _other) __span_noexcept {
|
||||
size_ = _other.size();
|
||||
data_ = _other.data();
|
||||
return *this;
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE ~Span() __span_noexcept {}; // NOLINT
|
||||
|
||||
XGBOOST_DEVICE constexpr iterator begin() const __span_noexcept { // NOLINT
|
||||
return {this, 0};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr iterator end() const __span_noexcept { // NOLINT
|
||||
return {this, size()};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr const_iterator cbegin() const __span_noexcept { // NOLINT
|
||||
return {this, 0};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr const_iterator cend() const __span_noexcept { // NOLINT
|
||||
return {this, size()};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr reverse_iterator rbegin() const __span_noexcept { // NOLINT
|
||||
return reverse_iterator{end()};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr reverse_iterator rend() const __span_noexcept { // NOLINT
|
||||
return reverse_iterator{begin()};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr const_reverse_iterator crbegin() const __span_noexcept { // NOLINT
|
||||
return const_reverse_iterator{cend()};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr const_reverse_iterator crend() const __span_noexcept { // NOLINT
|
||||
return const_reverse_iterator{cbegin()};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE reference operator[](index_type _idx) const {
|
||||
SPAN_CHECK(_idx >= 0 && _idx < size());
|
||||
return data()[_idx];
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr reference operator()(index_type _idx) const {
|
||||
return this->operator[](_idx);
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr pointer data() const __span_noexcept { // NOLINT
|
||||
return data_;
|
||||
}
|
||||
|
||||
// Observers
|
||||
XGBOOST_DEVICE constexpr index_type size() const __span_noexcept { // NOLINT
|
||||
return size_;
|
||||
}
|
||||
XGBOOST_DEVICE constexpr index_type size_bytes() const __span_noexcept { // NOLINT
|
||||
return size() * sizeof(T);
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE constexpr bool empty() const __span_noexcept { // NOLINT
|
||||
return size() == 0;
|
||||
}
|
||||
|
||||
// Subviews
|
||||
template <detail::ptrdiff_t Count >
|
||||
XGBOOST_DEVICE Span<element_type, Count> first() const { // NOLINT
|
||||
SPAN_CHECK(Count >= 0 && Count <= size());
|
||||
return {data(), Count};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE Span<element_type, dynamic_extent> first( // NOLINT
|
||||
detail::ptrdiff_t _count) const {
|
||||
SPAN_CHECK(_count >= 0 && _count <= size());
|
||||
return {data(), _count};
|
||||
}
|
||||
|
||||
template <detail::ptrdiff_t Count >
|
||||
XGBOOST_DEVICE Span<element_type, Count> last() const { // NOLINT
|
||||
SPAN_CHECK(Count >=0 && size() - Count >= 0);
|
||||
return {data() + size() - Count, Count};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE Span<element_type, dynamic_extent> last( // NOLINT
|
||||
detail::ptrdiff_t _count) const {
|
||||
SPAN_CHECK(_count >= 0 && _count <= size());
|
||||
return subspan(size() - _count, _count);
|
||||
}
|
||||
|
||||
/*!
|
||||
* If Count is std::dynamic_extent, r.size() == this->size() - Offset;
|
||||
* Otherwise r.size() == Count.
|
||||
*/
|
||||
template < detail::ptrdiff_t Offset,
|
||||
detail::ptrdiff_t Count = dynamic_extent >
|
||||
XGBOOST_DEVICE auto subspan() const -> // NOLINT
|
||||
Span<element_type,
|
||||
detail::ExtentValue<Extent, Offset, Count>::value> {
|
||||
SPAN_CHECK(Offset >= 0 && Offset < size());
|
||||
SPAN_CHECK(Count == dynamic_extent ||
|
||||
Count >= 0 && Offset + Count <= size());
|
||||
|
||||
return {data() + Offset, Count == dynamic_extent ? size() - Offset : Count};
|
||||
}
|
||||
|
||||
XGBOOST_DEVICE Span<element_type, dynamic_extent> subspan( // NOLINT
|
||||
detail::ptrdiff_t _offset,
|
||||
detail::ptrdiff_t _count = dynamic_extent) const {
|
||||
SPAN_CHECK(_offset >= 0 && _offset < size());
|
||||
SPAN_CHECK(_count == dynamic_extent ||
|
||||
_count >= 0 && _offset + _count <= size());
|
||||
|
||||
return {data() + _offset, _count ==
|
||||
dynamic_extent ? size() - _offset : _count};
|
||||
}
|
||||
|
||||
private:
|
||||
index_type size_;
|
||||
pointer data_;
|
||||
};
|
||||
|
||||
template <class T, detail::ptrdiff_t X, class U, detail::ptrdiff_t Y>
|
||||
XGBOOST_DEVICE bool operator==(Span<T, X> l, Span<U, Y> r) {
|
||||
if (l.size() != r.size()) {
|
||||
return false;
|
||||
}
|
||||
for (auto l_beg = l.cbegin(), r_beg = r.cbegin(); l_beg != l.cend();
|
||||
++l_beg, ++r_beg) {
|
||||
if (*l_beg != *r_beg) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
template <class T, detail::ptrdiff_t X, class U, detail::ptrdiff_t Y>
|
||||
XGBOOST_DEVICE constexpr bool operator!=(Span<T, X> l, Span<U, Y> r) {
|
||||
return !(l == r);
|
||||
}
|
||||
|
||||
template <class T, detail::ptrdiff_t X, class U, detail::ptrdiff_t Y>
|
||||
XGBOOST_DEVICE constexpr bool operator<(Span<T, X> l, Span<U, Y> r) {
|
||||
return detail::LexicographicalCompare(l.begin(), l.end(),
|
||||
r.begin(), r.end());
|
||||
}
|
||||
|
||||
template <class T, detail::ptrdiff_t X, class U, detail::ptrdiff_t Y>
|
||||
XGBOOST_DEVICE constexpr bool operator<=(Span<T, X> l, Span<U, Y> r) {
|
||||
return !(l > r);
|
||||
}
|
||||
|
||||
template <class T, detail::ptrdiff_t X, class U, detail::ptrdiff_t Y>
|
||||
XGBOOST_DEVICE constexpr bool operator>(Span<T, X> l, Span<U, Y> r) {
|
||||
return detail::LexicographicalCompare<
|
||||
typename Span<T, X>::iterator, typename Span<U, Y>::iterator,
|
||||
detail::Greater<typename Span<T, X>::element_type>>(l.begin(), l.end(),
|
||||
r.begin(), r.end());
|
||||
}
|
||||
|
||||
template <class T, detail::ptrdiff_t X, class U, detail::ptrdiff_t Y>
|
||||
XGBOOST_DEVICE constexpr bool operator>=(Span<T, X> l, Span<U, Y> r) {
|
||||
return !(l < r);
|
||||
}
|
||||
|
||||
template <class T, detail::ptrdiff_t E>
|
||||
XGBOOST_DEVICE auto as_bytes(Span<T, E> s) __span_noexcept -> // NOLINT
|
||||
Span<const byte, detail::ExtentAsBytesValue<T, E>::value> {
|
||||
return {reinterpret_cast<const byte*>(s.data()), s.size_bytes()};
|
||||
}
|
||||
|
||||
template <class T, detail::ptrdiff_t E>
|
||||
XGBOOST_DEVICE auto as_writable_bytes(Span<T, E> s) __span_noexcept -> // NOLINT
|
||||
Span<byte, detail::ExtentAsBytesValue<T, E>::value> {
|
||||
return {reinterpret_cast<byte*>(s.data()), s.size_bytes()};
|
||||
}
|
||||
|
||||
} // namespace common
|
||||
} // namespace xgboost
|
||||
|
||||
#if defined(_MSC_VER) &&_MSC_VER < 1910
|
||||
#undef constexpr
|
||||
#pragma pop_macro("constexpr")
|
||||
#undef __span_noexcept
|
||||
#endif // _MSC_VER < 1910
|
||||
|
||||
#endif // XGBOOST_COMMON_SPAN_H_
|
||||
Reference in New Issue
Block a user