gpu_hist performance tweaks (#5707)
* Remove device vectors * Remove allreduce synchronize * Remove double buffer
This commit is contained in:
@@ -511,7 +511,6 @@ struct GPUHistMakerDevice {
|
||||
reinterpret_cast<typename GradientSumT::ValueT*>(d_node_hist),
|
||||
reinterpret_cast<typename GradientSumT::ValueT*>(d_node_hist),
|
||||
page->Cuts().TotalBins() * (sizeof(GradientSumT) / sizeof(typename GradientSumT::ValueT)));
|
||||
reducer->Synchronize();
|
||||
|
||||
monitor.Stop("AllReduce");
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user