impose shuffle when creating training RDD (#1531)
This commit is contained in:
parent
3f198b9fef
commit
7fb3fbf577
@ -70,12 +70,9 @@ object XGBoost extends Serializable {
|
||||
useExternalMemory: Boolean, missing: Float = Float.NaN): RDD[Booster] = {
|
||||
import DataUtils._
|
||||
val partitionedData = {
|
||||
if (numWorkers > trainingData.partitions.length) {
|
||||
if (numWorkers != trainingData.partitions.length) {
|
||||
logger.info(s"repartitioning training set to $numWorkers partitions")
|
||||
trainingData.repartition(numWorkers)
|
||||
} else if (numWorkers < trainingData.partitions.length) {
|
||||
logger.info(s"repartitioning training set to $numWorkers partitions")
|
||||
trainingData.coalesce(numWorkers)
|
||||
} else {
|
||||
trainingData
|
||||
}
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user