XGBoost

Value Members

final def !=(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def ##(): Int

Definition Classes
AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes
AnyRef → Any
final def asInstanceOf[T0]: T0

Definition Classes
Any
def clone(): AnyRef

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes
AnyRef
def equals(arg0: Any): Boolean

Definition Classes
AnyRef → Any
def finalize(): Unit

Attributes
protected[java.lang]
Definition Classes
AnyRef
Annotations
@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes
AnyRef → Any
def hashCode(): Int

Definition Classes
AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes
Any
def loadModelFromHadoopFile(modelPath: String)(implicit sparkContext: SparkContext): XGBoostModel

Load XGBoost model from path in HDFS-compatible file system
Load XGBoost model from path in HDFS-compatible file system
modelPath
The path of the file representing the model
returns
The loaded model
final def ne(arg0: AnyRef): Boolean

Definition Classes
AnyRef
final def notify(): Unit

Definition Classes
AnyRef
final def notifyAll(): Unit

Definition Classes
AnyRef
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes
AnyRef
def toString(): String

Definition Classes
AnyRef → Any
def trainWithDataFrame(trainingData: Dataset[_], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN, featureCol: String = "features", labelCol: String = "label"): XGBoostModel

Train XGBoost model with the DataFrame-represented data
Train XGBoost model with the DataFrame-represented data
trainingData
the training set represented as DataFrame
params
Map containing the parameters to configure XGBoost
round
the number of iterations
nWorkers
the number of xgboost workers, 0 by default which means that the number of workers equals to the partition number of trainingData RDD
obj
An instance of ObjectiveTrait specifying a custom objective, null by default
eval
An instance of EvalTrait specifying a custom evaluation metric, null by default
useExternalMemory
indicate whether to use external memory cache, by setting this flag as true, the user may save the RAM cost for running XGBoost within Spark
missing
The value which represents a missing value in the dataset
featureCol
the name of input column, "features" as default value
labelCol
the name of output column, "label" as default value
returns
XGBoostModel when successful training

Annotations
@throws( classOf[XGBoostError] )
Exceptions thrown
ml.dmlc.xgboost4j.java.XGBoostError when the model training is failed
def trainWithRDD(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

Train XGBoost model with the RDD-represented data
Train XGBoost model with the RDD-represented data
trainingData
the training set represented as RDD
params
Map containing the configuration entries
round
the number of iterations
nWorkers
the number of xgboost workers, 0 by default which means that the number of workers equals to the partition number of trainingData RDD
obj
An instance of ObjectiveTrait specifying a custom objective, null by default
eval
An instance of EvalTrait specifying a custom evaluation metric, null by default
useExternalMemory
indicate whether to use external memory cache, by setting this flag as true, the user may save the RAM cost for running XGBoost within Spark
missing
The value which represents a missing value in the dataset
returns
XGBoostModel when successful training

Annotations
@throws( classOf[XGBoostError] )
Exceptions thrown
ml.dmlc.xgboost4j.java.XGBoostError when the model training has failed
final def wait(): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes
AnyRef
Annotations
@throws( ... )

Deprecated Value Members

def train(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

Train XGBoost model with the RDD-represented data
Train XGBoost model with the RDD-represented data
trainingData
the training set represented as RDD
params
Map containing the configuration entries
round
the number of iterations
nWorkers
the number of xgboost workers, 0 by default which means that the number of workers equals to the partition number of trainingData RDD
obj
An instance of ObjectiveTrait specifying a custom objective, null by default
eval
An instance of EvalTrait specifying a custom evaluation metric, null by default
useExternalMemory
indicate whether to use external memory cache, by setting this flag as true, the user may save the RAM cost for running XGBoost within Spark
missing
the value represented the missing value in the dataset
returns
XGBoostModel when successful training

Annotations
@deprecated
Deprecated
Use XGBoost.trainWithRDD instead.
Exceptions thrown
ml.dmlc.xgboost4j.java.XGBoostError when the model training is failed

Related Doc: package spark

object XGBoost extends Serializable

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

final def asInstanceOf[T0]: T0

def clone(): AnyRef

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

def loadModelFromHadoopFile(modelPath: String)(implicit sparkContext: SparkContext): XGBoostModel

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

def trainWithDataFrame(trainingData: Dataset[_], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN, featureCol: String = "features", labelCol: String = "label"): XGBoostModel

def trainWithRDD(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Deprecated Value Members

def train(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

Inherited from Serializable

Inherited from Serializable

Inherited from AnyRef

Inherited from Any

Ungrouped