XGBoost

Value Members

final def !=(arg0: Any): Boolean

Definition Classes

AnyRef → Any
final def ##(): Int

Definition Classes

AnyRef → Any
final def ==(arg0: Any): Boolean

Definition Classes

AnyRef → Any
final def asInstanceOf[T0]: T0

Definition Classes

Any
def clone(): AnyRef

Attributes

protected[java.lang]

Definition Classes

AnyRef

Annotations

@throws( ... )
final def eq(arg0: AnyRef): Boolean

Definition Classes

AnyRef
def equals(arg0: Any): Boolean

Definition Classes

AnyRef → Any
def finalize(): Unit

Attributes

protected[java.lang]

Definition Classes

AnyRef

Annotations

@throws( classOf[java.lang.Throwable] )
final def getClass(): Class[_]

Definition Classes

AnyRef → Any
def hashCode(): Int

Definition Classes

AnyRef → Any
final def isInstanceOf[T0]: Boolean

Definition Classes

Any
def loadModelFromHadoopFile(modelPath: String)(implicit sparkContext: SparkContext): XGBoostModel

Load XGBoost model from path in HDFS-compatible file system

Load XGBoost model from path in HDFS-compatible file system

modelPath

The path of the file representing the model

returns

The loaded model
final def ne(arg0: AnyRef): Boolean

Definition Classes

AnyRef
final def notify(): Unit

Definition Classes

AnyRef
final def notifyAll(): Unit

Definition Classes

AnyRef
final def synchronized[T0](arg0: ⇒ T0): T0

Definition Classes

AnyRef
def toString(): String

Definition Classes

AnyRef → Any
def train(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

train XGBoost model with the RDD-represented data

train XGBoost model with the RDD-represented data

trainingData

the trainingset represented as RDD

params

Map containing the configuration entries

round

the number of iterations

nWorkers

the number of xgboost workers, 0 by default which means that the number of workers equals to the partition number of trainingData RDD

obj

the user-defined objective function, null by default

eval

the user-defined evaluation function, null by default

useExternalMemory

indicate whether to use external memory cache, by setting this flag as true, the user may save the RAM cost for running XGBoost within Spark

missing

the value represented the missing value in the dataset

returns

XGBoostModel when successful training

Exceptions thrown

ml.dmlc.xgboost4j.java.XGBoostError when the model training is failed
def trainWithDataFrame(trainingData: Dataset[_], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN, featureCol: String = "features", labelCol: String = "label"): XGBoostModel

train XGBoost model with the DataFrame-represented data

train XGBoost model with the DataFrame-represented data

trainingData

the trainingset represented as DataFrame

params

Map containing the parameters to configure XGBoost

round

the number of iterations

nWorkers

the number of xgboost workers, 0 by default which means that the number of workers equals to the partition number of trainingData RDD

obj

the user-defined objective function, null by default

eval

the user-defined evaluation function, null by default

useExternalMemory

indicate whether to use external memory cache, by setting this flag as true, the user may save the RAM cost for running XGBoost within Spark

missing

the value represented the missing value in the dataset

featureCol

the name of input column, "features" as default value

labelCol

the name of output column, "label" as default value

returns

XGBoostModel when successful training

Annotations

@throws( classOf[XGBoostError] )

Exceptions thrown

ml.dmlc.xgboost4j.java.XGBoostError when the model training is failed
def trainWithRDD(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

various of train()

various of train()

trainingData

the trainingset represented as RDD

params

Map containing the configuration entries

round

the number of iterations

nWorkers

the number of xgboost workers, 0 by default which means that the number of workers equals to the partition number of trainingData RDD

obj

the user-defined objective function, null by default

eval

the user-defined evaluation function, null by default

useExternalMemory

indicate whether to use external memory cache, by setting this flag as true, the user may save the RAM cost for running XGBoost within Spark

missing

the value represented the missing value in the dataset

returns

XGBoostModel when successful training

Annotations

@throws( classOf[XGBoostError] )

Exceptions thrown

ml.dmlc.xgboost4j.java.XGBoostError when the model training is failed
final def wait(): Unit

Definition Classes

AnyRef

Annotations

@throws( ... )
final def wait(arg0: Long, arg1: Int): Unit

Definition Classes

AnyRef

Annotations

@throws( ... )
final def wait(arg0: Long): Unit

Definition Classes

AnyRef

Annotations

@throws( ... )

Related Doc: package spark

object XGBoost extends Serializable

Value Members

final def !=(arg0: Any): Boolean

final def ##(): Int

final def ==(arg0: Any): Boolean

final def asInstanceOf[T0]: T0

def clone(): AnyRef

final def eq(arg0: AnyRef): Boolean

def equals(arg0: Any): Boolean

def finalize(): Unit

final def getClass(): Class[_]

def hashCode(): Int

final def isInstanceOf[T0]: Boolean

def loadModelFromHadoopFile(modelPath: String)(implicit sparkContext: SparkContext): XGBoostModel

final def ne(arg0: AnyRef): Boolean

final def notify(): Unit

final def notifyAll(): Unit

final def synchronized[T0](arg0: ⇒ T0): T0

def toString(): String

def train(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

def trainWithDataFrame(trainingData: Dataset[_], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN, featureCol: String = "features", labelCol: String = "label"): XGBoostModel

def trainWithRDD(trainingData: RDD[org.apache.spark.ml.feature.LabeledPoint], params: Map[String, Any], round: Int, nWorkers: Int, obj: ObjectiveTrait = null, eval: EvalTrait = null, useExternalMemory: Boolean = false, missing: Float = Float.NaN): XGBoostModel

final def wait(): Unit

final def wait(arg0: Long, arg1: Int): Unit

final def wait(arg0: Long): Unit

Inherited from Serializable

Inherited from Serializable

Inherited from AnyRef

Inherited from Any

Ungrouped