class CatBoostClassificationModel extends ProbabilisticClassificationModel[Vector, CatBoostClassificationModel] with CatBoostModelTrait[CatBoostClassificationModel]
Classification model trained by CatBoost. Use CatBoostClassifier to train it
Serialization
Supports standard Spark MLLib serialization. Data can be saved to distributed filesystem like HDFS or
local files.
When saved to path two files are created:
-<path>/metadata which contains Spark-specific metadata in JSON format
-<path>/model which contains model in usual CatBoost format which can be read using other local
CatBoost APIs (if stored in a distributed filesystem it has to be copied to the local filesystem first).
Save model
val trainPool : Pool = ... init Pool ... val classifier = new CatBoostClassifier val model = classifier.fit(trainPool) val path = "/home/user/catboost_spark_models/model0" model.write.save(path)
, Load model
val dataFrameForPrediction : DataFrame = ... init DataFrame ... val path = "/home/user/catboost_spark_models/model0" val model = CatBoostClassificationModel.load(path) val predictions = model.transform(dataFrameForPrediction) predictions.show()
- Alphabetic
- By Inheritance
- CatBoostClassificationModel
- CatBoostModelTrait
- MLWritable
- ProbabilisticClassificationModel
- ProbabilisticClassifierParams
- HasThresholds
- HasProbabilityCol
- ClassificationModel
- ClassifierParams
- HasRawPredictionCol
- PredictionModel
- PredictorParams
- HasPredictionCol
- HasFeaturesCol
- HasLabelCol
- Model
- Transformer
- PipelineStage
- Logging
- Params
- Serializable
- Serializable
- Identifiable
- AnyRef
- Any
- Hide All
- Show All
- Public
- All
Instance Constructors
- new CatBoostClassificationModel(nativeModel: TFullModel)
- new CatBoostClassificationModel(uid: String, nativeModel: TFullModel = null, nativeDimension: Int)
Value Members
-
final
def
!=(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
##(): Int
- Definition Classes
- AnyRef → Any
-
final
def
$[T](param: Param[T]): T
- Attributes
- protected
- Definition Classes
- Params
-
final
def
==(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
final
def
asInstanceOf[T0]: T0
- Definition Classes
- Any
-
final
def
clear(param: Param[_]): CatBoostClassificationModel.this.type
- Definition Classes
- Params
-
def
clone(): AnyRef
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
-
def
copy(extra: ParamMap): CatBoostClassificationModel
- Definition Classes
- CatBoostClassificationModel → Model → Transformer → PipelineStage → Params
-
def
copyValues[T <: Params](to: T, extra: ParamMap): T
- Attributes
- protected
- Definition Classes
- Params
-
final
def
defaultCopy[T <: Params](extra: ParamMap): T
- Attributes
- protected
- Definition Classes
- Params
-
final
def
eq(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
def
equals(arg0: Any): Boolean
- Definition Classes
- AnyRef → Any
-
def
explainParam(param: Param[_]): String
- Definition Classes
- Params
-
def
explainParams(): String
- Definition Classes
- Params
-
final
def
extractParamMap(): ParamMap
- Definition Classes
- Params
-
final
def
extractParamMap(extra: ParamMap): ParamMap
- Definition Classes
- Params
-
final
val
featuresCol: Param[String]
- Definition Classes
- HasFeaturesCol
-
def
featuresDataType: DataType
- Attributes
- protected
- Definition Classes
- PredictionModel
-
def
finalize(): Unit
- Attributes
- protected[lang]
- Definition Classes
- AnyRef
- Annotations
- @throws( classOf[java.lang.Throwable] )
-
final
def
get[T](param: Param[T]): Option[T]
- Definition Classes
- Params
-
def
getAdditionalColumnsForApply: Seq[StructField]
- Attributes
- protected
- Definition Classes
- CatBoostClassificationModel → CatBoostModelTrait
-
final
def
getClass(): Class[_]
- Definition Classes
- AnyRef → Any
- Annotations
- @native()
-
final
def
getDefault[T](param: Param[T]): Option[T]
- Definition Classes
- Params
-
final
def
getFeaturesCol: String
- Definition Classes
- HasFeaturesCol
-
final
def
getLabelCol: String
- Definition Classes
- HasLabelCol
-
final
def
getOrDefault[T](param: Param[T]): T
- Definition Classes
- Params
-
def
getParam(paramName: String): Param[Any]
- Definition Classes
- Params
-
final
def
getPredictionCol: String
- Definition Classes
- HasPredictionCol
-
final
def
getProbabilityCol: String
- Definition Classes
- HasProbabilityCol
-
final
def
getRawPredictionCol: String
- Definition Classes
- HasRawPredictionCol
-
def
getResultIteratorForApply(rawObjectsDataProvider: SWIGTYPE_p_NCB__TRawObjectsDataProviderPtr, dstRows: ArrayBuffer[Array[Any]], threadCountForTask: Int): Iterator[Row]
- Attributes
- protected
- Definition Classes
- CatBoostClassificationModel → CatBoostModelTrait
-
def
getThresholds: Array[Double]
- Definition Classes
- HasThresholds
-
final
def
hasDefault[T](param: Param[T]): Boolean
- Definition Classes
- Params
-
def
hasParam(paramName: String): Boolean
- Definition Classes
- Params
-
def
hasParent: Boolean
- Definition Classes
- Model
-
def
hashCode(): Int
- Definition Classes
- AnyRef → Any
- Annotations
- @native()
-
def
initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
- Attributes
- protected
- Definition Classes
- Logging
-
def
initializeLogIfNecessary(isInterpreter: Boolean): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
final
def
isDefined(param: Param[_]): Boolean
- Definition Classes
- Params
-
final
def
isInstanceOf[T0]: Boolean
- Definition Classes
- Any
-
final
def
isSet(param: Param[_]): Boolean
- Definition Classes
- Params
-
def
isTraceEnabled(): Boolean
- Attributes
- protected
- Definition Classes
- Logging
-
final
val
labelCol: Param[String]
- Definition Classes
- HasLabelCol
-
def
log: Logger
- Attributes
- protected
- Definition Classes
- Logging
-
def
logDebug(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logDebug(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logError(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logError(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logInfo(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logInfo(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logName: String
- Attributes
- protected
- Definition Classes
- Logging
-
def
logTrace(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logTrace(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logWarning(msg: ⇒ String, throwable: Throwable): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
def
logWarning(msg: ⇒ String): Unit
- Attributes
- protected
- Definition Classes
- Logging
-
var
nativeDimension: Int
- Attributes
- protected
- Definition Classes
- CatBoostClassificationModel → CatBoostModelTrait
-
final
def
ne(arg0: AnyRef): Boolean
- Definition Classes
- AnyRef
-
final
def
notify(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
final
def
notifyAll(): Unit
- Definition Classes
- AnyRef
- Annotations
- @native()
-
def
numClasses: Int
- Definition Classes
- CatBoostClassificationModel → ClassificationModel
-
def
numFeatures: Int
- Definition Classes
- PredictionModel
- Annotations
- @Since( "1.6.0" )
-
lazy val
params: Array[Param[_]]
- Definition Classes
- Params
-
var
parent: Estimator[CatBoostClassificationModel]
- Definition Classes
- Model
-
def
predict(features: Vector): Double
- Definition Classes
- ClassificationModel → PredictionModel
-
def
predictProbability(features: Vector): Vector
- Attributes
- protected
- Definition Classes
- ProbabilisticClassificationModel
-
def
predictRaw(features: Vector): Vector
Prefer batch computations operating on datasets as a whole for efficiency
Prefer batch computations operating on datasets as a whole for efficiency
- Attributes
- protected
- Definition Classes
- CatBoostClassificationModel → ClassificationModel
-
final
def
predictRawImpl(features: Vector): Array[Double]
Prefer batch computations operating on datasets as a whole for efficiency
Prefer batch computations operating on datasets as a whole for efficiency
- Definition Classes
- CatBoostModelTrait
-
final
val
predictionCol: Param[String]
- Definition Classes
- HasPredictionCol
-
def
probability2prediction(probability: Vector): Double
- Attributes
- protected
- Definition Classes
- ProbabilisticClassificationModel
-
final
val
probabilityCol: Param[String]
- Definition Classes
- HasProbabilityCol
-
def
raw2prediction(rawPrediction: Vector): Double
- Attributes
- protected
- Definition Classes
- ProbabilisticClassificationModel → ClassificationModel
-
def
raw2probability(rawPrediction: Vector): Vector
- Attributes
- protected
- Definition Classes
- ProbabilisticClassificationModel
-
def
raw2probabilityInPlace(rawPrediction: Vector): Vector
Prefer batch computations operating on datasets as a whole for efficiency
Prefer batch computations operating on datasets as a whole for efficiency
- Attributes
- protected
- Definition Classes
- CatBoostClassificationModel → ProbabilisticClassificationModel
-
final
val
rawPredictionCol: Param[String]
- Definition Classes
- HasRawPredictionCol
-
def
save(path: String): Unit
- Definition Classes
- MLWritable
- Annotations
- @Since( "1.6.0" ) @throws( ... )
-
final
def
set(paramPair: ParamPair[_]): CatBoostClassificationModel.this.type
- Attributes
- protected
- Definition Classes
- Params
-
final
def
set(param: String, value: Any): CatBoostClassificationModel.this.type
- Attributes
- protected
- Definition Classes
- Params
-
final
def
set[T](param: Param[T], value: T): CatBoostClassificationModel.this.type
- Definition Classes
- Params
-
final
def
setDefault(paramPairs: ParamPair[_]*): CatBoostClassificationModel.this.type
- Attributes
- protected
- Definition Classes
- Params
-
final
def
setDefault[T](param: Param[T], value: T): CatBoostClassificationModel.this.type
- Attributes
- protected
- Definition Classes
- Params
-
def
setFeaturesCol(value: String): CatBoostClassificationModel
- Definition Classes
- PredictionModel
-
def
setParent(parent: Estimator[CatBoostClassificationModel]): CatBoostClassificationModel
- Definition Classes
- Model
-
def
setPredictionCol(value: String): CatBoostClassificationModel
- Definition Classes
- PredictionModel
-
def
setProbabilityCol(value: String): CatBoostClassificationModel
- Definition Classes
- ProbabilisticClassificationModel
-
def
setRawPredictionCol(value: String): CatBoostClassificationModel
- Definition Classes
- ClassificationModel
-
def
setThresholds(value: Array[Double]): CatBoostClassificationModel
- Definition Classes
- ProbabilisticClassificationModel
-
final
def
synchronized[T0](arg0: ⇒ T0): T0
- Definition Classes
- AnyRef
-
final
val
thresholds: DoubleArrayParam
- Definition Classes
- HasThresholds
-
def
toString(): String
- Definition Classes
- Identifiable → AnyRef → Any
-
def
transform(dataset: Dataset[_]): DataFrame
- Definition Classes
- CatBoostClassificationModel → ProbabilisticClassificationModel → ClassificationModel → PredictionModel → Transformer
-
def
transform(dataset: Dataset[_], paramMap: ParamMap): DataFrame
- Definition Classes
- Transformer
- Annotations
- @Since( "2.0.0" )
-
def
transform(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): DataFrame
- Definition Classes
- Transformer
- Annotations
- @Since( "2.0.0" ) @varargs()
-
def
transformImpl(dataset: Dataset[_]): DataFrame
- Definition Classes
- CatBoostModelTrait → PredictionModel
-
def
transformSchema(schema: StructType): StructType
- Definition Classes
- PredictionModel → PipelineStage
-
def
transformSchema(schema: StructType, logging: Boolean): StructType
- Attributes
- protected
- Definition Classes
- PipelineStage
- Annotations
- @DeveloperApi()
-
val
uid: String
- Definition Classes
- CatBoostClassificationModel → Identifiable
-
def
validateAndTransformSchema(schema: StructType, fitting: Boolean, featuresDataType: DataType): StructType
- Attributes
- protected
- Definition Classes
- ProbabilisticClassifierParams → ClassifierParams → PredictorParams
-
final
def
wait(): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long, arg1: Int): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... )
-
final
def
wait(arg0: Long): Unit
- Definition Classes
- AnyRef
- Annotations
- @throws( ... ) @native()
-
def
write: MLWriter
- Definition Classes
- CatBoostModelTrait → MLWritable