Packages

class CatBoostClassifier extends ProbabilisticClassifier[Vector, CatBoostClassifier, CatBoostClassificationModel] with CatBoostPredictorTrait[CatBoostClassifier, CatBoostClassificationModel] with ClassifierTrainingParamsTrait

Class to train CatBoostClassificationModel

The default optimized loss function depends on various conditions:

  • Logloss — The label column has only two different values or the targetBorder parameter is specified.
  • MultiClass — The label column has more than two different values and the targetBorder parameter is not specified.
Examples

Binary classification.

val spark = SparkSession.builder()
  .master("local[*]")
  .appName("ClassifierTest")
  .getOrCreate();

val srcDataSchema = Seq(
  StructField("features", SQLDataTypes.VectorType),
  StructField("label", StringType)
)

val trainData = Seq(
  Row(Vectors.dense(0.1, 0.2, 0.11), "0"),
  Row(Vectors.dense(0.97, 0.82, 0.33), "1"),
  Row(Vectors.dense(0.13, 0.22, 0.23), "1"),
  Row(Vectors.dense(0.8, 0.62, 0.0), "0")
)

val trainDf = spark.createDataFrame(spark.sparkContext.parallelize(trainData), StructType(srcDataSchema))
val trainPool = new Pool(trainDf)

val evalData = Seq(
  Row(Vectors.dense(0.22, 0.33, 0.9), "1"),
  Row(Vectors.dense(0.11, 0.1, 0.21), "0"),
  Row(Vectors.dense(0.77, 0.0, 0.0), "1")
)

val evalDf = spark.createDataFrame(spark.sparkContext.parallelize(evalData), StructType(srcDataSchema))
val evalPool = new Pool(evalDf)

val classifier = new CatBoostClassifier
val model = classifier.fit(trainPool, Array[Pool](evalPool))
val predictions = model.transform(evalPool.data)
predictions.show()

Multiclassification.

val spark = SparkSession.builder()
  .master("local[*]")
  .appName("ClassifierTest")
  .getOrCreate();

val srcDataSchema = Seq(
  StructField("features", SQLDataTypes.VectorType),
  StructField("label", StringType)
)

val trainData = Seq(
  Row(Vectors.dense(0.1, 0.2, 0.11), "1"),
  Row(Vectors.dense(0.97, 0.82, 0.33), "2"),
  Row(Vectors.dense(0.13, 0.22, 0.23), "1"),
  Row(Vectors.dense(0.8, 0.62, 0.0), "0")
)

val trainDf = spark.createDataFrame(spark.sparkContext.parallelize(trainData), StructType(srcDataSchema))
val trainPool = new Pool(trainDf)

val evalData = Seq(
  Row(Vectors.dense(0.22, 0.33, 0.9), "2"),
  Row(Vectors.dense(0.11, 0.1, 0.21), "0"),
  Row(Vectors.dense(0.77, 0.0, 0.0), "1")
)

val evalDf = spark.createDataFrame(spark.sparkContext.parallelize(evalData), StructType(srcDataSchema))
val evalPool = new Pool(evalDf)

val classifier = new CatBoostClassifier
val model = classifier.fit(trainPool, Array[Pool](evalPool))
val predictions = model.transform(evalPool.data)
predictions.show()

Serialization

Supports standard Spark MLLib serialization. Data can be saved to distributed filesystem like HDFS or local files.

Examples== Save:
val classifier = new CatBoostClassifier().setIterations(100)
val path = "/home/user/catboost_classifiers/classifier0"
classifier.write.save(path)

Load:

val path = "/home/user/catboost_classifiers/classifier0"
val classifier = CatBoostClassifier.load(path)
val trainPool : Pool = ... init Pool ...
val model = classifier.fit(trainPool)
Linear Supertypes
ClassifierTrainingParamsTrait, TrainingParamsTrait, QuantizationParamsTrait, ThreadCountParams, IgnoredFeaturesParams, CatBoostPredictorTrait[CatBoostClassifier, CatBoostClassificationModel], DefaultParamsWritable, MLWritable, DatasetParamsTrait, HasWeightCol, ProbabilisticClassifier[Vector, CatBoostClassifier, CatBoostClassificationModel], ProbabilisticClassifierParams, HasThresholds, HasProbabilityCol, Classifier[Vector, CatBoostClassifier, CatBoostClassificationModel], ClassifierParams, HasRawPredictionCol, Predictor[Vector, CatBoostClassifier, CatBoostClassificationModel], PredictorParams, HasPredictionCol, HasFeaturesCol, HasLabelCol, Estimator[CatBoostClassificationModel], PipelineStage, Logging, Params, Serializable, Serializable, Identifiable, AnyRef, Any
Ordering
  1. Alphabetic
  2. By Inheritance
Inherited
  1. CatBoostClassifier
  2. ClassifierTrainingParamsTrait
  3. TrainingParamsTrait
  4. QuantizationParamsTrait
  5. ThreadCountParams
  6. IgnoredFeaturesParams
  7. CatBoostPredictorTrait
  8. DefaultParamsWritable
  9. MLWritable
  10. DatasetParamsTrait
  11. HasWeightCol
  12. ProbabilisticClassifier
  13. ProbabilisticClassifierParams
  14. HasThresholds
  15. HasProbabilityCol
  16. Classifier
  17. ClassifierParams
  18. HasRawPredictionCol
  19. Predictor
  20. PredictorParams
  21. HasPredictionCol
  22. HasFeaturesCol
  23. HasLabelCol
  24. Estimator
  25. PipelineStage
  26. Logging
  27. Params
  28. Serializable
  29. Serializable
  30. Identifiable
  31. AnyRef
  32. Any
  1. Hide All
  2. Show All
Visibility
  1. Public
  2. All

Instance Constructors

  1. new CatBoostClassifier()
  2. new CatBoostClassifier(uid: String)

Value Members

  1. final def !=(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  2. final def ##(): Int
    Definition Classes
    AnyRef → Any
  3. final def $[T](param: Param[T]): T
    Attributes
    protected
    Definition Classes
    Params
  4. final def ==(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  5. def addEstimatedCtrFeatures(quantizedTrainPool: Pool, quantizedEvalPools: Array[Pool], updatedCatBoostJsonParams: JObject, classTargetPreprocessor: Option[TClassTargetPreprocessor] = None, serializedLabelConverter: TVector_i8 = new TVector_i8): (Pool, Array[Pool], CtrsContext)

    returns

    (preprocessedTrainPool, preprocessedEvalPools, ctrsContext)

    Attributes
    protected
    Definition Classes
    CatBoostPredictorTrait
  6. final val allowConstLabel: BooleanParam
    Definition Classes
    TrainingParamsTrait
  7. final val allowWritingFiles: BooleanParam
    Definition Classes
    TrainingParamsTrait
  8. final val approxOnFullHistory: BooleanParam
    Definition Classes
    TrainingParamsTrait
  9. final def asInstanceOf[T0]: T0
    Definition Classes
    Any
  10. final val autoClassWeights: EnumParam[EAutoClassWeightsType]
  11. final val baggingTemperature: FloatParam
    Definition Classes
    TrainingParamsTrait
  12. final val bestModelMinTrees: IntParam
    Definition Classes
    TrainingParamsTrait
  13. final val bootstrapType: EnumParam[EBootstrapType]
    Definition Classes
    TrainingParamsTrait
  14. final val borderCount: IntParam
    Definition Classes
    QuantizationParamsTrait
  15. final val classNames: StringArrayParam
  16. final val classWeightsList: DoubleArrayParam
  17. final val classWeightsMap: OrderedStringMapParam[Double]
  18. final val classesCount: IntParam
  19. final def clear(param: Param[_]): CatBoostClassifier.this.type
    Definition Classes
    Params
  20. def clone(): AnyRef
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  21. final val connectTimeout: DurationParam
    Definition Classes
    TrainingParamsTrait
  22. def copy(extra: ParamMap): CatBoostClassifier
    Definition Classes
    CatBoostClassifier → Predictor → Estimator → PipelineStage → Params
  23. def copyValues[T <: Params](to: T, extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  24. def createModel(nativeModel: TFullModel): CatBoostClassificationModel
    Attributes
    protected
    Definition Classes
    CatBoostClassifierCatBoostPredictorTrait
  25. final val customMetric: StringArrayParam
    Definition Classes
    TrainingParamsTrait
  26. final def defaultCopy[T <: Params](extra: ParamMap): T
    Attributes
    protected
    Definition Classes
    Params
  27. final val depth: IntParam
    Definition Classes
    TrainingParamsTrait
  28. final val diffusionTemperature: FloatParam
    Definition Classes
    TrainingParamsTrait
  29. final val earlyStoppingRounds: IntParam
    Definition Classes
    TrainingParamsTrait
  30. final def eq(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  31. def equals(arg0: Any): Boolean
    Definition Classes
    AnyRef → Any
  32. final val evalMetric: Param[String]
    Definition Classes
    TrainingParamsTrait
  33. def explainParam(param: Param[_]): String
    Definition Classes
    Params
  34. def explainParams(): String
    Definition Classes
    Params
  35. def extractInstances(dataset: Dataset[_], numClasses: Int): RDD[Instance]
    Attributes
    protected
    Definition Classes
    ClassifierParams
  36. def extractInstances(dataset: Dataset[_], validateInstance: (Instance) ⇒ Unit): RDD[Instance]
    Attributes
    protected
    Definition Classes
    PredictorParams
  37. def extractInstances(dataset: Dataset[_]): RDD[Instance]
    Attributes
    protected
    Definition Classes
    PredictorParams
  38. def extractLabeledPoints(dataset: Dataset[_], numClasses: Int): RDD[LabeledPoint]
    Attributes
    protected
    Definition Classes
    Classifier
  39. def extractLabeledPoints(dataset: Dataset[_]): RDD[LabeledPoint]
    Attributes
    protected
    Definition Classes
    Predictor
  40. final def extractParamMap(): ParamMap
    Definition Classes
    Params
  41. final def extractParamMap(extra: ParamMap): ParamMap
    Definition Classes
    Params
  42. final val featureBorderType: EnumParam[EBorderSelectionType]
    Definition Classes
    QuantizationParamsTrait
  43. final val featureWeightsList: DoubleArrayParam
    Definition Classes
    TrainingParamsTrait
  44. final val featureWeightsMap: OrderedStringMapParam[Double]
    Definition Classes
    TrainingParamsTrait
  45. final val featuresCol: Param[String]
    Definition Classes
    HasFeaturesCol
  46. def finalize(): Unit
    Attributes
    protected[lang]
    Definition Classes
    AnyRef
    Annotations
    @throws( classOf[java.lang.Throwable] )
  47. final val firstFeatureUsePenaltiesList: DoubleArrayParam
    Definition Classes
    TrainingParamsTrait
  48. final val firstFeatureUsePenaltiesMap: OrderedStringMapParam[Double]
    Definition Classes
    TrainingParamsTrait
  49. def fit(trainPool: Pool, evalPools: Array[Pool] = Array[Pool]()): CatBoostClassificationModel

    Additional variant of fit method that accepts CatBoost's Pool s and allows to specify additional datasets for computing evaluation metrics and overfitting detection similarily to CatBoost's other APIs.

    Additional variant of fit method that accepts CatBoost's Pool s and allows to specify additional datasets for computing evaluation metrics and overfitting detection similarily to CatBoost's other APIs.

    trainPool

    The input training dataset.

    evalPools

    The validation datasets used for the following processes:

    • overfitting detector
    • best iteration selection
    • monitoring metrics' changes
    returns

    trained model

    Definition Classes
    CatBoostPredictorTrait
  50. def fit(dataset: Dataset[_]): CatBoostClassificationModel
    Definition Classes
    Predictor → Estimator
  51. def fit(dataset: Dataset[_], paramMaps: Array[ParamMap]): Seq[CatBoostClassificationModel]
    Definition Classes
    Estimator
    Annotations
    @Since( "2.0.0" )
  52. def fit(dataset: Dataset[_], paramMap: ParamMap): CatBoostClassificationModel
    Definition Classes
    Estimator
    Annotations
    @Since( "2.0.0" )
  53. def fit(dataset: Dataset[_], firstParamPair: ParamPair[_], otherParamPairs: ParamPair[_]*): CatBoostClassificationModel
    Definition Classes
    Estimator
    Annotations
    @Since( "2.0.0" ) @varargs()
  54. final val foldLenMultiplier: FloatParam
    Definition Classes
    TrainingParamsTrait
  55. final val foldPermutationBlock: IntParam
    Definition Classes
    TrainingParamsTrait
  56. final def get[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  57. final def getAllowConstLabel: Boolean
    Definition Classes
    TrainingParamsTrait
  58. final def getAllowWritingFiles: Boolean
    Definition Classes
    TrainingParamsTrait
  59. final def getApproxOnFullHistory: Boolean
    Definition Classes
    TrainingParamsTrait
  60. final def getAutoClassWeights: EAutoClassWeightsType
  61. final def getBaggingTemperature: Float
    Definition Classes
    TrainingParamsTrait
  62. final def getBestModelMinTrees: Int
    Definition Classes
    TrainingParamsTrait
  63. final def getBootstrapType: EBootstrapType
    Definition Classes
    TrainingParamsTrait
  64. final def getBorderCount: Int
    Definition Classes
    QuantizationParamsTrait
  65. final def getClass(): Class[_]
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  66. final def getClassNames: Array[String]
  67. final def getClassWeightsList: Array[Double]
  68. final def getClassWeightsMap: LinkedHashMap[String, Double]
  69. final def getClassesCount: Int
  70. final def getConnectTimeout: Duration
    Definition Classes
    TrainingParamsTrait
  71. final def getCustomMetric: Array[String]
    Definition Classes
    TrainingParamsTrait
  72. final def getDefault[T](param: Param[T]): Option[T]
    Definition Classes
    Params
  73. final def getDepth: Int
    Definition Classes
    TrainingParamsTrait
  74. final def getDiffusionTemperature: Float
    Definition Classes
    TrainingParamsTrait
  75. final def getEarlyStoppingRounds: Int
    Definition Classes
    TrainingParamsTrait
  76. final def getEvalMetric: String
    Definition Classes
    TrainingParamsTrait
  77. final def getFeatureBorderType: EBorderSelectionType
    Definition Classes
    QuantizationParamsTrait
  78. final def getFeatureWeightsList: Array[Double]
    Definition Classes
    TrainingParamsTrait
  79. final def getFeatureWeightsMap: LinkedHashMap[String, Double]
    Definition Classes
    TrainingParamsTrait
  80. final def getFeaturesCol: String
    Definition Classes
    HasFeaturesCol
  81. final def getFirstFeatureUsePenaltiesList: Array[Double]
    Definition Classes
    TrainingParamsTrait
  82. final def getFirstFeatureUsePenaltiesMap: LinkedHashMap[String, Double]
    Definition Classes
    TrainingParamsTrait
  83. final def getFoldLenMultiplier: Float
    Definition Classes
    TrainingParamsTrait
  84. final def getFoldPermutationBlock: Int
    Definition Classes
    TrainingParamsTrait
  85. final def getHasTime: Boolean
    Definition Classes
    TrainingParamsTrait
  86. final def getIgnoredFeaturesIndices: Array[Int]
    Definition Classes
    IgnoredFeaturesParams
  87. final def getIgnoredFeaturesNames: Array[String]
    Definition Classes
    IgnoredFeaturesParams
  88. final def getInputBorders: String
    Definition Classes
    QuantizationParamsTrait
  89. final def getIterations: Int
    Definition Classes
    TrainingParamsTrait
  90. final def getL2LeafReg: Float
    Definition Classes
    TrainingParamsTrait
  91. final def getLabelCol: String
    Definition Classes
    HasLabelCol
  92. final def getLeafEstimationBacktracking: ELeavesEstimationStepBacktracking
    Definition Classes
    TrainingParamsTrait
  93. final def getLeafEstimationIterations: Int
    Definition Classes
    TrainingParamsTrait
  94. final def getLeafEstimationMethod: ELeavesEstimation
    Definition Classes
    TrainingParamsTrait
  95. final def getLearningRate: Float
    Definition Classes
    TrainingParamsTrait
  96. final def getLoggingLevel: ELoggingLevel
    Definition Classes
    TrainingParamsTrait
  97. final def getLossFunction: String
    Definition Classes
    TrainingParamsTrait
  98. final def getMetricPeriod: Int
    Definition Classes
    TrainingParamsTrait
  99. final def getModelShrinkMode: EModelShrinkMode
    Definition Classes
    TrainingParamsTrait
  100. final def getModelShrinkRate: Float
    Definition Classes
    TrainingParamsTrait
  101. final def getMvsReg: Float
    Definition Classes
    TrainingParamsTrait
  102. final def getNanMode: ENanMode
    Definition Classes
    QuantizationParamsTrait
  103. def getNumClasses(dataset: Dataset[_], maxNumClasses: Int): Int
    Attributes
    protected
    Definition Classes
    Classifier
  104. final def getOdPval: Float
    Definition Classes
    TrainingParamsTrait
  105. final def getOdType: EOverfittingDetectorType
    Definition Classes
    TrainingParamsTrait
  106. final def getOdWait: Int
    Definition Classes
    TrainingParamsTrait
  107. final def getOneHotMaxSize: Int
    Definition Classes
    TrainingParamsTrait
  108. final def getOrDefault[T](param: Param[T]): T
    Definition Classes
    Params
  109. def getParam(paramName: String): Param[Any]
    Definition Classes
    Params
  110. final def getPenaltiesCoefficient: Float
    Definition Classes
    TrainingParamsTrait
  111. final def getPerFloatFeatureQuantizaton: Array[String]
    Definition Classes
    QuantizationParamsTrait
  112. final def getPerObjectFeaturePenaltiesList: Array[Double]
    Definition Classes
    TrainingParamsTrait
  113. final def getPerObjectFeaturePenaltiesMap: LinkedHashMap[String, Double]
    Definition Classes
    TrainingParamsTrait
  114. final def getPredictionCol: String
    Definition Classes
    HasPredictionCol
  115. final def getProbabilityCol: String
    Definition Classes
    HasProbabilityCol
  116. final def getRandomSeed: Int
    Definition Classes
    TrainingParamsTrait
  117. final def getRandomStrength: Float
    Definition Classes
    TrainingParamsTrait
  118. final def getRawPredictionCol: String
    Definition Classes
    HasRawPredictionCol
  119. final def getRsm: Float
    Definition Classes
    TrainingParamsTrait
  120. final def getSamplingFrequency: ESamplingFrequency
    Definition Classes
    TrainingParamsTrait
  121. final def getSamplingUnit: ESamplingUnit
    Definition Classes
    TrainingParamsTrait
  122. final def getSaveSnapshot: Boolean
    Definition Classes
    TrainingParamsTrait
  123. final def getScalePosWeight: Float
  124. final def getScoreFunction: EScoreFunction
    Definition Classes
    TrainingParamsTrait
  125. final def getSnapshotFile: String
    Definition Classes
    TrainingParamsTrait
  126. final def getSnapshotInterval: Duration
    Definition Classes
    TrainingParamsTrait
  127. final def getSparkPartitionCount: Int
    Definition Classes
    TrainingParamsTrait
  128. final def getSubsample: Float
    Definition Classes
    TrainingParamsTrait
  129. final def getTargetBorder: Float
  130. final def getThreadCount: Int
    Definition Classes
    ThreadCountParams
  131. def getThresholds: Array[Double]
    Definition Classes
    HasThresholds
  132. final def getTrainDir: String
    Definition Classes
    TrainingParamsTrait
  133. final def getUseBestModel: Boolean
    Definition Classes
    TrainingParamsTrait
  134. final def getWeightCol: String
    Definition Classes
    HasWeightCol
  135. final def getWorkerInitializationTimeout: Duration
    Definition Classes
    TrainingParamsTrait
  136. final def getWorkerMaxFailures: Int
    Definition Classes
    TrainingParamsTrait
  137. final def hasDefault[T](param: Param[T]): Boolean
    Definition Classes
    Params
  138. def hasParam(paramName: String): Boolean
    Definition Classes
    Params
  139. final val hasTime: BooleanParam
    Definition Classes
    TrainingParamsTrait
  140. def hashCode(): Int
    Definition Classes
    AnyRef → Any
    Annotations
    @native()
  141. final val ignoredFeaturesIndices: IntArrayParam
    Definition Classes
    IgnoredFeaturesParams
  142. final val ignoredFeaturesNames: StringArrayParam
    Definition Classes
    IgnoredFeaturesParams
  143. def initializeLogIfNecessary(isInterpreter: Boolean, silent: Boolean): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  144. def initializeLogIfNecessary(isInterpreter: Boolean): Unit
    Attributes
    protected
    Definition Classes
    Logging
  145. final val inputBorders: Param[String]
    Definition Classes
    QuantizationParamsTrait
  146. final def isDefined(param: Param[_]): Boolean
    Definition Classes
    Params
  147. final def isInstanceOf[T0]: Boolean
    Definition Classes
    Any
  148. final def isSet(param: Param[_]): Boolean
    Definition Classes
    Params
  149. def isTraceEnabled(): Boolean
    Attributes
    protected
    Definition Classes
    Logging
  150. final val iterations: IntParam
    Definition Classes
    TrainingParamsTrait
  151. final val l2LeafReg: FloatParam
    Definition Classes
    TrainingParamsTrait
  152. final val labelCol: Param[String]
    Definition Classes
    HasLabelCol
  153. final val leafEstimationBacktracking: EnumParam[ELeavesEstimationStepBacktracking]
    Definition Classes
    TrainingParamsTrait
  154. final val leafEstimationIterations: IntParam
    Definition Classes
    TrainingParamsTrait
  155. final val leafEstimationMethod: EnumParam[ELeavesEstimation]
    Definition Classes
    TrainingParamsTrait
  156. final val learningRate: FloatParam
    Definition Classes
    TrainingParamsTrait
  157. def log: Logger
    Attributes
    protected
    Definition Classes
    Logging
  158. def logDebug(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  159. def logDebug(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  160. def logError(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  161. def logError(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  162. def logInfo(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  163. def logInfo(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  164. def logName: String
    Attributes
    protected
    Definition Classes
    Logging
  165. def logTrace(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  166. def logTrace(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  167. def logWarning(msg: ⇒ String, throwable: Throwable): Unit
    Attributes
    protected
    Definition Classes
    Logging
  168. def logWarning(msg: ⇒ String): Unit
    Attributes
    protected
    Definition Classes
    Logging
  169. final val loggingLevel: EnumParam[ELoggingLevel]
    Definition Classes
    TrainingParamsTrait
  170. final val lossFunction: Param[String]
    Definition Classes
    TrainingParamsTrait
  171. final val metricPeriod: IntParam
    Definition Classes
    TrainingParamsTrait
  172. final val modelShrinkMode: EnumParam[EModelShrinkMode]
    Definition Classes
    TrainingParamsTrait
  173. final val modelShrinkRate: FloatParam
    Definition Classes
    TrainingParamsTrait
  174. final val mvsReg: FloatParam
    Definition Classes
    TrainingParamsTrait
  175. final val nanMode: EnumParam[ENanMode]
    Definition Classes
    QuantizationParamsTrait
  176. final def ne(arg0: AnyRef): Boolean
    Definition Classes
    AnyRef
  177. final def notify(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  178. final def notifyAll(): Unit
    Definition Classes
    AnyRef
    Annotations
    @native()
  179. final val odPval: FloatParam
    Definition Classes
    TrainingParamsTrait
  180. final val odType: EnumParam[EOverfittingDetectorType]
    Definition Classes
    TrainingParamsTrait
  181. final val odWait: IntParam
    Definition Classes
    TrainingParamsTrait
  182. final val oneHotMaxSize: IntParam
    Definition Classes
    TrainingParamsTrait
  183. lazy val params: Array[Param[_]]
    Definition Classes
    Params
  184. final val penaltiesCoefficient: FloatParam
    Definition Classes
    TrainingParamsTrait
  185. final val perFloatFeatureQuantizaton: StringArrayParam
    Definition Classes
    QuantizationParamsTrait
  186. final val perObjectFeaturePenaltiesList: DoubleArrayParam
    Definition Classes
    TrainingParamsTrait
  187. final val perObjectFeaturePenaltiesMap: OrderedStringMapParam[Double]
    Definition Classes
    TrainingParamsTrait
  188. final val predictionCol: Param[String]
    Definition Classes
    HasPredictionCol
  189. def preprocessBeforeTraining(quantizedTrainPool: Pool, quantizedEvalPools: Array[Pool]): (Pool, Array[Pool], CatBoostTrainingContext)

    override in descendants if necessary

    override in descendants if necessary

    returns

    (preprocessedTrainPool, preprocessedEvalPools, catBoostTrainingContext)

    Attributes
    protected
    Definition Classes
    CatBoostClassifierCatBoostPredictorTrait
  190. final val probabilityCol: Param[String]
    Definition Classes
    HasProbabilityCol
  191. final val randomSeed: IntParam
    Definition Classes
    TrainingParamsTrait
  192. final val randomStrength: FloatParam
    Definition Classes
    TrainingParamsTrait
  193. final val rawPredictionCol: Param[String]
    Definition Classes
    HasRawPredictionCol
  194. final val rsm: FloatParam
    Definition Classes
    TrainingParamsTrait
  195. final val samplingFrequency: EnumParam[ESamplingFrequency]
    Definition Classes
    TrainingParamsTrait
  196. final val samplingUnit: EnumParam[ESamplingUnit]
    Definition Classes
    TrainingParamsTrait
  197. def save(path: String): Unit
    Definition Classes
    MLWritable
    Annotations
    @Since( "1.6.0" ) @throws( ... )
  198. final val saveSnapshot: BooleanParam
    Definition Classes
    TrainingParamsTrait
  199. final val scalePosWeight: FloatParam
  200. final val scoreFunction: EnumParam[EScoreFunction]
    Definition Classes
    TrainingParamsTrait
  201. final def set(paramPair: ParamPair[_]): CatBoostClassifier.this.type
    Attributes
    protected
    Definition Classes
    Params
  202. final def set(param: String, value: Any): CatBoostClassifier.this.type
    Attributes
    protected
    Definition Classes
    Params
  203. final def set[T](param: Param[T], value: T): CatBoostClassifier.this.type
    Definition Classes
    Params
  204. final def setAllowConstLabel(value: Boolean): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  205. final def setAllowWritingFiles(value: Boolean): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  206. final def setApproxOnFullHistory(value: Boolean): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  207. final def setAutoClassWeights(value: EAutoClassWeightsType): CatBoostClassifier.this.type
  208. final def setBaggingTemperature(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  209. final def setBestModelMinTrees(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  210. final def setBootstrapType(value: EBootstrapType): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  211. final def setBorderCount(value: Int): CatBoostClassifier.this.type
    Definition Classes
    QuantizationParamsTrait
  212. final def setClassNames(value: Array[String]): CatBoostClassifier.this.type
  213. final def setClassWeightsList(value: Array[Double]): CatBoostClassifier.this.type
  214. final def setClassWeightsMap(value: LinkedHashMap[String, Double]): CatBoostClassifier.this.type
  215. final def setClassesCount(value: Int): CatBoostClassifier.this.type
  216. final def setConnectTimeout(value: Duration): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  217. final def setCustomMetric(value: Array[String]): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  218. final def setDefault(paramPairs: ParamPair[_]*): CatBoostClassifier.this.type
    Attributes
    protected
    Definition Classes
    Params
  219. final def setDefault[T](param: Param[T], value: T): CatBoostClassifier.this.type
    Attributes
    protected
    Definition Classes
    Params
  220. final def setDepth(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  221. final def setDiffusionTemperature(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  222. final def setEarlyStoppingRounds(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  223. final def setEvalMetric(value: String): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  224. final def setFeatureBorderType(value: EBorderSelectionType): CatBoostClassifier.this.type
    Definition Classes
    QuantizationParamsTrait
  225. final def setFeatureWeightsList(value: Array[Double]): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  226. final def setFeatureWeightsMap(value: LinkedHashMap[String, Double]): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  227. def setFeaturesCol(value: String): CatBoostClassifier
    Definition Classes
    Predictor
  228. final def setFirstFeatureUsePenaltiesList(value: Array[Double]): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  229. final def setFirstFeatureUsePenaltiesMap(value: LinkedHashMap[String, Double]): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  230. final def setFoldLenMultiplier(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  231. final def setFoldPermutationBlock(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  232. final def setHasTime(value: Boolean): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  233. final def setIgnoredFeaturesIndices(value: Array[Int]): CatBoostClassifier.this.type
    Definition Classes
    IgnoredFeaturesParams
  234. final def setIgnoredFeaturesNames(value: Array[String]): CatBoostClassifier.this.type
    Definition Classes
    IgnoredFeaturesParams
  235. final def setInputBorders(value: String): CatBoostClassifier.this.type
    Definition Classes
    QuantizationParamsTrait
  236. final def setIterations(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  237. final def setL2LeafReg(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  238. def setLabelCol(value: String): CatBoostClassifier
    Definition Classes
    Predictor
  239. final def setLeafEstimationBacktracking(value: ELeavesEstimationStepBacktracking): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  240. final def setLeafEstimationIterations(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  241. final def setLeafEstimationMethod(value: ELeavesEstimation): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  242. final def setLearningRate(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  243. final def setLoggingLevel(value: ELoggingLevel): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  244. final def setLossFunction(value: String): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  245. final def setMetricPeriod(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  246. final def setModelShrinkMode(value: EModelShrinkMode): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  247. final def setModelShrinkRate(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  248. final def setMvsReg(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  249. final def setNanMode(value: ENanMode): CatBoostClassifier.this.type
    Definition Classes
    QuantizationParamsTrait
  250. final def setOdPval(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  251. final def setOdType(value: EOverfittingDetectorType): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  252. final def setOdWait(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  253. final def setOneHotMaxSize(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  254. final def setPenaltiesCoefficient(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  255. final def setPerFloatFeatureQuantizaton(value: Array[String]): CatBoostClassifier.this.type
    Definition Classes
    QuantizationParamsTrait
  256. final def setPerObjectFeaturePenaltiesList(value: Array[Double]): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  257. final def setPerObjectFeaturePenaltiesMap(value: LinkedHashMap[String, Double]): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  258. def setPredictionCol(value: String): CatBoostClassifier
    Definition Classes
    Predictor
  259. def setProbabilityCol(value: String): CatBoostClassifier
    Definition Classes
    ProbabilisticClassifier
  260. final def setRandomSeed(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  261. final def setRandomStrength(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  262. def setRawPredictionCol(value: String): CatBoostClassifier
    Definition Classes
    Classifier
  263. final def setRsm(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  264. final def setSamplingFrequency(value: ESamplingFrequency): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  265. final def setSamplingUnit(value: ESamplingUnit): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  266. final def setSaveSnapshot(value: Boolean): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  267. final def setScalePosWeight(value: Float): CatBoostClassifier.this.type
  268. final def setScoreFunction(value: EScoreFunction): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  269. final def setSnapshotFile(value: String): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  270. final def setSnapshotInterval(value: Duration): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  271. final def setSparkPartitionCount(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  272. final def setSubsample(value: Float): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  273. final def setTargetBorder(value: Float): CatBoostClassifier.this.type
  274. final def setThreadCount(value: Int): CatBoostClassifier.this.type
    Definition Classes
    ThreadCountParams
  275. def setThresholds(value: Array[Double]): CatBoostClassifier
    Definition Classes
    ProbabilisticClassifier
  276. final def setTrainDir(value: String): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  277. final def setUseBestModel(value: Boolean): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  278. final def setWorkerInitializationTimeout(value: Duration): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  279. final def setWorkerMaxFailures(value: Int): CatBoostClassifier.this.type
    Definition Classes
    TrainingParamsTrait
  280. final val snapshotFile: Param[String]
    Definition Classes
    TrainingParamsTrait
  281. final val snapshotInterval: DurationParam
    Definition Classes
    TrainingParamsTrait
  282. final val sparkPartitionCount: IntParam
    Definition Classes
    TrainingParamsTrait
  283. final val subsample: FloatParam
    Definition Classes
    TrainingParamsTrait
  284. final def synchronized[T0](arg0: ⇒ T0): T0
    Definition Classes
    AnyRef
  285. final val targetBorder: FloatParam
  286. final val threadCount: IntParam
    Definition Classes
    ThreadCountParams
  287. val thresholds: DoubleArrayParam
    Definition Classes
    HasThresholds
  288. def toString(): String
    Definition Classes
    Identifiable → AnyRef → Any
  289. def train(dataset: Dataset[_]): CatBoostClassificationModel
    Attributes
    protected
    Definition Classes
    CatBoostPredictorTrait → Predictor
  290. final val trainDir: Param[String]
    Definition Classes
    TrainingParamsTrait
  291. def transformSchema(schema: StructType): StructType
    Definition Classes
    Predictor → PipelineStage
  292. def transformSchema(schema: StructType, logging: Boolean): StructType
    Attributes
    protected
    Definition Classes
    PipelineStage
    Annotations
    @DeveloperApi()
  293. val uid: String
    Definition Classes
    CatBoostClassifier → Identifiable
  294. final val useBestModel: BooleanParam
    Definition Classes
    TrainingParamsTrait
  295. def validateAndTransformSchema(schema: StructType, fitting: Boolean, featuresDataType: DataType): StructType
    Attributes
    protected
    Definition Classes
    ProbabilisticClassifierParams → ClassifierParams → PredictorParams
  296. def validateLabel(label: Double, numClasses: Int): Unit
    Attributes
    protected
    Definition Classes
    Classifier
  297. def validateNumClasses(numClasses: Int): Unit
    Attributes
    protected
    Definition Classes
    Classifier
  298. final def wait(): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  299. final def wait(arg0: Long, arg1: Int): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... )
  300. final def wait(arg0: Long): Unit
    Definition Classes
    AnyRef
    Annotations
    @throws( ... ) @native()
  301. final val weightCol: Param[String]
    Definition Classes
    HasWeightCol
  302. final val workerInitializationTimeout: DurationParam
    Definition Classes
    TrainingParamsTrait
  303. final val workerMaxFailures: IntParam
    Definition Classes
    TrainingParamsTrait
  304. def write: MLWriter
    Definition Classes
    DefaultParamsWritable → MLWritable

Inherited from TrainingParamsTrait

Inherited from QuantizationParamsTrait

Inherited from ThreadCountParams

Inherited from IgnoredFeaturesParams

Inherited from DefaultParamsWritable

Inherited from MLWritable

Inherited from DatasetParamsTrait

Inherited from HasWeightCol

Inherited from ProbabilisticClassifier[Vector, CatBoostClassifier, CatBoostClassificationModel]

Inherited from ProbabilisticClassifierParams

Inherited from HasThresholds

Inherited from HasProbabilityCol

Inherited from Classifier[Vector, CatBoostClassifier, CatBoostClassificationModel]

Inherited from ClassifierParams

Inherited from HasRawPredictionCol

Inherited from Predictor[Vector, CatBoostClassifier, CatBoostClassificationModel]

Inherited from PredictorParams

Inherited from HasPredictionCol

Inherited from HasFeaturesCol

Inherited from HasLabelCol

Inherited from Estimator[CatBoostClassificationModel]

Inherited from PipelineStage

Inherited from Logging

Inherited from Params

Inherited from Serializable

Inherited from Serializable

Inherited from Identifiable

Inherited from AnyRef

Inherited from Any

Ungrouped