All Downloads are FREE. Search and download functionalities are using the official Maven repository.

ai.catboost.spark.params.QuantizationParams.scala Maven / Gradle / Ivy

package ai.catboost.spark.params;

import org.apache.spark.ml.param._
import org.apache.spark.ml.util.Identifiable

import ai.catboost.spark.params.macros.ParamGetterSetter

import ru.yandex.catboost.spark.catboost4j_spark.core.src.native_impl.{EBorderSelectionType,ENanMode};

/** Parameters for quantization. See documentation on [[https://catboost.ai/docs/]] for details. */
trait QuantizationParamsTrait
  extends Params with IgnoredFeaturesParams with ThreadCountParams
{
  @ParamGetterSetter
  final val perFloatFeatureQuantizaton: StringArrayParam = new StringArrayParam(
    this,
    "perFloatFeatureQuantizaton",
    "The quantization description for the given list of features (one or more)."
    + "Description format for a single feature:"
    + " FeatureId[:border_count=BorderCount][:nan_mode=BorderType][:border_type=border_selection_method]"
  )

  @ParamGetterSetter
  final val borderCount: IntParam = new IntParam(
    this,
    "borderCount",
    "The number of splits for numerical features. Allowed values are integers from 1 to 65535 inclusively. "
    + "Default value is 254."
  )

  @ParamGetterSetter
  final val featureBorderType: EnumParam[EBorderSelectionType] = new EnumParam[EBorderSelectionType](
    this,
    "featureBorderType",
    "The quantization mode for numerical features. See documentation for details. "
    + "Default value is 'GreedyLogSum'"
  )

  @ParamGetterSetter
  final val nanMode: EnumParam[ENanMode] = new EnumParam[ENanMode](
    this,
    "nanMode",
    "The method for processing missing values in the input dataset. See documentation for details. "
    + "Default value is 'Min'"
  )

  @ParamGetterSetter
  final val inputBorders: Param[String] = new Param[String](
    this,
    "inputBorders",
    "Load Custom quantization borders and missing value modes from a file (do not generate them)"
  )
}

object QuantizationParams {
  val MaxSubsetSizeForBuildBordersAlgorithms = 200000
}

/** Parameters for quantization as a class. Used in [[Pool!.quantize(QuantizationParamsTrait)]].
 *  See documentation on [[https://catboost.ai/docs/]] for details.
 */
class QuantizationParams (override val uid: String)
  extends QuantizationParamsTrait
{
  def this() = this(Identifiable.randomUID("catboostQuantizationParams"))

  override def copy(extra: ParamMap): QuantizationParams = defaultCopy(extra)
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy