ai.catboost.spark.params.QuantizationParams.scala Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of catboost-spark_3.5_2.13 Show documentation
Show all versions of catboost-spark_3.5_2.13 Show documentation
JVM module to use CatBoost on Apache Spark
The newest version!
package ai.catboost.spark.params;
import org.apache.spark.ml.param._
import org.apache.spark.ml.util.Identifiable
import ai.catboost.spark.params.macros.ParamGetterSetter
import ru.yandex.catboost.spark.catboost4j_spark.core.src.native_impl.{EBorderSelectionType,ENanMode};
/** Parameters for quantization. See documentation on [[https://catboost.ai/docs/]] for details. */
trait QuantizationParamsTrait
extends Params with IgnoredFeaturesParams with ThreadCountParams
{
@ParamGetterSetter
final val perFloatFeatureQuantizaton: StringArrayParam = new StringArrayParam(
this,
"perFloatFeatureQuantizaton",
"The quantization description for the given list of features (one or more)."
+ "Description format for a single feature:"
+ " FeatureId[:border_count=BorderCount][:nan_mode=BorderType][:border_type=border_selection_method]"
)
@ParamGetterSetter
final val borderCount: IntParam = new IntParam(
this,
"borderCount",
"The number of splits for numerical features. Allowed values are integers from 1 to 65535 inclusively. "
+ "Default value is 254."
)
@ParamGetterSetter
final val featureBorderType: EnumParam[EBorderSelectionType] = new EnumParam[EBorderSelectionType](
this,
"featureBorderType",
"The quantization mode for numerical features. See documentation for details. "
+ "Default value is 'GreedyLogSum'"
)
@ParamGetterSetter
final val nanMode: EnumParam[ENanMode] = new EnumParam[ENanMode](
this,
"nanMode",
"The method for processing missing values in the input dataset. See documentation for details. "
+ "Default value is 'Min'"
)
@ParamGetterSetter
final val inputBorders: Param[String] = new Param[String](
this,
"inputBorders",
"Load Custom quantization borders and missing value modes from a file (do not generate them)"
)
}
object QuantizationParams {
val MaxSubsetSizeForBuildBordersAlgorithms = 200000
}
/** Parameters for quantization as a class. Used in [[Pool!.quantize(QuantizationParamsTrait)]].
* See documentation on [[https://catboost.ai/docs/]] for details.
*/
class QuantizationParams (override val uid: String)
extends QuantizationParamsTrait
{
def this() = this(Identifiable.randomUID("catboostQuantizationParams"))
override def copy(extra: ParamMap): QuantizationParams = defaultCopy(extra)
}
© 2015 - 2024 Weber Informatics LLC | Privacy Policy