bio.ferlab.datalake.spark3.transformation.RegexReplace.scala Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of datalake-spark3_2.12 Show documentation
Show all versions of datalake-spark3_2.12 Show documentation
Library built on top of Apache Spark to speed-up data lakes development..
package bio.ferlab.datalake.spark3.transformation
import org.apache.spark.sql.DataFrame
import org.apache.spark.sql.functions.{col, regexp_replace}
case class RegexReplace(sourcefield: String, destinationfield: String, pattern: String, replacement: String) extends Transformation {
override def transform: DataFrame => DataFrame = { df =>
df.withColumn(destinationfield, regexp_replace(col(sourcefield), pattern, replacement))
}
}