![JAR search and dependency download from the Maven repository](/logo.png)
net.sansa_stack.owl.spark.rdd.FunctionalSyntaxOWLExpressionsRDDBuilder.scala Maven / Gradle / Ivy
package net.sansa_stack.owl.spark.rdd
import net.sansa_stack.owl.common.parsing.{FunctionalSyntaxExpressionBuilder, FunctionalSyntaxPrefixParsing}
import net.sansa_stack.owl.spark.hadoop.FunctionalSyntaxInputFormat
import org.apache.hadoop.io.{LongWritable, Text}
import org.apache.spark.sql.SparkSession
object FunctionalSyntaxOWLExpressionsRDDBuilder extends Serializable with FunctionalSyntaxPrefixParsing {
def build(spark: SparkSession, filePath: String): OWLExpressionsRDD = {
val hadoopRDD = spark.sparkContext.hadoopFile(
filePath, classOf[FunctionalSyntaxInputFormat], classOf[LongWritable],
classOf[Text], spark.sparkContext.defaultMinPartitions)
val rawRDD = hadoopRDD.map(entry => entry._2.toString)
val tmp: Array[(String, String)] =
rawRDD.filter(isPrefixDeclaration).map(parsePrefix).collect()
val prefixes: Map[String, String] = tmp.toMap
val builder = new FunctionalSyntaxExpressionBuilder(prefixes)
rawRDD.map(builder.clean).filter(_ != null)
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy