All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.stratio.provider.mongodb.DefaultSource.scala Maven / Gradle / Ivy

The newest version!
/*
 *  Licensed to STRATIO (C) under one or more contributor license agreements.
 *  See the NOTICE file distributed with this work for additional information
 *  regarding copyright ownership. The STRATIO (C) licenses this file
 *  to you under the Apache License, Version 2.0 (the
 *  "License"); you may not use this file except in compliance
 *  with the License. You may obtain a copy of the License at
 *
 *  http://www.apache.org/licenses/LICENSE-2.0
 *
 *  Unless required by applicable law or agreed to in writing,
 *  software distributed under the License is distributed on an
 *  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 *  KIND, either express or implied. See the License for the
 *  specific language governing permissions and limitations
 *  under the License.
 */

package com.stratio.provider.mongodb

import com.mongodb.MongoCredential
import com.mongodb.casbah.Imports._
import com.stratio.provider.DeepConfig._
import org.apache.spark.sql.SaveMode._
import org.apache.spark.sql.sources.BaseRelation
import org.apache.spark.sql.sources.RelationProvider
import org.apache.spark.sql.sources.SchemaRelationProvider
import org.apache.spark.sql.sources.CreatableRelationProvider
import org.apache.spark.sql.types.StructType
import org.apache.spark.sql.{DataFrame, SaveMode, SQLContext}
import MongodbConfig._

/**
 * Allows creation of MongoDB based tables using
 * the syntax CREATE TEMPORARY TABLE ... USING com.stratio.deep.mongodb.
 * Required options are detailed in [[com.stratio.provider.mongodb.MongodbConfig]]
 */
class DefaultSource extends RelationProvider with SchemaRelationProvider with CreatableRelationProvider{

  override def createRelation(
   sqlContext: SQLContext,
   parameters: Map[String, String]): BaseRelation = {

    MongodbRelation(
      MongodbConfigBuilder()
        .apply(parseParameters(parameters))
        .build())(sqlContext)

  }
  override def createRelation(
   sqlContext: SQLContext,
   parameters: Map[String, String],
   schema: StructType): BaseRelation = {

    MongodbRelation(
    MongodbConfigBuilder()
      .apply(parseParameters(parameters))
      .build())(sqlContext)

  }

  override def createRelation(
   sqlContext: SQLContext,
   mode: SaveMode,
   parameters: Map[String, String],
   data: DataFrame): BaseRelation = {

    val mongodbRelation = MongodbRelation(
      MongodbConfigBuilder()
        .apply(parseParameters(parameters))
        .build())(sqlContext)

    mode match{
      case Append         => mongodbRelation.insert(data, overwrite = false)
      case Overwrite      => mongodbRelation.insert(data, overwrite = true)
      case ErrorIfExists  => if(mongodbRelation.isEmptyCollection) mongodbRelation.insert(data, overwrite = false)
      else throw new UnsupportedOperationException("Writing in a non-empty collection.")
      case Ignore         => if(mongodbRelation.isEmptyCollection) mongodbRelation.insert(data, overwrite = false)
    }

    mongodbRelation
  }

  private def parseParameters(parameters : Map[String,String]): Map[String, Any] = {

    /** We will assume hosts are provided like 'host:port,host2:port2,...' */
    val host = parameters
      .getOrElse(Host, notFound[String](Host))
      .split(",").toList

    val database = parameters.getOrElse(Database, notFound(Database))

    val collection = parameters.getOrElse(Collection, notFound(Collection))

    val samplingRatio = parameters
      .get(SamplingRatio)
      .map(_.toDouble).getOrElse(DefaultSamplingRatio)

    val readpreference = parameters.getOrElse(readPreference, DefaultReadPreference)

    val properties :Map[String, Any] =
      Map(Host -> host, Database -> database, Collection -> collection , SamplingRatio -> samplingRatio, readPreference -> readpreference)

    val optionalProperties: List[String] = List(Credentials,SSLOptions, IdField, SearchFields, Language)
    val finalMap = (properties /: optionalProperties){    //TODO improve code
      case (properties,Credentials) =>
        /** We will assume credentials are provided like 'user,database,password;user,database,password;...' */
        val credentialInput = parameters.getOrElse(Credentials, " ")
        if(credentialInput.compareTo(" ")!=0){
          val credentials= credentialInput
            .split(";")
            .map(credential => credential.split(",")).toList
            .map(credentials => MongodbCredentials(credentials(0), credentials(1), credentials(2).toCharArray))
          properties.+(Credentials -> credentials)
        } else properties
      case (properties,SSLOptions) =>
        /** We will assume ssloptions are provided like '/path/keystorefile,keystorepassword,/path/truststorefile,truststorepassword' */
        val ssloptionInput = parameters.getOrElse(SSLOptions, " ")
        if(ssloptionInput.compareTo(" ")!=0) {
          val ssloption = ssloptionInput.split(",")
          val ssloptions = MongodbSSLOptions(Some(ssloption(0)), Some(ssloption(1)), ssloption(2), Some(ssloption(3)))
          properties.+(SSLOptions -> ssloptions)
        }
        else properties
      case (properties, IdField) => {
        val idFieldInput = parameters.get(IdField)
        if(idFieldInput.isDefined) properties.+(IdField -> idFieldInput.get) else properties
      }
      case (properties, Language) => {
        val languageInput = parameters.get(Language)
        if(languageInput.isDefined) properties.+(Language -> languageInput.get) else properties
      }
      case (properties, SearchFields) => {
        /** We will assume fields are provided like 'user,database,password...' */
        val searchInputs = parameters.get(SearchFields)
        if(searchInputs.isDefined){
          val searchFields = searchInputs.get.split(",")
          properties.+(SearchFields -> searchFields)
        } else properties
      }
    }
    finalMap
  }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy