streaming.dsl.load.batch.AutoWorkflowExplain.scala Maven / Gradle / Ivy

Show more of this group Show more artifacts with this name
Show all versions of streamingpro-mlsql-spark_2.4 Show documentation
The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package streaming.dsl.load.batch

import com.google.common.reflect.ClassPath
import net.csdn.common.reflect.ReflectHelper
import org.apache.spark.sql.{Row, SparkSession, _}
import org.apache.spark.sql.types.{StringType, StructField, StructType}
import scala.collection.JavaConversions._

/**
  * Created by allwefantasy on 21/9/2018.
  */
object AutoWorkflowSelfExplain {
  def apply(format: String, path: String, option: Map[String, String], sparkSession: SparkSession): AutoWorkflowSelfExplain = new AutoWorkflowSelfExplain(format, path, option)(sparkSession)
}


class AutoWorkflowSelfExplain(format: String, path: String, option: Map[String, String])(sparkSession: SparkSession) {
  private var table: DataFrame = null

  def isMatch = {
    new Then(this, Set("workflow", "workflowList", "workflowParams", "workflowExample", "workflowTypes").contains(format))
  }

  def explain() = {
    table = List(
      new AutoWorkflowStartup(format, path, option)(sparkSession),
      new AutoWorkflowList(format, path, option)(sparkSession),
      new AutoWorkflowTypes(format, path, option)(sparkSession)
    ).
      filter(explainer => explainer.isMatch).
      head.
      explain
  }

  class Then(parent: AutoWorkflowSelfExplain, isMatch: Boolean) {
    def thenDo() = {
      if (isMatch) {
        parent.explain()
      }
      new OrElse(parent, isMatch)
    }

  }

  class OrElse(parent: AutoWorkflowSelfExplain, isMatch: Boolean) {
    def orElse(f: () => DataFrame) = {
      if (!isMatch) {
        parent.table = f()
      }
      parent
    }

  }

  def get() = {
    table
  }
}

class AutoWorkflowStartup(format: String, path: String, option: Map[String, String])(sparkSession: SparkSession) extends SelfExplain {
  override def isMatch: Boolean = {
    format == "workflow" && path.isEmpty
  }

  override def explain: DataFrame = {

    val rows = sparkSession.sparkContext.parallelize(Seq(
      Row.fromSeq(Seq("command:list ", "load workflow.`list` as output;"))
    ), 1)

    sparkSession.createDataFrame(rows,
      StructType(Seq(
        StructField(name = "desc", dataType = StringType),
        StructField(name = "command", dataType = StringType)
      )))
  }
}


class AutoWorkflowList(format: String, path: String, option: Map[String, String])(sparkSession: SparkSession) extends SelfExplain {
  override def isMatch: Boolean = {
    (format == "workflow" && path == "list") || (format == "workflowList")
  }

  override def explain: DataFrame = {
    val instance = try {
      Class.forName("streaming.dsl.mmlib.algs.AutoFeature").newInstance()
    } catch {
      case e: Exception =>
        null
    }
    if (instance == null) {
      import sparkSession.implicits._
      return Seq.empty[(String, String)].toDF("name", "description")
    }
    val items = ReflectHelper.method(instance, "listWorkflows").asInstanceOf[Seq[String]].map(f => Row.fromSeq(Seq(f)))
    val rows = sparkSession.sparkContext.parallelize(items, 1)
    return sparkSession.createDataFrame(rows,
      StructType(Seq(
        StructField(name = "name", dataType = StringType)
      )))
  }
}

class AutoWorkflowTypes(format: String, path: String, option: Map[String, String])(sparkSession: SparkSession) extends SelfExplain {
  override def isMatch: Boolean = {
    (format == "workflow" && path == "types") || (format == "workflowTypes")
  }

  override def explain: DataFrame = {
    val items = ClassPath.from(getClass.getClassLoader).getTopLevelClasses("com.salesforce.op.features.types").map { f =>
      Row.fromSeq(Seq(f.getSimpleName, ""))
    }.toSeq
    val rows = sparkSession.sparkContext.parallelize(items, 1)
    sparkSession.createDataFrame(rows,
      StructType(Seq(
        StructField(name = "name", dataType = StringType),
        StructField(name = "desc", dataType = StringType)
      )))
  }
}