tus.sparktree.1.8.0.source-code.CovType_Unpack.scala Maven / Gradle / Ivy
/*
* Copyright (c) 2019 by Andrew Charneski.
*
* The author licenses this file to you under the
* Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance
* with the License. You may obtain a copy
* of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
import com.simiacryptus.aws.exe.EC2NodeSettings
import com.simiacryptus.sparkbook._
import com.simiacryptus.sparkbook.repl.{SparkRepl, SparkSessionProvider}
import com.simiacryptus.sparkbook.util.{LocalRunner, Logging}
import org.apache.spark.sql.SaveMode
abstract class CovType_Unpack extends SparkRepl with Logging with SparkSessionProvider {
override val defaultCmd: String =
"""%sql
|SELECT COUNT(*) AS count, Cover_Type FROM covtype GROUP BY Cover_Type
""".stripMargin
val destination = "s3a://simiacryptus/data/covtype/"
override def init(): Unit = {
Thread.sleep(30000)
val frame = CovType.dataframe(spark)
//frame.createOrReplaceTempView("covtype")
frame.write.mode(SaveMode.Overwrite).parquet(destination)
frame.sparkSession.sqlContext.read.parquet(destination).createOrReplaceTempView("covtype")
}
}
object CovType_Unpack_Local extends CovType_Unpack with LocalRunner[Object] with NotebookRunner[Object] {
override def http_port = 1081
}
object CovType_Unpack_EC2 extends CovType_Unpack with EC2Runner[Object] with AWSNotebookRunner[Object] {
override val s3bucket: String = envTuple._2
override def nodeSettings: EC2NodeSettings = EC2NodeSettings.T2_L
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy