Skip to content

Commit

Permalink
Initial commit
Browse files Browse the repository at this point in the history
  • Loading branch information
andrewresearch committed Jul 1, 2020
0 parents commit 85c1c80
Show file tree
Hide file tree
Showing 4 changed files with 51 additions and 0 deletions.
5 changes: 5 additions & 0 deletions .gitignore
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
# Project exclude paths
/project/project/target/
/project/target/
/target/
/target/scala-2.11/classes/
15 changes: 15 additions & 0 deletions build.sbt
Original file line number Diff line number Diff line change
@@ -0,0 +1,15 @@
name := "core"

organization := "io.nlytx"

version := "0.1"

scalaVersion := "2.11.12"


libraryDependencies ++= Seq(
"org.apache.spark" %% "spark-core" % "2.4.6",
"org.apache.spark" %% "spark-sql" % "2.4.6",
"org.apache.spark" %% "spark-mllib" % "2.4.6",
"com.johnsnowlabs.nlp" %% "spark-nlp" % "2.5.2"
)
5 changes: 5 additions & 0 deletions src/main/scala/io/nlytx/core/CoRE.scala
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
package io.nlytx.core

object CoRE {

}
26 changes: 26 additions & 0 deletions src/main/scala/io/nlytx/core/spark/File.scala
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
package io.nlytx.core.spark

import org.apache.spark.ml.PipelineModel
import org.apache.spark.sql.{DataFrame, SparkSession}

case class File(basePath:String)(implicit val spark:SparkSession) {

def loadDataFrame(fileName:String) =
spark.read.load(s"${basePath}/${fileName}.dataframe")

def saveDataFrame(df:DataFrame,fileName:String,overwrite:Boolean = false) = {
val saveMode = if (overwrite) "overwrite" else "ErrorIfExists"
df.write.mode(saveMode)
.save(s"${basePath}/${fileName}.dataframe")
}

def loadPipelineModel(fileName:String) =
PipelineModel.load(s"${basePath}/${fileName}.pipelinemodel")

def savePipelineModel(model:PipelineModel, fileName:String, overwrite:Boolean = false) = {
val saveMode = if (overwrite)
model.write.overwrite.save(s"${basePath}/${fileName}.pipelinemodel")
else
model.write.save(s"${basePath}/${fileName}.pipelinemodel")
}
}

0 comments on commit 85c1c80

Please sign in to comment.