Update

vidma · vidma · commit 5c0919ba51bd · 2017-05-17T19:23:52.000+03:00
diff --git a/simple-spark-sources/build.sbt b/simple-spark-sources/build.sbt
@@ -1,5 +1,5 @@
 
-organization := "generated"
+organization := "com.example"
 
 name := "simple-spark"
 
@@ -9,7 +9,7 @@ crossPaths := true
 
 scalaVersion := "2.10.6"
 
-maintainer := "" //Docker
+maintainer := "DF" //Docker
 
 resolvers ++= Seq(
  "Maven2 Local" at "file:/Users/vidma-vinted/.m2/repository/" ,
@@ -42,7 +42,7 @@ dockerExposedPorts := Seq(9000, 9443)
 
 daemonUser in Docker := "root"
 
-packageName in Docker := "generated.simplespark"
+packageName in Docker := "com.example.simplespark"
 
 mappings in Docker ++= directory("spark-lib")
 
@@ -152,7 +152,7 @@ libraryDependencies += "com.google.guava" % "guava" % "16.0.1" force()
 test in assembly := {}
 
 //main class
-mainClass in assembly := Some("generated.Main")
+mainClass in assembly := Some("com.example.Main")
 
 artifact in (Compile, assembly) ~= { art =>
   art.copy(`classifier` = Some("assembly"))
diff --git a/simple-spark-sources/simple-spark.snb.ipynb b/simple-spark-sources/simple-spark.snb.ipynb
@@ -0,0 +1,140 @@
+{
+  "metadata" : {
+    "id" : "af838c83-8642-46b6-9358-12ee05e704e1",
+    "name" : "Simple Spark",
+    "user_save_timestamp" : "2014-10-11T17:33:45.703Z",
+    "auto_save_timestamp" : "2015-01-10T00:02:12.659Z",
+    "language_info" : {
+      "name" : "scala",
+      "file_extension" : "scala",
+      "codemirror_mode" : "text/x-scala"
+    },
+    "trusted" : true,
+    "sparkNotebook" : null,
+    "customLocalRepo" : null,
+    "customRepos" : null,
+    "customDeps" : null,
+    "customImports" : null,
+    "customArgs" : null,
+    "customSparkConf" : null,
+    "customVars" : null
+  },
+  "cells" : [ {
+    "metadata" : {
+      "id" : "37DEEDC733044DD9972E9E4BA2F1B126"
+    },
+    "cell_type" : "markdown",
+    "source" : "### Spark config"
+  }, {
+    "metadata" : {
+      "trusted" : true,
+      "input_collapsed" : false,
+      "collapsed" : true,
+      "id" : "2A2F6AA618AC48018D01E7D2F4183B76"
+    },
+    "cell_type" : "code",
+    "source" : "sparkContext.getConf.toDebugString",
+    "outputs" : [ ]
+  }, {
+    "metadata" : {
+      "id" : "DAFA77C3B6D140FF8AAE30B94D2FC73E"
+    },
+    "cell_type" : "markdown",
+    "source" : "#### Counting"
+  }, {
+    "metadata" : {
+      "trusted" : true,
+      "input_collapsed" : false,
+      "collapsed" : false,
+      "id" : "9088B578DE2F4BA48DF323F11895488A"
+    },
+    "cell_type" : "code",
+    "source" : "def transform(i: Int) = (i, i+1)",
+    "outputs" : [ {
+      "name" : "stdout",
+      "output_type" : "stream",
+      "text" : "transform: (i: Int)(Int, Int)\n"
+    }, {
+      "metadata" : { },
+      "data" : {
+        "text/html" : ""
+      },
+      "output_type" : "execute_result",
+      "execution_count" : 2,
+      "time" : "Took: 0.727s, at 2017-05-16 12:18"
+    } ]
+  }, {
+    "metadata" : {
+      "trusted" : true,
+      "input_collapsed" : false,
+      "collapsed" : false,
+      "presentation" : {
+        "tabs_state" : "{\n  \"tab_id\": \"#tab662761867-0\"\n}",
+        "pivot_chart_state" : "{\n  \"hiddenAttributes\": [],\n  \"menuLimit\": 200,\n  \"cols\": [],\n  \"rows\": [],\n  \"vals\": [],\n  \"exclusions\": {},\n  \"inclusions\": {},\n  \"unusedAttrsVertical\": 85,\n  \"autoSortUnusedAttrs\": false,\n  \"inclusionsInfo\": {},\n  \"aggregatorName\": \"Count\",\n  \"rendererName\": \"Table\"\n}"
+      },
+      "id" : "BF434E47187740E78B7A7A521D2D87DD"
+    },
+    "cell_type" : "code",
+    "source" : "val dataset = sparkSession.createDataset(1 to 1000).map(transform)",
+    "outputs" : [ {
+      "name" : "stdout",
+      "output_type" : "stream",
+      "text" : "dataset: org.apache.spark.sql.Dataset[(Int, Int)] = [_1: int, _2: int]\n"
+    }, {
+      "metadata" : { },
+      "data" : {
+        "text/html" : ""
+      },
+      "output_type" : "execute_result",
+      "execution_count" : 9,
+      "time" : "Took: 1.466s, at 2017-05-16 12:20"
+    } ]
+  }, {
+    "metadata" : {
+      "trusted" : true,
+      "input_collapsed" : false,
+      "collapsed" : false,
+      "presentation" : {
+        "tabs_state" : "{\n  \"tab_id\": \"#tab1070475139-0\"\n}",
+        "pivot_chart_state" : "{\n  \"hiddenAttributes\": [],\n  \"menuLimit\": 200,\n  \"cols\": [],\n  \"rows\": [],\n  \"vals\": [],\n  \"exclusions\": {},\n  \"inclusions\": {},\n  \"unusedAttrsVertical\": 85,\n  \"autoSortUnusedAttrs\": false,\n  \"inclusionsInfo\": {},\n  \"aggregatorName\": \"Count\",\n  \"rendererName\": \"Table\"\n}"
+      },
+      "id" : "EE80B60DB2C645D58B30EB2B793A5BEC"
+    },
+    "cell_type" : "code",
+    "source" : "display(dataset.toDF)",
+    "outputs" : [ ]
+  }, {
+    "metadata" : {
+      "trusted" : true,
+      "input_collapsed" : false,
+      "collapsed" : false,
+      "id" : "7797C8DBEB7643D788F4D14F6C8E2B40"
+    },
+    "cell_type" : "code",
+    "source" : "val sum = dataset.map(_._2).reduce(_+_)\n\nprintln(sum)",
+    "outputs" : [ {
+      "name" : "stdout",
+      "output_type" : "stream",
+      "text" : "501500\nsum: Int = 501500\n"
+    }, {
+      "metadata" : { },
+      "data" : {
+        "text/html" : ""
+      },
+      "output_type" : "execute_result",
+      "execution_count" : 11,
+      "time" : "Took: 1.146s, at 2017-05-16 12:20"
+    } ]
+  }, {
+    "metadata" : {
+      "trusted" : true,
+      "input_collapsed" : false,
+      "collapsed" : true,
+      "id" : "73F60C7C9F2945E38AC0C252F2C3AC1E"
+    },
+    "cell_type" : "code",
+    "source" : "",
+    "outputs" : [ ]
+  } ],
+  "nbformat" : 4
+}
diff --git a/simple-spark-sources/src/main/resources/notebook.snb b/simple-spark-sources/src/main/resources/notebook.snb
diff --git a/simple-spark-sources/src/main/scala/App.scala b/simple-spark-sources/src/main/scala/App.scala
@@ -1,5 +1,5 @@
 
-package generated.simplespark
+package com.example.simplespark
 
 object Main {
 
@@ -17,12 +17,8 @@ object Main {
     
     // Spark notebook widgets (can be removed if you do not use them)
     // Dummy implementation of the most common ones (to avoid shipping 80+ MB of spark-notebook jars)
-    def display[C](originalData:C, fields:Option[(String, String)]=None, maxPoints:Int=0) = {}
-    def pairs[C](originalData:C, maxPoints:Int=0) = {}
-    def ul(capacity:Int=10, initData:Seq[String]=Nil, prefill:Option[String]=None) = {}
-    def ol(capacity:Int=10, initData:Seq[String]=Nil, prefill:Option[String]=None) = {}
-    def img(tpe:String="png", width:String="", height:String="") = {}
-    def text(value: String) = {}
+    import notebook.front.widgets.charts._
+    import notebook.front.widgets.charts.MockedCharts._
     
     // Create spark configuration holder
     val sparkConf = new SparkConf()
@@ -42,7 +38,7 @@ object Main {
     // This is needed only if not using spark-submit (comment otherwise)
     
     def setExecutorJars() = {
-      val currentProjectJars = Array("lib/generated.simple-spark-0.0.1-SNAPSHOT.jar", "target/scala-2.10/generated.simple-spark_2.10-0.0.1-SNAPSHOT.jar").map{j => new java.io.File(j)}.filter(_.exists()).map(_.getAbsolutePath)
+      val currentProjectJars = Array("lib/com.example.simple-spark-0.0.1-SNAPSHOT.jar", "target/scala-2.10/com.example.simple-spark_2.10-0.0.1-SNAPSHOT.jar").map{j => new java.io.File(j)}.filter(_.exists()).map(_.getAbsolutePath)
       val sparkLibDir = new java.io.File("spark-lib")
       val fromProjectJars = Array[String]().map{j => new java.io.File(sparkLibDir, j).getAbsolutePath}
       val jarsArray = (sparkConf.get("spark.jars", "").split(",").toArray ++ currentProjectJars ++ fromProjectJars).distinct.filter(!_.isEmpty)
diff --git a/simple-spark-sources/src/main/scala/Classes.scala b/simple-spark-sources/src/main/scala/Classes.scala
@@ -1,5 +1,5 @@
 
-package generated.simplespark
+package com.example.simplespark
 
 
   //---//
diff --git a/simple-spark-sources/src/main/scala/MockedCharts.scala b/simple-spark-sources/src/main/scala/MockedCharts.scala
@@ -0,0 +1,143 @@
+
+package notebook.front.widgets.charts
+
+import notebook.front.widgets.charts.MockedCharts.DEFAULT_MAX_POINTS
+
+object MockedCharts {
+  val DEFAULT_MAX_POINTS = 1000
+
+  def display[C](originalData:C, fields:Option[(String, String)]=None, maxPoints:Int=0) = {}
+  def pairs[C](originalData:C, maxPoints:Int=0) = {}
+  def ul(capacity:Int=10, initData:Seq[String]=Nil, prefill:Option[String]=None) = {}
+  def ol(capacity:Int=10, initData:Seq[String]=Nil, prefill:Option[String]=None) = {}
+  def img(tpe:String="png", width:String="", height:String="") = {}
+  def text(value: String) = {}
+}
+
+case class CustomC3Chart[C](
+                             originalData: C,
+                             chartOptions: String = "{}",
+                             sizes: (Int, Int) = (600, 400),
+                             maxPoints: Int = DEFAULT_MAX_POINTS
+                           )
+
+case class ScatterChart[C](
+                            originalData: C,
+                            fields: Option[(String, String)] = None,
+                            sizes: (Int, Int) = (600, 400),
+                            maxPoints: Int = DEFAULT_MAX_POINTS,
+                            groupField: Option[String] = None
+                          )
+
+case class LineChart[C](
+                         originalData: C,
+                         fields: Option[(String, String)] = None,
+                         sizes: (Int, Int) = (600, 400),
+                         maxPoints: Int = DEFAULT_MAX_POINTS,
+                         groupField: Option[String] = None
+                       )
+
+case class RadarChart[C](
+                          originalData: C,
+                          labelField: Option[String] = None,
+                          sizes: (Int, Int) = (600, 400),
+                          maxPoints: Int = DEFAULT_MAX_POINTS
+                        )
+
+
+case class ParallelCoordChart[C](
+                                  originalData: C,
+                                  sizes: (Int, Int) = (600, 400),
+                                  maxPoints: Int = DEFAULT_MAX_POINTS
+                                )
+
+case class TimeseriesChart[C](
+                               originalData: C,
+                               fields: Option[(String, String)] = None,
+                               sizes: (Int, Int) = (600, 400),
+                               maxPoints: Int = DEFAULT_MAX_POINTS,
+                               groupField: Option[String] = None,
+                               tickFormat: String = "%Y-%m-%d %H:%M:%S"
+                             )
+
+case class BarChart[C](
+                        originalData: C,
+                        fields: Option[(String, String)] = None,
+                        sizes: (Int, Int) = (600, 400),
+                        maxPoints: Int = DEFAULT_MAX_POINTS,
+                        groupField: Option[String] = None
+                      )
+
+
+case class PieChart[C](
+                        originalData: C,
+                        fields: Option[(String, String)] = None,
+                        sizes: (Int, Int) = (600, 400),
+                        maxPoints: Int = DEFAULT_MAX_POINTS
+                      )
+
+case class DiyChart[C](
+                        originalData: C,
+                        js: String = "",
+                        sizes: (Int, Int) = (600, 400),
+                        maxPoints: Int = DEFAULT_MAX_POINTS
+                      )
+
+
+case class GeoPointsChart[C](
+                              originalData: C,
+                              sizes: (Int, Int) = (600, 400),
+                              maxPoints: Int = DEFAULT_MAX_POINTS,
+                              latLonFields: Option[(String, String)] = None,
+                              rField: Option[String] = None,
+                              colorField: Option[String] = None
+                            )
+
+
+case class GeoChart[C](
+                        originalData: C,
+                        sizes: (Int, Int) = (600, 400),
+                        maxPoints: Int = DEFAULT_MAX_POINTS,
+                        geometryField: Option[String] = None,
+                        rField: Option[String] = None,
+                        colorField: Option[String] = None,
+                        fillColorField: Option[String] = None
+                      )
+
+case class GraphChart[C](
+                          originalData: C,
+                          sizes: (Int, Int) = (600, 400),
+                          maxPoints: Int = DEFAULT_MAX_POINTS,
+                          charge: Int = -30,
+                          linkDistance: Int = 20,
+                          linkStrength: Double = 1.0
+                        )
+
+
+case class PivotChart[C](
+                          originalData: C,
+                          sizes: (Int, Int) = (600, 400),
+                          maxPoints: Int = DEFAULT_MAX_POINTS,
+                          // FIXME: otherwise this would add dependency on play-json!
+                          // derivedAttributes:JsObject=play.api.libs.json.Json.obj(),
+                          options: Map[String, String] = Map.empty
+                        )
+
+
+case class CustomPlotlyChart[C](
+                                 originalData: C,
+                                 layout: String = "{}",
+                                 dataOptions: String = "{}",
+                                 dataSources: String = "{}",
+                                 sizes: (Int, Int) = (600, 400),
+                                 maxPoints: Int = DEFAULT_MAX_POINTS
+                               )
+
+case class TableChart[C](
+                          originalData: C,
+                          filterCol: Option[Seq[String]] = None,
+                          sizes: (Int, Int) = (600, 400),
+                          maxPoints: Int = DEFAULT_MAX_POINTS
+                        )
+
+    

Original file line number	Diff line number	Diff line change
`@@ -1,5 +1,5 @@`
`1`	`1`
`2`		`-package generated.simplespark`
	`2`	`+package com.example.simplespark`
`3`	`3`
`4`	`4`
`5`	`5`	`//---//`