Added LSSVM committee model based on spark RDDs

mandar2812 · mandar2812 · commit 00b5ff2625c2 · 2016-06-03T17:19:08.000+02:00
diff --git a/build.sbt b/build.sbt
@@ -40,8 +40,7 @@ lazy val commonSettings = Seq(
     "org.jzy3d" % "jzy3d-api" % "0.9.1" % "compile",
     "com.lihaoyi" % "ammonite-repl_2.11.7" % "0.5.8"
   ),
-  initialCommands in console :=
-    """io.github.mandar2812.dynaml.DynaML.run();"""
+  initialCommands in console := """io.github.mandar2812.dynaml.DynaML.run();"""
 )
 
 lazy val DynaML = (project in file(".")).enablePlugins(JavaAppPackaging, BuildInfoPlugin)
diff --git a/src/main/scala/io/github/mandar2812/dynaml/models/ensemble/CommitteeModel.scala b/src/main/scala/io/github/mandar2812/dynaml/models/ensemble/CommitteeModel.scala
@@ -16,62 +16,13 @@ KIND, either express or implied.  See the License for the
 specific language governing permissions and limitations
 under the License.
 * */
-package io.github.mandar2812.dynaml.models
+package io.github.mandar2812.dynaml.models.ensemble
 
 import breeze.linalg.DenseVector
-import io.github.mandar2812.dynaml.pipes.ModelPipe
-import io.github.mandar2812.dynaml.models.neuralnets.FeedForwardNetwork
 import io.github.mandar2812.dynaml.models.gp.GPRegression
-
-/**
-  *
-  * w1*y1(x) + w2*y2(x) + ... + wb*yb(x)
-  * Defines the basic skeleton of a "meta-model" or
-  * a model of models.
-  *
-  * A set of base models are trained on sub-sampled versions
-  * of the training data set and finally a predictor of the form.
-  *
-  * y(x) = f(y1(x), y2(x), ..., yb(x))
-  *
-  * Where f is some combination function and
-  * b is the number of base models used.
-  *
-  * @tparam D The type of the data structure containing the
-  *           training data set.
-  *
-  * @tparam D1 The type of data structure containing the data
-  *            of the base models.
-  *
-  * @tparam BaseModel The type of model used as base model
-  *                   for the meta model.
-  *                   example: [[FeedForwardNetwork]], [[GPRegression]], etc
-  *
-  * @tparam Pipe A sub-type of [[ModelPipe]] which yields a [[BaseModel]]
-  *              with [[D1]] as the base data structure given a
-  *              data structure of type [[D]]
-  *
-  * @param num The number of training data points.
-  *
-  * @param data The actual training data
-  *
-  * @param networks A sequence of [[Pipe]] objects yielding [[BaseModel]]
-  * */
-abstract class MetaModel[
-D, D1,
-BaseModel <: Model[D1, DenseVector[Double], Double],
-Pipe <: ModelPipe[D, D1, DenseVector[Double], Double, BaseModel]
-](num: Int, data: D, networks: Pipe*)
-  extends Model[D, DenseVector[Double], Double] {
-
-  override protected val g = data
-
-  val baseNetworks: List[BaseModel] =
-    networks.toList.map(net => net.run(g))
-
-}
-
-
+import io.github.mandar2812.dynaml.models.neuralnets.FeedForwardNetwork
+import io.github.mandar2812.dynaml.models.{LinearModel, Model}
+import io.github.mandar2812.dynaml.pipes.ModelPipe
 
 /**
   * Defines an abstract implementation of a "committee-model".
@@ -108,7 +59,7 @@ abstract class CommitteeModel[
 D, D1,
 BaseModel <: Model[D1, DenseVector[Double], Double],
 Pipe <: ModelPipe[D, D1, DenseVector[Double], Double, BaseModel]
-](num: Int, data: D, networks: Pipe*) extends
+](num: Long, data: D, networks: Pipe*) extends
 MetaModel[D,D1,BaseModel,Pipe](num, data, networks:_*) with
 LinearModel[D, DenseVector[Double], DenseVector[Double], Double, D] {
 
@@ -128,7 +79,7 @@ LinearModel[D, DenseVector[Double], DenseVector[Double], Double, D] {
     DenseVector.fill[Double](baseNetworks.length)(1.0)
 
   override def initParams(): DenseVector[Double] =
-    DenseVector.fill[Double](baseNetworks.length)(1.0)
+    DenseVector.fill[Double](baseNetworks.length)(1.0/baseNetworks.length)
 
   /**
     * Learn the parameters
@@ -138,16 +89,14 @@ LinearModel[D, DenseVector[Double], DenseVector[Double], Double, D] {
     *
     **/
   override def learn(): Unit = {
-
     params = optimizer.optimize(num_points, g, initParams())
   }
 
   override protected var params: DenseVector[Double] =
-    DenseVector.fill[Double](baseNetworks.length)(1.0)
+    initParams()
 
   featureMap = (pattern) =>
-    DenseVector(baseNetworks.map(net =>
-      net.predict(pattern)).toArray)
+    DenseVector(baseNetworks.map(_.predict(pattern)).toArray)
 
 
 }
diff --git a/src/main/scala/io/github/mandar2812/dynaml/models/ensemble/MetaModel.scala b/src/main/scala/io/github/mandar2812/dynaml/models/ensemble/MetaModel.scala
@@ -0,0 +1,67 @@
+/*
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements.  See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership.  The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied.  See the License for the
+specific language governing permissions and limitations
+under the License.
+* */
+package io.github.mandar2812.dynaml.models.ensemble
+
+import breeze.linalg.DenseVector
+import io.github.mandar2812.dynaml.models.Model
+import io.github.mandar2812.dynaml.models.gp.GPRegression
+import io.github.mandar2812.dynaml.models.neuralnets.FeedForwardNetwork
+import io.github.mandar2812.dynaml.pipes.ModelPipe
+
+/**
+  *
+  * w1*y1(x) + w2*y2(x) + ... + wb*yb(x)
+  * Defines the basic skeleton of a "meta-model" or
+  * a model of models.
+  *
+  * A set of base models are trained on sub-sampled versions
+  * of the training data set and finally a predictor of the form.
+  *
+  * y(x) = f(y1(x), y2(x), ..., yb(x))
+  *
+  * Where f is some combination function and
+  * b is the number of base models used.
+  *
+  * @tparam D The type of the data structure containing the
+  *           training data set.
+  * @tparam D1 The type of data structure containing the data
+  *            of the base models.
+  * @tparam BaseModel The type of model used as base model
+  *                   for the meta model.
+  *                   example: [[FeedForwardNetwork]], [[GPRegression]], etc
+  * @tparam Pipe A sub-type of [[ModelPipe]] which yields a [[BaseModel]]
+  *              with [[D1]] as the base data structure given a
+  *              data structure of type [[D]]
+  * @param num The number of training data points.
+  * @param data The actual training data
+  * @param networks A sequence of [[Pipe]] objects yielding [[BaseModel]]
+  * */
+abstract class MetaModel[
+D, D1,
+BaseModel <: Model[D1, DenseVector[Double], Double],
+Pipe <: ModelPipe[D, D1, DenseVector[Double], Double, BaseModel]
+](num: Long, data: D, networks: Pipe*)
+  extends Model[D, DenseVector[Double], Double] {
+
+  override protected val g = data
+
+  val baseNetworks: List[BaseModel] =
+    networks.toList.map(_(g))
+
+}
diff --git a/src/main/scala/io/github/mandar2812/dynaml/models/neuralnets/CommitteeNetwork.scala b/src/main/scala/io/github/mandar2812/dynaml/models/neuralnets/CommitteeNetwork.scala
@@ -62,14 +62,15 @@ LinearModel[D, DenseVector[Double], DenseVector[Double],
   override def predict(point: DenseVector[Double]): Double =
     params dot featureMap(point)
 
-  override def clearParameters(): Unit =
-    DenseVector.fill[Double](baseNetworks.length)(1.0)
+  override def clearParameters(): Unit = {
+    params = initParams()
+  }
 
   override def initParams(): DenseVector[Double] =
-    DenseVector.fill[Double](baseNetworks.length)(1.0)
+    DenseVector.fill[Double](baseNetworks.length)(1.0/baseNetworks.length)
 
   featureMap = (pattern) =>
-    DenseVector(baseNetworks.map(net => net.forwardPass(pattern)(0)).toArray)
+    DenseVector(baseNetworks.map(_.forwardPass(pattern)(0)).toArray)
 
   /**
     * Learn the parameters
diff --git a/src/main/scala/io/github/mandar2812/dynaml/models/svm/AbstractDualLSSVM.scala b/src/main/scala/io/github/mandar2812/dynaml/models/svm/AbstractDualLSSVM.scala
@@ -81,5 +81,6 @@ abstract class AbstractDualLSSVM[Index](data: Stream[(Index, Double)],
     current_state += ("regularization" -> h("regularization"))
   }
 
+  def getState = current_state
 
 }
diff --git a/src/main/scala/io/github/mandar2812/dynaml/models/svm/LSSVMCommittee.scala b/src/main/scala/io/github/mandar2812/dynaml/models/svm/LSSVMCommittee.scala
@@ -0,0 +1,42 @@
+package io.github.mandar2812.dynaml.models.svm
+
+import breeze.linalg.DenseVector
+import io.github.mandar2812.dynaml.models.ensemble.CommitteeModel
+import io.github.mandar2812.dynaml.optimization.{GlobalOptimizer, GridSearch, RDDCommitteeSolver, RegularizedOptimizer}
+import io.github.mandar2812.dynaml.pipes.DLSSVMPipe
+import org.apache.spark.rdd.RDD
+
+/**
+  * Created by mandar on 3/6/16.
+  */
+
+class LSSVMCommittee(num: Long,
+                     data: RDD[(DenseVector[Double], Double)],
+                     pipes: DLSSVMPipe[RDD[(DenseVector[Double], Double)]]*) extends
+  CommitteeModel[RDD[(DenseVector[Double], Double)],
+    Stream[(DenseVector[Double], Double)],
+    DLSSVM, DLSSVMPipe[RDD[(DenseVector[Double], Double)]]] (num, data, pipes:_*){
+
+  override protected val optimizer: RegularizedOptimizer[
+    DenseVector[Double],
+    DenseVector[Double], Double,
+    RDD[(DenseVector[Double], Double)]] = new RDDCommitteeSolver
+
+  var modelTuners: List[GlobalOptimizer[DLSSVM]] =
+    baseNetworks.map(m => new GridSearch[DLSSVM](m).setGridSize(10).setStepSize(0.1))
+
+  override def learn(): Unit = {
+    //First tune and learn the base SVM models
+    (baseNetworks zip modelTuners).foreach(modelCouple => {
+      val (_, conf) = modelCouple._2.optimize(modelCouple._1.getState, Map())
+      modelCouple._1.setState(conf)
+      modelCouple._1.learn()
+    })
+    //Now learn the committee weights
+    val fMap = featureMap
+    params = optimizer.optimize(num_points,
+      g.map(patternCouple => (fMap(patternCouple._1), patternCouple._2)),
+      initParams())
+  }
+
+}
diff --git a/src/main/scala/io/github/mandar2812/dynaml/optimization/CommitteeModelSolver.scala b/src/main/scala/io/github/mandar2812/dynaml/optimization/CommitteeModelSolver.scala
@@ -18,7 +18,8 @@ under the License.
 * */
 package io.github.mandar2812.dynaml.optimization
 
-import breeze.linalg.{DenseMatrix, inv, DenseVector}
+import breeze.linalg.{DenseMatrix, DenseVector, inv}
+import org.apache.spark.rdd.RDD
 
 /**
   * Solves the optimization problem pertaining
@@ -50,3 +51,31 @@ RegularizedOptimizer[DenseVector[Double],
     ans/Z
   }
 }
+
+
+class RDDCommitteeSolver extends
+  RegularizedOptimizer[DenseVector[Double],
+    DenseVector[Double], Double,
+    RDD[(DenseVector[Double], Double)]] {
+  /**
+    * Solve the convex optimization problem.
+    *
+    * min wT.C.w    such that ||w||<sub>1</sub> = 1
+    */
+  override def optimize(nPoints: Long,
+                        ParamOutEdges: RDD[(DenseVector[Double], Double)],
+                        initialP: DenseVector[Double]): DenseVector[Double] = {
+
+    val sumMat = ParamOutEdges.map(couple => {
+      val diff = couple._1 - DenseVector.fill[Double](couple._1.length)(couple._2)
+      diff * diff.t
+    }).reduce((mat1, mat2) => mat1+mat2)
+
+    sumMat :/= nPoints.toDouble
+    val ones = DenseVector.ones[Double](initialP.length)
+    val invMat = inv(sumMat + DenseMatrix.eye[Double](initialP.length)*regParam)
+    val ans: DenseVector[Double] = invMat*ones
+    val Z: Double = ones dot ans
+    ans/Z
+  }
+}
diff --git a/src/main/scala/io/github/mandar2812/dynaml/pipes/ModelPipe.scala b/src/main/scala/io/github/mandar2812/dynaml/pipes/ModelPipe.scala
@@ -23,6 +23,7 @@ import io.github.mandar2812.dynaml.kernels.CovarianceFunction
 import io.github.mandar2812.dynaml.models._
 import io.github.mandar2812.dynaml.models.gp.AbstractGPRegressionModel
 import io.github.mandar2812.dynaml.models.lm.GeneralizedLinearModel
+import io.github.mandar2812.dynaml.models.svm.{AbstractDualLSSVM, DLSSVM}
 
 /**
   * Top level trait for Pipes involving ML models.
@@ -68,4 +69,16 @@ class GLMPipe[T, Source](pre: (Source) => Stream[(DenseVector[Double], Double)],
 
 }
 
+class DLSSVMPipe[Source](pre: (Source) => Stream[(DenseVector[Double], Double)],
+                         cov: CovarianceFunction[DenseVector[Double], Double, DenseMatrix[Double]],
+                         task: String = "regression") extends
+  ModelPipe[Source, Stream[(DenseVector[Double], Double)],
+    DenseVector[Double], Double, DLSSVM] {
+
+  override val preProcess = pre
 
+  override def run(data: Source) = {
+    val training = preProcess(data)
+    new DLSSVM(training, training.length, cov, task)
+  }
+}

Original file line number	Diff line number	Diff line change
`@@ -40,8 +40,7 @@ lazy val commonSettings = Seq(`
`40`	`40`	`"org.jzy3d" % "jzy3d-api" % "0.9.1" % "compile",`
`41`	`41`	`"com.lihaoyi" % "ammonite-repl_2.11.7" % "0.5.8"`
`42`	`42`	`),`
`43`		`- initialCommands in console :=`
`44`		`- """io.github.mandar2812.dynaml.DynaML.run();"""`
	`43`	`+ initialCommands in console := """io.github.mandar2812.dynaml.DynaML.run();"""`
`45`	`44`	`)`
`46`	`45`
`47`	`46`	`lazy val DynaML = (project in file(".")).enablePlugins(JavaAppPackaging, BuildInfoPlugin)`
Original file line number	Diff line number	Diff line change
`@@ -81,5 +81,6 @@ abstract class AbstractDualLSSVM[Index](data: Stream[(Index, Double)],`
`81`	`81`	`current_state += ("regularization" -> h("regularization"))`
`82`	`82`	`}`
`83`	`83`
	`84`	`+ def getState = current_state`
`84`	`85`
`85`	`86`	`}`