Add some benchmarks

Atry · Atry · commit 3e31ec5d6b1c · 2018-05-30T17:15:25.000+08:00
diff --git a/benchmark/build.sbt b/benchmark/build.sbt
@@ -0,0 +1,28 @@
+libraryDependencies ++= {
+  import Ordering.Implicits._
+  if (VersionNumber(scalaVersion.value).numbers >= Seq(2, 12)) {
+    Nil
+  } else {
+    Seq(
+      "com.thoughtworks.deeplearning.etl" %% "cifar100" % "0.1.1-SNAPSHOT",
+      "ch.qos.logback" % "logback-classic" % "1.2.3" % Optional,
+      "org.nd4j" %% "nd4s" % "0.8.0",
+      "org.nd4j" % "nd4j-api" % "0.8.0",
+      "org.nd4j" % "nd4j-native-platform" % "0.8.0" % Optional
+    )
+  }
+}
+
+fork in Test := true
+
+enablePlugins(JmhPlugin)
+
+publishArtifact := false
+
+addCompilerPlugin("com.thoughtworks.dsl" %% "compilerplugins-bangnotation" % "1.0.0-RC10")
+
+addCompilerPlugin("com.thoughtworks.dsl" %% "compilerplugins-reseteverywhere" % "1.0.0-RC10")
+
+libraryDependencies += "com.thoughtworks.dsl" %% "domains-scalaz" % "1.0.0-RC10"
+
+addCompilerPlugin("com.thoughtworks.import" %% "import" % "2.0.2")
diff --git a/benchmark/src/jmh/scala/com/thoughtworks/deeplearning/benchmark/benchmark.scala b/benchmark/src/jmh/scala/com/thoughtworks/deeplearning/benchmark/benchmark.scala
@@ -0,0 +1,181 @@
+package com.thoughtworks.deeplearning.benchmark
+
+import java.util.concurrent.{ExecutorService, Executors}
+
+import com.thoughtworks.deeplearning.DeepLearning
+import com.thoughtworks.deeplearning.etl.Cifar100
+import com.thoughtworks.deeplearning.etl.Cifar100.Batch
+import com.thoughtworks.deeplearning.plugins.Builtins
+import com.thoughtworks.feature.Factory
+import org.openjdk.jmh.annotations._
+import com.thoughtworks.future._
+import org.nd4j.linalg.api.ndarray.INDArray
+import org.nd4j.linalg.factory.Nd4j
+
+import scala.concurrent.{ExecutionContext, ExecutionContextExecutorService}
+
+/**
+  * @author 杨博 (Yang Bo)
+  */
+object benchmark {
+
+  import $exec.`https://gist.github.com/Atry/1fb0608c655e3233e68b27ba99515f16/raw/39ba06ee597839d618f2fcfe9526744c60f2f70a/FixedLearningRate.sc`
+
+  trait LayerOutput {
+    def numberOfFeatures: Int
+    type Output
+    def output: Output
+    def typeClassInstance: DeepLearning.Aux[Output, INDArray, INDArray]
+  }
+  object LayerOutput {
+    def input(indArray: INDArray): LayerOutput = new LayerOutput {
+      def numberOfFeatures: Int = indArray.shape().apply(1)
+
+      type Output = INDArray
+      def output = indArray
+
+      def typeClassInstance: DeepLearning.Aux[INDArray, INDArray, INDArray] = ???
+    }
+  }
+
+  @Threads(value = 1)
+  @State(Scope.Benchmark)
+  class FourLayer {
+
+    @Param(Array("4"))
+    protected var batchSize: Int = _
+
+    @Param(Array("1", "2", "4"))
+    protected var sizeOfThreadPool: Int = _
+
+    @Param(Array("16", "32", "64"))
+    protected var numberOfHiddenFeatures: Int = _
+
+    @Param(Array("16", "8"))
+    protected var numberOfBranches: Int = _
+
+    private implicit var executionContext: ExecutionContextExecutorService = _
+
+    private lazy val batches = {
+      val cifar100: Cifar100 = Cifar100.load().blockingAwait
+      Iterator.continually(cifar100.epochByCoarseClass(batchSize)).flatten
+    }
+
+    class Model {
+      val hyperparameters = Factory[Builtins with FixedLearningRate].newInstance(learningRate = 0.0001)
+
+      import hyperparameters._, implicits._
+
+      object CoarseFeatures extends (INDArray => INDArrayLayer) {
+
+        val branches = Seq.fill(numberOfBranches)(new (INDArray => INDArrayLayer) {
+          object Dense1 extends (INDArray => INDArrayLayer) {
+            val weight = INDArrayWeight(Nd4j.randn(Cifar100.NumberOfPixelsPerSample, numberOfHiddenFeatures))
+            val bias = INDArrayWeight(Nd4j.randn(1, numberOfHiddenFeatures))
+
+            def apply(input: INDArray) = {
+              max(input dot weight + bias, 0.0)
+            }
+          }
+
+          val weight = INDArrayWeight(Nd4j.randn(numberOfHiddenFeatures, numberOfHiddenFeatures))
+          val bias = INDArrayWeight(Nd4j.randn(1, numberOfHiddenFeatures))
+
+          def apply(input: INDArray) = {
+            max(Dense1(input) dot weight + bias, 0.0)
+          }
+        })
+
+        def apply(input: INDArray) = {
+          branches.map(_.apply(input)).reduce(_ + _)
+        }
+      }
+
+      object CoarseProbabilityModel {
+        val weight = INDArrayWeight(Nd4j.randn(numberOfHiddenFeatures, Cifar100.NumberOfCoarseClasses))
+        val bias = INDArrayWeight(Nd4j.randn(1, Cifar100.NumberOfCoarseClasses))
+
+        def apply(input: INDArrayLayer) = {
+          val scores = input dot weight + bias
+
+          val expScores = exp(scores)
+          expScores / expScores.sum(1)
+        }
+      }
+
+      val fineProbabilityModel = Seq.fill(Cifar100.NumberOfCoarseClasses)(new (INDArrayLayer => INDArrayLayer) {
+        object Dense2 extends (INDArrayLayer => INDArrayLayer) {
+
+          object Dense1 extends (INDArrayLayer => INDArrayLayer) {
+            val weight = INDArrayWeight(Nd4j.randn(numberOfHiddenFeatures, numberOfHiddenFeatures))
+            val bias = INDArrayWeight(Nd4j.randn(1, numberOfHiddenFeatures))
+
+            def apply(coarseFeatures: INDArrayLayer) = {
+              max(coarseFeatures dot weight + bias, 0.0)
+            }
+          }
+
+          val weight = INDArrayWeight(Nd4j.randn(numberOfHiddenFeatures, numberOfHiddenFeatures))
+          val bias = INDArrayWeight(Nd4j.randn(1, numberOfHiddenFeatures))
+
+          def apply(coarseFeatures: INDArrayLayer) = {
+            max(Dense1(coarseFeatures) dot weight + bias, 0.0)
+          }
+        }
+
+        val weight = INDArrayWeight(Nd4j.randn(numberOfHiddenFeatures, Cifar100.NumberOfFineClassesPerCoarseClass))
+        val bias = INDArrayWeight(Nd4j.randn(1, Cifar100.NumberOfFineClassesPerCoarseClass))
+
+        def apply(coarseFeatures: INDArrayLayer) = {
+          val scores = Dense2(coarseFeatures) dot weight + bias
+
+          val expScores = exp(scores)
+          expScores / expScores.sum(1)
+        }
+      })
+
+      def loss(coarseLabel: Int, batch: Batch): DoubleLayer = {
+        def crossEntropy(prediction: INDArrayLayer, expectOutput: INDArray): DoubleLayer = {
+          -(hyperparameters.log(prediction) * expectOutput).mean
+        }
+
+        val Array(batchSize, width, height, channels) = batch.pixels.shape()
+        val coarseFeatures = CoarseFeatures(batch.pixels.reshape(batchSize, width * height * channels))
+        val coarseProbabilities = CoarseProbabilityModel(coarseFeatures)
+        val fineProbabilities = fineProbabilityModel(coarseLabel)(coarseFeatures)
+
+        crossEntropy(coarseProbabilities, batch.coarseClasses) + crossEntropy(fineProbabilities, batch.localFineClasses)
+      }
+
+      def train(coarseLabel: Int, batch: Batch) = {
+        loss(coarseLabel, batch).train
+      }
+
+    }
+
+    private var model: Model = null
+
+    @Setup
+    final def setup(): Unit = {
+      executionContext = ExecutionContext.fromExecutorService(Executors.newFixedThreadPool(sizeOfThreadPool))
+      model = new Model
+    }
+
+    @TearDown
+    final def tearDown(): Unit = {
+      model = null
+      executionContext.shutdown()
+      executionContext = null
+    }
+
+    @Benchmark
+    final def deepLearningDotScala(): Double = {
+      val (coarseClass, batch) = batches.synchronized {
+        batches.next()
+      }
+      model.train(coarseClass, batch).blockingAwait
+    }
+
+  }
+
+}
diff --git a/build.sbt b/build.sbt
@@ -144,6 +144,9 @@ lazy val `plugins-Builtins` =
     `plugins-CumulativeINDArrayLayers`,
     DeepLearning % "test->test"
   )
+
+lazy val benchmark = project.dependsOn(`plugins-Builtins`)
+
 publishArtifact := false
 
 lazy val unidoc =
diff --git a/project/plugins.sbt b/project/plugins.sbt
@@ -1,3 +1,5 @@
 addSbtPlugin("com.thoughtworks.sbt-best-practice" % "sbt-best-practice" % "2.5.0")
 
 addSbtPlugin("com.thoughtworks.example" % "sbt-example" % "2.0.2")
+
+addSbtPlugin("pl.project13.scala" % "sbt-jmh" % "0.3.4")

Original file line number	Diff line number	Diff line change
@@ -144,6 +144,9 @@ lazy val `plugins-Builtins` =
`144`	`144`	`plugins-CumulativeINDArrayLayers`,
`145`	`145`	`DeepLearning % "test->test"`
`146`	`146`	`)`
	`147`	`+`
	`148`	+lazy val benchmark = project.dependsOn(`plugins-Builtins`)
	`149`	`+`
`147`	`150`	`publishArtifact := false`
`148`	`151`
`149`	`152`	`lazy val unidoc =`