[MXNET-716] Adding Scala Inference Benchmarks (#12721)

* Adding Scala Inference Benchmark base class + an example of how to run it * Fixed scalastyle issues * Added platform check to the classpath * Formatting the metrics to print upto 2 decimal digits in float * Added bash script to fetch resnet-18 data and params * Added flag for cpu/gpu for running the script * Fixed duplicate if check
apache · Oct 5, 2018 · e93af41 · e93af41
1 parent e1fe7b1
commit e93af41
Show file tree

Hide file tree

Showing 10 changed files with 476 additions and 11 deletions.
diff --git a/scala-package/examples/scripts/benchmark/run_image_inference_bm.sh b/scala-package/examples/scripts/benchmark/run_image_inference_bm.sh
@@ -0,0 +1,61 @@
+#!/bin/bash
+
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+set -e
+
+echo $OSTYPE
+
+hw_type=cpu
+if [ "$1" = "gpu" ]
+then
+    hw_type=gpu
+fi
+
+platform=linux-x86_64
+
+if [ "$OSTYPE" == "darwin"* ]
+then
+    platform=osx-x86_64
+fi
+
+MXNET_ROOT=$(cd "$(dirname $0)/../../../.."; pwd)
+CLASS_PATH=$MXNET_ROOT/scala-package/assembly/$platform-$hw_type/target/*:$MXNET_ROOT/scala-package/examples/target/*:$MXNET_ROOT/scala-package/examples/target/classes/lib/*:$MXNET_ROOT/scala-package/infer/target/*
+
+MODEL_NAME=$2
+
+RUNS=$3
+
+BATCHSIZE=$4
+
+# model dir
+MODEL_PATH_PREFIX=$5
+# input image
+INPUT_IMG=$6
+# which input image dir
+INPUT_DIR=$7
+
+java -Xmx8G -Dmxnet.traceLeakedObjects=true -cp $CLASS_PATH \
+	org.apache.mxnetexamples.benchmark.ScalaInferenceBenchmark \
+	--example $MODEL_NAME \
+	--count $RUNS \
+	--batchSize $BATCHSIZE \
+	--model-path-prefix $MODEL_PATH_PREFIX \
+	--input-image $INPUT_IMG \
+	--input-dir $INPUT_DIR \
+
diff --git a/scala-package/examples/scripts/infer/imageclassifier/get_resnet_18_data.sh b/scala-package/examples/scripts/infer/imageclassifier/get_resnet_18_data.sh
@@ -0,0 +1,41 @@
+#!/bin/bash
+
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+set -e
+
+MXNET_ROOT=$(cd "$(dirname $0)/../../.."; pwd)
+
+data_path=$MXNET_ROOT/scripts/infer/models/resnet-18/
+
+image_path=$MXNET_ROOT/scripts/infer/images/
+
+if [ ! -d "$data_path" ]; then
+  mkdir -p "$data_path"
+fi
+
+if [ ! -d "$image_path" ]; then
+  mkdir -p "$image_path"
+fi
+
+if [ ! -f "$data_path" ]; then
+  wget https://s3.us-east-2.amazonaws.com/scala-infer-models/resnet-18/resnet-18-symbol.json -P $data_path
+  wget https://s3.us-east-2.amazonaws.com/scala-infer-models/resnet-18/resnet-18-0000.params -P $data_path
+  wget https://s3.us-east-2.amazonaws.com/scala-infer-models/resnet-18/synset.txt -P $data_path
+  wget https://s3.amazonaws.com/model-server/inputs/kitten.jpg -P $image_path
+fi
diff --git a/scala-package/examples/src/main/scala/org/apache/mxnetexamples/InferBase.scala b/scala-package/examples/src/main/scala/org/apache/mxnetexamples/InferBase.scala
@@ -0,0 +1,30 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.mxnetexamples
+
+import org.apache.mxnet._
+
+trait InferBase {
+
+  def loadModel(context: Array[Context]): Any
+  def loadSingleData(): Any
+  def loadBatchFileList(batchSize: Int): List[Any]
+  def loadInputBatch(source: Any): Any
+  def runSingleInference(loadedModel: Any, input: Any): Any
+  def runBatchInference(loadedModel: Any, input: Any): Any
+}
diff --git a/scala-package/examples/src/main/scala/org/apache/mxnetexamples/benchmark/README.md b/scala-package/examples/src/main/scala/org/apache/mxnetexamples/benchmark/README.md
@@ -0,0 +1,49 @@
+# Benchmarking Scala Inference APIs 
+
+This folder contains a base class [ScalaInferenceBenchmark](https://github.com/apache/incubator-mxnet/tree/master/scala-package/examples/src/main/scala/org/apache/mxnetexamples/benchmark/) and provides a mechanism for benchmarking [MXNet Inference APIs]((https://github.com/apache/incubator-mxnet/tree/master/scala-package/infer)) in Scala.
+The benchmarking scripts provided runs an experiment for single inference calls and batch inference calls. It collects the time taken to perform an inference operation and emits the P99, P50 and Average values for these metrics.  One can easily add/modify any new/existing examples to the ScalaInferenceBenchmark framework in order to get the benchmark numbers for inference calls.
+Currently the ScalaInferenceBenchmark script supports three Scala examples : 
+1. [ImageClassification using ResNet-152](https://github.com/apache/incubator-mxnet/blob/master/scala-package/mxnet-demo/src/main/scala/sample/ImageClassificationExample.scala)
+2. [Object Detection Example](https://github.com/apache/incubator-mxnet/blob/master/scala-package/examples/src/main/scala/org/apache/mxnetexamples/infer/objectdetector/SSDClassifierExample.scala)
+3. [Text Generation through RNNs](https://github.com/apache/incubator-mxnet/blob/master/scala-package/examples/src/main/scala/org/apache/mxnetexamples/rnn/TestCharRnn.scala)
+
+This script can be easily placed in an automated environment to run benchmark regressions on the Scala APIs. The script automatically picks up whether you are running it on a CPU machine or on a GPU machine and appropriately uses that.
+
+## Contents
+
+1. [Prerequisites](#prerequisites)
+2. [Scripts](#scripts)
+
+## Prerequisites
+
+1. MXNet
+2. MXNet Scala Package
+3. [IntelliJ IDE (or alternative IDE) project setup](http://mxnet.incubator.apache.org/tutorials/scala/mxnet_scala_on_intellij.html) with the MXNet Scala Package
+4. Model files and datasets for the model one will try to benchmark
+
+## Scripts
+To help you easily run the benchmarks, a starter shell script has been provided for each of three examples mentioned above. The scripts can be found [here](https://github.com/apache/incubator-mxnet/blob/master/scala-package/examples/scripts/benchmark).
+Each of the script takes some parameters as inputs, details of which can be found either in the bash scripts or in the example classes itself. 
+
+* *ImageClassification Example*
+<br> The following shows an example of running ImageClassifier under the benchmark script. The script takes as parameters, the platform type (cpu/gpu), number of iterations for inference calls, the batch size for batch inference calls, the model path, input file, and input directory. 
+For more details to run ImageClassificationExample as a standalone file, refer to the [README](https://github.com/apache/incubator-mxnet/blob/master/scala-package/examples/src/main/scala/org/apache/mxnetexamples/infer/imageclassifier/README.md) for ImageClassifierExample.
+You may need to run ```chmod u+x run_image_inference_bm.sh``` before running this script.
+    ```bash
+    cd <Path-To-MXNET-Repo>/scala-package/examples/scripts/infer/imageclassifier
+    ./get_resnet_data.sh
+    cd <Path-To-MXNET-Repo>/scala-package/examples/scripts/benchmark
+    ./run_image_inference_bm.sh gpu ImageClassifierExample 100 10 ../infer/models/resnet-152/resnet-152 ../infer/images/kitten.jpg ../infer/images/
+    ./run_image_inference_bm.sh cpu ImageClassifierExample 100 10 ../infer/models/resnet-152/resnet-152 ../infer/images/kitten.jpg ../infer/images/
+    ```
+    Upon running this script, you might see an output like this : 
+    ```
+    [main] INFO org.apache.mxnetexamples.benchmark.CLIParserBase - 
+    single_inference_latency p99 1663, single_inference_p50 729, single_inference_average 755.17
+    ...
+
+    INFO org.apache.mxnetexamples.benchmark.CLIParserBase - 
+    batch_inference_latency p99 4241, batch_inference_p50 4241, batch_inference_average 4241.00
+    ```
+
+More examples to be added soon.
diff --git a/.../examples/src/main/scala/org/apache/mxnetexamples/benchmark/ScalaInferenceBenchmark.scala b/.../examples/src/main/scala/org/apache/mxnetexamples/benchmark/ScalaInferenceBenchmark.scala
@@ -0,0 +1,157 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.mxnetexamples.benchmark
+
+import org.apache.mxnetexamples.InferBase
+import org.apache.mxnetexamples.infer.imageclassifier.ImageClassifierExample
+import org.apache.mxnet._
+import org.kohsuke.args4j.{CmdLineParser, Option}
+import org.slf4j.LoggerFactory
+
+import scala.collection.JavaConverters._
+
+object ScalaInferenceBenchmark {
+
+  private val logger = LoggerFactory.getLogger(classOf[CLIParserBase])
+
+  def loadModel(objectToRun: InferBase, context: Array[Context]):
+  Any = {
+    objectToRun.loadModel(context)
+  }
+
+  def loadDataSet(objectToRun: InferBase):
+  Any = {
+    objectToRun.loadSingleData()
+  }
+
+  def loadBatchDataSet(objectToRun: InferBase, batchSize: Int):
+  List[Any] = {
+    objectToRun.loadBatchFileList(batchSize)
+  }
+
+  def runInference(objectToRun: InferBase, loadedModel: Any, dataSet: Any, totalRuns: Int):
+  List[Long] = {
+    var inferenceTimes: List[Long] = List()
+    for (i <- 1 to totalRuns) {
+      NDArrayCollector.auto().withScope {
+        val startTimeSingle = System.currentTimeMillis()
+        objectToRun.runSingleInference(loadedModel, dataSet)
+        val estimatedTimeSingle = System.currentTimeMillis() - startTimeSingle
+        inferenceTimes = estimatedTimeSingle :: inferenceTimes
+        logger.info("Inference time at iteration: %d is : %d \n".format(i, estimatedTimeSingle))
+      }
+    }
+
+    inferenceTimes
+  }
+
+  def runBatchInference(objecToRun: InferBase, loadedModel: Any, dataSetBatches: List[Any]):
+  List[Long] = {
+
+    var inferenceTimes: List[Long] = List()
+    for (batch <- dataSetBatches) {
+      NDArrayCollector.auto().withScope {
+        val loadedBatch = objecToRun.loadInputBatch(batch)
+        val startTimeSingle = System.currentTimeMillis()
+        objecToRun.runBatchInference(loadedModel, loadedBatch)
+        val estimatedTimeSingle = System.currentTimeMillis() - startTimeSingle
+        inferenceTimes = estimatedTimeSingle :: inferenceTimes
+        logger.info("Batch Inference time is : %d \n".format(estimatedTimeSingle))
+      }
+    }
+
+    inferenceTimes
+  }
+
+  def percentile(p: Int, seq: Seq[Long]): Long = {
+    val sorted = seq.sorted
+    val k = math.ceil((seq.length - 1) * (p / 100.0)).toInt
+    sorted(k)
+  }
+
+  def printStatistics(inferenceTimes: List[Long], metricsPrefix: String)  {
+
+    val times: Seq[Long] = inferenceTimes
+    val p50 = percentile(50, times)
+    val p99 = percentile(99, times)
+    val average = times.sum / (times.length * 1.0)
+
+    logger.info("\n%s_p99 %d, %s_p50 %d, %s_average %1.2f".format(metricsPrefix,
+      p99, metricsPrefix, p50, metricsPrefix, average))
+
+  }
+
+  def main(args: Array[String]): Unit = {
+
+    var context = Context.cpu()
+    if (System.getenv().containsKey("SCALA_TEST_ON_GPU") &&
+      System.getenv("SCALA_TEST_ON_GPU").toInt == 1) {
+      context = Context.gpu()
+    }
+    var baseCLI : CLIParserBase = null
+    try {
+      val exampleName = args(1)
+      val exampleToBenchmark : InferBase = exampleName match {
+        case "ImageClassifierExample" => {
+          val imParser = new org.apache.mxnetexamples.infer.imageclassifier.CLIParser
+          baseCLI = imParser
+          val parsedVals = new CmdLineParser(imParser).parseArgument(args.toList.asJava)
+          new ImageClassifierExample(imParser)
+        }
+        case _ => throw new Exception("Invalid example name to run")
+      }
+
+      logger.info("Running single inference call")
+      // Benchmarking single inference call
+      NDArrayCollector.auto().withScope {
+        val loadedModel = loadModel(exampleToBenchmark, context)
+        val dataSet = loadDataSet(exampleToBenchmark)
+        val inferenceTimes = runInference(exampleToBenchmark, loadedModel, dataSet, baseCLI.count)
+        printStatistics(inferenceTimes, "single_inference")
+      }
+
+      if (baseCLI.batchSize != 0) {
+        logger.info("Running for batch inference call")
+        // Benchmarking batch inference call
+        NDArrayCollector.auto().withScope {
+          val loadedModel = loadModel(exampleToBenchmark, context)
+          val batchDataSet = loadBatchDataSet(exampleToBenchmark, baseCLI.batchSize)
+          val inferenceTimes = runBatchInference(exampleToBenchmark, loadedModel, batchDataSet)
+          printStatistics(inferenceTimes, "batch_inference")
+        }
+      }
+
+    } catch {
+      case ex: Exception => {
+        logger.error(ex.getMessage, ex)
+        new CmdLineParser(baseCLI).printUsage(System.err)
+        sys.exit(1)
+      }
+    }
+  }
+
+}
+
+class CLIParserBase {
+  @Option(name = "--example", usage = "The scala example to benchmark")
+  val exampleName: String = "ImageClassifierExample"
+  @Option(name = "--count", usage = "number of times to run inference")
+  val count: Int = 1000
+  @Option(name = "--batchSize", usage = "BatchSize to run batchinference calls", required = false)
+  val batchSize: Int = 0
+}