Support benchmarking models by CLI and BrowserStack (#3641)

Linchenn · web-flow · commit fb2677e329a9 · 2020-07-23T18:06:32.000-07:00
FEATURE
diff --git a/e2e/benchmarks/benchmark_models.js b/e2e/benchmarks/benchmark_models.js
@@ -0,0 +1,79 @@
+/**
+ * @license
+ * Copyright 2020 Google LLC. All Rights Reserved.
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * =============================================================================
+ */
+
+/**
+ * The purpose of this test file is to benchmark models by a test runner, such
+ * as karma. To invoke this test, inlude this file to the `files` field of
+ * `karma.conf.js`.
+ *
+ * This file wraps the model benchmarking into a Jasmine test and the benchmark
+ * results will be logged to the console.
+ */
+
+async function getEnvSummary() {
+  let envSummary = `${tf.getBackend()} backend`;
+  if (tf.getBackend() === 'webgl') {
+    envSummary += `, version ${tf.env().get('WEBGL_VERSION')}`;
+  } else if (tf.getBackend() === 'wasm') {
+    const hasSIMD = await tf.env().getAsync('WASM_HAS_SIMD_SUPPORT');
+    envSummary += hasSIMD ? ' with SIMD' : ' without SIMD';
+  }
+  return envSummary;
+}
+
+async function getBenchmarkSummary(timeInfo, memoryInfo, modelName = 'model') {
+  if (timeInfo == null) {
+    throw new Error('Missing the timeInfo parameter.');
+  } else if (timeInfo.times.length === 0) {
+    throw new Error('Missing the memoryInfo parameter.');
+  } else if (memoryInfo == null) {
+    throw new Error('The length of timeInfo.times is at least 1.');
+  }
+
+  const numRuns = timeInfo.times.length;
+  const envSummary = await getEnvSummary();
+  const benchmarkSummary = `
+  benchmark the ${modelName} on ${envSummary}
+  1st inference time: ${printTime(timeInfo.times[0])}
+  Average inference time (${numRuns} runs): ${printTime(timeInfo.averageTime)}
+  Best inference time: ${printTime(timeInfo.minTime)}
+  Peak memory: ${printMemory(memoryInfo.peakBytes)}
+  `;
+  return benchmarkSummary;
+}
+
+describe('benchmark models', () => {
+  beforeAll(() => {
+    jasmine.DEFAULT_TIMEOUT_INTERVAL = 1000000;
+  });
+
+  it('mobile net', async () => {
+    const url =
+        'https://storage.googleapis.com/learnjs-data/mobilenet_v2_100_fused/model.json';
+    const model = await tf.loadGraphModel(url);
+    const input = generateInput(model);
+    const predict = () => model.predict(input);
+
+    const numRuns = 20;
+    const timeInfo = await profileInferenceTime(predict, numRuns);
+    const memoryInfo = await profileInferenceMemory(predict);
+
+    const benchmarkSummary =
+        await getBenchmarkSummary(timeInfo, memoryInfo, 'mobilenet_v2');
+    console.log(benchmarkSummary);
+  });
+});
diff --git a/e2e/benchmarks/benchmark_util.js b/e2e/benchmarks/benchmark_util.js
@@ -119,8 +119,12 @@ function getPredictFnForModel(model, input) {
 /**
  * Executes the predict function for `model` (`model.predict` for tf.LayersModel
  * and `model.executeAsync` for tf.GraphModel) and times the inference process
- * for `numRuns` rounds. Then returns a promise that resolves with an array of
- * inference times for each inference process.
+ * for `numRuns` rounds. Then returns a promise that resolves with information
+ * about the model's inference time:
+ * - `times`: an array of inference time for each inference
+ * - `averageTime`: the average time of all inferences
+ * - `minTime`: the minimum time of all inferences
+ * - `maxTime`: the maximum time of all inferences
  *
  * The inference time contains the time spent by both `predict()` and `data()`
  * called by tensors in the prediction.
@@ -130,10 +134,13 @@ function getPredictFnForModel(model, input) {
  *    'https://tfhub.dev/google/imagenet/mobilenet_v2_140_224/classification/2';
  * const model = await tf.loadGraphModel(modelUrl, {fromTFHub: true});
  * const zeros = tf.zeros([1, 224, 224, 3]);
- * const elapsedTimeArray =
+ * const timeInfo =
  *    await profileInferenceTimeForModel(model, zeros, 2);
  *
- * console.log(`Elapsed time array: ${elapsedTimeArray}`);
+ * console.log(`Elapsed time array: ${timeInfo.times}`);
+ * console.log(`Average time: ${timeInfo.averageTime}`);
+ * console.log(`Minimum time: ${timeInfo.minTime}`);
+ * console.log(`Maximum time: ${timeInfo.maxTime}`);
  * ```
  *
  * @param model An instance of tf.GraphModel or tf.LayersModel for timing the
@@ -148,8 +155,12 @@ async function profileInferenceTimeForModel(model, input, numRuns = 1) {
 
 /**
  * Executes `predict()` and times the inference process for `numRuns` rounds.
- * Then returns a promise that resolves with an array of inference time for each
- * inference process.
+ * Then returns a promise that resolves with information about the inference
+ * time:
+ * - `times`: an array of inference time for each inference
+ * - `averageTime`: the average time of all inferences
+ * - `minTime`: the minimum time of all inferences
+ * - `maxTime`: the maximum time of all inferences
  *
  * The inference time contains the time spent by both `predict()` and `data()`
  * called by tensors in the prediction.
@@ -159,10 +170,13 @@ async function profileInferenceTimeForModel(model, input, numRuns = 1) {
  *    'https://tfhub.dev/google/imagenet/mobilenet_v2_140_224/classification/2';
  * const model = await tf.loadGraphModel(modelUrl, {fromTFHub: true});
  * const zeros = tf.zeros([1, 224, 224, 3]);
- * const elapsedTimeArray =
+ * const timeInfo =
  *    await profileInferenceTime(() => model.predict(zeros), 2);
  *
- * console.log(`Elapsed time array: ${elapsedTimeArray}`);
+ * console.log(`Elapsed time array: ${timeInfo.times}`);
+ * console.log(`Average time: ${timeInfo.averageTime}`);
+ * console.log(`Minimum time: ${timeInfo.minTime}`);
+ * console.log(`Maximum time: ${timeInfo.maxTime}`);
  * ```
  *
  * @param predict The predict function to execute and time.
@@ -175,7 +189,7 @@ async function profileInferenceTime(predict, numRuns = 1) {
         `a(n) ${typeof predict} is found.`);
   }
 
-  const elapsedTimeArray = [];
+  const times = [];
   for (let i = 0; i < numRuns; i++) {
     const start = performance.now();
     const res = await predict();
@@ -184,9 +198,20 @@ async function profileInferenceTime(predict, numRuns = 1) {
     const elapsedTime = performance.now() - start;
 
     tf.dispose(res);
-    elapsedTimeArray.push(elapsedTime);
+    times.push(elapsedTime);
   }
-  return elapsedTimeArray;
+
+  const averageTime = times.reduce((acc, curr) => acc + curr, 0) / times.length;
+  const minTime = Math.min(...times);
+  const maxTime = Math.max(...times);
+  const timeInfo = {
+    times,
+    averageTime,
+    minTime,
+    maxTime
+
+  };
+  return timeInfo;
 }
 
 /**
diff --git a/e2e/benchmarks/benchmark_util_test.js b/e2e/benchmarks/benchmark_util_test.js
@@ -34,6 +34,28 @@ describe('benchmark_util', () => {
     });
   });
 
+  describe('profile inference time', () => {
+    describe('profileInferenceTime', () => {
+      it('throws when passing in invalid predict', async () => {
+        const predict = {};
+        await expectAsync(profileInferenceTime(predict)).toBeRejected();
+      });
+
+      it('does not add new tensors', async () => {
+        const model = tf.sequential(
+            {layers: [tf.layers.dense({units: 1, inputShape: [3]})]});
+        const input = tf.zeros([1, 3]);
+
+        const tensorsBefore = tf.memory().numTensors;
+        await profileInferenceTime(() => model.predict(input));
+        expect(tf.memory().numTensors).toEqual(tensorsBefore);
+
+        model.dispose();
+        input.dispose();
+      });
+    });
+  });
+
   describe('Profile Memory', () => {
     describe('profileInferenceMemory', () => {
       it('pass in invalid predict', async () => {
diff --git a/e2e/benchmarks/index.html b/e2e/benchmarks/index.html
@@ -255,21 +255,21 @@ <h2>TensorFlow.js Model Benchmark</h2>
     async function warmUpAndRecordTime() {
       await showMsg('Warming up');
 
-      let elapsedTimeArray;
+      let timeInfo;
       if (state.benchmark === 'custom') {
         const input = generateInput(model);
         try {
-          elapsedTimeArray = await profileInferenceTimeForModel(model, input, 1);
+          timeInfo = await profileInferenceTimeForModel(model, input, 1);
         } finally {
           tf.dispose(input);
         }
       } else {
-        elapsedTimeArray = await profileInferenceTime(() => predict(model), 1);
+        timeInfo = await profileInferenceTime(() => predict(model), 1);
       }
 
       await showMsg(null);
       appendRow(timeTable, 'backend', state.backend);
-      appendRow(timeTable, '1st inference', printTime(elapsedTimeArray[0]));
+      appendRow(timeTable, '1st inference', printTime(timeInfo.times[0]));
     }
 
     async function showInputs() {
@@ -340,27 +340,25 @@ <h2>TensorFlow.js Model Benchmark</h2>
       await showMsg(`Running predict ${state.numRuns} times`);
       chartWidth = document.querySelector('#perf-trendline-container').getBoundingClientRect().width;
 
-      let times;
+      let timeInfo;
       const numRuns = state.numRuns;
       if (state.benchmark === 'custom') {
         const input = generateInput(model);
         try {
-          times = await profileInferenceTimeForModel(model, input, numRuns);
+          timeInfo = await profileInferenceTimeForModel(model, input, numRuns);
         } finally {
           tf.dispose(input);
         }
       } else {
-        times = await profileInferenceTime(() => predict(model), numRuns);
+        timeInfo = await profileInferenceTime(() => predict(model), numRuns);
       }
 
       const forceInferenceTrendYMinToZero = true;
-      populateTrendline(document.querySelector('#perf-trendline-container'), times, forceInferenceTrendYMinToZero, printTime);
+      populateTrendline(document.querySelector('#perf-trendline-container'), timeInfo.times, forceInferenceTrendYMinToZero, printTime);
 
       await showMsg(null);
-      const average = times.reduce((acc, curr) => acc + curr, 0) / times.length;
-      const min = Math.min(...times);
-      appendRow(timeTable, `Subsequent average(${state.numRuns} runs)`, printTime(average));
-      appendRow(timeTable, 'Best time', printTime(min));
+      appendRow(timeTable, `Subsequent average(${state.numRuns} runs)`, printTime(timeInfo.averageTime));
+      appendRow(timeTable, 'Best time', printTime(timeInfo.minTime));
     }
 
     async function profileMemory() {
diff --git a/e2e/benchmarks/karma.conf.js b/e2e/benchmarks/karma.conf.js
@@ -0,0 +1,98 @@
+/**
+ * @license
+ * Copyright 2020 Google LLC. All Rights Reserved.
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * =============================================================================
+ */
+
+const localRunConfig = {
+  reporters: ['progress'],
+  plugins: ['karma-jasmine', 'karma-chrome-launcher'],
+  browsers: ['Chrome']
+};
+
+const browserstackConfig = {
+  hostname: 'bs-local.com',
+  plugins: ['karma-jasmine', 'karma-browserstack-launcher'],
+  reporters: ['progress', 'BrowserStack'],
+  browserStack: {
+    username: process.env.BROWSERSTACK_USERNAME,
+    accessKey: process.env.BROWSERSTACK_ACCESS_KEY,
+    apiClientEndpoint: 'https://api.browserstack.com'
+  },
+
+  customLaunchers: {
+    bs_chrome_mac: {
+      base: 'BrowserStack',
+      browser: 'chrome',
+      browser_version: '84.0',
+      os: 'OS X',
+      os_version: 'Catalina',
+    },
+    bs_firefox_mac: {
+      base: 'BrowserStack',
+      browser: 'firefox',
+      browser_version: '70.0',
+      os: 'OS X',
+      os_version: 'Catalina',
+    },
+    bs_safari_mac: {
+      base: 'BrowserStack',
+      browser: 'Safari',
+      browser_version: '13.1',
+      os: 'OS X',
+      os_version: 'Catalina',
+    }
+  },
+
+  browsers: ['bs_chrome_mac', 'bs_firefox_mac', 'bs_safari_mac'],
+};
+
+module.exports = function(config) {
+  let extraConfig = null;
+  if (config.browserstack) {
+    extraConfig = browserstackConfig;
+  } else {
+    extraConfig = localRunConfig;
+  }
+
+  config.set({
+    ...extraConfig,
+    frameworks: ['jasmine'],
+    files: [
+      'https://unpkg.com/@tensorflow/tfjs-core@latest/dist/tf-core.js',
+      'https://unpkg.com/@tensorflow/tfjs-backend-cpu@latest/dist/tf-backend-cpu.js',
+      'https://unpkg.com/@tensorflow/tfjs-backend-webgl@latest/dist/tf-backend-webgl.js',
+      'https://unpkg.com/@tensorflow/tfjs-layers@latest/dist/tf-layers.js',
+      'https://unpkg.com/@tensorflow/tfjs-converter@latest/dist/tf-converter.js',
+      'https://unpkg.com/@tensorflow/tfjs-backend-wasm@latest/dist/tf-backend-wasm.js',
+      'util.js', 'benchmark_util.js', 'benchmark_models.js'
+    ],
+    preprocessors: {},
+    singleRun: true,
+    captureTimeout: 3e5,
+    reportSlowerThan: 500,
+    browserNoActivityTimeout: 3e5,
+    browserDisconnectTimeout: 3e5,
+    browserDisconnectTolerance: 0,
+    browserSocketTimeout: 1.2e5,
+    client: {jasmine: {random: false}},
+
+    // The following configurations are generated by karma
+    port: 9876,
+    colors: true,
+    logLevel: config.LOG_INFO,
+    autoWatch: false,
+    concurrency: Infinity
+  })
+}
diff --git a/e2e/benchmarks/package.json b/e2e/benchmarks/package.json
@@ -0,0 +1,22 @@
+{
+  "name": "@tensorflow/tfjs-benchmark",
+  "version": "0.0.1",
+  "description": "Benchmark models' and ops' performance",
+  "private": true,
+  "repository": {
+    "type": "git",
+    "url": "https://github.com/tensorflow/tfjs"
+  },
+  "devDependencies": {
+    "karma": "^4.4.1",
+    "karma-browserstack-launcher": "^1.6.0",
+    "karma-jasmine": "^3.3.1"
+  },
+  "scripts": {
+    "test": "karma start"
+  },
+  "license": "Apache-2.0",
+  "engines": {
+    "yarn": ">= 1.0.0"
+  }
+}
diff --git a/e2e/benchmarks/yarn.lock b/e2e/benchmarks/yarn.lock