tensorflow
diff --git a/‎lstm-text-generation/.babelrc
Lines changed: 1 addition & 1 deletion b/‎lstm-text-generation/.babelrc
Lines changed: 1 addition & 1 deletion
diff --git a/‎lstm-text-generation/.gitignore
Lines changed: 1 addition & 0 deletions b/‎lstm-text-generation/.gitignore
Lines changed: 1 addition & 0 deletions
diff --git a/‎lstm-text-generation/README.md
Lines changed: 59 additions & 0 deletions b/‎lstm-text-generation/README.md
Lines changed: 59 additions & 0 deletions
diff --git a/‎lstm-text-generation/data.js
Lines changed: 61 additions & 1 deletion b/‎lstm-text-generation/data.js
Lines changed: 61 additions & 1 deletion
diff --git a/‎lstm-text-generation/data_test.js
Lines changed: 79 additions & 0 deletions b/‎lstm-text-generation/data_test.js
Lines changed: 79 additions & 0 deletions
diff --git a/‎lstm-text-generation/gen_node.js
Lines changed: 104 additions & 0 deletions b/‎lstm-text-generation/gen_node.js
Lines changed: 104 additions & 0 deletions
@@ -13,6 +13,6 @@
     ]
   ],
   "plugins": [
-    "@babel/plugin-transform-runtime"
+    "transform-runtime"
   ]
 }
@@ -0,0 +1 @@
+*.txt
@@ -1,4 +1,6 @@
 # TensorFlow.js Example: Train LSTM to Generate Text
+ 
+[See this example live!](https://storage.googleapis.com/tfjs-examples/lstm-text-generation/dist/index.html)
 
 ## Overview
 
@@ -35,6 +37,63 @@ https://github.com/keras-team/keras/blob/master/examples/lstm_text_generation.py
 
 ## Usage
 
+### Running the Web Demo
+
+The web demo supports model training and text generation. To launch the demo, do:
+
 ```sh
 yarn && yarn watch
 ```
+
+### Training Models in Node.js
+
+Training a model in Node.js should give you a faster performance than the browser
+environment.
+
+To start a training job, enter command lines such as:
+
+```sh
+yarn
+yarn train shakespeare \
+    --lstmLayerSize 128,128 \
+    --epochs 120 \
+    --savePath ./my-shakespeare-model
+```
+
+- The first argument to `yarn train` (`shakespeare`) specifies what text corpus
+  to train the model on. See the console output of `yarn train --help` for a set
+  of supported text data.
+- The argument `--lstmLayerSize 128,128` specifies that the next-character
+  prediction model should contain two LSTM layers stacked on top of each other,
+  each with 128 units.
+- The flag `--epochs` is used to specify the number of training epochs.
+- The argument `--savePath ...` lets the training script save the model at the
+  specified path once the training completes
+
+If you have a CUDA-enabled GPU set up properly on your system, you can
+add the `--gpu` flag to the command line to train the model on the GPU, which
+should give you a further performance boost.
+
+### Generating Text in Node.js using Saved Model Files
+
+The example command line above generates a set of model files in the 
+`./my-shakespeare-model` folder after the completion of the training. You can
+load the model and use it to generate text. For example:
+
+```sh
+yarn gen shakespeare ./my-shakespeare-model/model.json \
+    --genLength 250 \
+    --temperature 0.6
+```
+
+The command will randomly sample a snippet of text from the shakespeare
+text corpus and use it as the seed to generate text.
+
+- The first argument (`shakespeare`) specifies the text corpus.
+- The second argument specifies the path to the saved JSON file for the
+  model, which has been generated in the previous section.
+- The `--genLength` flag allows you to speicify how many characters
+  to generate.
+- The `--temperature` flag allows you to specify the stochacity (randomness)
+  of the generation processs. It should be a number greater than or equal to
+  zero. The higher the value is, the more random the generated text will be.
@@ -17,6 +17,29 @@
 
 import * as tf from '@tensorflow/tfjs';
 
+// TODO(cais): Support user-supplied text data.
+export const TEXT_DATA_URLS = {
+  'nietzsche': {
+    url:
+        'https://storage.googleapis.com/tfjs-examples/lstm-text-generation/data/nietzsche.txt',
+    needle: 'Nietzsche'
+  },
+  'julesverne': {
+    url:
+        'https://storage.googleapis.com/tfjs-examples/lstm-text-generation/data/t1.verne.txt',
+    needle: 'Jules Verne'
+  },
+  'shakespeare': {
+    url:
+        'https://storage.googleapis.com/tfjs-examples/lstm-text-generation/data/t8.shakespeare.txt',
+    needle: 'Shakespeare'
+  },
+  'tfjs-code': {
+    url: 'https://cdn.jsdelivr.net/npm/@tensorflow/[email protected]/dist/tf.js',
+    needle: 'TensorFlow.js Code (Compiled, 0.11.7)'
+  }
+}
+
 /**
  * A class for text data.
  *
@@ -38,6 +61,13 @@ export class TextData {
    *   example of the training data (in `textString`) to the next.
    */
   constructor(dataIdentifier, textString, sampleLen, sampleStep) {
+    tf.util.assert(
+        sampleLen > 0,
+        `Expected sampleLen to be a positive integer, but got ${sampleLen}`);
+    tf.util.assert(
+        sampleStep > 0,
+        `Expected sampleStep to be a positive integer, but got ${sampleStep}`);
+
     if (!dataIdentifier) {
       throw new Error('Model identifier is not provided.');
     }
@@ -51,7 +81,6 @@ export class TextData {
 
     this.getCharSet_();
     this.convertAllTextToIndices_();
-    this.generateExampleBeginIndices_();
   }
 
   /**
@@ -98,6 +127,12 @@ export class TextData {
    *   `ys` has the shape of `[numExamples, this.charSetSize]`.
    */
   nextDataEpoch(numExamples) {
+    this.generateExampleBeginIndices_();
+
+    if (numExamples == null) {
+      numExamples = this.exampleBeginIndices_.length;
+    }
+
     const xsBuffer = new tf.TensorBuffer([
         numExamples, this.sampleLen_, this.charSetSize_]);
     const ysBuffer  = new tf.TensorBuffer([numExamples, this.charSetSize_]);
@@ -199,3 +234,28 @@ export class TextData {
     this.examplePosition_ = 0;
   }
 }
+
+/**
+ * Get a file by downloading it if necessary.
+ *
+ * @param {string} sourceURL URL to download the file from.
+ * @param {string} destPath Destination file path on local filesystem.
+ */
+export async function maybeDownload(sourceURL, destPath) {
+  const fs = require('fs');
+  return new Promise(async (resolve, reject) => {
+    if (!fs.existsSync(destPath) || fs.lstatSync(destPath).size === 0) {
+      const localZipFile = fs.createWriteStream(destPath);
+      console.log(`Downloading file from ${sourceURL} to ${destPath}...`);
+      https.get(sourceURL, response => {
+        response.pipe(localZipFile);
+        localZipFile.on('finish', () => {
+          localZipFile.close(() => resolve());
+        });
+        localZipFile.on('error', err => reject(err));
+      });
+    } else {
+      return resolve();
+    }
+  });
+}
@@ -0,0 +1,79 @@
+/**
+ * @license
+ * Copyright 2019 Google LLC. All Rights Reserved.
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * =============================================================================
+ */
+
+import {TextData} from './data';
+
+// tslint:disable:max-line-length
+const FAKE_TEXT = `Lorem ipsum dolor sit amet, consectetur adipiscing elit. Suspendisse tempor aliquet justo non varius. Curabitur eget convallis velit. Vivamus malesuada, tortor ut finibus posuere, libero lacus eleifend felis, sit amet tempus dolor magna id nibh. Praesent non turpis libero. Praesent luctus, neque vitae suscipit suscipit, arcu neque aliquam justo, eget gravida diam augue nec lorem. Etiam scelerisque vel nibh sit amet maximus. Praesent et dui quis elit bibendum elementum a eget velit. Mauris porta lorem ac porttitor congue. Vestibulum lobortis ultrices velit, vitae condimentum elit ultrices a. Vivamus rutrum ultrices eros ac finibus. Orci varius natoque penatibus et magnis dis parturient montes, nascetur ridiculus mus. Morbi a purus a nibh eleifend convallis. Praesent non turpis volutpat, imperdiet lacus in, cursus tellus. Etiam elit velit, ornare sit amet nulla vel, aliquam iaculis mauris.
+
+Phasellus sed sem ut justo sollicitudin cursus at sed neque. Proin tempor finibus nisl, nec aliquam leo porta at. Nullam vel mauris et neque pellentesque laoreet sit amet eu risus. Sed sed ante sed enim hendrerit commodo. Etiam blandit aliquet molestie. Nullam dictum imperdiet enim, quis scelerisque nunc ultricies sit amet. Praesent dictum dictum lobortis. Sed ut ipsum at orci commodo congue.
+
+Aenean pharetra mollis erat, id convallis ante elementum at. Cras semper turpis nec lorem tempus ultrices. Sed eget purus vel est blandit dictum. Praesent auctor, sapien non consequat pellentesque, risus orci sagittis leo, at cursus nibh nisi vel quam. Morbi et orci id quam dictum efficitur ac iaculis nisl. Donec at nunc et nibh accumsan malesuada eu in odio. Donec quis elementum turpis. Vestibulum pretium rhoncus orci, nec gravida nisl hendrerit pellentesque. Cras imperdiet odio a quam mollis, in aliquet neque efficitur. Praesent at tincidunt ipsum. Maecenas neque risus, pretium ut orci sit amet, dignissim auctor dui. Sed finibus nunc elit, rhoncus ornare dui pharetra vitae. Sed ut iaculis ex. Quisque quis molestie ligula. Vivamus egestas rhoncus mollis.
+
+Pellentesque volutpat ipsum vitae ex interdum, eu rhoncus dolor fringilla. Suspendisse potenti. Maecenas in sem leo. Curabitur vestibulum porta vulputate. Nunc quis consectetur enim. Aliquam congue, augue in commodo porttitor, sem tellus posuere augue, ut aliquam sapien massa in est. Duis convallis pellentesque vehicula. Mauris ipsum urna, congue consequat posuere sed, euismod nec mauris. Praesent sollicitudin scelerisque scelerisque. Ut commodo nisl vitae nunc feugiat auctor. Praesent imperdiet magna facilisis nunc vulputate, vel suscipit leo consequat. Duis fermentum rutrum ipsum a laoreet. Nunc dictum libero in quam pellentesque, sit amet tempus tellus suscipit. Curabitur pharetra erat bibendum malesuada rhoncus.
+
+Donec laoreet leo ligula, ut condimentum mi placerat ut. Sed pretium sollicitudin nisl quis tincidunt. Proin id nisl ornare, interdum lorem quis, posuere lacus. Cras cursus mollis scelerisque. Mauris mattis mi sed orci feugiat, et blandit velit tincidunt. Donec ultrices leo vel tellus tincidunt, id vehicula mi commodo. Nulla egestas mollis massa. Etiam blandit nisl eu risus luctus viverra. Mauris eget mi sem.
+
+`;
+// tslint:enable:max-line-length
+
+describe('TextData', () => {
+  it('Creation', () => {
+    const data = new TextData('LoremIpsum', FAKE_TEXT, 20, 3);
+    expect(data.sampleLen()).toEqual(20);
+    expect(data.charSetSize()).toBeGreaterThan(0);
+  });
+
+  it('nextDataEpoch: full pass', () => {
+    const data = new TextData('LoremIpsum', FAKE_TEXT, 20, 3);
+    const [xs, ys] = data.nextDataEpoch();
+    expect(xs.rank).toEqual(3);
+    expect(ys.rank).toEqual(2);
+    expect(xs.shape[0]).toEqual(ys.shape[0]);
+    expect(xs.shape[1]).toEqual(20);
+    expect(xs.shape[2]).toEqual(ys.shape[1]);
+  });
+
+  it('nextDataEpoch: partial pass', () => {
+    const data = new TextData('LoremIpsum', FAKE_TEXT, 20, 3);
+    const [xs, ys] = data.nextDataEpoch(4);
+    expect(xs.rank).toEqual(3);
+    expect(ys.rank).toEqual(2);
+    expect(xs.shape[0]).toEqual(4);
+    expect(ys.shape[0]).toEqual(4);
+    expect(xs.shape[1]).toEqual(20);
+    expect(xs.shape[2]).toEqual(ys.shape[1]);
+  });
+
+  it('getFromCharSet', () => {
+    const data = new TextData('LoremIpsum', FAKE_TEXT, 20, 3);
+    const charSetSize = data.charSetSize();
+    expect(data.getFromCharSet(0)).not.toEqual(data.getFromCharSet(1));
+    expect(data.getFromCharSet(0))
+        .not.toEqual(data.getFromCharSet(charSetSize - 1));
+    expect(data.getFromCharSet(charSetSize)).toBeUndefined();
+    expect(data.getFromCharSet(-1)).toBeUndefined();
+  });
+
+  it('getRandomSlice', () => {
+    const data = new TextData('LoremIpsum', FAKE_TEXT, 20, 3);
+    const [text, indices] = data.getRandomSlice();
+    expect(typeof text).toEqual('string');
+    expect(Array.isArray(indices)).toEqual(true);
+  });
+});
+
@@ -0,0 +1,104 @@
+/**
+ * @license
+ * Copyright 2019 Google LLC. All Rights Reserved.
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * =============================================================================
+ */
+
+/**
+ * Use a trained next-character prediction model to generate some text. 
+ */
+
+import * as fs from 'fs';
+import * as os from 'os';
+import * as path from 'path';
+import * as argparse from 'argparse';
+
+import * as tf from '@tensorflow/tfjs';
+
+import {maybeDownload, TextData, TEXT_DATA_URLS} from './data';
+import {generateText} from './model';
+
+function parseArgs() {
+  const parser = argparse.ArgumentParser({
+    description: 'Train an lstm-text-generation model.'
+  });
+  parser.addArgument('textDatasetName', {
+    type: 'string',
+    choices: Object.keys(TEXT_DATA_URLS),
+    help: 'Name of the text dataset'
+  });
+  parser.addArgument('modelJSONPath', {
+    type: 'string',
+    help: 'Path to the trained next-char prediction model saved on disk ' +
+    '(e.g., ./my-model/model.json)'
+  });
+  parser.addArgument('--genLength', {
+    type: 'int',
+    defaultValue: 200,
+    help: 'Length of the text to generate.'
+  });
+  parser.addArgument('--temperature', {
+    type: 'float',
+    defaultValue: 0.5,
+    help: 'Temperature value to use for text generation. Higher values ' +
+    'lead to more random-looking generation results.'
+  });
+  parser.addArgument('--gpu', {
+    action: 'storeTrue',
+    help: 'Use CUDA GPU for training.'
+  });
+  parser.addArgument('--sampleStep', {
+    type: 'int',
+    defaultValue: 3,
+    help: 'Step length: how many characters to skip between one example ' +
+    'extracted from the text data to the next.'
+  });
+  return parser.parseArgs();
+}
+
+async function main() {
+  const args = parseArgs();
+
+  if (args.gpu) {
+    console.log('Using GPU');
+    require('@tensorflow/tfjs-node-gpu');
+  } else {
+    console.log('Using CPU');
+    require('@tensorflow/tfjs-node');
+  }
+
+  // Load the model.
+  const model = await tf.loadModel(`file://${args.modelJSONPath}`);
+
+  const sampleLen = model.inputs[0].shape[1];
+
+  // Create the text data object.
+  const textDataURL = TEXT_DATA_URLS[args.textDatasetName].url;
+  const localTextDataPath = path.join(os.tmpdir(), path.basename(textDataURL));
+  await maybeDownload(textDataURL, localTextDataPath);
+  const text = fs.readFileSync(localTextDataPath, {encoding: 'utf-8'});
+  const textData = new TextData('text-data', text, sampleLen, args.sampleStep);
+
+  // Get a seed text from the text data object.
+  const [seed, seedIndices] = textData.getRandomSlice();
+  
+  console.log(`Seed text:\n"${seed}"\n`);
+
+  const generated = await generateText(
+      model, textData, seedIndices, args.genLength, args.temperature);
+
+  console.log(`Generated text:\n"${generated}"\n`);
+}
+
+main();
Original file line number	Diff line number	Diff line change
`@@ -13,6 +13,6 @@`
`13`	`13`	`]`
`14`	`14`	`],`
`15`	`15`	`"plugins": [`
`16`		`- "@babel/plugin-transform-runtime"`
	`16`	`+ "transform-runtime"`
`17`	`17`	`]`
`18`	`18`	`}`