tensorflow
diff --git a/‎lstm-text-generation/.babelrc
+18 b/‎lstm-text-generation/.babelrc
+18
diff --git a/‎lstm-text-generation/README.md
+40 b/‎lstm-text-generation/README.md
+40
diff --git a/‎lstm-text-generation/data.js
+201 b/‎lstm-text-generation/data.js
+201
@@ -0,0 +1,18 @@
+{
+  "presets": [
+    [
+      "env",
+      {
+        "esmodules": false,
+        "targets": {
+          "browsers": [
+            "> 3%"
+          ]
+        }
+      }
+    ]
+  ],
+  "plugins": [
+    "transform-runtime"
+  ]
+}
@@ -0,0 +1,40 @@
+# TensorFlow.js Example: Train LSTM to Generate Text
+
+## Overview
+
+This example illustrates how to use TensorFlow.js to train a LSTM model to
+generate random text based on the patterns in a text corpus such as
+Nietzsche's writing or the source code of TensorFlow.js itself.
+
+The LSTM model operates at the character level. It takes a tensor of
+shape `[numExamples, sampleLen, charSetSize]` as the input. The input is a
+one-hot encoding of sequences of `sampleLen` characters. The characters
+belong to a set of `charSetSize` unique characters. With the input, the model
+outputs a tensor of shape `[numExamples, charSetSize]`, which represents the
+model's predicted probabilites of the character that follows the input sequence.
+The application then draws a random sample based on the predicted
+probabilities to get the next character. Once the next character is obtained,
+its one-hot encoding is concatenated with the previous input sequence to form
+the input for the next time step. This process is repeated in order to generate
+a character sequence of a given length. The randomness (diversity) is controlled
+by a temperature parameter.
+
+The UI allows creation of models consisting of a single
+[LSTM layer](https://js.tensorflow.org/api/latest/#layers.lstm) or multiple,
+stacked LSTM layers.
+
+This example also illustrates how to save a trained model in the browser's
+IndexedDB using TensorFlow.js's
+[model saving API](https://js.tensorflow.org/tutorials/model-save-load.html),
+so that the result of the training
+may persist across browser sessions. Once a previously-trained model is loaded
+from the IndexedDB, it can be used in text generation and/or further training.
+
+This example is inspired by the LSTM text generation example from Keras:
+https://github.com/keras-team/keras/blob/master/examples/lstm_text_generation.py
+
+## Usage
+
+```sh
+yarn && yarn watch
+```
@@ -0,0 +1,201 @@
+/**
+ * @license
+ * Copyright 2018 Google LLC. All Rights Reserved.
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ * =============================================================================
+ */
+
+import * as tf from '@tensorflow/tfjs';
+
+/**
+ * A class for text data.
+ *
+ * This class manages the following:
+ *
+ * - Converting training data (as a string) into one-hot encoded vectors.
+ * - Drawing random slices from the training data. This is useful for training
+ *   models and obtaining the seed text for model-based text generation.
+ */
+export class TextData {
+  /**
+   * Constructor of TextData.
+   *
+   * @param {string} dataIdentifier An identifier for this instance of TextData.
+   * @param {string} textString The training text data.
+   * @param {number} sampleLen Length of each training example, i.e., the input
+   *   sequence length expected by the LSTM model.
+   * @param {number} sampleStep How many characters to skip when going from one
+   *   example of the training data (in `textString`) to the next.
+   */
+  constructor(dataIdentifier, textString, sampleLen, sampleStep) {
+    if (!dataIdentifier) {
+      throw new Error('Model identifier is not provided.');
+    }
+
+    this.dataIdentifier_ = dataIdentifier;
+
+    this.textString_ = textString;
+    this.textLen_ = textString.length;
+    this.sampleLen_ = sampleLen;
+    this.sampleStep_ = sampleStep;
+
+    this.getCharSet_();
+    this.convertAllTextToIndices_();
+    this.generateExampleBeginIndices_();
+  }
+
+  /**
+   * Get data identifier.
+   *
+   * @returns {string} The data identifier.
+   */
+  dataIdentifier() {
+    return this.dataIdentifier_;
+  }
+
+  /**
+   * Get length of the training text data.
+   *
+   * @returns {number} Length of training text data.
+   */
+  textLen() {
+    return this.textLen_;
+  }
+
+  /**
+   * Get the length of each training example.
+   */
+  sampleLen() {
+    return this.sampleLen_;
+  }
+
+  /**
+   * Get the size of the character set.
+   *
+   * @returns {number} Size of the character set, i.e., how many unique
+   *   characters there are in the training text data.
+   */
+  charSetSize() {
+    return this.charSetSize_;
+  }
+
+  /**
+   * Generate the next epoch of data for training models.
+   *
+   * @param {number} numExamples Number examples to generate.
+   * @returns {[tf.Tensor, tf.Tensor]} `xs` and `ys` Tensors.
+   *   `xs` has the shape of `[numExamples, this.sampleLen, this.charSetSize]`.
+   *   `ys` has the shape of `[numExamples, this.charSetSize]`.
+   */
+  nextDataEpoch(numExamples) {
+    const xsBuffer = new tf.TensorBuffer([
+        numExamples, this.sampleLen_, this.charSetSize_]);
+    const ysBuffer  = new tf.TensorBuffer([numExamples, this.charSetSize_]);
+    for (let i = 0; i < numExamples; ++i) {
+      const beginIndex = this.exampleBeginIndices_[
+          this.examplePosition_ % this.exampleBeginIndices_.length];
+      for (let j = 0; j < this.sampleLen_; ++j) {
+        xsBuffer.set(1, i, j, this.indices_[beginIndex + j]);
+      }
+      ysBuffer.set(1, i, this.indices_[beginIndex + this.sampleLen_]);
+      this.examplePosition_++;
+    }
+    return [xsBuffer.toTensor(), ysBuffer.toTensor()];
+  }
+
+  /**
+   * Get the unique character at given index from the character set.
+   *
+   * @param {number} index
+   * @returns {string} The unique character at `index` of the character set.
+   */
+  getFromCharSet(index) {
+    return this.charSet_[index];
+  }
+
+  /**
+   * Convert text string to integer indices.
+   *
+   * @param {string} text Input text.
+   * @returns {number[]} Indices of the characters of `text`.
+   */
+  textToIndices(text) {
+    const indices = [];
+    for (let i = 0; i < text.length; ++i) {
+      indices.push(this.charSet_.indexOf(text[i]));
+    }
+    return indices;
+  }
+
+  /**
+   * Get a random slice of text data.
+   *
+   * @returns {[string, number[]} The string and index representation of the
+   *   same slice.
+   */
+  getRandomSlice() {
+    const startIndex =
+        Math.round(Math.random() * (this.textLen_ - this.sampleLen_ - 1));
+    const textSlice = this.slice_(startIndex, startIndex + this.sampleLen_);
+    return [textSlice, this.textToIndices(textSlice)];
+  }
+
+  /**
+   * Get a slice of the training text data.
+   *
+   * @param {number} startIndex
+   * @param {number} endIndex
+   * @param {bool} useIndices Whether to return the indices instead of string.
+   * @returns {string | Uint16Array} The result of the slicing.
+   */
+  slice_(startIndex, endIndex) {
+    return this.textString_.slice(startIndex, endIndex);
+  }
+
+  /**
+   * Get the set of unique characters from text.
+   */
+  getCharSet_() {
+    this.charSet_ = [];
+    for (let i = 0; i < this.textLen_; ++i) {
+      if (this.charSet_.indexOf(this.textString_[i]) === -1) {
+        this.charSet_.push(this.textString_[i]);
+      }
+    }
+    this.charSetSize_ = this.charSet_.length;
+  }
+
+  /**
+   * Convert all training text to integer indices.
+   */
+  convertAllTextToIndices_() {
+    this.indices_ = new Uint16Array(this.textToIndices(this.textString_));
+  }
+
+  /**
+   * Generate the example-begin indices; shuffle them randomly.
+   */
+  generateExampleBeginIndices_() {
+    // Prepare beginning indices of examples.
+    this.exampleBeginIndices_ = [];
+    for (let i = 0;
+        i < this.textLen_ - this.sampleLen_ - 1;
+        i += this.sampleStep_) {
+      this.exampleBeginIndices_.push(i);
+    }
+
+    // Randomly shuffle the beginning indices.
+    tf.util.shuffle(this.exampleBeginIndices_);
+    this.examplePosition_ = 0;
+  }
+}