webmachinelearning · huningxin · Apr 16, 2024 · Feb 28, 2024 · Feb 28, 2024 · fdwr
diff --git a/src/lib/validate-input.js b/src/lib/validate-input.js
@@ -133,6 +133,73 @@ export function validateGemmParams(a, b) {
   }
 }
 
+export function validateLstmCellParams(input, weight, recurrentWeight,
+    hiddenState, cellState, hiddenSize,
+    {bias, recurrentBias, peepholeWeight, layout = 'iofg'} = {}) {
+  if (!Number.isInteger(hiddenSize) || hiddenSize <= 0) {
+    throw new Error(`The hiddenSize ${hiddenSize} is invalid.`);
+  }
+  if (input.rank !== 2) {
+    throw new Error(`The input (rank ${input.rank}) is not a 2-D tensor.`);
+  }
+  const batchSize = input.shape[0];
+  const inputSize = input.shape[1];
+  if (weight.rank !== 2) {
+    throw new Error(`The weight (rank ${weight.rank}) is not a 2-D tensor.`);
+  }
+  if (weight.shape[0] !== 4 * hiddenSize || weight.shape[1] !== inputSize) {
+    throw new Error(`The shape of weight [${weight.shape[0]}, ${weight.shape[1]}] is invalid.`);
+  }
+  if (recurrentWeight.rank !== 2) {
+    throw new Error(`The recurrentWeight (rank ${recurrentWeight.rank}) is not a 2-D tensor.`);
+  }
+  if (recurrentWeight.shape[0] !== 4 * hiddenSize || recurrentWeight.shape[1] !== hiddenSize) {
+    throw new Error(`The shape of recurrentWeight ` +
+    `[${recurrentWeight.shape[0]}, ${recurrentWeight.shape[1]}] is invalid.`);
+  }
+  if (hiddenState.rank !== 2) {
+    throw new Error(`The hiddenState (rank ${hiddenState.rank}) is not a 2-D tensor.`);
+  }
+  if (hiddenState.shape[0] !== batchSize || hiddenState.shape[1] !== hiddenSize) {
+    throw new Error(`The shape of hiddenState
+    [${hiddenState.shape[0]}, ${hiddenState.shape[1]}] is invalid.`);
+  }
+  if (cellState.rank !== 2) {
+    throw new Error(`The cellState (rank ${cellState.rank}) is not a 2-D tensor.`);
+  }
+  if (cellState.shape[0] !== batchSize || cellState.shape[1] !== hiddenSize) {
+    throw new Error(`The shape of cellState
+    [${cellState.shape[0]}, ${cellState.shape[1]}] is invalid.`);
+  }
+  if (bias) {
+    if (bias.rank !== 1) {
+      throw new Error(`The bias (rank ${bias.rank}) is not a 1-D tensor.`);
+    }
+    if (bias.shape[0] !== 4 * hiddenSize) {
+      throw new Error(`The shape of bias [${bias.shape[0]}] is invalid.`);
+    }
+  }
+  if (recurrentBias) {
+    if (recurrentBias.rank !== 1) {
+      throw new Error(`The recurrentBias (rank ${bias.rank}) is not a 1-D tensor.`);
+    }
+    if (recurrentBias.shape[0] !== 4 * hiddenSize) {
+      throw new Error(`The shape of recurrentBias [${recurrentBias.shape[0]}] is invalid.`);
+    }
+  }
+  if (peepholeWeight) {
+    if (peepholeWeight.rank !== 1) {
+      throw new Error(`The peepholeWeight (rank ${bias.rank}) is not a 1-D tensor.`);
+    }
+    if (peepholeWeight.shape[0] !== 3 * hiddenSize) {
+      throw new Error(`The shape of peepholeWeight [${peepholeWeight.shape[0]}] is invalid.`);
+    }
+  }
+  if (layout !== 'iofg' && layout !== 'ifgo') {
+    throw new Error(`The layout ${layout} is invalid.`);
+  }
+}
+
 export function validateGruCellParams(input, weight, recurrentWeight, hiddenState, hiddenSize,
     {bias, recurrentBias, layout = 'zrn'} = {}) {
   if (!Number.isInteger(hiddenSize) || hiddenSize <= 0) {

diff --git a/src/lstm_cell.js b/src/lstm_cell.js
@@ -0,0 +1,143 @@
+'use strict';
+
+import {add, mul} from './binary.js';
+import {matmul} from './matmul.js';
+import {Scalar} from './lib/tensor.js';
+import {sigmoid} from './sigmoid.js';
+import {slice} from './slice.js';
+import {tanh} from './tanh.js';
+import {transpose} from './transpose.js';
+import {validateLstmCellParams} from './lib/validate-input.js';
+
+/**
+ *
+ * @param {Tensor} input
+ * @param {Tensor} weight
+ * @param {Tensor} recurrentWeight
+ * @param {Tensor} hiddenState
+ * @param {Tensor} cellState
+ * @param {Number} hiddenSize
+ * @param {MLLstmCellOptions} options
+ * return {Tensor}
+ */
+
+export function lstmCell(input, weight, recurrentWeight, hiddenState, cellState, hiddenSize,
+    {bias, recurrentBias, peepholeWeight,
+      layout = 'iofg', activations = [sigmoid, tanh, tanh]}={}) {
+  validateLstmCellParams(...arguments);
+  const zero = new Scalar(0);
+  const inputSize = input.shape[1];
+  const starts = layout === 'iofg' ? {i: 0, o: hiddenSize, f: 2* hiddenSize, g: 3*hiddenSize} :
-  const starts = layout === 'iofg' ? {i: 0, o: hiddenSize, f: 2* hiddenSize, g: 3*hiddenSize} :
+  const starts = layout === 'iofg' ? {i: 0, o: hiddenSize, f: 2 * hiddenSize, g: 3 * hiddenSize} :
+    {i: 0, f: hiddenSize, g: 2 * hiddenSize, o: 3 * hiddenSize};
-  const starts = layout === 'iofg' ? {i: 0, o: hiddenSize, f: 2* hiddenSize, g: 3*hiddenSize} :
+  const starts = layout === 'iofg' ? {i: 0, o: hiddenSize, f: 2 * hiddenSize, g: 3 * hiddenSize} :
+    {i: 0, f: hiddenSize, g: 2 * hiddenSize, o: 3 * hiddenSize};
+  {i: 0, f: hiddenSize, g: 2* hiddenSize, o: 3*hiddenSize};
+  const activation0 = activations[0];
+  const activation1 = activations[1];
+  const activation2 = activations[2];
+
+  // input gate (i)
+  const i = activation0(
+      add(
+          mul(
+              cellState,
+              (peepholeWeight ? slice(peepholeWeight, [starts.i], [hiddenSize]) : zero),
+          ),
+          add(
+              add(
+                  (bias ? slice(bias, [starts.i], [hiddenSize]) : zero),
+                  (recurrentBias ? slice(recurrentBias, [starts.i], [hiddenSize]) : zero),
+              ),
+              add(
+                  matmul(
+                      input,
+                      transpose(slice(weight, [starts.i, 0], [hiddenSize, inputSize])),
+                  ),
+                  matmul(
+                      hiddenState,
+                      transpose(slice(recurrentWeight, [starts.i, 0], [hiddenSize, hiddenSize])),
+                  ),
+              ),
+          ),
+      ),
+  );
+
+  // forget gate (f)
+  const f = activation0(
+      add(
+          mul(
+              cellState,
+              (peepholeWeight ? slice(peepholeWeight, [starts.f], [hiddenSize]) : zero),
+          ),
+          add(
+              add(
+                  (bias ? slice(bias, [starts.f], [hiddenSize]) : zero),
+                  (recurrentBias ? slice(recurrentBias, [starts.f], [hiddenSize]) : zero),
+              ),
+              add(
+                  matmul(
+                      input,
+                      transpose(slice(weight, [starts.f, 0], [hiddenSize, inputSize])),
+                  ),
+                  matmul(
+                      hiddenState,
+                      transpose(
+                          slice(recurrentWeight, [starts.f, 0], [hiddenSize, hiddenSize]),
+                      ),
+                  ),
+              ),
+          ),
+      ),
+  );
+
+  // cell gate (g)
+  const g = activation1(
+      add(
+          add(
+              (bias ? slice(bias, [starts.g], [hiddenSize]) : zero),
+              (recurrentBias ? slice(recurrentBias, [starts.g], [hiddenSize]) : zero),
+          ),
+          add(
+              matmul(
+                  input,
+                  transpose(slice(weight, [starts.g, 0], [hiddenSize, inputSize])),
+              ),
+              matmul(
+                  hiddenState,
+                  transpose(slice(recurrentWeight, [starts.g, 0], [hiddenSize, hiddenSize])),
+              ),
+          ),
+      ),
+  );
+
+  // output gate (o)
+  const o = activation0(
+      add(
+          mul(
+              cellState,
+              (peepholeWeight ? slice(peepholeWeight, [starts.o], [hiddenSize]) : zero),
+          ),
+          add(
+              add(
+                  (bias ? slice(bias, [starts.o], [hiddenSize]) : zero),
+                  (recurrentBias ? slice(recurrentBias, [starts.o], [hiddenSize]) : zero),
+              ),
+              add(
+                  matmul(
+                      input,
+                      transpose(slice(weight, [starts.o, 0], [hiddenSize, inputSize])),
+                  ),
+                  matmul(
+                      hiddenState,
+                      transpose(slice(recurrentWeight, [starts.o, 0], [hiddenSize, hiddenSize])),
+                  ),
+              ),
+          ),
+      ),
+  );
+
+  // output cell state (ct)
+  const ct = add(mul(f, cellState), mul(i, g));
+
+  // output hidden state (ht)
+  const ht = mul(o, activation2(ct));
+
+  return [ht, ct];
+}
diff --git a/test/lstm_cell_test.js b/test/lstm_cell_test.js
@@ -0,0 +1,57 @@
+'use strict';
+
+import {lstmCell} from '../src/lstm_cell.js';
+import {relu} from '../src/relu.js';
+import {Tensor} from '../src/lib/tensor.js';
+import * as utils from './utils.js';
+
+describe('test lstmCell', function() {
+  it.only('lstmCell lstmCell activations=[relu, relu, relu]', function() {
+    const batchSize = 2;
+    const inputSize = 2;
+    const hiddenSize = 2;
+    const input = new Tensor([batchSize, inputSize], [1, 2, 2, 1]);
+    const weight = new Tensor([4 * hiddenSize, inputSize],
+        new Float32Array([
+          1, -1, 2, -2, 1, -1, 2, -2,
+          1, -1, 2, -2, 1, -1, 2, -2,
+        ]));
+    const recurrentWeight = new Tensor([4 * hiddenSize, hiddenSize],
+        new Float32Array(4 * hiddenSize * hiddenSize).fill(0.1));
+    const hiddenState = new Tensor([batchSize, hiddenSize],
+        new Float32Array(batchSize * hiddenSize).fill(0));
+    const cellState = new Tensor([batchSize, hiddenSize],
+        new Float32Array(batchSize * hiddenSize).fill(0));
+    const bias = new Tensor([4* hiddenSize],
+        new Float32Array([
+          1, 2, 1, 2, 1, 2, 1, 2,
+        ]));
+    const recurrentBias = new Tensor([4* hiddenSize],
+        new Float32Array([
+          1, 2, 1, 2, 1, 2, 1, 2,
+        ]));
+    const peepholeWeight = new Tensor([3* hiddenSize],
+        new Float32Array(3 * hiddenSize).fill(0));
+    const activations = [
+      relu,
+      relu,
+      relu,
+    ];
+    const outputs = lstmCell(
+        input, weight, recurrentWeight, hiddenState, cellState, hiddenSize,
+        {bias, recurrentBias, peepholeWeight, activations});
+    utils.checkShape(outputs[0], [batchSize, hiddenSize]);
+    utils.checkShape(outputs[1], [batchSize, hiddenSize]);
+    const expected = [
+      [
+        1, 8, 27, 216,
+      ],
+      [
+        1, 4, 9, 36,
+      ],
+    ];
+    for (let i = 0; i < expected.length; ++i) {
+      utils.checkValue(outputs[i], expected[i]);
+    }
+  });
+});