src/recurrent/lstm.test.ts

import { LSTM } from './lstm';
import { IMatrixJSON, Matrix } from './matrix';
import { RNN } from './rnn';
import { DataFormatter } from '../utilities/data-formatter';

describe('LSTM', () => {
  describe('.getHiddenLayer()', () => {
    test('overrides RNN', () => {
      expect(typeof LSTM.prototype.getHiddenLayer).toEqual('function');
      expect(LSTM.prototype.getHiddenLayer).not.toEqual(
        RNN.prototype.getHiddenLayer
      );
    });
  });
  describe('getEquation', () => {
    test('overrides RNN', () => {
      expect(typeof LSTM.prototype.getEquation).toEqual('function');
      expect(LSTM.prototype.getEquation).not.toEqual(RNN.prototype.getEquation);
    });
  });

  describe('math', () => {
    it('can predict math', () => {
      const net = new LSTM();
      const items = new Set<string>([]);
      for (let i = 0; i < 10; i++) {
        for (let j = 0; j < 10; j++) {
          items.add(`${i}+${j}=${i + j}`);
          items.add(`${j}+${i}=${i + j}`);
        }
      }
      net.train(Array.from(items), { iterations: 60, errorThresh: 0.03 });
      for (let i = 0; i < 10; i++) {
        const output = net.run(`${i}+`);
        expect(/^[0-9]+[=][0-9]+$/.test(output)).toBe(true);
      }
    });
  });

  describe('json', () => {
    describe('.toJSON', () => {
      it('can export model as json', () => {
        const net = new LSTM({
          inputSize: 6,
          inputRange: 12,
          outputSize: 6,
        });
        const json = net.toJSON();

        function compare(left: IMatrixJSON, right: Matrix) {
          left.weights.forEach((value, i) => {
            expect(value).toBe(right.weights[i]);
          });
          expect(left.rows).toBe(right.rows);
          expect(left.columns).toBe(right.columns);
        }

        compare(json.input, net.model.input);
        net.model.hiddenLayers.forEach((layer, i) => {
          for (const p in layer) {
            compare(json.hiddenLayers[i][p], layer[p]);
          }
        });
        compare(json.output, net.model.output);
        compare(json.outputConnector, net.model.outputConnector);
      });
    });

    describe('.fromJSON', () => {
      it('can import model from json', () => {
        const dataFormatter = new DataFormatter('abcdef'.split(''));
        const json = new LSTM({
          inputSize: 6, // <- length
          inputRange: dataFormatter.characters.length,
          outputSize: dataFormatter.characters.length, // <- length
        }).toJSON();

        const clone = new LSTM();
        clone.fromJSON(JSON.parse(JSON.stringify(json)));

        expect(json).toEqual(clone.toJSON());
        expect(clone.options.inputSize).toBe(6);
        expect(clone.options.inputRange).toBe(dataFormatter.characters.length);
        expect(clone.options.outputSize).toBe(dataFormatter.characters.length);
      });

      it('can train imported model from json', () => {
        const dataFormatter = new DataFormatter('abcdef'.split(''));
        const json = new LSTM({
          inputSize: 6, // <- length
          inputRange: dataFormatter.characters.length,
          outputSize: dataFormatter.characters.length, // <- length
        }).toJSON();

        const clone = new LSTM();
        clone.fromJSON(JSON.parse(JSON.stringify(json)));
        clone.trainPattern([0, 1, 2, 3, 4, 5]);

        expect(json).not.toEqual(clone.toJSON());
        expect(clone.options.inputSize).toBe(6);
        expect(clone.options.inputRange).toBe(dataFormatter.characters.length);
        expect(clone.options.outputSize).toBe(dataFormatter.characters.length);
      });
    });
  });

  describe('.toFunction', () => {
    it('can output same as run method', () => {
      const dataFormatter = new DataFormatter(['h', 'i', ' ', 'm', 'o', '!']);
      const net = new LSTM({
        inputSize: 1,
        inputRange: dataFormatter.characters.length,
        outputSize: 1,
        dataFormatter,
      });
      net.initialize();
      for (let i = 0; i < 100; i++) {
        net.trainPattern(dataFormatter.toIndexes('hi mom!'));
      }

      const lastOutput = net.run();
      expect(lastOutput).toBe('hi mom!');
    });
    it('can include the DataFormatter', () => {
      const net = new LSTM();
      net.train(['hi mom!'], { iterations: 100 });
      const expected = net.run('hi ');
      const newNet = net.toFunction();
      const output = newNet('hi ');
      expect(output).toBe(expected);
    });
  });

  describe('.run', () => {
    jest.retryTimes(5);
    it('can predict greetings in 200 trainings', () => {
      const net = new LSTM();
      const trainingData = [
        {
          input: 'hi',
          output: 'mom',
        },
        {
          input: 'howdy',
          output: 'dad',
        },
        {
          input: 'hello',
          output: 'sis',
        },
        {
          input: 'yo',
          output: 'bro',
        },
      ];
      net.train(trainingData, { iterations: 200 });
      expect(net.run('hi')).toBe('mom');
      expect(net.run('howdy')).toBe('dad');
      expect(net.run('hello')).toBe('sis');
      expect(net.run('yo')).toBe('bro');
    });
    it('can predict a string from index in 200 trainings', () => {
      const net = new LSTM();
      const transactionTypes = {
        credit: '0',
        debit: '1',
        personalCard: '2',
        other: '3',
      };
      const trainingData = [
        {
          input: transactionTypes.credit,
          output: 'credit',
        },
        {
          input: transactionTypes.debit,
          output: 'debit',
        },
        {
          input: transactionTypes.personalCard,
          output: 'personal card',
        },
        {
          input: transactionTypes.other,
          output: 'other',
        },
      ];
      net.train(trainingData, { iterations: 200 });
      expect(net.run([transactionTypes.credit])).toBe('credit');
      expect(net.run([transactionTypes.debit])).toBe('debit');
      expect(net.run([transactionTypes.personalCard])).toBe('personal card');
      expect(net.run([transactionTypes.other])).toBe('other');
    });
  });

  describe('cloned LSTM net training', () => {
    it('continues evolving from the point where the original stopped', () => {
      const net = new LSTM({ hiddenLayers: [60, 60] });
      net.maxPredictionLength = 100;

      const trainData = [
        'doe, a deer, a female deer',
        'ray, a drop of golden sun',
        'me, a name I call myself',
      ];

      // First train
      net.train(trainData, {
        iterations: 5000,
        log: true,
        logPeriod: 500,
        learningRate: 0.2,
      });

      // Clone the net:
      const net2 = new LSTM({ hiddenLayers: [60, 60] });
      net2.fromJSON(net.toJSON());

      // Both output the same text:
      expect(net.run('ray')).toBe(net2.run('ray'));

      // More training, start from the last error rate:
      net.train(trainData, {
        iterations: 30,
        log: true,
        logPeriod: 10,
        learningRate: 0.2,
      });

      // More training to the clone:
      net2.train(trainData, {
        iterations: 30,
        log: true,
        logPeriod: 10,
        learningRate: 0.2,
      });

      // The first reduced the quality, but the second is crazy:
      expect(net.run('ray')).not.toBe(net2.run('ray'));
    });
  });
});