cavis/deeplearning4j/deeplearning4j-cuda/src/test/java/org/deeplearning4j/lstm/ValidateCudnnLSTM.java

/*******************************************************************************
 * Copyright (c) 2015-2018 Skymind, Inc.
 *
 * This program and the accompanying materials are made available under the
 * terms of the Apache License, Version 2.0 which is available at
 * https://www.apache.org/licenses/LICENSE-2.0.
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
 * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
 * License for the specific language governing permissions and limitations
 * under the License.
 *
 * SPDX-License-Identifier: Apache-2.0
 ******************************************************************************/

package org.deeplearning4j.lstm;

import org.deeplearning4j.BaseDL4JTest;
import org.deeplearning4j.TestUtils;
import org.deeplearning4j.nn.api.Layer;
import org.deeplearning4j.nn.conf.*;
import org.deeplearning4j.nn.conf.distribution.NormalDistribution;
import org.deeplearning4j.nn.conf.layers.LSTM;
import org.deeplearning4j.nn.conf.layers.RnnOutputLayer;
import org.deeplearning4j.nn.gradient.Gradient;
import org.deeplearning4j.nn.layers.recurrent.CudnnLSTMHelper;
import org.deeplearning4j.nn.multilayer.MultiLayerNetwork;
import org.junit.Test;
import org.nd4j.linalg.activations.Activation;
import org.nd4j.linalg.api.buffer.DataType;
import org.nd4j.linalg.api.ndarray.INDArray;
import org.nd4j.linalg.dataset.DataSet;
import org.nd4j.linalg.factory.Nd4j;
import org.nd4j.linalg.learning.config.NoOp;
import org.nd4j.linalg.lossfunctions.LossFunctions;

import java.lang.reflect.Field;
import java.util.Map;
import java.util.Random;

import static org.junit.Assert.*;

/**
 * Created by Alex on 18/07/2017.
 */
public class ValidateCudnnLSTM extends BaseDL4JTest {

    @Test
    public void validateImplSimple() throws Exception {

        Nd4j.getRandom().setSeed(12345);
        int minibatch = 10;
        int inputSize = 3;
        int lstmLayerSize = 4;
        int timeSeriesLength = 3;
        int nOut = 2;
        INDArray input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});
        INDArray labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);
        Random r = new Random(12345);
        for (int i = 0; i < minibatch; i++) {
            for (int j = 0; j < timeSeriesLength; j++) {
                labels.putScalar(i, r.nextInt(nOut), j, 1.0);
            }
        }

        MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().inferenceWorkspaceMode(WorkspaceMode.NONE)
                        .trainingWorkspaceMode(WorkspaceMode.NONE).updater(new NoOp())
                        .seed(12345L)
                        .dist(new NormalDistribution(0, 2)).list()
                        .layer(0, new LSTM.Builder().nIn(input.size(1)).nOut(lstmLayerSize)
                                        .gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())
                        .layer(1, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)
                                        .activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())
                        .build();

        MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());
        mln1.init();

        MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());
        mln2.init();


        assertEquals(mln1.params(), mln2.params());

        Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");
        f.setAccessible(true);

        Layer l0 = mln1.getLayer(0);
        f.set(l0, null);
        assertNull(f.get(l0));

        l0 = mln2.getLayer(0);
        assertTrue(f.get(l0) instanceof CudnnLSTMHelper);


        INDArray out1 = mln1.output(input);
        INDArray out2 = mln2.output(input);

        assertEquals(out1, out2);


        mln1.setInput(input);
        mln1.setLabels(labels);

        mln2.setInput(input);
        mln2.setLabels(labels);

        mln1.computeGradientAndScore();
        mln2.computeGradientAndScore();

        assertEquals(mln1.score(), mln2.score(), 1e-8);

        Gradient g1 = mln1.gradient();
        Gradient g2 = mln2.gradient();

        for (Map.Entry<String, INDArray> entry : g1.gradientForVariable().entrySet()) {
            INDArray exp = entry.getValue();
            INDArray act = g2.gradientForVariable().get(entry.getKey());

            //System.out.println(entry.getKey() + "\t" + exp.equals(act));
        }

        assertEquals(mln1.getFlattenedGradients(), mln2.getFlattenedGradients());
    }

    @Test
    public void validateImplMultiLayer() throws Exception {

        Nd4j.getRandom().setSeed(12345);
        int minibatch = 10;
        int inputSize = 3;
        int lstmLayerSize = 4;
        int timeSeriesLength = 3;
        int nOut = 2;
        INDArray input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});
        INDArray labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);
        Random r = new Random(12345);
        for (int i = 0; i < minibatch; i++) {
            for (int j = 0; j < timeSeriesLength; j++) {
                labels.putScalar(i, r.nextInt(nOut), j, 1.0);
            }
        }

        MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().updater(new NoOp())
                        .dataType(DataType.DOUBLE)
                        .inferenceWorkspaceMode(WorkspaceMode.NONE).trainingWorkspaceMode(WorkspaceMode.NONE)
                        .seed(12345L)
                        .dist(new NormalDistribution(0, 2)).list()
                        .layer(0, new LSTM.Builder().nIn(input.size(1)).nOut(lstmLayerSize)
                                        .gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())
                        .layer(1, new LSTM.Builder().nIn(lstmLayerSize).nOut(lstmLayerSize)
                                        .gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())
                        .layer(2, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)
                                        .activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())
                        .build();

        MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());
        mln1.init();

        MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());
        mln2.init();


        assertEquals(mln1.params(), mln2.params());

        Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");
        f.setAccessible(true);

        Layer l0 = mln1.getLayer(0);
        Layer l1 = mln1.getLayer(1);
        f.set(l0, null);
        f.set(l1, null);
        assertNull(f.get(l0));
        assertNull(f.get(l1));

        l0 = mln2.getLayer(0);
        l1 = mln2.getLayer(1);
        assertTrue(f.get(l0) instanceof CudnnLSTMHelper);
        assertTrue(f.get(l1) instanceof CudnnLSTMHelper);


        INDArray out1 = mln1.output(input);
        INDArray out2 = mln2.output(input);

        assertEquals(out1, out2);

        for (int x = 0; x < 10; x++) {
            input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});
            labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);
            for (int i = 0; i < minibatch; i++) {
                for (int j = 0; j < timeSeriesLength; j++) {
                    labels.putScalar(i, r.nextInt(nOut), j, 1.0);
                }
            }

            mln1.setInput(input);
            mln1.setLabels(labels);

            mln2.setInput(input);
            mln2.setLabels(labels);

            mln1.computeGradientAndScore();
            mln2.computeGradientAndScore();

            assertEquals(mln1.score(), mln2.score(), 1e-5);

            assertEquals(mln1.getFlattenedGradients(), mln2.getFlattenedGradients());

            mln1.fit(new DataSet(input, labels));
            mln2.fit(new DataSet(input, labels));

            assertEquals("Iteration: " + x, mln1.params(), mln2.params());
        }
    }


    @Test
    public void validateImplMultiLayerTBPTT() throws Exception {

        Nd4j.getRandom().setSeed(12345);
        int minibatch = 10;
        int inputSize = 3;
        int lstmLayerSize = 4;
        int timeSeriesLength = 23;
        int tbpttLength = 5;
        int nOut = 2;

        MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().updater(new NoOp())
                        .inferenceWorkspaceMode(WorkspaceMode.NONE).trainingWorkspaceMode(WorkspaceMode.NONE)
                        .seed(12345L)
                        .dist(new NormalDistribution(0, 2)).list()
                        .layer(0, new LSTM.Builder().nIn(inputSize).nOut(lstmLayerSize)
                                        .gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())
                        .layer(1, new LSTM.Builder().nIn(lstmLayerSize).nOut(lstmLayerSize)
                                        .gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())
                        .layer(2, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)
                                        .activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())
                        .backpropType(BackpropType.TruncatedBPTT)
                        .tBPTTLength(tbpttLength).build();

        MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());
        mln1.init();

        MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());
        mln2.init();


        assertEquals(mln1.params(), mln2.params());

        Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");
        f.setAccessible(true);

        Layer l0 = mln1.getLayer(0);
        Layer l1 = mln1.getLayer(1);
        f.set(l0, null);
        f.set(l1, null);
        assertNull(f.get(l0));
        assertNull(f.get(l1));

        l0 = mln2.getLayer(0);
        l1 = mln2.getLayer(1);
        assertTrue(f.get(l0) instanceof CudnnLSTMHelper);
        assertTrue(f.get(l1) instanceof CudnnLSTMHelper);

        Random r = new Random(12345);
        for (int x = 0; x < 1; x++) {
            INDArray input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});
            INDArray labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);
            for (int i = 0; i < minibatch; i++) {
                for (int j = 0; j < timeSeriesLength; j++) {
                    labels.putScalar(i, r.nextInt(nOut), j, 1.0);
                }
            }

            DataSet ds = new DataSet(input, labels);
            mln1.fit(ds);
            mln2.fit(ds);
        }


        assertEquals(mln1.params(), mln2.params());
    }

    @Test
    public void validateImplMultiLayerRnnTimeStep() throws Exception {

        for(WorkspaceMode wsm : new WorkspaceMode[]{WorkspaceMode.NONE, WorkspaceMode.ENABLED}) {
            Nd4j.getRandom().setSeed(12345);
            int minibatch = 10;
            int inputSize = 3;
            int lstmLayerSize = 4;
            int timeSeriesLength = 3;
            int tbpttLength = 5;
            int nOut = 2;

            MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().updater(new NoOp())
                    .inferenceWorkspaceMode(WorkspaceMode.NONE).trainingWorkspaceMode(WorkspaceMode.NONE)
                    .cacheMode(CacheMode.NONE).seed(12345L)
                    .dist(new NormalDistribution(0, 2)).list()
                    .layer(0, new LSTM.Builder().nIn(inputSize).nOut(lstmLayerSize)
                            .gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())
                    .layer(1, new LSTM.Builder().nIn(lstmLayerSize).nOut(lstmLayerSize)
                            .gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())
                    .layer(2, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)
                            .activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())
                    .backpropType(BackpropType.TruncatedBPTT)
                    .tBPTTLength(tbpttLength).build();

            MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());
            mln1.init();

            MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());
            mln2.init();


            assertEquals(mln1.params(), mln2.params());

            Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");
            f.setAccessible(true);

            Layer l0 = mln1.getLayer(0);
            Layer l1 = mln1.getLayer(1);
            f.set(l0, null);
            f.set(l1, null);
            assertNull(f.get(l0));
            assertNull(f.get(l1));

            l0 = mln2.getLayer(0);
            l1 = mln2.getLayer(1);
            assertTrue(f.get(l0) instanceof CudnnLSTMHelper);
            assertTrue(f.get(l1) instanceof CudnnLSTMHelper);

            Random r = new Random(12345);
            for (int x = 0; x < 5; x++) {
                INDArray input = Nd4j.rand(new int[]{minibatch, inputSize, timeSeriesLength});

                INDArray step1 = mln1.rnnTimeStep(input);
                INDArray step2 = mln2.rnnTimeStep(input);

                assertEquals("Step: " + x, step1, step2);
            }

            assertEquals(mln1.params(), mln2.params());

            //Also check fit (mainly for workspaces sanity check):
            INDArray in = Nd4j.rand(new int[]{minibatch, inputSize, 3 * tbpttLength});
            INDArray label = TestUtils.randomOneHotTimeSeries(minibatch, nOut, 3 * tbpttLength);
            for( int i=0; i<3; i++ ){
                mln1.fit(in, label);
                mln2.fit(in, label);
            }
        }
    }
}
Eclipse Migration Initial Commit 2019-06-06 15:21:15 +03:00			`/*******************************************************************************`
			`* Copyright (c) 2015-2018 Skymind, Inc.`
			`*`
			`* This program and the accompanying materials are made available under the`
			`* terms of the Apache License, Version 2.0 which is available at`
			`* https://www.apache.org/licenses/LICENSE-2.0.`
			`*`
			`* Unless required by applicable law or agreed to in writing, software`
			`* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT`
			`* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the`
			`* License for the specific language governing permissions and limitations`
			`* under the License.`
			`*`
			`* SPDX-License-Identifier: Apache-2.0`
			`******************************************************************************/`

			`package org.deeplearning4j.lstm;`

			`import org.deeplearning4j.BaseDL4JTest;`
			`import org.deeplearning4j.TestUtils;`
			`import org.deeplearning4j.nn.api.Layer;`
			`import org.deeplearning4j.nn.conf.*;`
			`import org.deeplearning4j.nn.conf.distribution.NormalDistribution;`
			`import org.deeplearning4j.nn.conf.layers.LSTM;`
			`import org.deeplearning4j.nn.conf.layers.RnnOutputLayer;`
			`import org.deeplearning4j.nn.gradient.Gradient;`
			`import org.deeplearning4j.nn.layers.recurrent.CudnnLSTMHelper;`
			`import org.deeplearning4j.nn.multilayer.MultiLayerNetwork;`
			`import org.junit.Test;`
			`import org.nd4j.linalg.activations.Activation;`
			`import org.nd4j.linalg.api.buffer.DataType;`
			`import org.nd4j.linalg.api.ndarray.INDArray;`
			`import org.nd4j.linalg.dataset.DataSet;`
			`import org.nd4j.linalg.factory.Nd4j;`
			`import org.nd4j.linalg.learning.config.NoOp;`
			`import org.nd4j.linalg.lossfunctions.LossFunctions;`

			`import java.lang.reflect.Field;`
			`import java.util.Map;`
			`import java.util.Random;`

			`import static org.junit.Assert.*;`

			`/**`
			`* Created by Alex on 18/07/2017.`
			`*/`
			`public class ValidateCudnnLSTM extends BaseDL4JTest {`

			`@Test`
			`public void validateImplSimple() throws Exception {`

			`Nd4j.getRandom().setSeed(12345);`
			`int minibatch = 10;`
			`int inputSize = 3;`
			`int lstmLayerSize = 4;`
			`int timeSeriesLength = 3;`
			`int nOut = 2;`
			`INDArray input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});`
			`INDArray labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);`
			`Random r = new Random(12345);`
			`for (int i = 0; i < minibatch; i++) {`
			`for (int j = 0; j < timeSeriesLength; j++) {`
			`labels.putScalar(i, r.nextInt(nOut), j, 1.0);`
			`}`
			`}`

			`MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().inferenceWorkspaceMode(WorkspaceMode.NONE)`
			`.trainingWorkspaceMode(WorkspaceMode.NONE).updater(new NoOp())`
			`.seed(12345L)`
			`.dist(new NormalDistribution(0, 2)).list()`
			`.layer(0, new LSTM.Builder().nIn(input.size(1)).nOut(lstmLayerSize)`
			`.gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())`
			`.layer(1, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)`
			`.activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())`
			`.build();`

			`MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());`
			`mln1.init();`

			`MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());`
			`mln2.init();`


			`assertEquals(mln1.params(), mln2.params());`

			`Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");`
			`f.setAccessible(true);`

			`Layer l0 = mln1.getLayer(0);`
			`f.set(l0, null);`
			`assertNull(f.get(l0));`

			`l0 = mln2.getLayer(0);`
			`assertTrue(f.get(l0) instanceof CudnnLSTMHelper);`


			`INDArray out1 = mln1.output(input);`
			`INDArray out2 = mln2.output(input);`

			`assertEquals(out1, out2);`


			`mln1.setInput(input);`
			`mln1.setLabels(labels);`

			`mln2.setInput(input);`
			`mln2.setLabels(labels);`

			`mln1.computeGradientAndScore();`
			`mln2.computeGradientAndScore();`

			`assertEquals(mln1.score(), mln2.score(), 1e-8);`

			`Gradient g1 = mln1.gradient();`
			`Gradient g2 = mln2.gradient();`

			`for (Map.Entry<String, INDArray> entry : g1.gradientForVariable().entrySet()) {`
			`INDArray exp = entry.getValue();`
			`INDArray act = g2.gradientForVariable().get(entry.getKey());`

			`//System.out.println(entry.getKey() + "\t" + exp.equals(act));`
			`}`

			`assertEquals(mln1.getFlattenedGradients(), mln2.getFlattenedGradients());`
			`}`

			`@Test`
			`public void validateImplMultiLayer() throws Exception {`

			`Nd4j.getRandom().setSeed(12345);`
			`int minibatch = 10;`
			`int inputSize = 3;`
			`int lstmLayerSize = 4;`
			`int timeSeriesLength = 3;`
			`int nOut = 2;`
			`INDArray input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});`
			`INDArray labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);`
			`Random r = new Random(12345);`
			`for (int i = 0; i < minibatch; i++) {`
			`for (int j = 0; j < timeSeriesLength; j++) {`
			`labels.putScalar(i, r.nextInt(nOut), j, 1.0);`
			`}`
			`}`

			`MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().updater(new NoOp())`
			`.dataType(DataType.DOUBLE)`
			`.inferenceWorkspaceMode(WorkspaceMode.NONE).trainingWorkspaceMode(WorkspaceMode.NONE)`
			`.seed(12345L)`
			`.dist(new NormalDistribution(0, 2)).list()`
			`.layer(0, new LSTM.Builder().nIn(input.size(1)).nOut(lstmLayerSize)`
			`.gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())`
			`.layer(1, new LSTM.Builder().nIn(lstmLayerSize).nOut(lstmLayerSize)`
			`.gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())`
			`.layer(2, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)`
			`.activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())`
			`.build();`

			`MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());`
			`mln1.init();`

			`MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());`
			`mln2.init();`


			`assertEquals(mln1.params(), mln2.params());`

			`Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");`
			`f.setAccessible(true);`

			`Layer l0 = mln1.getLayer(0);`
			`Layer l1 = mln1.getLayer(1);`
			`f.set(l0, null);`
			`f.set(l1, null);`
			`assertNull(f.get(l0));`
			`assertNull(f.get(l1));`

			`l0 = mln2.getLayer(0);`
			`l1 = mln2.getLayer(1);`
			`assertTrue(f.get(l0) instanceof CudnnLSTMHelper);`
			`assertTrue(f.get(l1) instanceof CudnnLSTMHelper);`


			`INDArray out1 = mln1.output(input);`
			`INDArray out2 = mln2.output(input);`

			`assertEquals(out1, out2);`

			`for (int x = 0; x < 10; x++) {`
			`input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});`
			`labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);`
			`for (int i = 0; i < minibatch; i++) {`
			`for (int j = 0; j < timeSeriesLength; j++) {`
			`labels.putScalar(i, r.nextInt(nOut), j, 1.0);`
			`}`
			`}`

			`mln1.setInput(input);`
			`mln1.setLabels(labels);`

			`mln2.setInput(input);`
			`mln2.setLabels(labels);`

			`mln1.computeGradientAndScore();`
			`mln2.computeGradientAndScore();`

			`assertEquals(mln1.score(), mln2.score(), 1e-5);`

			`assertEquals(mln1.getFlattenedGradients(), mln2.getFlattenedGradients());`

			`mln1.fit(new DataSet(input, labels));`
			`mln2.fit(new DataSet(input, labels));`

			`assertEquals("Iteration: " + x, mln1.params(), mln2.params());`
			`}`
			`}`



			`@Test`
			`public void validateImplMultiLayerTBPTT() throws Exception {`

			`Nd4j.getRandom().setSeed(12345);`
			`int minibatch = 10;`
			`int inputSize = 3;`
			`int lstmLayerSize = 4;`
			`int timeSeriesLength = 23;`
			`int tbpttLength = 5;`
			`int nOut = 2;`

			`MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().updater(new NoOp())`
			`.inferenceWorkspaceMode(WorkspaceMode.NONE).trainingWorkspaceMode(WorkspaceMode.NONE)`
			`.seed(12345L)`
			`.dist(new NormalDistribution(0, 2)).list()`
			`.layer(0, new LSTM.Builder().nIn(inputSize).nOut(lstmLayerSize)`
			`.gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())`
			`.layer(1, new LSTM.Builder().nIn(lstmLayerSize).nOut(lstmLayerSize)`
			`.gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())`
			`.layer(2, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)`
			`.activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())`
			`.backpropType(BackpropType.TruncatedBPTT)`
			`.tBPTTLength(tbpttLength).build();`

			`MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());`
			`mln1.init();`

			`MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());`
			`mln2.init();`


			`assertEquals(mln1.params(), mln2.params());`

			`Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");`
			`f.setAccessible(true);`

			`Layer l0 = mln1.getLayer(0);`
			`Layer l1 = mln1.getLayer(1);`
			`f.set(l0, null);`
			`f.set(l1, null);`
			`assertNull(f.get(l0));`
			`assertNull(f.get(l1));`

			`l0 = mln2.getLayer(0);`
			`l1 = mln2.getLayer(1);`
			`assertTrue(f.get(l0) instanceof CudnnLSTMHelper);`
			`assertTrue(f.get(l1) instanceof CudnnLSTMHelper);`

			`Random r = new Random(12345);`
			`for (int x = 0; x < 1; x++) {`
			`INDArray input = Nd4j.rand(new int[] {minibatch, inputSize, timeSeriesLength});`
			`INDArray labels = Nd4j.zeros(minibatch, nOut, timeSeriesLength);`
			`for (int i = 0; i < minibatch; i++) {`
			`for (int j = 0; j < timeSeriesLength; j++) {`
			`labels.putScalar(i, r.nextInt(nOut), j, 1.0);`
			`}`
			`}`

			`DataSet ds = new DataSet(input, labels);`
			`mln1.fit(ds);`
			`mln2.fit(ds);`
			`}`


			`assertEquals(mln1.params(), mln2.params());`
			`}`

			`@Test`
			`public void validateImplMultiLayerRnnTimeStep() throws Exception {`

			`for(WorkspaceMode wsm : new WorkspaceMode[]{WorkspaceMode.NONE, WorkspaceMode.ENABLED}) {`
			`Nd4j.getRandom().setSeed(12345);`
			`int minibatch = 10;`
			`int inputSize = 3;`
			`int lstmLayerSize = 4;`
			`int timeSeriesLength = 3;`
			`int tbpttLength = 5;`
			`int nOut = 2;`

			`MultiLayerConfiguration conf = new NeuralNetConfiguration.Builder().updater(new NoOp())`
			`.inferenceWorkspaceMode(WorkspaceMode.NONE).trainingWorkspaceMode(WorkspaceMode.NONE)`
			`.cacheMode(CacheMode.NONE).seed(12345L)`
			`.dist(new NormalDistribution(0, 2)).list()`
			`.layer(0, new LSTM.Builder().nIn(inputSize).nOut(lstmLayerSize)`
			`.gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())`
			`.layer(1, new LSTM.Builder().nIn(lstmLayerSize).nOut(lstmLayerSize)`
			`.gateActivationFunction(Activation.SIGMOID).activation(Activation.TANH).build())`
			`.layer(2, new RnnOutputLayer.Builder(LossFunctions.LossFunction.MCXENT)`
			`.activation(Activation.SOFTMAX).nIn(lstmLayerSize).nOut(nOut).build())`
			`.backpropType(BackpropType.TruncatedBPTT)`
			`.tBPTTLength(tbpttLength).build();`

			`MultiLayerNetwork mln1 = new MultiLayerNetwork(conf.clone());`
			`mln1.init();`

			`MultiLayerNetwork mln2 = new MultiLayerNetwork(conf.clone());`
			`mln2.init();`


			`assertEquals(mln1.params(), mln2.params());`

			`Field f = org.deeplearning4j.nn.layers.recurrent.LSTM.class.getDeclaredField("helper");`
			`f.setAccessible(true);`

			`Layer l0 = mln1.getLayer(0);`
			`Layer l1 = mln1.getLayer(1);`
			`f.set(l0, null);`
			`f.set(l1, null);`
			`assertNull(f.get(l0));`
			`assertNull(f.get(l1));`

			`l0 = mln2.getLayer(0);`
			`l1 = mln2.getLayer(1);`
			`assertTrue(f.get(l0) instanceof CudnnLSTMHelper);`
			`assertTrue(f.get(l1) instanceof CudnnLSTMHelper);`

			`Random r = new Random(12345);`
			`for (int x = 0; x < 5; x++) {`
			`INDArray input = Nd4j.rand(new int[]{minibatch, inputSize, timeSeriesLength});`

			`INDArray step1 = mln1.rnnTimeStep(input);`
			`INDArray step2 = mln2.rnnTimeStep(input);`

			`assertEquals("Step: " + x, step1, step2);`
			`}`

			`assertEquals(mln1.params(), mln2.params());`

			`//Also check fit (mainly for workspaces sanity check):`
			`INDArray in = Nd4j.rand(new int[]{minibatch, inputSize, 3 * tbpttLength});`
			`INDArray label = TestUtils.randomOneHotTimeSeries(minibatch, nOut, 3 * tbpttLength);`
			`for( int i=0; i<3; i++ ){`
			`mln1.fit(in, label);`
			`mln2.fit(in, label);`
			`}`
			`}`
			`}`
			`}`