zhongkaifu
diff --git a/‎RNNSharp/BiRNN.cs
+22-17 b/‎RNNSharp/BiRNN.cs
+22-17
diff --git a/‎RNNSharp/LSTMRNN.cs
+33-58 b/‎RNNSharp/LSTMRNN.cs
+33-58
diff --git a/‎RNNSharp/MathUtil.cs
+1-1 b/‎RNNSharp/MathUtil.cs
+1-1
@@ -3,6 +3,7 @@
 using System.Threading.Tasks;
 using AdvUtils;
 using System.Collections.Generic;
+using System.Numerics;
 
 /// <summary>
 /// RNNSharp written by Zhongkai Fu ([email protected])
@@ -13,6 +14,7 @@ class BiRNN : RNN
     {
         private RNN forwardRNN;
         private RNN backwardRNN;
+        private Vector<float> vecConst2 = new Vector<float>(2.0f);
 
         public BiRNN(RNN s_forwardRNN, RNN s_backwardRNN)
         {
@@ -129,7 +131,7 @@ public override float LearningRate
             }
         }
 
-        public override double GradientCutoff
+        public override float GradientCutoff
         {
             get
             {
@@ -209,7 +211,7 @@ public override void InitMem()
             backwardRNN.InitMem();
 
             //Create and intialise the weights from hidden to output layer, these are just normal weights
-            Hidden2OutputWeight = new Matrix<double>(L2, L1);
+            Hidden2OutputWeight = new Matrix<float>(L2, L1);
 
             for (int i = 0; i < Hidden2OutputWeight.Height; i++)
             {
@@ -222,7 +224,7 @@ public override void InitMem()
             Hidden2OutputWeightLearningRate = new Matrix<float>(L2, L1);
         }
 
-        public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<double> rawOutputLayer)
+        public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<float> rawOutputLayer)
         {
             int numStates = pSequence.States.Length;
             SimpleLayer[] mForward = null;
@@ -266,14 +268,18 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid
                 SimpleLayer forwardCells = mForward[curState];
                 SimpleLayer backwardCells = mBackward[curState];
 
-                for (int i = 0; i < forwardRNN.L1; i++)
+                for (int i = 0; i < forwardRNN.L1; i+=Vector<float>.Count)
                 {
-                    cells.cellOutput[i] = (forwardCells.cellOutput[i] + backwardCells.cellOutput[i]) / 2.0;
+                    Vector<float> v1 = new Vector<float>(forwardCells.cellOutput, i);
+                    Vector<float> v2 = new Vector<float>(backwardCells.cellOutput, i);
+                    Vector<float> v = (v1 + v2) / vecConst2;
+
+                    v.CopyTo(cells.cellOutput, i);
                 }
             });
 
             //Calculate output layer
-            Matrix<double> tmp_rawOutputLayer = new Matrix<double>(numStates, L2);
+            Matrix<float> tmp_rawOutputLayer = new Matrix<float>(numStates, L2);
             SimpleLayer[] seqOutput = new SimpleLayer[numStates];
             Parallel.For(0, numStates, parallelOption, curState =>
             {
@@ -282,7 +288,7 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid
 
                 matrixXvectorADD(outputCells, mergedHiddenLayer[curState], Hidden2OutputWeight, L2, L1, 0);
 
-                double[] tmp_vector = tmp_rawOutputLayer[curState];
+                float[] tmp_vector = tmp_rawOutputLayer[curState];
                 outputCells.cellOutput.CopyTo(tmp_vector, 0);
 
                 //Activation on output layer
@@ -301,7 +307,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running
             int numStates = pSequence.States.Length;
             //Predict output
             SimpleLayer[] mergedHiddenLayer = null;
-            Matrix<double> rawOutputLayer = null;
+            Matrix<float> rawOutputLayer = null;
             SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);
 
             ForwardBackward(numStates, rawOutputLayer);
@@ -326,7 +332,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running
                 {
                     int label = pSequence.States[curState].Label;
                     SimpleLayer layer = seqOutput[curState];
-                    double[] CRFOutputLayer = CRFSeqOutput[curState];
+                    float[] CRFOutputLayer = CRFSeqOutput[curState];
 
                     //For standard RNN
                     for (int c = 0; c < L2; c++)
@@ -342,14 +348,14 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running
             return predict;
         }
 
-        public override Matrix<double> PredictSentence(Sequence pSequence, RunningMode runningMode)
+        public override Matrix<float> PredictSentence(Sequence pSequence, RunningMode runningMode)
         {
             //Reset the network
             int numStates = pSequence.States.Length;
 
             //Predict output
             SimpleLayer[] mergedHiddenLayer = null;
-            Matrix<double> rawOutputLayer = null;
+            Matrix<float> rawOutputLayer = null;
             SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);
 
             if (runningMode != RunningMode.Test)
@@ -374,7 +380,7 @@ public override Matrix<double> PredictSentence(Sequence pSequence, RunningMode r
                     {
                         layer.er[c] = -layer.cellOutput[c];
                     }
-                    layer.er[label] = 1.0 - layer.cellOutput[label];
+                    layer.er[label] = 1.0f - layer.cellOutput[label];
                 }
 
                 LearnTwoRNN(pSequence, mergedHiddenLayer, seqOutput);
@@ -407,18 +413,17 @@ private void LearnTwoRNN(Sequence pSequence, SimpleLayer[] mergedHiddenLayer, Si
                     for (int i = 0; i < Hidden2OutputWeight.Height; i++)
                     {
                         //update weights for hidden to output layer
-                        double er = outputCells.er[i];
-                        double[] vector_i = Hidden2OutputWeight[i];
+                        float er = outputCells.er[i];
+                        float[] vector_i = Hidden2OutputWeight[i];
                         for (int k = 0; k < Hidden2OutputWeight.Width; k++)
                         {
                             double delta = NormalizeGradient(mergedHiddenCells.cellOutput[k] * er);
                             double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, i, k, delta);
 
-                            vector_i[k] += newLearningRate * delta;
+                            vector_i[k] += (float)(newLearningRate * delta);
                         }
                     }
                 }
-
             },
             ()=>
             {
@@ -485,7 +490,7 @@ public override void computeHiddenLayer(State state, bool isTrain = true)
             throw new NotImplementedException("computeHiddenLayer is not implemented in BiRNN");
         }
 
-        public override void computeOutput(double[] doutput)
+        public override void computeOutput(float[] doutput)
         {
             throw new NotImplementedException("computeOutput is not implemented in BiRNN");
         }
 
@@ -30,10 +30,6 @@ public class LSTMCell : SimpleCell
         public double wCellForget;
         public double wCellOut;
 
-        public float dCellInLearningRate;
-        public float dCellForgetLearningRate;
-        public float dCellOutLearningRate;
-
         //partial derivatives
         public double dSWCellIn;
         public double dSWCellForget;
@@ -52,22 +48,6 @@ public struct LSTMWeight
         public float wInputOutputGate;
     }
 
-    //public struct LSTMWeightLearningRate
-    //{
-    //    public float dInputCellLearningRate;
-    //    public float dInputInputGateLearningRate;
-    //    public float dInputForgetGateLearningRate;
-    //    public float dInputOutputGateLearningRate;
-    //}
-
-    //public struct LSTMWeightDerivative
-    //{
-    //    //partial derivatives. dont need partial derivative for output gate as it uses BP not RTRL
-    //    public double dSInputCell;
-    //    public double dSInputInputGate;
-    //    public double dSInputForgetGate;
-    //}
-
     public class LSTMRNN : RNN
     {
         public LSTMCell[] neuHidden;		//neurons in hidden layer
@@ -76,10 +56,15 @@ public class LSTMRNN : RNN
 
         protected Vector4[][] Input2HiddenLearningRate;
         protected Vector4[][] Feature2HiddenLearningRate;
+        protected Vector3[] CellLearningRate;
 
         protected Vector3[][] input2hiddenDeri;
         protected Vector3[][] feature2hiddenDeri;
 
+        private Vector4 vecLearningRate;
+        private Vector3 vecLearningRate3;
+
+
         public LSTMRNN()
         {
             ModelType = MODELTYPE.LSTM;
@@ -368,7 +353,7 @@ public override void SaveModel(string filename)
             //weight input->hidden
             Logger.WriteLine("Saving input2hidden weights...");
             saveLSTMWeight(input2hidden, fo);
-  
+
             if (DenseFeatureSize > 0)
             {
                 //weight fea->hidden
@@ -453,7 +438,7 @@ public override void initWeights()
             }
 
             //Create and intialise the weights from hidden to output layer, these are just normal weights
-            Hidden2OutputWeight = new Matrix<double>(L2, L1);
+            Hidden2OutputWeight = new Matrix<float>(L2, L1);
 
             for (int i = 0; i < Hidden2OutputWeight.Height; i++)
             {
@@ -499,12 +484,9 @@ public override void CleanStatus()
                 Feature2HiddenLearningRate = new Vector4[L1][];
             }
 
+            CellLearningRate = new Vector3[L1];
             Parallel.For(0, L1, parallelOption, i =>
             {
-                neuHidden[i].dCellForgetLearningRate = 0;
-                neuHidden[i].dCellInLearningRate = 0;
-                neuHidden[i].dCellOutLearningRate = 0;
-
                 Input2HiddenLearningRate[i] = new Vector4[L0];
 
                 if (DenseFeatureSize > 0)
@@ -515,6 +497,8 @@ public override void CleanStatus()
             });
 
             Hidden2OutputWeightLearningRate = new Matrix<float>(L2, L1);
+            vecLearningRate = new Vector4(LearningRate, LearningRate, LearningRate, LearningRate);
+            vecLearningRate3 = new Vector3(LearningRate, LearningRate, LearningRate);
         }
 
         public override void InitMem()
@@ -583,7 +567,7 @@ public override void ComputeHiddenLayerErr()
                 //find the error by find the product of the output errors and their weight connection.
                 SimpleCell cell = neuHidden[i];
 
-                cell.er = 0.0;
+                cell.er = 0.0f;
 
                 if (cell.mask == false)
                 {
@@ -600,30 +584,22 @@ public override void LearnOutputWeight()
             //update weights for hidden to output layer
             Parallel.For(0, L1, parallelOption, i =>
             {
-                double cellOutput = neuHidden[i].cellOutput;
+                float cellOutput = neuHidden[i].cellOutput;
                 for (int k = 0; k < L2; k++)
                 {
-                    double delta = NormalizeGradient(cellOutput * OutputLayer.er[k]);
-                    double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, i, k, delta);
+                    float delta = NormalizeGradient(cellOutput * OutputLayer.er[k]);
+                    double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, k, i, delta);
 
-                    Hidden2OutputWeight[k][i] += newLearningRate * delta;
+                    Hidden2OutputWeight[k][i] += (float)(newLearningRate * delta);
                 }
             });
         }
 
-        public double UpdateLearningRate(ref float mg, double delta)
-        {
-            double dg = mg + delta * delta;
-            mg = (float)dg;
-            return LearningRate / (1.0 + Math.Sqrt(dg));
-        }
-
         public override void LearnNet(State state, int numStates, int curState)
         {
             //Get sparse feature and apply it into hidden layer
             var sparse = state.SparseData;
             int sparseFeatureSize = sparse.Count;
-            Vector4 vecLearningRate = new Vector4(LearningRate, LearningRate, LearningRate, LearningRate);
 
             //put variables for derivaties in weight class and cell class
             Parallel.For(0, L1, parallelOption, i =>
@@ -650,8 +626,6 @@ public override void LearnNet(State state, int numStates, int curState)
                         (float)Sigmoid2_ci_netCellState_mul_SigmoidDerivative_ci_netIn,
                         (float)ci_previousCellState_mul_SigmoidDerivative_ci_netForget);
 
-                double delta = 0;
-                double newLearningRate = 0;
                 for (int k = 0; k < sparseFeatureSize; k++)
                 {
                     var entry = sparse.GetEntry(k);
@@ -673,9 +647,7 @@ public override void LearnNet(State state, int numStates, int curState)
                     vecAlpha = wlr + vecAlpha;
                     wlr_i[entry.Key] = vecAlpha;
 
-                    vecAlpha = Vector4.SquareRoot(vecAlpha) + Vector4.One;
-                    vecAlpha = vecLearningRate / vecAlpha;
-
+                    vecAlpha = vecLearningRate / (Vector4.SquareRoot(vecAlpha) + Vector4.One);
                     vecDelta = vecAlpha * vecDelta;
 
                     w.wInputCell += vecDelta.X;
@@ -713,9 +685,7 @@ public override void LearnNet(State state, int numStates, int curState)
                         vecAlpha = wlr + vecAlpha;
                         wlr_i[j] = vecAlpha;
 
-                        vecAlpha = Vector4.SquareRoot(vecAlpha) + Vector4.One;
-                        vecAlpha = vecLearningRate / vecAlpha;
-
+                        vecAlpha = vecLearningRate / (Vector4.SquareRoot(vecAlpha) + Vector4.One);
                         vecDelta = vecAlpha * vecDelta;
 
                         w.wInputCell += vecDelta.X;
@@ -736,17 +706,22 @@ public override void LearnNet(State state, int numStates, int curState)
 
 
                 //update internal weights
-                delta = cellStateError * c.dSWCellIn;
-                newLearningRate = UpdateLearningRate(ref c.dCellInLearningRate, delta);
-                c.wCellIn += newLearningRate * delta;
+                Vector3 vecCellDelta = new Vector3((float)c.dSWCellIn, (float)c.dSWCellForget, (float)c.cellState);
+                Vector3 vecCellErr = new Vector3(cellStateError, cellStateError, gradientOutputGate);
+                Vector3 vecCellLearningRate = CellLearningRate[i];
+
+                vecCellDelta = vecCellErr * vecCellDelta;
+                vecCellLearningRate += (vecCellDelta * vecCellDelta);
+                CellLearningRate[i] = vecCellLearningRate;
+
+                //LearningRate / (1.0 + Math.Sqrt(dg));
+                vecCellLearningRate = vecLearningRate3 / (Vector3.One + Vector3.SquareRoot(vecCellLearningRate));
+                vecCellDelta = vecCellLearningRate * vecCellDelta;
 
-                delta = cellStateError * c.dSWCellForget;
-                newLearningRate = UpdateLearningRate(ref c.dCellForgetLearningRate, delta);
-                c.wCellForget += newLearningRate * delta;
+                c.wCellIn += vecCellDelta.X;
+                c.wCellForget += vecCellDelta.Y;
+                c.wCellOut += vecCellDelta.Z;
 
-                delta = gradientOutputGate * c.cellState;
-                newLearningRate = UpdateLearningRate(ref c.dCellOutLearningRate, delta);
-                c.wCellOut += newLearningRate * delta;
 
                 neuHidden[i] = c;
             });
@@ -833,15 +808,15 @@ public override void computeHiddenLayer(State state, bool isTrain = true)
                 //squash output gate 
                 cell_j.yOut = Sigmoid(cell_j.netOut);
 
-                cell_j.cellOutput = cell_j.cellState * cell_j.yOut;
+                cell_j.cellOutput = (float)(cell_j.cellState * cell_j.yOut);
 
 
                 neuHidden[j] = cell_j;
             });
         }
 
 
-        public override void computeOutput(double[] doutput)
+        public override void computeOutput(float[] doutput)
         {
             matrixXvectorADD(OutputLayer, neuHidden, Hidden2OutputWeight, L2, L1, 0);
             if (doutput != null)
 
@@ -7,7 +7,7 @@ namespace RNNSharp
 {
     class MathUtil
     {
-        public static int GetMaxProbIndex(double [] array)
+        public static int GetMaxProbIndex(float [] array)
         {
             int dim = array.Length;
             double maxValue = array[0];
Original file line number	Diff line number	Diff line change
`@@ -3,6 +3,7 @@`
`3`	`3`	`using System.Threading.Tasks;`
`4`	`4`	`using AdvUtils;`
`5`	`5`	`using System.Collections.Generic;`
	`6`	`+using System.Numerics;`
`6`	`7`
`7`	`8`	`/// <summary>`
`8`	`9`	`/// RNNSharp written by Zhongkai Fu ([email protected])`
`@@ -13,6 +14,7 @@ class BiRNN : RNN`
`13`	`14`	`{`
`14`	`15`	`private RNN forwardRNN;`
`15`	`16`	`private RNN backwardRNN;`
	`17`	`+ private Vector<float> vecConst2 = new Vector<float>(2.0f);`
`16`	`18`
`17`	`19`	`public BiRNN(RNN s_forwardRNN, RNN s_backwardRNN)`
`18`	`20`	`{`
`@@ -129,7 +131,7 @@ public override float LearningRate`
`129`	`131`	`}`
`130`	`132`	`}`
`131`	`133`
`132`		`- public override double GradientCutoff`
	`134`	`+ public override float GradientCutoff`
`133`	`135`	`{`
`134`	`136`	`get`
`135`	`137`	`{`
`@@ -209,7 +211,7 @@ public override void InitMem()`
`209`	`211`	`backwardRNN.InitMem();`
`210`	`212`
`211`	`213`	`//Create and intialise the weights from hidden to output layer, these are just normal weights`
`212`		`- Hidden2OutputWeight = new Matrix<double>(L2, L1);`
	`214`	`+ Hidden2OutputWeight = new Matrix<float>(L2, L1);`
`213`	`215`
`214`	`216`	`for (int i = 0; i < Hidden2OutputWeight.Height; i++)`
`215`	`217`	`{`
`@@ -222,7 +224,7 @@ public override void InitMem()`
`222`	`224`	`Hidden2OutputWeightLearningRate = new Matrix<float>(L2, L1);`
`223`	`225`	`}`
`224`	`226`
`225`		`- public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<double> rawOutputLayer)`
	`227`	`+ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<float> rawOutputLayer)`
`226`	`228`	`{`
`227`	`229`	`int numStates = pSequence.States.Length;`
`228`	`230`	`SimpleLayer[] mForward = null;`
`@@ -266,14 +268,18 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid`
`266`	`268`	`SimpleLayer forwardCells = mForward[curState];`
`267`	`269`	`SimpleLayer backwardCells = mBackward[curState];`
`268`	`270`
`269`		`- for (int i = 0; i < forwardRNN.L1; i++)`
	`271`	`+ for (int i = 0; i < forwardRNN.L1; i+=Vector<float>.Count)`
`270`	`272`	`{`
`271`		`- cells.cellOutput[i] = (forwardCells.cellOutput[i] + backwardCells.cellOutput[i]) / 2.0;`
	`273`	`+ Vector<float> v1 = new Vector<float>(forwardCells.cellOutput, i);`
	`274`	`+ Vector<float> v2 = new Vector<float>(backwardCells.cellOutput, i);`
	`275`	`+ Vector<float> v = (v1 + v2) / vecConst2;`
	`276`	`+`
	`277`	`+ v.CopyTo(cells.cellOutput, i);`
`272`	`278`	`}`
`273`	`279`	`});`
`274`	`280`
`275`	`281`	`//Calculate output layer`
`276`		`- Matrix<double> tmp_rawOutputLayer = new Matrix<double>(numStates, L2);`
	`282`	`+ Matrix<float> tmp_rawOutputLayer = new Matrix<float>(numStates, L2);`
`277`	`283`	`SimpleLayer[] seqOutput = new SimpleLayer[numStates];`
`278`	`284`	`Parallel.For(0, numStates, parallelOption, curState =>`
`279`	`285`	`{`
`@@ -282,7 +288,7 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid`
`282`	`288`
`283`	`289`	`matrixXvectorADD(outputCells, mergedHiddenLayer[curState], Hidden2OutputWeight, L2, L1, 0);`
`284`	`290`
`285`		`- double[] tmp_vector = tmp_rawOutputLayer[curState];`
	`291`	`+ float[] tmp_vector = tmp_rawOutputLayer[curState];`
`286`	`292`	`outputCells.cellOutput.CopyTo(tmp_vector, 0);`
`287`	`293`
`288`	`294`	`//Activation on output layer`
`@@ -301,7 +307,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running`
`301`	`307`	`int numStates = pSequence.States.Length;`
`302`	`308`	`//Predict output`
`303`	`309`	`SimpleLayer[] mergedHiddenLayer = null;`
`304`		`- Matrix<double> rawOutputLayer = null;`
	`310`	`+ Matrix<float> rawOutputLayer = null;`
`305`	`311`	`SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);`
`306`	`312`
`307`	`313`	`ForwardBackward(numStates, rawOutputLayer);`
`@@ -326,7 +332,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running`
`326`	`332`	`{`
`327`	`333`	`int label = pSequence.States[curState].Label;`
`328`	`334`	`SimpleLayer layer = seqOutput[curState];`
`329`		`- double[] CRFOutputLayer = CRFSeqOutput[curState];`
	`335`	`+ float[] CRFOutputLayer = CRFSeqOutput[curState];`
`330`	`336`
`331`	`337`	`//For standard RNN`
`332`	`338`	`for (int c = 0; c < L2; c++)`
`@@ -342,14 +348,14 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running`
`342`	`348`	`return predict;`
`343`	`349`	`}`
`344`	`350`
`345`		`- public override Matrix<double> PredictSentence(Sequence pSequence, RunningMode runningMode)`
	`351`	`+ public override Matrix<float> PredictSentence(Sequence pSequence, RunningMode runningMode)`
`346`	`352`	`{`
`347`	`353`	`//Reset the network`
`348`	`354`	`int numStates = pSequence.States.Length;`
`349`	`355`
`350`	`356`	`//Predict output`
`351`	`357`	`SimpleLayer[] mergedHiddenLayer = null;`
`352`		`- Matrix<double> rawOutputLayer = null;`
	`358`	`+ Matrix<float> rawOutputLayer = null;`
`353`	`359`	`SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);`
`354`	`360`
`355`	`361`	`if (runningMode != RunningMode.Test)`
`@@ -374,7 +380,7 @@ public override Matrix<double> PredictSentence(Sequence pSequence, RunningMode r`
`374`	`380`	`{`
`375`	`381`	`layer.er[c] = -layer.cellOutput[c];`
`376`	`382`	`}`
`377`		`- layer.er[label] = 1.0 - layer.cellOutput[label];`
	`383`	`+ layer.er[label] = 1.0f - layer.cellOutput[label];`
`378`	`384`	`}`
`379`	`385`
`380`	`386`	`LearnTwoRNN(pSequence, mergedHiddenLayer, seqOutput);`
`@@ -407,18 +413,17 @@ private void LearnTwoRNN(Sequence pSequence, SimpleLayer[] mergedHiddenLayer, Si`
`407`	`413`	`for (int i = 0; i < Hidden2OutputWeight.Height; i++)`
`408`	`414`	`{`
`409`	`415`	`//update weights for hidden to output layer`
`410`		`- double er = outputCells.er[i];`
`411`		`- double[] vector_i = Hidden2OutputWeight[i];`
	`416`	`+ float er = outputCells.er[i];`
	`417`	`+ float[] vector_i = Hidden2OutputWeight[i];`
`412`	`418`	`for (int k = 0; k < Hidden2OutputWeight.Width; k++)`
`413`	`419`	`{`
`414`	`420`	`double delta = NormalizeGradient(mergedHiddenCells.cellOutput[k] * er);`
`415`	`421`	`double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, i, k, delta);`
`416`	`422`
`417`		`- vector_i[k] += newLearningRate * delta;`
	`423`	`+ vector_i[k] += (float)(newLearningRate * delta);`
`418`	`424`	`}`
`419`	`425`	`}`
`420`	`426`	`}`
`421`		`-`
`422`	`427`	`},`
`423`	`428`	`()=>`
`424`	`429`	`{`
`@@ -485,7 +490,7 @@ public override void computeHiddenLayer(State state, bool isTrain = true)`
`485`	`490`	`throw new NotImplementedException("computeHiddenLayer is not implemented in BiRNN");`
`486`	`491`	`}`
`487`	`492`
`488`		`- public override void computeOutput(double[] doutput)`
	`493`	`+ public override void computeOutput(float[] doutput)`
`489`	`494`	`{`
`490`	`495`	`throw new NotImplementedException("computeOutput is not implemented in BiRNN");`
`491`	`496`	`}`
Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ namespace RNNSharp`
`7`	`7`	`{`
`8`	`8`	`class MathUtil`
`9`	`9`	`{`
`10`		`- public static int GetMaxProbIndex(double [] array)`
	`10`	`+ public static int GetMaxProbIndex(float [] array)`
`11`	`11`	`{`
`12`	`12`	`int dim = array.Length;`
`13`	`13`	`double maxValue = array[0];`