zhongkaifu
diff --git a/‎RNNSharp/BiRNN.cs
+17-22 b/‎RNNSharp/BiRNN.cs
+17-22
diff --git a/‎RNNSharp/LSTMRNN.cs
+58-33 b/‎RNNSharp/LSTMRNN.cs
+58-33
diff --git a/‎RNNSharp/MathUtil.cs
+1-1 b/‎RNNSharp/MathUtil.cs
+1-1
@@ -3,7 +3,6 @@
 using System.Threading.Tasks;
 using AdvUtils;
 using System.Collections.Generic;
-using System.Numerics;
 
 /// <summary>
 /// RNNSharp written by Zhongkai Fu ([email protected])
@@ -14,7 +13,6 @@ class BiRNN : RNN
     {
         private RNN forwardRNN;
         private RNN backwardRNN;
-        private Vector<float> vecConst2 = new Vector<float>(2.0f);
 
         public BiRNN(RNN s_forwardRNN, RNN s_backwardRNN)
         {
@@ -131,7 +129,7 @@ public override float LearningRate
             }
         }
 
-        public override float GradientCutoff
+        public override double GradientCutoff
         {
             get
             {
@@ -211,7 +209,7 @@ public override void InitMem()
             backwardRNN.InitMem();
 
             //Create and intialise the weights from hidden to output layer, these are just normal weights
-            Hidden2OutputWeight = new Matrix<float>(L2, L1);
+            Hidden2OutputWeight = new Matrix<double>(L2, L1);
 
             for (int i = 0; i < Hidden2OutputWeight.Height; i++)
             {
@@ -224,7 +222,7 @@ public override void InitMem()
             Hidden2OutputWeightLearningRate = new Matrix<float>(L2, L1);
         }
 
-        public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<float> rawOutputLayer)
+        public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<double> rawOutputLayer)
         {
             int numStates = pSequence.States.Length;
             SimpleLayer[] mForward = null;
@@ -268,18 +266,14 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid
                 SimpleLayer forwardCells = mForward[curState];
                 SimpleLayer backwardCells = mBackward[curState];
 
-                for (int i = 0; i < forwardRNN.L1; i+=Vector<float>.Count)
+                for (int i = 0; i < forwardRNN.L1; i++)
                 {
-                    Vector<float> v1 = new Vector<float>(forwardCells.cellOutput, i);
-                    Vector<float> v2 = new Vector<float>(backwardCells.cellOutput, i);
-                    Vector<float> v = (v1 + v2) / vecConst2;
-
-                    v.CopyTo(cells.cellOutput, i);
+                    cells.cellOutput[i] = (forwardCells.cellOutput[i] + backwardCells.cellOutput[i]) / 2.0;
                 }
             });
 
             //Calculate output layer
-            Matrix<float> tmp_rawOutputLayer = new Matrix<float>(numStates, L2);
+            Matrix<double> tmp_rawOutputLayer = new Matrix<double>(numStates, L2);
             SimpleLayer[] seqOutput = new SimpleLayer[numStates];
             Parallel.For(0, numStates, parallelOption, curState =>
             {
@@ -288,7 +282,7 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid
 
                 matrixXvectorADD(outputCells, mergedHiddenLayer[curState], Hidden2OutputWeight, L2, L1, 0);
 
-                float[] tmp_vector = tmp_rawOutputLayer[curState];
+                double[] tmp_vector = tmp_rawOutputLayer[curState];
                 outputCells.cellOutput.CopyTo(tmp_vector, 0);
 
                 //Activation on output layer
@@ -307,7 +301,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running
             int numStates = pSequence.States.Length;
             //Predict output
             SimpleLayer[] mergedHiddenLayer = null;
-            Matrix<float> rawOutputLayer = null;
+            Matrix<double> rawOutputLayer = null;
             SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);
 
             ForwardBackward(numStates, rawOutputLayer);
@@ -332,7 +326,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running
                 {
                     int label = pSequence.States[curState].Label;
                     SimpleLayer layer = seqOutput[curState];
-                    float[] CRFOutputLayer = CRFSeqOutput[curState];
+                    double[] CRFOutputLayer = CRFSeqOutput[curState];
 
                     //For standard RNN
                     for (int c = 0; c < L2; c++)
@@ -348,14 +342,14 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running
             return predict;
         }
 
-        public override Matrix<float> PredictSentence(Sequence pSequence, RunningMode runningMode)
+        public override Matrix<double> PredictSentence(Sequence pSequence, RunningMode runningMode)
         {
             //Reset the network
             int numStates = pSequence.States.Length;
 
             //Predict output
             SimpleLayer[] mergedHiddenLayer = null;
-            Matrix<float> rawOutputLayer = null;
+            Matrix<double> rawOutputLayer = null;
             SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);
 
             if (runningMode != RunningMode.Test)
@@ -380,7 +374,7 @@ public override Matrix<float> PredictSentence(Sequence pSequence, RunningMode ru
                     {
                         layer.er[c] = -layer.cellOutput[c];
                     }
-                    layer.er[label] = 1.0f - layer.cellOutput[label];
+                    layer.er[label] = 1.0 - layer.cellOutput[label];
                 }
 
                 LearnTwoRNN(pSequence, mergedHiddenLayer, seqOutput);
@@ -413,17 +407,18 @@ private void LearnTwoRNN(Sequence pSequence, SimpleLayer[] mergedHiddenLayer, Si
                     for (int i = 0; i < Hidden2OutputWeight.Height; i++)
                     {
                         //update weights for hidden to output layer
-                        float er = outputCells.er[i];
-                        float[] vector_i = Hidden2OutputWeight[i];
+                        double er = outputCells.er[i];
+                        double[] vector_i = Hidden2OutputWeight[i];
                         for (int k = 0; k < Hidden2OutputWeight.Width; k++)
                         {
                             double delta = NormalizeGradient(mergedHiddenCells.cellOutput[k] * er);
                             double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, i, k, delta);
 
-                            vector_i[k] += (float)(newLearningRate * delta);
+                            vector_i[k] += newLearningRate * delta;
                         }
                     }
                 }
+
             },
             ()=>
             {
@@ -490,7 +485,7 @@ public override void computeHiddenLayer(State state, bool isTrain = true)
             throw new NotImplementedException("computeHiddenLayer is not implemented in BiRNN");
         }
 
-        public override void computeOutput(float[] doutput)
+        public override void computeOutput(double[] doutput)
         {
             throw new NotImplementedException("computeOutput is not implemented in BiRNN");
         }
 
@@ -30,6 +30,10 @@ public class LSTMCell : SimpleCell
         public double wCellForget;
         public double wCellOut;
 
+        public float dCellInLearningRate;
+        public float dCellForgetLearningRate;
+        public float dCellOutLearningRate;
+
         //partial derivatives
         public double dSWCellIn;
         public double dSWCellForget;
@@ -48,6 +52,22 @@ public struct LSTMWeight
         public float wInputOutputGate;
     }
 
+    //public struct LSTMWeightLearningRate
+    //{
+    //    public float dInputCellLearningRate;
+    //    public float dInputInputGateLearningRate;
+    //    public float dInputForgetGateLearningRate;
+    //    public float dInputOutputGateLearningRate;
+    //}
+
+    //public struct LSTMWeightDerivative
+    //{
+    //    //partial derivatives. dont need partial derivative for output gate as it uses BP not RTRL
+    //    public double dSInputCell;
+    //    public double dSInputInputGate;
+    //    public double dSInputForgetGate;
+    //}
+
     public class LSTMRNN : RNN
     {
         public LSTMCell[] neuHidden;		//neurons in hidden layer
@@ -56,15 +76,10 @@ public class LSTMRNN : RNN
 
         protected Vector4[][] Input2HiddenLearningRate;
         protected Vector4[][] Feature2HiddenLearningRate;
-        protected Vector3[] CellLearningRate;
 
         protected Vector3[][] input2hiddenDeri;
         protected Vector3[][] feature2hiddenDeri;
 
-        private Vector4 vecLearningRate;
-        private Vector3 vecLearningRate3;
-
-
         public LSTMRNN()
         {
             ModelType = MODELTYPE.LSTM;
@@ -353,7 +368,7 @@ public override void SaveModel(string filename)
             //weight input->hidden
             Logger.WriteLine("Saving input2hidden weights...");
             saveLSTMWeight(input2hidden, fo);
-
+  
             if (DenseFeatureSize > 0)
             {
                 //weight fea->hidden
@@ -438,7 +453,7 @@ public override void initWeights()
             }
 
             //Create and intialise the weights from hidden to output layer, these are just normal weights
-            Hidden2OutputWeight = new Matrix<float>(L2, L1);
+            Hidden2OutputWeight = new Matrix<double>(L2, L1);
 
             for (int i = 0; i < Hidden2OutputWeight.Height; i++)
             {
@@ -484,9 +499,12 @@ public override void CleanStatus()
                 Feature2HiddenLearningRate = new Vector4[L1][];
             }
 
-            CellLearningRate = new Vector3[L1];
             Parallel.For(0, L1, parallelOption, i =>
             {
+                neuHidden[i].dCellForgetLearningRate = 0;
+                neuHidden[i].dCellInLearningRate = 0;
+                neuHidden[i].dCellOutLearningRate = 0;
+
                 Input2HiddenLearningRate[i] = new Vector4[L0];
 
                 if (DenseFeatureSize > 0)
@@ -497,8 +515,6 @@ public override void CleanStatus()
             });
 
             Hidden2OutputWeightLearningRate = new Matrix<float>(L2, L1);
-            vecLearningRate = new Vector4(LearningRate, LearningRate, LearningRate, LearningRate);
-            vecLearningRate3 = new Vector3(LearningRate, LearningRate, LearningRate);
         }
 
         public override void InitMem()
@@ -567,7 +583,7 @@ public override void ComputeHiddenLayerErr()
                 //find the error by find the product of the output errors and their weight connection.
                 SimpleCell cell = neuHidden[i];
 
-                cell.er = 0.0f;
+                cell.er = 0.0;
 
                 if (cell.mask == false)
                 {
@@ -584,22 +600,30 @@ public override void LearnOutputWeight()
             //update weights for hidden to output layer
             Parallel.For(0, L1, parallelOption, i =>
             {
-                float cellOutput = neuHidden[i].cellOutput;
+                double cellOutput = neuHidden[i].cellOutput;
                 for (int k = 0; k < L2; k++)
                 {
-                    float delta = NormalizeGradient(cellOutput * OutputLayer.er[k]);
-                    double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, k, i, delta);
+                    double delta = NormalizeGradient(cellOutput * OutputLayer.er[k]);
+                    double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, i, k, delta);
 
-                    Hidden2OutputWeight[k][i] += (float)(newLearningRate * delta);
+                    Hidden2OutputWeight[k][i] += newLearningRate * delta;
                 }
             });
         }
 
+        public double UpdateLearningRate(ref float mg, double delta)
+        {
+            double dg = mg + delta * delta;
+            mg = (float)dg;
+            return LearningRate / (1.0 + Math.Sqrt(dg));
+        }
+
         public override void LearnNet(State state, int numStates, int curState)
         {
             //Get sparse feature and apply it into hidden layer
             var sparse = state.SparseData;
             int sparseFeatureSize = sparse.Count;
+            Vector4 vecLearningRate = new Vector4(LearningRate, LearningRate, LearningRate, LearningRate);
 
             //put variables for derivaties in weight class and cell class
             Parallel.For(0, L1, parallelOption, i =>
@@ -626,6 +650,8 @@ public override void LearnNet(State state, int numStates, int curState)
                         (float)Sigmoid2_ci_netCellState_mul_SigmoidDerivative_ci_netIn,
                         (float)ci_previousCellState_mul_SigmoidDerivative_ci_netForget);
 
+                double delta = 0;
+                double newLearningRate = 0;
                 for (int k = 0; k < sparseFeatureSize; k++)
                 {
                     var entry = sparse.GetEntry(k);
@@ -647,7 +673,9 @@ public override void LearnNet(State state, int numStates, int curState)
                     vecAlpha = wlr + vecAlpha;
                     wlr_i[entry.Key] = vecAlpha;
 
-                    vecAlpha = vecLearningRate / (Vector4.SquareRoot(vecAlpha) + Vector4.One);
+                    vecAlpha = Vector4.SquareRoot(vecAlpha) + Vector4.One;
+                    vecAlpha = vecLearningRate / vecAlpha;
+
                     vecDelta = vecAlpha * vecDelta;
 
                     w.wInputCell += vecDelta.X;
@@ -685,7 +713,9 @@ public override void LearnNet(State state, int numStates, int curState)
                         vecAlpha = wlr + vecAlpha;
                         wlr_i[j] = vecAlpha;
 
-                        vecAlpha = vecLearningRate / (Vector4.SquareRoot(vecAlpha) + Vector4.One);
+                        vecAlpha = Vector4.SquareRoot(vecAlpha) + Vector4.One;
+                        vecAlpha = vecLearningRate / vecAlpha;
+
                         vecDelta = vecAlpha * vecDelta;
 
                         w.wInputCell += vecDelta.X;
@@ -706,22 +736,17 @@ public override void LearnNet(State state, int numStates, int curState)
 
 
                 //update internal weights
-                Vector3 vecCellDelta = new Vector3((float)c.dSWCellIn, (float)c.dSWCellForget, (float)c.cellState);
-                Vector3 vecCellErr = new Vector3(cellStateError, cellStateError, gradientOutputGate);
-                Vector3 vecCellLearningRate = CellLearningRate[i];
-
-                vecCellDelta = vecCellErr * vecCellDelta;
-                vecCellLearningRate += (vecCellDelta * vecCellDelta);
-                CellLearningRate[i] = vecCellLearningRate;
-
-                //LearningRate / (1.0 + Math.Sqrt(dg));
-                vecCellLearningRate = vecLearningRate3 / (Vector3.One + Vector3.SquareRoot(vecCellLearningRate));
-                vecCellDelta = vecCellLearningRate * vecCellDelta;
+                delta = cellStateError * c.dSWCellIn;
+                newLearningRate = UpdateLearningRate(ref c.dCellInLearningRate, delta);
+                c.wCellIn += newLearningRate * delta;
 
-                c.wCellIn += vecCellDelta.X;
-                c.wCellForget += vecCellDelta.Y;
-                c.wCellOut += vecCellDelta.Z;
+                delta = cellStateError * c.dSWCellForget;
+                newLearningRate = UpdateLearningRate(ref c.dCellForgetLearningRate, delta);
+                c.wCellForget += newLearningRate * delta;
 
+                delta = gradientOutputGate * c.cellState;
+                newLearningRate = UpdateLearningRate(ref c.dCellOutLearningRate, delta);
+                c.wCellOut += newLearningRate * delta;
 
                 neuHidden[i] = c;
             });
@@ -808,15 +833,15 @@ public override void computeHiddenLayer(State state, bool isTrain = true)
                 //squash output gate 
                 cell_j.yOut = Sigmoid(cell_j.netOut);
 
-                cell_j.cellOutput = (float)(cell_j.cellState * cell_j.yOut);
+                cell_j.cellOutput = cell_j.cellState * cell_j.yOut;
 
 
                 neuHidden[j] = cell_j;
             });
         }
 
 
-        public override void computeOutput(float[] doutput)
+        public override void computeOutput(double[] doutput)
         {
             matrixXvectorADD(OutputLayer, neuHidden, Hidden2OutputWeight, L2, L1, 0);
             if (doutput != null)
 
@@ -7,7 +7,7 @@ namespace RNNSharp
 {
     class MathUtil
     {
-        public static int GetMaxProbIndex(float [] array)
+        public static int GetMaxProbIndex(double [] array)
         {
             int dim = array.Length;
             double maxValue = array[0];
Original file line number	Diff line number	Diff line change
`@@ -3,7 +3,6 @@`
`3`	`3`	`using System.Threading.Tasks;`
`4`	`4`	`using AdvUtils;`
`5`	`5`	`using System.Collections.Generic;`
`6`		`-using System.Numerics;`
`7`	`6`
`8`	`7`	`/// <summary>`
`9`	`8`	`/// RNNSharp written by Zhongkai Fu ([email protected])`
`@@ -14,7 +13,6 @@ class BiRNN : RNN`
`14`	`13`	`{`
`15`	`14`	`private RNN forwardRNN;`
`16`	`15`	`private RNN backwardRNN;`
`17`		`- private Vector<float> vecConst2 = new Vector<float>(2.0f);`
`18`	`16`
`19`	`17`	`public BiRNN(RNN s_forwardRNN, RNN s_backwardRNN)`
`20`	`18`	`{`
`@@ -131,7 +129,7 @@ public override float LearningRate`
`131`	`129`	`}`
`132`	`130`	`}`
`133`	`131`
`134`		`- public override float GradientCutoff`
	`132`	`+ public override double GradientCutoff`
`135`	`133`	`{`
`136`	`134`	`get`
`137`	`135`	`{`
`@@ -211,7 +209,7 @@ public override void InitMem()`
`211`	`209`	`backwardRNN.InitMem();`
`212`	`210`
`213`	`211`	`//Create and intialise the weights from hidden to output layer, these are just normal weights`
`214`		`- Hidden2OutputWeight = new Matrix<float>(L2, L1);`
	`212`	`+ Hidden2OutputWeight = new Matrix<double>(L2, L1);`
`215`	`213`
`216`	`214`	`for (int i = 0; i < Hidden2OutputWeight.Height; i++)`
`217`	`215`	`{`
`@@ -224,7 +222,7 @@ public override void InitMem()`
`224`	`222`	`Hidden2OutputWeightLearningRate = new Matrix<float>(L2, L1);`
`225`	`223`	`}`
`226`	`224`
`227`		`- public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<float> rawOutputLayer)`
	`225`	`+ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHiddenLayer, out Matrix<double> rawOutputLayer)`
`228`	`226`	`{`
`229`	`227`	`int numStates = pSequence.States.Length;`
`230`	`228`	`SimpleLayer[] mForward = null;`
`@@ -268,18 +266,14 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid`
`268`	`266`	`SimpleLayer forwardCells = mForward[curState];`
`269`	`267`	`SimpleLayer backwardCells = mBackward[curState];`
`270`	`268`
`271`		`- for (int i = 0; i < forwardRNN.L1; i+=Vector<float>.Count)`
	`269`	`+ for (int i = 0; i < forwardRNN.L1; i++)`
`272`	`270`	`{`
`273`		`- Vector<float> v1 = new Vector<float>(forwardCells.cellOutput, i);`
`274`		`- Vector<float> v2 = new Vector<float>(backwardCells.cellOutput, i);`
`275`		`- Vector<float> v = (v1 + v2) / vecConst2;`
`276`		`-`
`277`		`- v.CopyTo(cells.cellOutput, i);`
	`271`	`+ cells.cellOutput[i] = (forwardCells.cellOutput[i] + backwardCells.cellOutput[i]) / 2.0;`
`278`	`272`	`}`
`279`	`273`	`});`
`280`	`274`
`281`	`275`	`//Calculate output layer`
`282`		`- Matrix<float> tmp_rawOutputLayer = new Matrix<float>(numStates, L2);`
	`276`	`+ Matrix<double> tmp_rawOutputLayer = new Matrix<double>(numStates, L2);`
`283`	`277`	`SimpleLayer[] seqOutput = new SimpleLayer[numStates];`
`284`	`278`	`Parallel.For(0, numStates, parallelOption, curState =>`
`285`	`279`	`{`
`@@ -288,7 +282,7 @@ public SimpleLayer[] InnerDecode(Sequence pSequence, out SimpleLayer[] outputHid`
`288`	`282`
`289`	`283`	`matrixXvectorADD(outputCells, mergedHiddenLayer[curState], Hidden2OutputWeight, L2, L1, 0);`
`290`	`284`
`291`		`- float[] tmp_vector = tmp_rawOutputLayer[curState];`
	`285`	`+ double[] tmp_vector = tmp_rawOutputLayer[curState];`
`292`	`286`	`outputCells.cellOutput.CopyTo(tmp_vector, 0);`
`293`	`287`
`294`	`288`	`//Activation on output layer`
`@@ -307,7 +301,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running`
`307`	`301`	`int numStates = pSequence.States.Length;`
`308`	`302`	`//Predict output`
`309`	`303`	`SimpleLayer[] mergedHiddenLayer = null;`
`310`		`- Matrix<float> rawOutputLayer = null;`
	`304`	`+ Matrix<double> rawOutputLayer = null;`
`311`	`305`	`SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);`
`312`	`306`
`313`	`307`	`ForwardBackward(numStates, rawOutputLayer);`
`@@ -332,7 +326,7 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running`
`332`	`326`	`{`
`333`	`327`	`int label = pSequence.States[curState].Label;`
`334`	`328`	`SimpleLayer layer = seqOutput[curState];`
`335`		`- float[] CRFOutputLayer = CRFSeqOutput[curState];`
	`329`	`+ double[] CRFOutputLayer = CRFSeqOutput[curState];`
`336`	`330`
`337`	`331`	`//For standard RNN`
`338`	`332`	`for (int c = 0; c < L2; c++)`
`@@ -348,14 +342,14 @@ public override int[] PredictSentenceCRF(Sequence pSequence, RunningMode running`
`348`	`342`	`return predict;`
`349`	`343`	`}`
`350`	`344`
`351`		`- public override Matrix<float> PredictSentence(Sequence pSequence, RunningMode runningMode)`
	`345`	`+ public override Matrix<double> PredictSentence(Sequence pSequence, RunningMode runningMode)`
`352`	`346`	`{`
`353`	`347`	`//Reset the network`
`354`	`348`	`int numStates = pSequence.States.Length;`
`355`	`349`
`356`	`350`	`//Predict output`
`357`	`351`	`SimpleLayer[] mergedHiddenLayer = null;`
`358`		`- Matrix<float> rawOutputLayer = null;`
	`352`	`+ Matrix<double> rawOutputLayer = null;`
`359`	`353`	`SimpleLayer[] seqOutput = InnerDecode(pSequence, out mergedHiddenLayer, out rawOutputLayer);`
`360`	`354`
`361`	`355`	`if (runningMode != RunningMode.Test)`
`@@ -380,7 +374,7 @@ public override Matrix<float> PredictSentence(Sequence pSequence, RunningMode ru`
`380`	`374`	`{`
`381`	`375`	`layer.er[c] = -layer.cellOutput[c];`
`382`	`376`	`}`
`383`		`- layer.er[label] = 1.0f - layer.cellOutput[label];`
	`377`	`+ layer.er[label] = 1.0 - layer.cellOutput[label];`
`384`	`378`	`}`
`385`	`379`
`386`	`380`	`LearnTwoRNN(pSequence, mergedHiddenLayer, seqOutput);`
`@@ -413,17 +407,18 @@ private void LearnTwoRNN(Sequence pSequence, SimpleLayer[] mergedHiddenLayer, Si`
`413`	`407`	`for (int i = 0; i < Hidden2OutputWeight.Height; i++)`
`414`	`408`	`{`
`415`	`409`	`//update weights for hidden to output layer`
`416`		`- float er = outputCells.er[i];`
`417`		`- float[] vector_i = Hidden2OutputWeight[i];`
	`410`	`+ double er = outputCells.er[i];`
	`411`	`+ double[] vector_i = Hidden2OutputWeight[i];`
`418`	`412`	`for (int k = 0; k < Hidden2OutputWeight.Width; k++)`
`419`	`413`	`{`
`420`	`414`	`double delta = NormalizeGradient(mergedHiddenCells.cellOutput[k] * er);`
`421`	`415`	`double newLearningRate = UpdateLearningRate(Hidden2OutputWeightLearningRate, i, k, delta);`
`422`	`416`
`423`		`- vector_i[k] += (float)(newLearningRate * delta);`
	`417`	`+ vector_i[k] += newLearningRate * delta;`
`424`	`418`	`}`
`425`	`419`	`}`
`426`	`420`	`}`
	`421`	`+`
`427`	`422`	`},`
`428`	`423`	`()=>`
`429`	`424`	`{`
`@@ -490,7 +485,7 @@ public override void computeHiddenLayer(State state, bool isTrain = true)`
`490`	`485`	`throw new NotImplementedException("computeHiddenLayer is not implemented in BiRNN");`
`491`	`486`	`}`
`492`	`487`
`493`		`- public override void computeOutput(float[] doutput)`
	`488`	`+ public override void computeOutput(double[] doutput)`
`494`	`489`	`{`
`495`	`490`	`throw new NotImplementedException("computeOutput is not implemented in BiRNN");`
`496`	`491`	`}`
Original file line number	Diff line number	Diff line change
`@@ -7,7 +7,7 @@ namespace RNNSharp`
`7`	`7`	`{`
`8`	`8`	`class MathUtil`
`9`	`9`	`{`
`10`		`- public static int GetMaxProbIndex(float [] array)`
	`10`	`+ public static int GetMaxProbIndex(double [] array)`
`11`	`11`	`{`
`12`	`12`	`int dim = array.Length;`
`13`	`13`	`double maxValue = array[0];`