Code refactoring

zhongkaifu · zhongkaifu · commit ebc087f3da24 · 2017-03-14T22:56:30.000-07:00
diff --git a/RNNSharp/Layers/DropoutLayer.cs b/RNNSharp/Layers/DropoutLayer.cs
@@ -38,7 +38,6 @@ public override Neuron CopyNeuronTo(Neuron neuron)
             DropoutNeuron dropoutNeuron = neuron as DropoutNeuron;
             mask.CopyTo(dropoutNeuron.mask, 0);
             Cells.CopyTo(dropoutNeuron.Cells, 0);
-            previousCellOutputs.CopyTo(dropoutNeuron.PrevCellOutputs, 0);
 
             return dropoutNeuron;
         }
diff --git a/RNNSharp/Layers/LSTMLayer.cs b/RNNSharp/Layers/LSTMLayer.cs
@@ -129,12 +129,14 @@ public class LSTMLayer : SimpleLayer
         private Vector4 vecNormalLearningRate;
         private Vector3 vecNormalLearningRate3;
         private Vector<float> vecNormalLearningRateFloat;
+ //       protected float[] previousCellOutputs;
 
         LSTMLayerConfig config;
 
         public LSTMLayer(LSTMLayerConfig config) : base(config)
         {
             this.config = config;
+     //       previousCellOutputs = new float[LayerSize];
             LSTMCells = new LSTMCell[LayerSize];
             for (var i = 0; i < LayerSize; i++)
             {
@@ -155,7 +157,7 @@ public override Neuron CopyNeuronTo(Neuron neuron)
             LSTMNeuron lstmNeuron = neuron as LSTMNeuron;
 
             Cells.CopyTo(lstmNeuron.Cells, 0);
-            previousCellOutputs.CopyTo(lstmNeuron.PrevCellOutputs, 0);
+     //       previousCellOutputs.CopyTo(lstmNeuron.PrevCellOutputs, 0);
             for (int i = 0; i < LayerSize; i++)
             {
                 lstmNeuron.LSTMCells[i].Set(LSTMCells[i]);
@@ -168,8 +170,8 @@ public override Neuron CopyNeuronTo(Neuron neuron)
         public override void PreUpdateWeights(Neuron neuron, float[] errs)
         {
             LSTMNeuron lstmNeuron = neuron as LSTMNeuron;
-            lstmNeuron.Cells.CopyTo(Cells, 0);
-            lstmNeuron.PrevCellOutputs.CopyTo(previousCellOutputs, 0);
+       //     lstmNeuron.Cells.CopyTo(Cells, 0);
+    //        lstmNeuron.PrevCellOutputs.CopyTo(previousCellOutputs, 0);
             for (int i = 0; i < LayerSize; i++)
             {
                 LSTMCells[i].Set(lstmNeuron.LSTMCells[i]);
@@ -726,7 +728,8 @@ public override void ForwardPass(SparseVector sparseFeature, float[] denseFeatur
 
                 //hidden(t-1) -> hidden(t)
                 cell_j.previousCellState = cell_j.cellState;
-                previousCellOutputs[j] = Cells[j];
+                cell_j.previousCellOutput = Cells[j];
+//                previousCellOutputs[j] = Cells[j];
 
                 var vecCell_j = Vector4.Zero;
 
@@ -787,26 +790,24 @@ public override void ForwardPass(SparseVector sparseFeature, float[] denseFeatur
                 //reset each netOut to zero
                 cell_j.netOut = vecCell_j.W;
 
-                var cell_j_previousCellOutput = previousCellOutputs[j];
-
                 //include internal connection multiplied by the previous cell state
-                cell_j.netIn += cell_j.previousCellState * cellWeight_j.wPeepholeIn + cell_j_previousCellOutput * cellWeight_j.wCellIn;
+                cell_j.netIn += cell_j.previousCellState * cellWeight_j.wPeepholeIn + cell_j.previousCellOutput * cellWeight_j.wCellIn;
                 //squash input
                 cell_j.yIn = Sigmoid(cell_j.netIn);
 
                 //include internal connection multiplied by the previous cell state
                 cell_j.netForget += cell_j.previousCellState * cellWeight_j.wPeepholeForget +
-                                    cell_j_previousCellOutput * cellWeight_j.wCellForget;
+                                    cell_j.previousCellOutput * cellWeight_j.wCellForget;
                 cell_j.yForget = Sigmoid(cell_j.netForget);
 
-                cell_j.netCellState += cell_j_previousCellOutput * cellWeight_j.wCellState;
+                cell_j.netCellState += cell_j.previousCellOutput * cellWeight_j.wCellState;
                 cell_j.yCellState = TanH(cell_j.netCellState);
 
                 //cell state is equal to the previous cell state multipled by the forget gate and the cell inputs multiplied by the input gate
                 cell_j.cellState = cell_j.yForget * cell_j.previousCellState + cell_j.yIn * cell_j.yCellState;
 
                 ////include the internal connection multiplied by the CURRENT cell state
-                cell_j.netOut += cell_j.cellState * cellWeight_j.wPeepholeOut + cell_j_previousCellOutput * cellWeight_j.wCellOut;
+                cell_j.netOut += cell_j.cellState * cellWeight_j.wPeepholeOut + cell_j.previousCellOutput * cellWeight_j.wCellOut;
 
                 //squash output gate
                 cell_j.yOut = Sigmoid(cell_j.netOut);
@@ -1001,20 +1002,18 @@ public override void BackwardPass()
                 cellWeight.wPeepholeOut += vecCellDelta.Z;
 
                 //Update cells weights
-                var c_previousCellOutput = previousCellOutputs[i];
                 //partial derivatives for internal connections
                 cellWeightDeri.dSWCellIn = cellWeightDeri.dSWCellIn * c.yForget +
-                              Sigmoid2_ci_netCellState_mul_SigmoidDerivative_ci_netIn * c_previousCellOutput;
+                              Sigmoid2_ci_netCellState_mul_SigmoidDerivative_ci_netIn * c.previousCellOutput;
 
                 //partial derivatives for internal connections, initially zero as dS is zero and previous cell state is zero
                 cellWeightDeri.dSWCellForget = cellWeightDeri.dSWCellForget * c.yForget +
-                                  ci_previousCellState_mul_SigmoidDerivative_ci_netForget * c_previousCellOutput;
+                                  ci_previousCellState_mul_SigmoidDerivative_ci_netForget * c.previousCellOutput;
 
                 cellWeightDeri.dSWCellState = cellWeightDeri.dSWCellState * c.yForget +
-                                 Sigmoid2Derivative_ci_netCellState_mul_ci_yIn * c_previousCellOutput;
+                                 Sigmoid2Derivative_ci_netCellState_mul_ci_yIn * c.previousCellOutput;
 
-                var vecCellDelta4 = new Vector4((float)cellWeightDeri.dSWCellIn, (float)cellWeightDeri.dSWCellForget, (float)cellWeightDeri.dSWCellState,
-                    c_previousCellOutput);
+                var vecCellDelta4 = new Vector4((float)cellWeightDeri.dSWCellIn, (float)cellWeightDeri.dSWCellForget, (float)cellWeightDeri.dSWCellState, (float)c.previousCellOutput);
                 vecCellDelta4 = vecErr * vecCellDelta4;
 
                 //Normalize err by gradient cut-off
@@ -1069,7 +1068,7 @@ public override void Reset()
 
         private void InitializeLSTMCell(LSTMCell c, LSTMCellWeight cw, LSTMCellWeightDeri deri)
         {
-            c.previousCellState = 0;
+         //   c.previousCellState = 0;
             c.cellState = 0;
 
             //partial derivatives
@@ -1139,6 +1138,7 @@ public class LSTMCell
     {
         //The following fields are only for forward
         public double previousCellState;
+        public double previousCellOutput;
         public double cellState;
 
         public double netCellState;
@@ -1164,6 +1164,7 @@ public LSTMCell(LSTMCell cell)
         public void Set(LSTMCell cell)
         {
             previousCellState = cell.previousCellState;
+            previousCellOutput = cell.previousCellOutput;
             cellState = cell.cellState;
             netCellState = cell.netCellState;
             netForget = cell.netForget;
diff --git a/RNNSharp/Layers/SimpleLayer.cs b/RNNSharp/Layers/SimpleLayer.cs
@@ -23,7 +23,6 @@ public class SimpleLayer
         public float[] DenseFeature { get; set; }
 
         protected ParallelOptions parallelOption = new ParallelOptions();
-        protected float[] previousCellOutputs;
         protected RunningMode runningMode;
 
 
@@ -34,7 +33,6 @@ public SimpleLayer(LayerConfig config)
         {
             LayerConfig = config;
             Cells = new float[LayerSize];
-            previousCellOutputs = new float[LayerSize];
             Errs = new float[LayerSize];
             LabelShortList = new List<int>();
         }
@@ -68,7 +66,6 @@ public void SetRunningMode(RunningMode mode)
         public virtual Neuron CopyNeuronTo(Neuron neuron)
         {
             Cells.CopyTo(neuron.Cells, 0);
-            previousCellOutputs.CopyTo(neuron.PrevCellOutputs, 0);
 
             return neuron;
         }
@@ -99,7 +96,6 @@ public virtual void ShallowCopyWeightTo(SimpleLayer destLayer)
         public virtual void PreUpdateWeights(Neuron neuron, float[] errs)
         {
             neuron.Cells.CopyTo(Cells, 0);
-            neuron.PrevCellOutputs.CopyTo(previousCellOutputs, 0);
             errs.CopyTo(Errs, 0);
         }
 
diff --git a/RNNSharp/RNNEncoder.cs b/RNNSharp/RNNEncoder.cs
@@ -217,14 +217,17 @@ public void Train()
 
                 }
 
+                var start = DateTime.Now;
                 Logger.WriteLine($"Start to training {iter} iteration. learning rate = {RNNHelper.LearningRate}");
                 Parallel.For(0, N, i =>
                 {
                     rnns[i].CleanStatus();
                     Process(rnns[i], dataSets[i], RunningMode.Training);
                 });
 
-                Logger.WriteLine($"End {iter} iteration.");
+                var duration = DateTime.Now.Subtract(start);
+
+                Logger.WriteLine($"End {iter} iteration. Time duration = {duration}");
                 Logger.WriteLine("");
 
                 if (tknErrCnt >= bestTrainTknErrCnt && lastAlpha != RNNHelper.LearningRate)
@@ -256,7 +259,6 @@ public void Train()
                         //We got better result on validated corpus, save this model
                         Logger.WriteLine($"Saving better model into file {modelFilePath}, since we got a better result on validation set.");
                         Logger.WriteLine($"Error token percent: {(double)tknErrCnt / (double)processedWordCnt * 100.0}%, Error sequence percent: {(double)sentErrCnt / (double)processedSequence * 100.0}%");
-                        Logger.WriteLine("");
 
                         rnn.SaveModel(modelFilePath);
                         bestValidTknErrCnt = tknErrCnt;
@@ -268,11 +270,12 @@ public void Train()
                     //We got better result on validated corpus, save this model
                     Logger.WriteLine($"Saving better model into file {modelFilePath}, although validation set doesn't exist, we have better result on training set.");
                     Logger.WriteLine($"Error token percent: {(double)trainTknErrCnt / (double)processedWordCnt * 100.0}%, Error sequence percent: {(double)sentErrCnt / (double)processedSequence * 100.0}%");
-                    Logger.WriteLine("");
 
                     rnn.SaveModel(modelFilePath);
                 }
-                
+
+                Logger.WriteLine("");
+
                 if (trainTknErrCnt >= bestTrainTknErrCnt)
                 {
                     //We don't have better result on training set, so reduce learning rate

Original file line number	Diff line number	Diff line change
`@@ -38,7 +38,6 @@ public override Neuron CopyNeuronTo(Neuron neuron)`
`38`	`38`	`DropoutNeuron dropoutNeuron = neuron as DropoutNeuron;`
`39`	`39`	`mask.CopyTo(dropoutNeuron.mask, 0);`
`40`	`40`	`Cells.CopyTo(dropoutNeuron.Cells, 0);`
`41`		`- previousCellOutputs.CopyTo(dropoutNeuron.PrevCellOutputs, 0);`
`42`	`41`
`43`	`42`	`return dropoutNeuron;`
`44`	`43`	`}`
Original file line number	Diff line number	Diff line change
`@@ -23,7 +23,6 @@ public class SimpleLayer`
`23`	`23`	`public float[] DenseFeature { get; set; }`
`24`	`24`
`25`	`25`	`protected ParallelOptions parallelOption = new ParallelOptions();`
`26`		`- protected float[] previousCellOutputs;`
`27`	`26`	`protected RunningMode runningMode;`
`28`	`27`
`29`	`28`
`@@ -34,7 +33,6 @@ public SimpleLayer(LayerConfig config)`
`34`	`33`	`{`
`35`	`34`	`LayerConfig = config;`
`36`	`35`	`Cells = new float[LayerSize];`
`37`		`- previousCellOutputs = new float[LayerSize];`
`38`	`36`	`Errs = new float[LayerSize];`
`39`	`37`	`LabelShortList = new List<int>();`
`40`	`38`	`}`
`@@ -68,7 +66,6 @@ public void SetRunningMode(RunningMode mode)`
`68`	`66`	`public virtual Neuron CopyNeuronTo(Neuron neuron)`
`69`	`67`	`{`
`70`	`68`	`Cells.CopyTo(neuron.Cells, 0);`
`71`		`- previousCellOutputs.CopyTo(neuron.PrevCellOutputs, 0);`
`72`	`69`
`73`	`70`	`return neuron;`
`74`	`71`	`}`
`@@ -99,7 +96,6 @@ public virtual void ShallowCopyWeightTo(SimpleLayer destLayer)`
`99`	`96`	`public virtual void PreUpdateWeights(Neuron neuron, float[] errs)`
`100`	`97`	`{`
`101`	`98`	`neuron.Cells.CopyTo(Cells, 0);`
`102`		`- neuron.PrevCellOutputs.CopyTo(previousCellOutputs, 0);`
`103`	`99`	`errs.CopyTo(Errs, 0);`
`104`	`100`	`}`
`105`	`101`