simplified logic and moved weight_bak initialization

back to before updating the weight. original bug was in momentum == 0.0 block it seems.
apache · piiswrong · Mar 5, 2017 · Feb 24, 2017 · Feb 25, 2017 · Feb 25, 2017
commit 259d2e7f4c972499b04420c9b54983975e493bfd
@@ -318,7 +318,7 @@ def create_state(self, index, weight):
 
         """
         if self.momentum == 0.0:
-            return (None,           # momentum
+            return (zeros(weight.shape, weight.context, dtype=weight.dtype), # placeholder
                     weight.copy())  # previous weight
         else:
             return (zeros(weight.shape, weight.context, dtype=weight.dtype), # momentum
@@ -352,17 +352,11 @@ def update(self, index, weight, grad, state):
             grad = clip(grad, -self.clip_gradient, self.clip_gradient)
 
         mom, previous_weight = state
-        if mom:
-            mom[:] *= self.momentum
-            mom[:] += -lr * (grad + wd * weight + self.lamda \
-                                    * grad * grad * (weight - previous_weight))
-            weight[:] += mom
-            previous_weight[:] = weight
-        else:
-            assert self.momentum == 0.0
-            weight[:] += -lr * (grad + wd * weight + self.lamda \
-                                    * grad * grad * (weight - previous_weight))
-            previous_weight[:] = weight
+        mom[:] *= self.momentum
+        mom[:] += -lr * (grad + wd * weight + self.lamda \
+                      * grad * grad * (weight - previous_weight))
+        previous_weight[:] = weight
+        weight[:] += mom
 
 @register
 class NAG(SGD):