add centered variant of RMS Prop

2017-07-21 19:46:44 +00:00 · 2017-07-21 19:46:44 +00:00 · c2bb2cfcd5
commit c2bb2cfcd5
parent fb22f64716
1 changed files with 45 additions and 2 deletions
--- a/onn_core.py
+++ b/onn_core.py
@ -323,13 +323,56 @@ class RMSprop(Optimizer):
            self.g = np.zeros_like(dW)
        # basically apply a first-order low-pass filter to delta squared
-        self.g[:] = self.mu * self.g + (1 - self.mu) * dW * dW
+        self.g[:] = self.mu * self.g + (1 - self.mu) * np.square(dW)
        # equivalent (though numerically different?):
-        #self.g += (dW * dW - self.g) * (1 - self.mu)
+        #self.g += (np.square(dW) - self.g) * (1 - self.mu)
        # finally sqrt it to complete the running root-mean-square approximation
        return -self.lr * dW / (np.sqrt(self.g) + self.eps)
 class RMSpropCentered(Optimizer):
    # referenced TensorFlow/PyTorch.
    # paper: https://arxiv.org/pdf/1308.0850v5.pdf
    def __init__(self, lr=1e-4, aleph=0.95, momentum=0.9, eps=1e-8):
        self.aleph = _f(aleph)
        self.momentum = _f(momentum)
        self.eps = _f(eps)
        super().__init__(lr)
    def reset(self):
        self.g = None
        self.mt = None
        self.vt = None
        self.delta = None
    def compute(self, dW, W):
        if self.g is None:
            self.g = np.zeros_like(dW)
        if self.mt is None:
            self.mt = np.zeros_like(dW)
        if self.vt is None:
            self.vt = np.zeros_like(dW)
        if self.delta is None:
            self.delta = np.zeros_like(dW)
        self.mt[:] = self.aleph * self.mt + (1 - self.aleph) * dW
        self.vt[:] = self.aleph * self.vt + (1 - self.aleph) * np.square(dW)
        # PyTorch has the epsilon outside of the sqrt,
        # TensorFlow and the paper have it within.
        # in onn, we generally do it outside, as this seems to work better.
        temp = dW / (np.sqrt(self.vt - np.square(self.mt)) + self.eps)
        # TensorFlow does it this way.
        self.delta[:] = self.momentum * self.delta + self.lr * temp
        return -self.delta
        # PyTorch does it this way.
        #self.delta[:] = self.momentum * self.delta + temp
        #return -self.lr * self.delta
        # they are equivalent only when LR is constant, which it might not be.
 class Adam(Optimizer):
    # paper: https://arxiv.org/abs/1412.6980
    # Adam generalizes* RMSprop, and