deep-learning-algorithm
diff --git a/‎pynet/nn/Conv2d.py‎
Lines changed: 33 additions & 48 deletions b/‎pynet/nn/Conv2d.py‎
Lines changed: 33 additions & 48 deletions
diff --git a/‎pynet/nn/Conv2d2.py‎
Lines changed: 0 additions & 73 deletions b/‎pynet/nn/Conv2d2.py‎
Lines changed: 0 additions & 73 deletions
diff --git a/‎pynet/nn/GAP.py‎
Lines changed: 7 additions & 10 deletions b/‎pynet/nn/GAP.py‎
Lines changed: 7 additions & 10 deletions
diff --git a/‎pynet/nn/Layer.py‎
Lines changed: 1 addition & 1 deletion b/‎pynet/nn/Layer.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pynet/nn/MaxPool.py‎
Lines changed: 16 additions & 17 deletions b/‎pynet/nn/MaxPool.py‎
Lines changed: 16 additions & 17 deletions
diff --git a/‎pynet/nn/MaxPool2.py‎
Lines changed: 0 additions & 54 deletions b/‎pynet/nn/MaxPool2.py‎
Lines changed: 0 additions & 54 deletions
diff --git a/‎pynet/nn/__init__.py‎
Lines changed: 2 additions & 2 deletions b/‎pynet/nn/__init__.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎pynet/nn/__pycache__/Conv2d.cpython-37.pyc‎
-2.89 KB b/‎pynet/nn/__pycache__/Conv2d.cpython-37.pyc‎
-2.89 KB
diff --git a/‎pynet/nn/__pycache__/Conv2d2.cpython-37.pyc‎
-2.38 KB b/‎pynet/nn/__pycache__/Conv2d2.cpython-37.pyc‎
-2.38 KB
diff --git a/‎pynet/nn/__pycache__/MaxPool.cpython-37.pyc‎
-1.65 KB b/‎pynet/nn/__pycache__/MaxPool.cpython-37.pyc‎
-1.65 KB
@@ -1,6 +1,6 @@
 # -*- coding: utf-8 -*-
 
-# @Time    : 19-6-20 下午2:29
+# @Time    : 19-7-2 上午9:53
 # @Author  : zj
 
 
@@ -9,80 +9,65 @@
 from .pool2row import *
 from .Layer import *
 
-__all__ = ['Conv2d']
+__all__ = ['Conv2d2']
 
 
-class Conv2d(Layer):
+class Conv2d2:
     """
     convolutional layer
     卷积层
     """
 
-    def __init__(self, in_c, filter_h, filter_w, filter_num, stride=1, padding=0, momentum=0, nesterov=False):
-        super(Conv2d, self).__init__()
+    def __init__(self, in_c, filter_h, filter_w, filter_num, stride=1, padding=0, weight_scale=1e-2):
+        """
+        :param in_c: 输入数据体通道数
+        :param filter_h: 滤波器长
+        :param filter_w: 滤波器宽
+        :param filter_num: 滤波器个数
+        :param stride: 步长
+        :param padding: 零填充
+        :param weight_scale:
+        """
+        super(Conv2d2, self).__init__()
         self.in_c = in_c
         self.filter_h = filter_h
         self.filter_w = filter_w
         self.filter_num = filter_num
         self.stride = stride
         self.padding = padding
+        self.weight_scale = weight_scale
 
-        self.W = \
-            {'val': 0.01 * np.random.normal(loc=0, scale=1.0, size=(filter_h * filter_w * in_c, filter_num)),
-             'grad': 0,
-             'v': 0,
-             'momentum': momentum,
-             'nesterov': nesterov}
-        self.b = {'val': 0.01 * np.random.normal(loc=0, scale=1.0, size=(1, filter_num)), 'grad': 0}
-        self.a = None
-        self.input_shape = None
+    def __call__(self, inputs, w, b):
+        return self.forward(inputs, w, b)
 
-    def __call__(self, inputs):
-        return self.forward(inputs)
-
-    def forward(self, inputs):
+    def forward(self, inputs, w, b):
         # input.shape == [N, C, H, W]
         assert len(inputs.shape) == 4
         N, C, H, W = inputs.shape[:4]
         out_h = int((H - self.filter_h + 2 * self.padding) / self.stride + 1)
         out_w = int((W - self.filter_w + 2 * self.padding) / self.stride + 1)
 
         a = im2row_indices(inputs, self.filter_h, self.filter_w, stride=self.stride, padding=self.padding)
-        z = a.dot(self.W['val']) + self.b['val']
-
-        self.input_shape = inputs.shape
-        self.a = a.copy()
+        z = a.dot(w) + b
 
         out = conv_fc2output(z, N, out_h, out_w)
-        return out
+        cache = (a, inputs.shape, w, b)
+        return out, cache
 
-    def backward(self, grad_out):
+    def backward(self, grad_out, cache):
         assert len(grad_out.shape) == 4
 
-        dz = conv_output2fc(grad_out)
-        self.W['grad'] = self.a.T.dot(dz)
-        self.b['grad'] = np.sum(dz, axis=0, keepdims=True) / dz.shape[0]
-
-        da = dz.dot(self.W['val'].T)
-        return row2im_indices(da, self.input_shape, field_height=self.filter_h,
-                              field_width=self.filter_w, stride=self.stride, padding=self.padding)
-
-    def update(self, learning_rate=0, regularization_rate=0):
-        v_prev = self.W['v']
-        self.W['v'] = self.W['momentum'] * self.W['v'] - learning_rate * (
-                self.W['grad'] + regularization_rate * self.W['val'])
-        if self.W['nesterov']:
-            self.W['val'] += (1 + self.W['momentum']) * self.W['v'] - self.W['momentum'] * v_prev
-        else:
-            self.W['val'] += self.W['v']
-        self.b['val'] -= learning_rate * (self.b['grad'])
+        a, input_shape, w, b = cache
 
-    def get_params(self):
-        return {'W': self.W['val'], 'momentum': self.W['momentum'], 'nesterov': self.W['nesterov'], 'b': self.b['val']}
+        dz = conv_output2fc(grad_out)
+        grad_W = a.T.dot(dz)
+        grad_b = np.sum(dz, axis=0, keepdims=True) / dz.shape[0]
 
-    def set_params(self, params):
-        self.W['val'] = params.get('W')
-        self.b['val'] = params.get('b')
+        da = dz.dot(w.T)
+        return grad_W, grad_b, row2im_indices(da, input_shape, field_height=self.filter_h,
+                                              field_width=self.filter_w, stride=self.stride, padding=self.padding)
 
-        self.W['momentum'] = params.get('momentum', 0.0)
-        self.W['nesterov'] = params.get('nesterov', False)
+    def get_params(self):
+        return self.weight_scale * np.random.normal(loc=0, scale=1.0, size=(
+            self.filter_h * self.filter_w * self.in_c, self.filter_num)), \
+               self.weight_scale * np.random.normal(loc=0, scale=1.0, size=(1, self.filter_num))
@@ -16,10 +16,6 @@ class GAP(Layer):
     全局平均池化层
     """
 
-    def __init__(self):
-        super(GAP, self).__init__()
-        self.input_shape = None
-
     def __call__(self, inputs):
         return self.forward(inputs)
 
@@ -29,12 +25,13 @@ def forward(self, inputs):
         N, C, H, W = inputs.shape[:4]
 
         z = np.mean(inputs.reshape(N, C, -1), axis=2)
-        self.input_shape = inputs.shape
 
-        return z
+        cache = (inputs.shape)
+        return z, cache
 
-    def backward(self, grad_out):
-        N, C, H, W = self.input_shape[:4]
+    def backward(self, grad_out, cache):
+        input_shape = cache
+        N, C, H, W = input_shape[:4]
         dz = grad_out.reshape(N * C, -1)
         da = np.repeat(dz, H * W, axis=1)
 
@@ -45,9 +42,9 @@ def backward(self, grad_out):
     gap = GAP()
 
     inputs = np.arange(36).reshape(2, 2, 3, 3)
-    res = gap(inputs)
+    res, cache = gap(inputs)
     print(res)
 
     grad_out = np.arange(4).reshape(2, 2)
-    da = gap.backward(grad_out)
+    da = gap.backward(grad_out, cache)
     print(da)
@@ -15,5 +15,5 @@ def forward(self, inputs):
         pass
 
     @abstractmethod
-    def backward(self, grad_out):
+    def backward(self, grad_out, cache):
         pass
@@ -1,33 +1,28 @@
 # -*- coding: utf-8 -*-
 
-# @Time    : 19-6-20 下午3:03
+# @Time    : 19-7-2 上午10:06
 # @Author  : zj
 
-
 from .utils import *
 from .pool2row import *
 from .Layer import *
 
-__all__ = ['MaxPool']
+__all__ = ['MaxPool2']
 
 
-class MaxPool(Layer):
+class MaxPool2:
     """
     max pool layer
     池化层，执行max运算
     """
 
     def __init__(self, filter_h, filter_w, filter_num, stride=2):
-        super(MaxPool, self).__init__()
+        super(MaxPool2, self).__init__()
         self.filter_h = filter_h
         self.filter_w = filter_w
         self.filter_num = filter_num
         self.stride = stride
 
-        self.input_shape = None
-        self.a_shape = None
-        self.arg_z = None
-
     def __call__(self, inputs):
         return self.forward(inputs)
 
@@ -40,16 +35,20 @@ def forward(self, inputs):
 
         a = pool2row_indices(inputs, self.filter_h, self.filter_w, stride=self.stride)
         z = np.max(a, axis=1)
-        self.arg_z = np.argmax(a, axis=1)
-        self.input_shape = inputs.shape
-        self.a_shape = a.shape
 
-        return pool_fc2output(z, N, out_h, out_w)
+        arg_z = np.argmax(a, axis=1)
+        input_shape = inputs.shape
+        a_shape = a.shape
+        cache = (arg_z, input_shape, a_shape)
+
+        return pool_fc2output(z, N, out_h, out_w), cache
+
+    def backward(self, grad_out, cache):
+        arg_z, input_shape, a_shape = cache
 
-    def backward(self, grad_out):
         dz = pool_output2fc(grad_out)
-        da = np.zeros(self.a_shape)
-        da[range(self.a_shape[0]), self.arg_z] = dz
+        da = np.zeros(a_shape)
+        da[range(a_shape[0]), arg_z] = dz
 
-        return row2pool_indices(da, self.input_shape, field_height=self.filter_h, field_width=self.filter_w,
+        return row2pool_indices(da, input_shape, field_height=self.filter_h, field_width=self.filter_w,
                                 stride=self.stride)
@@ -8,5 +8,5 @@
 from .MaxPool import MaxPool
 from .GAP import GAP
 
-from .Conv2d2 import Conv2d2
-from .MaxPool2 import MaxPool2
+from .Conv2d import Conv2d2
+from .MaxPool import MaxPool2