[2/3] incubator-singa git commit: SINGA-383 Add Separable Convolution for autograd

zhaojing Thu, 23 Aug 2018 19:59:04 -0700

SINGA-383 Add Separable Convolution for autograd

- Implement Xception net by calling SeparableConv2d layer. The file is added to 
  /example/autograd folder.


- Modified SeparableConv2d layer API.


Project: http://git-wip-us.apache.org/repos/asf/incubator-singa/repo
Commit: http://git-wip-us.apache.org/repos/asf/incubator-singa/commit/d5422a43
Tree: http://git-wip-us.apache.org/repos/asf/incubator-singa/tree/d5422a43
Diff: http://git-wip-us.apache.org/repos/asf/incubator-singa/diff/d5422a43

Branch: refs/heads/master
Commit: d5422a432d1ad4261f3b44b1f61af5f4c2a651ec
Parents: ca70bdf
Author: xuewanqi <[email protected]>
Authored: Tue Aug 21 14:17:00 2018 +0000
Committer: xuewanqi <[email protected]>
Committed: Thu Aug 23 06:49:53 2018 +0000

----------------------------------------------------------------------
 examples/autograd/xceptionnet.py | 202 ++++++++++++++++++++++++++++++++++
 python/singa/autograd.py         |   6 +-
 2 files changed, 205 insertions(+), 3 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/incubator-singa/blob/d5422a43/examples/autograd/xceptionnet.py
----------------------------------------------------------------------
diff --git a/examples/autograd/xceptionnet.py b/examples/autograd/xceptionnet.py
new file mode 100755
index 0000000..f52a8ac
--- /dev/null
+++ b/examples/autograd/xceptionnet.py
@@ -0,0 +1,202 @@
+from singa import autograd
+from singa import tensor
+from singa import device
+from singa import opt
+
+import numpy as np
+from tqdm import trange
+
+
+# the code is modified from
+# 
https://github.com/Cadene/pretrained-models.pytorch/blob/master/pretrainedmodels/models/xception.py
+
+__all__ = ['xception']
+
+
+class Block(autograd.Layer):
+
+    def __init__(self, in_filters, out_filters, reps, strides=1, padding=0, 
start_with_relu=True, grow_first=True):
+        super(Block, self).__init__()
+
+        if out_filters != in_filters or strides != 1:
+            self.skip = autograd.Conv2d(in_filters, out_filters,
+                                        1, stride=strides, padding=padding, 
bias=False)
+            self.skipbn = autograd.BatchNorm2d(out_filters)
+        else:
+            self.skip = None
+
+        self.layers = []
+
+        filters = in_filters
+        if grow_first:
+            self.layers.append(autograd.ReLU())
+            self.layers.append(autograd.SeparableConv2d(in_filters, 
out_filters,
+                                                        3, stride=1, 
padding=1, bias=False))
+            self.layers.append(autograd.BatchNorm2d(out_filters))
+            filters = out_filters
+
+        for i in range(reps - 1):
+            self.layers.append(autograd.ReLU())
+            self.layers.append(autograd.SeparableConv2d(filters, filters,
+                                                        3, stride=1, 
padding=1, bias=False))
+            self.layers.append(autograd.BatchNorm2d(filters))
+
+        if not grow_first:
+            self.layers.append(autograd.ReLU())
+            self.layers.append(autograd.SeparableConv2d(in_filters, 
out_filters,
+                                                        3, stride=1, 
padding=1, bias=False))
+            self.layers.append(autograd.BatchNorm2d(out_filters))
+
+        if not start_with_relu:
+            self.layers = self.layers[1:]
+        else:
+            self.layers[0] = autograd.ReLU()
+
+        if strides != 1:
+            self.layers.append(autograd.MaxPool2d(3, strides, padding + 1))
+
+    def __call__(self, x):
+        y = self.layers[0](x)
+        for layer in self.layers[1:]:
+            if isinstance(y, tuple):
+                y = y[0]
+            y = layer(y)
+
+        if self.skip is not None:
+            skip = self.skip(x)
+            skip = self.skipbn(skip)
+        else:
+            skip = x
+        y = autograd.add(y, skip)
+        return y
+
+
+class Xception(autograd.Layer):
+    """
+    Xception optimized for the ImageNet dataset, as specified in
+    https://arxiv.org/pdf/1610.02357.pdf
+    """
+
+    def __init__(self, num_classes=1000):
+        """ Constructor
+        Args:
+            num_classes: number of classes
+        """
+        super(Xception, self).__init__()
+        self.num_classes = num_classes
+
+        self.conv1 = autograd.Conv2d(3, 32, 3, 2, 0, bias=False)
+        self.bn1 = autograd.BatchNorm2d(32)
+
+        self.conv2 = autograd.Conv2d(32, 64, 3, 1, 1, bias=False)
+        self.bn2 = autograd.BatchNorm2d(64)
+        # do relu here
+
+        self.block1 = Block(
+            64, 128, 2, 2, padding=0, start_with_relu=False, grow_first=True)
+        self.block2 = Block(
+            128, 256, 2, 2, padding=0, start_with_relu=True, grow_first=True)
+        self.block3 = Block(
+            256, 728, 2, 2, padding=0, start_with_relu=True, grow_first=True)
+
+        self.block4 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+        self.block5 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+        self.block6 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+        self.block7 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+
+        self.block8 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+        self.block9 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+        self.block10 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+        self.block11 = Block(
+            728, 728, 3, 1, start_with_relu=True, grow_first=True)
+
+        self.block12 = Block(
+            728, 1024, 2, 2, start_with_relu=True, grow_first=False)
+
+        self.conv3 = autograd.SeparableConv2d(1024, 1536, 3, 1, 1)
+        self.bn3 = autograd.BatchNorm2d(1536)
+
+        # do relu here
+        self.conv4 = autograd.SeparableConv2d(1536, 2048, 3, 1, 1)
+        self.bn4 = autograd.BatchNorm2d(2048)
+
+        self.globalpooling = autograd.MaxPool2d(10, 1)
+        self.fc = autograd.Linear(2048, num_classes)
+
+    def features(self, input):
+        x = self.conv1(input)
+        x = self.bn1(x)
+        x = autograd.relu(x)
+
+        x = self.conv2(x)
+        x = self.bn2(x)
+        x = autograd.relu(x)
+
+        x = self.block1(x)
+        x = self.block2(x)
+        x = self.block3(x)
+        x = self.block4(x)
+        x = self.block5(x)
+        x = self.block6(x)
+        x = self.block7(x)
+        x = self.block8(x)
+        x = self.block9(x)
+        x = self.block10(x)
+        x = self.block11(x)
+        x = self.block12(x)
+
+        x = self.conv3(x)
+        x = self.bn3(x)
+        x = autograd.relu(x)
+
+        x = self.conv4(x)
+        x = self.bn4(x)
+        return x
+
+    def logits(self, features):
+        x = autograd.relu(features)
+        x = self.globalpooling(x)
+        x = autograd.flatten(x)
+        x = self.fc(x)
+        return x
+
+    def __call__(self, input):
+        x = self.features(input)
+        x = self.logits(x)
+        return x
+
+
+if __name__ == '__main__':
+    model = Xception(num_classes=1000)
+    print('Start intialization............')
+    dev = device.create_cuda_gpu_on(0)
+    #dev = device.create_cuda_gpu()
+
+    niters = 20
+    batch_size = 16
+    IMG_SIZE = 299
+    sgd = opt.SGD(lr=0.1, momentum=0.9, weight_decay=1e-5)
+
+    tx = tensor.Tensor((batch_size, 3, IMG_SIZE, IMG_SIZE), dev)
+    ty = tensor.Tensor((batch_size,), dev, tensor.int32)
+    autograd.training = True
+    x = np.random.randn(batch_size, 3, IMG_SIZE, IMG_SIZE).astype(np.float32)
+    y = np.random.randint(0, 1000, batch_size, dtype=np.int32)
+    tx.copy_from_numpy(x)
+    ty.copy_from_numpy(y)
+
+    with trange(niters) as t:
+        for b in t:
+            x = model(tx)
+            loss = autograd.softmax_cross_entropy(x, ty)
+            for p, g in autograd.backward(loss):
+                # print(p.shape, g.shape)
+                sgd.update(p, g)
+                # pass

http://git-wip-us.apache.org/repos/asf/incubator-singa/blob/d5422a43/python/singa/autograd.py
----------------------------------------------------------------------
diff --git a/python/singa/autograd.py b/python/singa/autograd.py
index 938b813..84afcd1 100755
--- a/python/singa/autograd.py
+++ b/python/singa/autograd.py
@@ -779,12 +779,12 @@ class Conv2d(Layer):
 
 class SeparableConv2d(Layer):
 
-    def __init__(self, in_channels, out_channels, kernel_size, stride=1, 
padding=0):
+    def __init__(self, in_channels, out_channels, kernel_size, stride=1, 
padding=0, bias=False):
 
         self.mapping_spacial_conv = Conv2d(
-            in_channels, in_channels, kernel_size, stride, padding, 
groups=in_channels, bias=False)
+            in_channels, in_channels, kernel_size, stride, padding, 
groups=in_channels, bias=bias)
 
-        self.mapping_depth_conv = Conv2d(in_channels, out_channels, 1, 
bias=False)
+        self.mapping_depth_conv = Conv2d(in_channels, out_channels, 1, 
bias=bias)
 
     def __call__(self, x):
         y = self.mapping_spacial_conv(x)

[2/3] incubator-singa git commit: SINGA-383 Add Separable Convolution for autograd

Reply via email to