yresnet, stem_stride_on

ayasyrev · ayasyrev · commit d1543b0d5b97 · 2020-07-28T12:33:04.000+03:00
diff --git a/model_constructor/__init__.py b/model_constructor/__init__.py
@@ -1 +1 @@
-__version__ = "0.1.1"
+__version__ = "0.1.4"
diff --git a/model_constructor/_nbdev.py b/model_constructor/_nbdev.py
@@ -31,21 +31,23 @@
          "xresnet50": "03_xresnet.ipynb",
          "init_cnn": "04_Net.ipynb",
          "NewResBlock": "04_Net.ipynb",
-         "net34": "04_Net.ipynb",
-         "net50": "04_Net.ipynb",
          "nn": "05_Twist.ipynb",
          "F": "05_Twist.ipynb",
          "ConvTwist": "05_Twist.ipynb",
          "ConvLayerTwist": "05_Twist.ipynb",
          "NewResBlockTwist": "05_Twist.ipynb",
-         "ResBlockTwist": "05_Twist.ipynb"}
+         "ResBlockTwist": "05_Twist.ipynb",
+         "YResBlock": "06_YResnet.ipynb",
+         "yresnet34": "06_YResnet.ipynb",
+         "yresnet50": "06_YResnet.ipynb"}
 
 modules = ["constructor.py",
            "layers.py",
            "resnet.py",
            "xresnet.py",
            "net.py",
-           "twist.py"]
+           "twist.py",
+           "yresnet.py"]
 
 doc_url = "https://ayasyrev.github.io/model_constructor/"
 
diff --git a/model_constructor/net.py b/model_constructor/net.py
@@ -1,13 +1,12 @@
 # AUTOGENERATED! DO NOT EDIT! File to edit: nbs/04_Net.ipynb (unless otherwise specified).
 
-__all__ = ['init_cnn', 'act_fn', 'ResBlock', 'NewResBlock', 'Net', 'net34', 'net50']
+__all__ = ['init_cnn', 'act_fn', 'ResBlock', 'NewResBlock', 'Net']
 
 # Cell
 import torch.nn as nn
 import sys, torch
 from functools import partial
 from collections import OrderedDict
-
 from .layers import *
 
 # Cell
@@ -70,7 +69,8 @@ def forward(self, x):
 # Cell
 def _make_stem(self):
         stem = [(f"conv_{i}", self.conv_layer(self.stem_sizes[i], self.stem_sizes[i+1],
-                    stride=2 if i==0 else 1,
+#                     stride=2 if i==0 else 1,
+                    stride=2 if i==self.stem_stride_on else 1,
                     bn_layer=(not self.stem_bn_end) if i==(len(self.stem_sizes)-2) else True,
                     act_fn=self.act_fn, bn_1st=self.bn_1st))
                 for i in range(len(self.stem_sizes)-1)]
@@ -105,18 +105,18 @@ def _make_head(self):
 # Cell
 # v8
 class Net():
-    def __init__(self, expansion=1, layers=[2,2,2,2], c_in=3, c_out=1000, name='Net',
-                act_fn=nn.ReLU(inplace=True), pool = nn.AvgPool2d(2, ceil_mode=True), sa=0):
+    def __init__(self, expansion=1, layers=[2,2,2,2], c_in=3, c_out=1000,
+                 name='Net', block=ResBlock,act_fn=nn.ReLU(inplace=True),
+                 pool = nn.AvgPool2d(2, ceil_mode=True), sa=0):
         super().__init__()
         self.name = name
         self.c_in, self.c_out,self.expansion,self.layers = c_in,c_out,expansion,layers # todo setter for expansion
-        self.act_fn, self.pool, self.sa = act_fn, pool, sa
+        self.block, self.act_fn, self.pool, self.sa = block, act_fn, pool, sa
         self.groups = 1
-
         self.stem_sizes = [c_in,32,32,64]
         self.stem_pool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)
+        self.stem_stride_on = 0
         self.stem_bn_end = False
-        self.block = ResBlock
         self.norm = nn.BatchNorm2d
         self.bn_1st = True
         self.zero_bn=True
@@ -155,16 +155,4 @@ def __call__(self):
         model.extra_repr = lambda : f"model {self.name}"
         return model
     def __repr__(self):
-        return f" constr {self.name}\n expansion: {self.expansion}, sa: {self.sa}, groups: {self.groups}\n stem sizes: {self.stem_sizes}\n body sizes {self.block_szs}"
-
-# Cell
-# me = sys.modules[__name__]
-# for n,e,l in [[ 18 , 1, [2,2,2 ,2] ],
-#     [ 34 , 1, [3,4,6 ,3] ],
-#     [ 50 , 4, [3,4,6 ,3] ],
-#     [ 101, 4, [3,4,23,3] ],
-#     [ 152, 4, [3,8,36,3] ],]:
-#     name = f'net{n}'
-#     setattr(me, name, partial(Net, expansion=e, layers=l, name=name))
-net34  = partial(Net, expansion=1, layers=[3, 4,  6, 3], name='xresnet34')
-net50  = partial(Net, expansion=4, layers=[3, 4,  6, 3], name='xresnet50')
+        return f"{self.name} constructor\n expansion: {self.expansion}, sa: {self.sa}, groups: {self.groups}\n stem sizes: {self.stem_sizes}\n body sizes {self.block_szs}"
diff --git a/model_constructor/yresnet.py b/model_constructor/yresnet.py
@@ -0,0 +1,41 @@
+# AUTOGENERATED! DO NOT EDIT! File to edit: nbs/06_YResnet.ipynb (unless otherwise specified).
+
+__all__ = ['YResBlock', 'yresnet34', 'yresnet50']
+
+# Cell
+import torch.nn as nn
+import sys, torch
+from functools import partial
+from collections import OrderedDict
+from .layers import *
+from .net import Net
+
+# Cell
+# YResBlock - former NewResBlock.
+class YResBlock(nn.Module):
+    '''YResBlock. Reduce by pool instead of stride 2'''
+    def __init__(self, expansion, ni, nh, stride=1,
+                 conv_layer=ConvLayer, act_fn=act_fn, zero_bn=True, bn_1st=True,
+                 pool=nn.AvgPool2d(2, ceil_mode=True), sa=False,sym=False, groups=1):
+        super().__init__()
+        nf,ni = nh*expansion,ni*expansion
+        self.reduce = noop if stride==1 else pool
+        layers  = [(f"conv_0", conv_layer(ni, nh, 3, stride=1, act_fn=act_fn, bn_1st=bn_1st)), # stride 1 !!!
+                   (f"conv_1", conv_layer(nh, nf, 3, zero_bn=zero_bn, act=False, bn_1st=bn_1st))
+        ] if expansion == 1 else [
+                   (f"conv_0",conv_layer(ni, nh, 1, act_fn=act_fn, bn_1st=bn_1st)),
+                   (f"conv_1",conv_layer(nh, nh, 3, stride=1, act_fn=act_fn, bn_1st=bn_1st, groups=int(nh/groups))), # stride 1 !!!
+                   (f"conv_2",conv_layer(nh, nf, 1, zero_bn=zero_bn, act=False, bn_1st=bn_1st))
+        ]
+        if sa: layers.append(('sa', SimpleSelfAttention(nf,ks=1,sym=sym)))
+        self.convs = nn.Sequential(OrderedDict(layers))
+        self.idconv = noop if ni==nf else conv_layer(ni, nf, 1, act=False)
+        self.merge =act_fn
+
+    def forward(self, x):
+        o = self.reduce(x)
+        return self.merge(self.convs(o) + self.idconv(o))
+
+# Cell
+yresnet34  = partial(Net, block=YResBlock, expansion=1, layers=[3, 4,  6, 3], name='yresnet34')
+yresnet50  = partial(Net, block=YResBlock, expansion=4, layers=[3, 4,  6, 3], name='yresnet50')
diff --git a/nbs/04_Net.ipynb b/nbs/04_Net.ipynb
@@ -69,7 +69,6 @@
     "import sys, torch\n",
     "from functools import partial\n",
     "from collections import OrderedDict\n",
-    "\n",
     "from model_constructor.layers import *"
    ]
   },
@@ -496,7 +495,8 @@
     "%nbdev_export\n",
     "def _make_stem(self):\n",
     "        stem = [(f\"conv_{i}\", self.conv_layer(self.stem_sizes[i], self.stem_sizes[i+1], \n",
-    "                    stride=2 if i==0 else 1, \n",
+    "#                     stride=2 if i==0 else 1, \n",
+    "                    stride=2 if i==self.stem_stride_on else 1, \n",
     "                    bn_layer=(not self.stem_bn_end) if i==(len(self.stem_sizes)-2) else True,\n",
     "                    act_fn=self.act_fn, bn_1st=self.bn_1st))\n",
     "                for i in range(len(self.stem_sizes)-1)]\n",
@@ -566,18 +566,18 @@
     "%nbdev_export\n",
     "# v8\n",
     "class Net():\n",
-    "    def __init__(self, expansion=1, layers=[2,2,2,2], c_in=3, c_out=1000, name='Net',\n",
-    "                act_fn=nn.ReLU(inplace=True), pool = nn.AvgPool2d(2, ceil_mode=True), sa=0):\n",
+    "    def __init__(self, expansion=1, layers=[2,2,2,2], c_in=3, c_out=1000, \n",
+    "                 name='Net', block=ResBlock,act_fn=nn.ReLU(inplace=True), \n",
+    "                 pool = nn.AvgPool2d(2, ceil_mode=True), sa=0):\n",
     "        super().__init__()\n",
     "        self.name = name\n",
     "        self.c_in, self.c_out,self.expansion,self.layers = c_in,c_out,expansion,layers # todo setter for expansion\n",
-    "        self.act_fn, self.pool, self.sa = act_fn, pool, sa\n",
+    "        self.block, self.act_fn, self.pool, self.sa = block, act_fn, pool, sa\n",
     "        self.groups = 1\n",
-    "        \n",
     "        self.stem_sizes = [c_in,32,32,64]\n",
     "        self.stem_pool = nn.MaxPool2d(kernel_size=3, stride=2, padding=1)\n",
+    "        self.stem_stride_on = 0\n",
     "        self.stem_bn_end = False\n",
-    "        self.block = ResBlock\n",
     "        self.norm = nn.BatchNorm2d\n",
     "        self.bn_1st = True\n",
     "        self.zero_bn=True\n",
@@ -616,7 +616,7 @@
     "        model.extra_repr = lambda : f\"model {self.name}\"\n",
     "        return model\n",
     "    def __repr__(self):\n",
-    "        return f\" constr {self.name}\\n expansion: {self.expansion}, sa: {self.sa}, groups: {self.groups}\\n stem sizes: {self.stem_sizes}\\n body sizes {self.block_szs}\""
+    "        return f\"{self.name} constructor\\n expansion: {self.expansion}, sa: {self.sa}, groups: {self.groups}\\n stem sizes: {self.stem_sizes}\\n body sizes {self.block_szs}\""
    ]
   },
   {
@@ -636,7 +636,7 @@
     {
      "data": {
       "text/plain": [
-       " constr Net\n",
+       "Net constructor\n",
        " expansion: 1, sa: 0, groups: 1\n",
        " stem sizes: [3, 32, 32, 64]\n",
        " body sizes [64, 64, 128, 256, 512]"
@@ -709,6 +709,45 @@
     "model.stem"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "Sequential(\n",
+       "  (conv_0): ConvLayer(\n",
+       "    (conv): Conv2d(3, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
+       "    (bn): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
+       "    (act_fn): ReLU(inplace=True)\n",
+       "  )\n",
+       "  (conv_1): ConvLayer(\n",
+       "    (conv): Conv2d(32, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
+       "    (bn): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
+       "    (act_fn): ReLU(inplace=True)\n",
+       "  )\n",
+       "  (conv_2): ConvLayer(\n",
+       "    (conv): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
+       "    (bn): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
+       "    (act_fn): ReLU(inplace=True)\n",
+       "  )\n",
+       "  (stem_pool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)\n",
+       ")"
+      ]
+     },
+     "execution_count": null,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "%nbdev_collapse_output\n",
+    "model.stem_stride_on = 1\n",
+    "model.stem"
+   ]
+  },
   {
    "cell_type": "code",
    "execution_count": null,
@@ -1112,12 +1151,12 @@
       "text/plain": [
        "Sequential(\n",
        "  (conv_0): ConvLayer(\n",
-       "    (conv): Conv2d(3, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
+       "    (conv): Conv2d(3, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
        "    (act_fn): LeakyReLU(negative_slope=0.01, inplace=True)\n",
        "    (bn): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
        "  )\n",
        "  (conv_1): ConvLayer(\n",
-       "    (conv): Conv2d(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
+       "    (conv): Conv2d(32, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
        "    (act_fn): LeakyReLU(negative_slope=0.01, inplace=True)\n",
        "    (bn): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
        "  )\n",
@@ -1238,12 +1277,12 @@
        "  model Net\n",
        "  (stem): Sequential(\n",
        "    (conv_0): ConvLayer(\n",
-       "      (conv): Conv2d(3, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
+       "      (conv): Conv2d(3, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
        "      (act_fn): LeakyReLU(negative_slope=0.01, inplace=True)\n",
        "      (bn): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
        "    )\n",
        "    (conv_1): ConvLayer(\n",
-       "      (conv): Conv2d(32, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)\n",
+       "      (conv): Conv2d(32, 32, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1), bias=False)\n",
        "      (act_fn): LeakyReLU(negative_slope=0.01, inplace=True)\n",
        "      (bn): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)\n",
        "    )\n",
@@ -1682,30 +1721,25 @@
     "assert y.shape == torch.Size([bs_test, 1000]), f\"size expected {bs_test}, 1000\""
    ]
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## xresnet constructor"
-   ]
-  },
   {
    "cell_type": "code",
    "execution_count": null,
    "metadata": {},
    "outputs": [],
    "source": [
-    "%nbdev_export\n",
-    "# me = sys.modules[__name__]\n",
-    "# for n,e,l in [[ 18 , 1, [2,2,2 ,2] ],\n",
-    "#     [ 34 , 1, [3,4,6 ,3] ],\n",
-    "#     [ 50 , 4, [3,4,6 ,3] ],\n",
-    "#     [ 101, 4, [3,4,23,3] ],\n",
-    "#     [ 152, 4, [3,8,36,3] ],]:\n",
-    "#     name = f'net{n}'\n",
-    "#     setattr(me, name, partial(Net, expansion=e, layers=l, name=name))\n",
-    "net34  = partial(Net, expansion=1, layers=[3, 4,  6, 3], name='xresnet34')\n",
-    "net50  = partial(Net, expansion=4, layers=[3, 4,  6, 3], name='xresnet50')"
+    "## xresnet constructor\n",
+    "\n",
+    "# %nbdev_export\n",
+    "# # me = sys.modules[__name__]\n",
+    "# # for n,e,l in [[ 18 , 1, [2,2,2 ,2] ],\n",
+    "# #     [ 34 , 1, [3,4,6 ,3] ],\n",
+    "# #     [ 50 , 4, [3,4,6 ,3] ],\n",
+    "# #     [ 101, 4, [3,4,23,3] ],\n",
+    "# #     [ 152, 4, [3,8,36,3] ],]:\n",
+    "# #     name = f'net{n}'\n",
+    "# #     setattr(me, name, partial(Net, expansion=e, layers=l, name=name))\n",
+    "# net34  = partial(Net, expansion=1, layers=[3, 4,  6, 3], name='xresnet34')\n",
+    "# net50  = partial(Net, expansion=4, layers=[3, 4,  6, 3], name='xresnet50')"
    ]
   },
   {
@@ -1714,7 +1748,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "m = net50(c_out=10)"
+    "# m = net50(c_out=10)"
    ]
   },
   {
@@ -1738,7 +1772,7 @@
     }
    ],
    "source": [
-    "m, m.c_out"
+    "# m, m.c_out"
    ]
   },
   {
@@ -1765,6 +1799,7 @@
       "Converted 03_xresnet.ipynb.\n",
       "Converted 04_Net.ipynb.\n",
       "Converted 05_Twist.ipynb.\n",
+      "Converted 06_YResnet.ipynb.\n",
       "Converted index.ipynb.\n"
      ]
     }
diff --git a/nbs/06_YResnet.ipynb b/nbs/06_YResnet.ipynb

Original file line number	Diff line number	Diff line change
`@@ -1 +1 @@`
`1`		`-__version__ = "0.1.1"`
	`1`	`+__version__ = "0.1.4"`