Skip to content

Commit 14d72cb

Browse files
committed
docs and fixes at models
1 parent 2bd255a commit 14d72cb

22 files changed

+4247
-2755
lines changed

Nbs/001_Blocks.ipynb

Lines changed: 453 additions & 0 deletions
Large diffs are not rendered by default.

Nbs/00_ModelConstructor.ipynb

Lines changed: 152 additions & 590 deletions
Large diffs are not rendered by default.

Nbs/01_layers.ipynb

Lines changed: 58 additions & 97 deletions
Large diffs are not rendered by default.

Nbs/02_XResNet.ipynb

Lines changed: 903 additions & 0 deletions
Large diffs are not rendered by default.

Nbs/03_MXResNet.ipynb

Lines changed: 128 additions & 102 deletions
Large diffs are not rendered by default.

Nbs/04_YaResNet.ipynb

Lines changed: 577 additions & 118 deletions
Large diffs are not rendered by default.

Nbs/05_Twist.ipynb

Lines changed: 20 additions & 69 deletions
Original file line numberDiff line numberDiff line change
@@ -18,27 +18,9 @@
1818
"#hide\n",
1919
"import torch\n",
2020
"import torch.nn as nn\n",
21-
"import torch.nn.functional as F\n",
22-
"import numpy as np\n",
23-
"from collections import OrderedDict\n",
2421
"\n",
2522
"from model_constructor.net import Net\n",
26-
"from model_constructor.layers import ConvLayer, noop, act_fn, SimpleSelfAttention\n",
27-
"\n",
28-
"from nbdev.showdoc import show_doc\n",
29-
"from IPython.display import Markdown, display"
30-
]
31-
},
32-
{
33-
"cell_type": "code",
34-
"execution_count": null,
35-
"metadata": {},
36-
"outputs": [],
37-
"source": [
38-
"# hide\n",
39-
"def print_doc(func_name):\n",
40-
" doc = show_doc(func_name, title_level=4, disp=False)\n",
41-
" display(Markdown(doc))"
23+
"from model_constructor.layers import ConvLayer\n"
4224
]
4325
},
4426
{
@@ -57,16 +39,6 @@
5739
"from model_constructor.twist import ConvTwist"
5840
]
5941
},
60-
{
61-
"cell_type": "code",
62-
"execution_count": null,
63-
"metadata": {},
64-
"outputs": [],
65-
"source": [
66-
"# hide_input\n",
67-
"# print_doc(ConvTwist)"
68-
]
69-
},
7042
{
7143
"cell_type": "code",
7244
"execution_count": null,
@@ -150,7 +122,7 @@
150122
}
151123
],
152124
"source": [
153-
"ConvTwist(64,64)"
125+
"ConvTwist(64, 64)"
154126
]
155127
},
156128
{
@@ -175,7 +147,7 @@
175147
"source": [
176148
"ConvTwist.twist = True\n",
177149
"ConvTwist.permute = False\n",
178-
"ConvTwist(64,64)"
150+
"ConvTwist(64, 64)"
179151
]
180152
},
181153
{
@@ -219,7 +191,7 @@
219191
}
220192
],
221193
"source": [
222-
"ConvLayerTwist(64,64, stride=1)"
194+
"ConvLayerTwist(64, 64, stride=1)"
223195
]
224196
},
225197
{
@@ -558,16 +530,6 @@
558530
"from model_constructor.twist import NewResBlockTwist"
559531
]
560532
},
561-
{
562-
"cell_type": "code",
563-
"execution_count": null,
564-
"metadata": {},
565-
"outputs": [],
566-
"source": [
567-
"# hide_input\n",
568-
"# print_doc(NewResBlockTwist)"
569-
]
570-
},
571533
{
572534
"cell_type": "code",
573535
"execution_count": null,
@@ -610,7 +572,7 @@
610572
],
611573
"source": [
612574
"#collapse_output\n",
613-
"bl = NewResBlockTwist(4,64,64,sa=True)\n",
575+
"bl = NewResBlockTwist(4, 64, 64, sa=True)\n",
614576
"bl"
615577
]
616578
},
@@ -676,7 +638,7 @@
676638
],
677639
"source": [
678640
"#collapse_output\n",
679-
"bl = NewResBlockTwist(4,64,64,stride=2)\n",
641+
"bl = NewResBlockTwist(4, 64, 64, stride=2)\n",
680642
"bl"
681643
]
682644
},
@@ -746,7 +708,7 @@
746708
],
747709
"source": [
748710
"#collapse_output\n",
749-
"bl = NewResBlockTwist(4,64,128,stride=2)\n",
711+
"bl = NewResBlockTwist(4, 64, 128, stride=2)\n",
750712
"bl"
751713
]
752714
},
@@ -806,7 +768,7 @@
806768
],
807769
"source": [
808770
"#hide\n",
809-
"bl = NewResBlockTwist(1,64,64,sa=True)\n",
771+
"bl = NewResBlockTwist(1, 64, 64, sa=True)\n",
810772
"bl"
811773
]
812774
},
@@ -876,7 +838,14 @@
876838
],
877839
"source": [
878840
"#collapse_output\n",
879-
"bl = NewResBlockTwist(4,64,128,stride=2,act_fn=nn.LeakyReLU(), bn_1st=False)\n",
841+
"bl = NewResBlockTwist(\n",
842+
" 4,\n",
843+
" 64,\n",
844+
" 128,\n",
845+
" stride=2,\n",
846+
" act_fn=nn.LeakyReLU(),\n",
847+
" bn_1st=False,\n",
848+
")\n",
880849
"bl"
881850
]
882851
},
@@ -918,16 +887,6 @@
918887
"from model_constructor.twist import ResBlockTwist"
919888
]
920889
},
921-
{
922-
"cell_type": "code",
923-
"execution_count": null,
924-
"metadata": {},
925-
"outputs": [],
926-
"source": [
927-
"#hide_input\n",
928-
"# print_doc(ResBlockTwist)"
929-
]
930-
},
931890
{
932891
"cell_type": "code",
933892
"execution_count": null,
@@ -970,7 +929,7 @@
970929
],
971930
"source": [
972931
"#collapse_output\n",
973-
"bl = ResBlockTwist(4,64,64,sa=True)\n",
932+
"bl = ResBlockTwist(4, 64, 64, sa=True)\n",
974933
"bl"
975934
]
976935
},
@@ -1036,7 +995,7 @@
1036995
],
1037996
"source": [
1038997
"#collapse_output\n",
1039-
"bl = ResBlockTwist(4,64,64,stride=2)\n",
998+
"bl = ResBlockTwist(4, 64, 64, stride=2)\n",
1040999
"bl"
10411000
]
10421001
},
@@ -1106,7 +1065,7 @@
11061065
],
11071066
"source": [
11081067
"#collapse_output\n",
1109-
"bl = ResBlockTwist(4,64,128,stride=2)\n",
1068+
"bl = ResBlockTwist(4, 64, 128, stride=2)\n",
11101069
"bl"
11111070
]
11121071
},
@@ -1145,7 +1104,7 @@
11451104
"metadata": {},
11461105
"outputs": [],
11471106
"source": [
1148-
"model = Net(expansion=4, layers=[3,4,6,3])"
1107+
"model = Net(expansion=4, layers=[3, 4, 6, 3])"
11491108
]
11501109
},
11511110
{
@@ -1569,14 +1528,6 @@
15691528
"text": [
15701529
"torch.Size([16, 64, 32, 32])\n"
15711530
]
1572-
},
1573-
{
1574-
"name": "stderr",
1575-
"output_type": "stream",
1576-
"text": [
1577-
"/home/jzz/anaconda3/envs/mc_dev/lib/python3.9/site-packages/torch/nn/functional.py:718: UserWarning: Named tensors and all their associated APIs are an experimental feature and subject to change. Please do not use them for anything important until they are released as stable. (Triggered internally at /opt/conda/conda-bld/pytorch_1623448255797/work/c10/core/TensorImpl.h:1156.)\n",
1578-
" return torch.max_pool2d(input, kernel_size, stride, padding, dilation, ceil_mode)\n"
1579-
]
15801531
}
15811532
],
15821533
"source": [

0 commit comments

Comments
 (0)