增加已完成的模型

Kedreamix · Kedreamix · commit 236a0f2d5fed · 2022-05-08T10:17:30.000+08:00
diff --git a/CIFAR10_code/nets/AlexNet.py b/CIFAR10_code/nets/AlexNet.py
@@ -59,7 +59,7 @@ def test():
     x = torch.randn(2,3,32,32)
     y = net(x)
     print(y.size())
-    from torchsummary import summary
+    from torchinfo import summary
     device = 'cuda' if torch.cuda.is_available() else 'cpu'
     net = net.to(device)
     summary(net,(3,32,32))
diff --git a/CIFAR10_code/nets/DenseNet.py b/CIFAR10_code/nets/DenseNet.py
@@ -0,0 +1,151 @@
+
+"""
+DenseNet in pytorch
+see the details in papaer
+[1] Gao Huang, Zhuang Liu, Laurens van der Maaten, Kilian Q. Weinberger.
+    Densely Connected Convolutional Networks
+    https://arxiv.org/abs/1608.06993v5
+"""
+import torch
+import torch.nn as nn
+
+class Bottleneck(nn.Module):
+    """
+    Dense Block
+    这里的growth_rate=out_channels, 就是每个Block自己输出的通道数。
+    先通过1x1卷积层，将通道数缩小为4 * growth_rate，然后再通过3x3卷积层降低到growth_rate。
+    """
+    # 通常1×1卷积的通道数为GrowthRate的4倍
+    expansion = 4
+    
+    def __init__(self, in_channels, growth_rate):
+        super(Bottleneck, self).__init__()
+        zip_channels = self.expansion * growth_rate
+        self.features = nn.Sequential(
+            nn.BatchNorm2d(in_channels),
+            nn.ReLU(True),
+            nn.Conv2d(in_channels, zip_channels, kernel_size=1, bias=False),
+            nn.BatchNorm2d(zip_channels),
+            nn.ReLU(True),
+            nn.Conv2d(zip_channels, growth_rate, kernel_size=3, padding=1, bias=False)
+        )
+        
+    def forward(self, x):
+        out = self.features(x)
+        out = torch.cat([out, x], 1)
+        return out        
+
+
+class Transition(nn.Module):
+    """
+    改变维数的Transition层 具体包括BN、ReLU、1×1卷积（Conv）、2×2平均池化操作
+    先通过1x1的卷积层减少channels，再通过2x2的平均池化层缩小feature-map
+    """
+    # 1×1卷积的作用是降维，起到压缩模型的作用，而平均池化则是降低特征图的尺寸。
+    def __init__(self, in_channels, out_channels):
+        super(Transition, self).__init__()
+        self.features = nn.Sequential(
+            nn.BatchNorm2d(in_channels),
+            nn.ReLU(True),
+            nn.Conv2d(in_channels, out_channels, kernel_size=1, bias=False),
+            nn.AvgPool2d(2)
+        )
+        
+    def forward(self, x):
+        out = self.features(x)
+        return out
+# DesneNet-BC
+# B 代表 bottleneck layer(BN-RELU-CONV(1x1)-BN-RELU-CONV(3x3))
+# C 代表压缩系数(0<=theta<=1)
+import math
+class DenseNet(nn.Module):
+    """
+    Dense Net
+    paper中growth_rate取12，维度压缩的参数θ，即reduction取0.5
+    且初始化方法为kaiming_normal()
+    num_blocks为每段网络中的DenseBlock数量
+    DenseNet和ResNet一样也是六段式网络（一段卷积+四段Dense+平均池化层），最后FC层。
+    第一段将维数从3变到2 * growth_rate
+    
+    (3, 32, 32) -> [Conv2d] -> (24, 32, 32) -> [layer1] -> (48, 16, 16) -> [layer2]
+  ->(96, 8, 8) -> [layer3] -> (192, 4, 4) -> [layer4] -> (384, 4, 4) -> [AvgPool]
+  ->(384, 1, 1) -> [Linear] -> (10)
+    
+    """
+    def __init__(self, num_blocks, growth_rate=12, reduction=0.5, num_classes=10):
+        super(DenseNet, self).__init__()
+        self.growth_rate = growth_rate
+        self.reduction = reduction
+        
+        num_channels = 2 * growth_rate
+        
+        self.features = nn.Conv2d(3, num_channels, kernel_size=3, padding=1, bias=False)
+        self.layer1, num_channels = self._make_dense_layer(num_channels, num_blocks[0])
+        self.layer2, num_channels = self._make_dense_layer(num_channels, num_blocks[1])
+        self.layer3, num_channels = self._make_dense_layer(num_channels, num_blocks[2])
+        self.layer4, num_channels = self._make_dense_layer(num_channels, num_blocks[3], transition=False)
+        self.avg_pool = nn.Sequential(
+            nn.BatchNorm2d(num_channels),
+            nn.ReLU(True),
+            nn.AvgPool2d(4),
+        )
+        self.classifier = nn.Linear(num_channels, num_classes)
+        
+        self._initialize_weight()
+        
+    def _make_dense_layer(self, in_channels, nblock, transition=True):
+        layers = []
+        for i in range(nblock):
+            layers += [Bottleneck(in_channels, self.growth_rate)]
+            in_channels += self.growth_rate
+        out_channels = in_channels
+        if transition:
+            out_channels = int(math.floor(in_channels * self.reduction))
+            layers += [Transition(in_channels, out_channels)]
+        return nn.Sequential(*layers), out_channels
+    
+    def _initialize_weight(self):
+        for m in self.modules():
+            if isinstance(m, nn.Conv2d):
+                nn.init.kaiming_normal_(m.weight.data)
+                if m.bias is not None:
+                    m.bias.data.zero_()
+    
+    def forward(self, x):
+        out = self.features(x)
+        out = self.layer1(out)
+        out = self.layer2(out)
+        out = self.layer3(out)
+        out = self.layer4(out)
+        out = self.avg_pool(out)
+        out = out.view(out.size(0), -1)
+        out = self.classifier(out)
+        return out
+
+def DenseNet121():
+    return DenseNet([6,12,24,16], growth_rate=32)
+
+def DenseNet169():
+    return DenseNet([6,12,32,32], growth_rate=32)
+
+def DenseNet201():
+    return DenseNet([6,12,48,32], growth_rate=32)
+
+def DenseNet161():
+    return DenseNet([6,12,36,24], growth_rate=48)
+
+def densenet_cifar():
+    return DenseNet([6,12,24,16], growth_rate=12)
+
+
+def test():
+    net = densenet_cifar()
+    x = torch.randn(1,3,32,32)
+    y = net(x)
+    print(y.size())
+    from torchinfo import summary
+    device = 'cuda' if torch.cuda.is_available() else 'cpu'
+    net = net.to(device)
+    summary(net,(1,3,32,32))
+    
+test()
diff --git a/CIFAR10_code/nets/LeNet-5.py b/CIFAR10_code/nets/LeNet-5.py
@@ -45,8 +45,8 @@ def test():
     x = torch.randn(2,3,32,32)
     y = net(x)
     print(y.size())
-    from torchsummary import summary
+    from torchinfo import summary
     device = 'cuda' if torch.cuda.is_available() else 'cpu'
     net = net.to(device)
-    summary(net,(3,32,32))
+    summary(net,(2,3,32,32))
     
diff --git a/CIFAR10_code/nets/MobileNetv1.py b/CIFAR10_code/nets/MobileNetv1.py
@@ -79,6 +79,6 @@ def test():
     from torchinfo import summary
     device = 'cuda' if torch.cuda.is_available() else 'cpu'
     net = net.to(device)
-    summary(net,(32,3,32,32))
+    summary(net,(2,3,32,32))
     
 test()
diff --git a/CIFAR10_code/nets/MobileNetv2.py b/CIFAR10_code/nets/MobileNetv2.py
@@ -99,6 +99,6 @@ def test():
     from torchinfo import summary
     device = 'cuda' if torch.cuda.is_available() else 'cpu'
     net = net.to(device)
-    summary(net,(32,3,32,32))
+    summary(net,(2,3,32,32))
     
 test() 
diff --git a/CIFAR10_code/nets/ResNet.py b/CIFAR10_code/nets/ResNet.py
@@ -0,0 +1,158 @@
+'''
+ResNet in PyTorch.
+Reference:
+[1] Kaiming He, Xiangyu Zhang, Shaoqing Ren, Jian Sun
+    Deep Residual Learning for Image Recognition. arXiv:1512.03385
+'''
+import torch
+import torch.nn as nn
+class BasicBlock(nn.Module):
+    """
+    对于浅层网络，如ResNet-18/34等，用基本的Block
+    基础模块没有压缩,所以expansion=1
+    """
+    expansion = 1
+    def __init__(self, in_channels, out_channels, stride=1):
+        super(BasicBlock,self).__init__()
+        self.features = nn.Sequential(
+            nn.Conv2d(in_channels, out_channels, kernel_size=3, stride=stride, padding=1, bias=False),
+            nn.BatchNorm2d(out_channels),
+            nn.ReLU(True),
+            nn.Conv2d(out_channels,out_channels, kernel_size=3, stride=1, padding=1, bias=False),
+            nn.BatchNorm2d(out_channels)
+        )
+        # 如果输入输出维度不等，则使用1x1卷积层来改变维度
+        self.shortcut = nn.Sequential()
+        if stride != 1 or in_channels != self.expansion * out_channels:
+            self.shortcut = nn.Sequential(
+                nn.Conv2d(in_channels, self.expansion * out_channels, kernel_size=1, stride=stride, bias=False),
+                nn.BatchNorm2d(self.expansion * out_channels),
+            )
+    def forward(self, x):
+        out = self.features(x)
+#         print(out.shape)
+        out += self.shortcut(x)
+        out = torch.relu(out)
+        return out
+    
+
+class Bottleneck(nn.Module):
+    """
+    对于深层网络，我们使用BottleNeck，论文中提出其拥有近似的计算复杂度，但能节省很多资源
+    zip_channels: 压缩后的维数，最后输出的维数是 expansion * zip_channels
+    针对ResNet50/101/152的网络结构,主要是因为第三层是第二层的4倍的关系所以expansion=4
+    """
+    expansion = 4
+    
+    def __init__(self, in_channels, zip_channels, stride=1):
+        super(Bottleneck, self).__init__()
+        out_channels = self.expansion * zip_channels
+        self.features = nn.Sequential(
+            nn.Conv2d(in_channels, zip_channels, kernel_size=1, bias=False),
+            nn.BatchNorm2d(zip_channels),
+            nn.ReLU(inplace=True),
+            nn.Conv2d(zip_channels, zip_channels, kernel_size=3, stride=stride, padding=1, bias=False),
+            nn.BatchNorm2d(zip_channels),
+            nn.ReLU(inplace=True),
+            nn.Conv2d(zip_channels, out_channels, kernel_size=1, bias=False),
+            nn.BatchNorm2d(out_channels)
+        )
+        self.shortcut = nn.Sequential()
+        if stride != 1 or in_channels != out_channels:
+            self.shortcut = nn.Sequential(
+                nn.Conv2d(in_channels, out_channels, kernel_size=1, stride=stride, bias=False),
+                nn.BatchNorm2d(out_channels)
+            )
+            
+    def forward(self, x):
+        out = self.features(x)
+#         print(out.shape)
+        out += self.shortcut(x)
+        out = torch.relu(out)
+        return out
+    
+class ResNet(nn.Module):
+    """
+    不同的ResNet架构都是统一的一层特征提取、四层残差，不同点在于每层残差的深度。
+    对于cifar10，feature map size的变化如下：
+    (32, 32, 3) -> [Conv2d] -> (32, 32, 64) -> [Res1] -> (32, 32, 64) -> [Res2] 
+ -> (16, 16, 128) -> [Res3] -> (8, 8, 256) ->[Res4] -> (4, 4, 512) -> [AvgPool] 
+ -> (1, 1, 512) -> [Reshape] -> (512) -> [Linear] -> (10)
+    """
+    def __init__(self, block, num_blocks, num_classes=10, verbose = False):
+        super(ResNet, self).__init__()
+        self.verbose = verbose
+        self.in_channels = 64
+        self.features = nn.Sequential(
+            nn.Conv2d(3, 64, kernel_size=3, stride=1, padding=1, bias=False),
+            nn.BatchNorm2d(64),
+            nn.ReLU(inplace=True)
+        )
+        #使用_make_layer函数生成上表对应的conv2_x, conv3_x, conv4_x, conv5_x的结构
+        self.layer1 = self._make_layer(block, 64, num_blocks[0], stride=1)
+        self.layer2 = self._make_layer(block, 128, num_blocks[1], stride=2)
+        self.layer3 = self._make_layer(block, 256, num_blocks[2], stride=2)
+        self.layer4 = self._make_layer(block, 512, num_blocks[3], stride=2)
+        # cifar10经过上述结构后，到这里的feature map size是 4 x 4 x 512 x expansion
+        # 所以这里用了 4 x 4 的平均池化
+        self.avg_pool = nn.AvgPool2d(kernel_size=4)
+        self.classifer = nn.Linear(512 * block.expansion, num_classes)
+        
+    def _make_layer(self, block, out_channels, num_blocks, stride):
+        # 第一个block要进行降采样
+        strides = [stride] + [1] * (num_blocks - 1)
+        layers = []
+        for stride in strides:
+            layers.append(block(self.in_channels, out_channels, stride))
+            # 如果是Bottleneck Block的话需要对每层输入的维度进行压缩，压缩后再增加维数
+            # 所以每层的输入维数也要跟着变
+            self.in_channels = out_channels * block.expansion
+        return nn.Sequential(*layers)
+    
+    def forward(self, x):
+        out = self.features(x)
+        if self.verbose:
+            print('block 1 output: {}'.format(out.shape))
+        out = self.layer1(out)        
+        if self.verbose:
+            print('block 2 output: {}'.format(out.shape))
+        out = self.layer2(out)
+        if self.verbose:
+            print('block 3 output: {}'.format(out.shape))
+        out = self.layer3(out)
+        if self.verbose:
+            print('block 4 output: {}'.format(out.shape))
+        out = self.layer4(out)
+        if self.verbose:
+            print('block 5 output: {}'.format(out.shape))
+        out = self.avg_pool(out)
+        out = out.view(out.size(0), -1)
+        out = self.classifer(out)
+        return out
+    
+def ResNet18(verbose=False):
+    return ResNet(BasicBlock, [2,2,2,2],verbose=verbose)
+
+def ResNet34(verbose=False):
+    return ResNet(BasicBlock, [3,4,6,3],verbose=verbose)
+
+def ResNet50(verbose=False):
+    return ResNet(Bottleneck, [3,4,6,3],verbose=verbose)
+
+def ResNet101(verbose=False):
+    return ResNet(Bottleneck, [3,4,23,3],verbose=verbose)
+
+def ResNet152(verbose=False):
+    return ResNet(Bottleneck, [3,8,36,3],verbose=verbose)
+
+def test():
+    net = ResNet34()
+    x = torch.randn(2,3,32,32)
+    y = net(x)
+    print(y.size())
+    from torchinfo import summary
+    device = 'cuda' if torch.cuda.is_available() else 'cpu'
+    net = net.to(device)
+    summary(net,(2,3,32,32))
+
+test()
diff --git a/CIFAR10_code/nets/VGG.py b/CIFAR10_code/nets/VGG.py
@@ -43,9 +43,9 @@ def test():
     x = torch.randn(2,3,32,32)
     y = net(x)
     print(y.size())
-    from torchsummary import summary
+    from torchinfo import summary
     device = 'cuda' if torch.cuda.is_available() else 'cpu'
     net = net.to(device)
-    summary(net,(3,32,32))
+    summary(net,(2,3,32,32))
     
 test()