(구현) Rethinking the inception Architecture for computer vision

Notice

Recent Posts

Recent Comments

Link

12-20 07:43

« 2024/12 »
일	월	화	수	목	금	토
1	2	3	4	5	6	7
8	9	10	11	12	13	14
15	16	17	18	19	20	21
22	23	24	25	26	27	28
29	30	31

Tags more

Archives

Today

Total

관리 메뉴

AI 전문가가 되고싶은 사람

(구현) Rethinking the inception Architecture for computer vision 본문

논문

(구현) Rethinking the inception Architecture for computer vision

Kimseungwoo0407 2024. 9. 10. 15:43

참고 사이트 : https://medium.com/@AnasBrital98/inception-v3-cnn-architecture-explained-691cfb7bba08

Inception V3 CNN Architecture Explained .

Inception-V3 CNN Architecture illustrated and Implemented in both Keras and PyTorch .

medium.com

코드가 길어보여서 처음에는 걱정이 되었지만, 직접 작성해보니 의외로 이해하기 어렵지 않았다. 코드를 하나하나 작성하면서 각 부분의 역할을 명확히 파악할 수 있었고, 전체적인 흐름도 자연스럽게 이해할 수 있었다. 이런 과정을 통해 코드의 구조와 작동 방식에 대한 감을 잡게 된 것 같다.

import torch.nn as nn
import torch
import torch.nn.functional as F

class ConvolutionBlock(nn.Module):
    def __init__(self, in_channels, out_channels, kernel_size, stride, padding):
        super(ConvolutionBlock,self).__init__()
        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size, stride, padding)
        self.batchNormalization = nn.BatchNorm2d(out_channels)
        self.activation =nn.ReLU()
    
    def forward(self, x):
        out = self.conv(x)
        out = self.batchNormalization(out)
        out = self.activation(out)
        return out

class StemBlock(nn.Module):
    def __init__(self):
        super(StemBlock, self).__init__()

        self.conv1 = ConvolutionBlock(3,32,3,2,0)
        self.conv2 = ConvolutionBlock(32,32,3,1,0)
        self.conv3 = ConvolutionBlock(32,64,3,1,1)
        self.conv4 = ConvolutionBlock(64,80,3,1,0)
        self.conv5 = ConvolutionBlock(80,192,3,1,0)
        self.maxPool = nn.MaxPool2d(kernel_size=(3,3), stride=(2,2))

    
    def forward(self, x):
        out = self.conv1(x)
        out = self.conv2(out)
        out = self.conv3(out)
        out = self.maxPool(out)
        out = self.conv4(out)
        out = self.conv5(out)
        out = self.maxPool(out)
        return out

class InceptionBlock_A(nn.Module):
    def __init__(self, in_channels, nbr_kernels):
        super(InceptionBlock_A,self).__init__()

        # 1x1 합성곱 후 3x3 합성곱 2번
        self.branch1 = nn.Sequential(
            ConvolutionBlock(in_channels, 64, 1, 1, 0),
            ConvolutionBlock(64, 96, 3, 1, 1),
            ConvolutionBlock(96, 96, 3, 1, 1)
        )
        # 1x1 합성곱 후 3x3 합성곱
        self.branch2 = nn.Sequential(
            ConvolutionBlock(in_channels, 48, 1, 1, 0),
            ConvolutionBlock(48, 64, 3, 1, 1)
        )
        # 3x3 평균 풀링 후 1x1 합성곱
        self.branch3 = nn.Sequential(
            nn.AvgPool2d(kernel_size=(3,3), stride=1, padding=1),
            ConvolutionBlock(in_channels, 64, 1, 1, 0)
        )
        # 1x1 합성곱
        self.branch4 = ConvolutionBlock(in_channels, 64, 1, 1, 0)

    def forward(self,x):
        branch1 = self.branch1(x)
        branch2 = self.branch2(x)
        branch3 = self.branch3(x)
        branch4 = self.branch4(x)

        out = torch.cat([branch1, branch2, branch3, branch4],1)

        return out

class InceptionBlock_B(nn.Module):
    def __init__(self, in_channels, nbr_kernels):
        super(InceptionBlock_B, self).__init__()

        self.branch1 = nn.Sequential(
            ConvolutionBlock(in_channels, 192, 1, 1, 0)
        )
        self.branch2 = nn.Sequential(
            ConvolutionBlock(in_channels, nbr_kernels, 1, 1, 0),
            ConvolutionBlock(nbr_kernels, nbr_kernels, (1,7), 1, (0,3)),
            ConvolutionBlock(nbr_kernels, 192, (7,1), 1, (3,0))
        )
        self.branch3 = nn.Sequential(
            ConvolutionBlock(in_channels, nbr_kernels, 1, 1, 0),
            ConvolutionBlock(nbr_kernels, nbr_kernels, (7,1), 1, (0,3)),
            ConvolutionBlock(nbr_kernels, nbr_kernels, (1,7), 1, (3,0)),
            ConvolutionBlock(nbr_kernels, nbr_kernels, (7,1), 1, (0,3)),
            ConvolutionBlock(nbr_kernels, 192, (1,7), 1, (3,0))
        )
        self.branch4 = nn.Sequential(
            nn.AvgPool2d(kernel_size=(3,3), stride=1, padding=1),
            ConvolutionBlock(in_channels, 192, 1, 1, 0)
        )
    
    def forward(self, x):
        branch1 = self.branch1(x)
        branch2 = self.branch2(x)
        branch3 = self.branch3(x)
        branch4 = self.branch4(x)
    
        out = torch.cat([branch1,branch2,branch3,branch4],1)

        return out

class InceptionBlock_C(nn.Module):
    def __init__(self,in_channels, nbr_kernels):
        super(InceptionBlock_C, self).__init__()

        self.branch1 = nn.Sequential(
            ConvolutionBlock(in_channels, 320, 1, 1, 0)
        )
        self.branch2 = nn.Sequential(
            nn.AvgPool2d(kernel_size=(3,3), stride=1, padding=1),
            ConvolutionBlock(in_channels, 192, 1, 1, 0)
        )
        self.branch3 = nn.Sequential(
            ConvolutionBlock(in_channels, 384, 1, 1, 0)
        )
        self.branch3_1 = nn.Sequential(
            ConvolutionBlock(384, 384, (1,3), 1, (0,1))
        )
        self.branch3_2 = nn.Sequential(
            ConvolutionBlock(384, 384, (3,1), 1, (1,0))
        )
        self.branch4 = nn.Sequential(
            ConvolutionBlock(in_channels, 448, 1,1,0),
            ConvolutionBlock(448, 384, 3, 1, 1)
        )
        self.branch4_1 = nn.Sequential(
            ConvolutionBlock(384, 384, (1,3) , 1, (0,1))
        )
        self.branch4_2 = nn.Sequential(
            ConvolutionBlock(384, 384, (3,1), 1, (1,0))
        )
    
    def forward(self, x):
        branch1 = self.branch1(x)
        branch2 = self.branch2(x)
        branch3 = self.branch3(x)
        branch3 = torch.cat([self.branch3_1(branch3), self.branch3_2(branch3)],1)

        branch4 = self.branch4(x)
        branch4_1 = self.branch4_1(branch4)
        branch4_2 = self.branch4_2(branch4)
        branch4 = torch.cat([branch4_1, branch4_2],1)
        
        out = torch.cat([branch1, branch2, branch3, branch4], 1)

        return out

class ReductionBlock_A(nn.Module):
    def __init__(self, in_channels):

        super(ReductionBlock_A, self).__init__()

        self.branch1 = nn.Sequential(
            ConvolutionBlock(in_channels, 64, 1, 1, 0),
            ConvolutionBlock(64, 96, 3, 1, 1),
            ConvolutionBlock(96, 96, 3, 2, 0)
        )
        self.branch2 = nn.Sequential(
            ConvolutionBlock(in_channels, 384, 3, 2, 0)
        )
        self.branch3 = nn.Sequential(
            nn.MaxPool2d(kernel_size=(3,3), stride=2, padding=0)
        )
    
    def forward(self, x):
        branch1 = self.branch1(x)
        branch2 = self.branch2(x)
        branch3 = self.branch3(x)

        out = torch.cat([branch1, branch2, branch3], 1)

        return out
    
class ReductionBlock_B(nn.Module):
    
    def __init__(self, in_channels):
        super(ReductionBlock_B, self).__init__()

        self.branch1 = nn.Sequential(
            ConvolutionBlock(in_channels, 192, 1, 1, 0),
            ConvolutionBlock(192, 192, (1,7), 1, (0,3)),
            ConvolutionBlock(192, 192, (7,1), 1, (3,0)),
            ConvolutionBlock(192, 192, 3, 2, 0)
        )

        self.branch2 = nn.Sequential(
            ConvolutionBlock(in_channels, 192, 1, 1, 0),
            ConvolutionBlock(192, 192, 3, 1, 0)
        )

        self.branch3 = nn.Sequential(
            nn.MaxPool2d(kernel_size=(3,3), stride=2)
        )
    
    def forward(self, x):
        branch1 = self.branch1(x)
        branch2 = self.branch2(x)
        branch3 = self.branch3(x)

        out = torch.cat([branch1, branch2, branch3], 1)

        return out

class Aux_Block(nn.Module):

    def __init__(self, in_channels):
        super(Aux_Block, self).__init__()

        self.avgPool = nn.AvgPool2d(kernel_size=(5,5), stride=3, padding=0)
        self.conv1 = ConvolutionBlock(in_channels, 128, 1, 1, 0)
        self.conv2 = ConvolutionBlock(128, 768, 5, 1, 0)
        self.fc1 = nn.Linear(in_features= 768, out_features= 1024)
        self.fc2 = nn.Linear(in_features= 1024, out_features = 1000)

    def forward(self, x):
        out = self.avgPool(x)
        out = self.conv1(out)
        out = self.conv2(out)
        out = torch.flatten(out,1)
        out = self.fc1(out)
        out = nn.ReLU()(out)
        out = self.fc2(out)
        out = nn.Softmax()(out)

        return out

class InceptionV3(nn.Module):
    def __init__(self):
        super(InceptionV3, self).__init__()
        self.stem = StemBlock()

        self.inceptionA_1 = InceptionBlock_A(192, 32)
        self.inceptionA_2 = InceptionBlock_A(288, 64)
        self.inceptionA_3 = InceptionBlock_A(288, 64)

        self.reductionA = ReductionBlock_A(288)

        self.inceptionB_1 = InceptionBlock_B(768, 128)
        self.inceptionB_2 = InceptionBlock_B(768, 160)
        self.inceptionB_3 = InceptionBlock_B(768, 160)
        self.inceptionB_4 = InceptionBlock_B(768, 192)

        self.aux = Aux_Block(768)

        self.reductionB = ReductionBlock_B(768)
        
        self.inceptionC_1 = InceptionBlock_C(1280)
        self.inceptionC_2 = InceptionBlock_C(2048)

        self.avgpool = nn.AdaptiveAvgPool2d((1,1))
        self.fc1 = nn.Linear(in_features=2048, out_features= 2048)
        self.fc2 = nn.Linear(in_features=2048, out_features=1000)

    def forward(self,x):
        out = self.stem(x)

        out = self.inceptionA_1(out)
        out = self.inceptionA_2(out)
        out = self.inceptionA_3(out)

        out = self.reductionA(out)

        out = self.inceptionB_1(out)
        out = self.inceptionB_2(out)
        out = self.inceptionB_3(out)
        out = self.inceptionB_4(out)

        aux = self.aux(out)

        out = self.reductionB(out)

        out = self.inceptionC_1(out)
        out = self.inceptionC_2(out)

        out = self.avgpool(out)
        out = out.reshape(out.shape[0], -1)

        out = self.fc1(out)
        out = nn.ReLU()(out)

        out = self.fc2(out)
        out = nn.ReLU()(out)

        return out, aux

'논문' 카테고리의 다른 글

(구현) Deep Residual Learning for Image Recognition (0)	2024.09.12
(공부용) Deep Residual Learning for Image Recognition (4)	2024.09.11
(공부용) Rethinking the inception Architecture for computer vision (2)	2024.09.09
(구현) VERY DEEP CONVOLUTIONAL NETWORKS FOR LARGE-SCALE IMAGE RECOGNITION (0)	2024.09.09
(공부용) VERY DEEP CONVOLUTIONAL NETWORKSFOR LARGE-SCALE IMAGE RECOGNITION (2)	2024.09.07

'논문' Related Articles

AI 전문가가 되고싶은 사람

(구현) Rethinking the inception Architecture for computer vision 본문

(구현) Rethinking the inception Architecture for computer vision

'논문' 카테고리의 다른 글

티스토리툴바