Pytorch how and when to use Module Sequential ModuleList and ModuleDict Download - Pytorch how and when to use Module Sequential ModuleList and ModuleDict ดาวน์โหลดซอร์สโค้ด

ภาษาไทย

中文(简体) 中文(繁体) 한국어 日本語 English Português Español Русский العربية Indonesia Deutsch Français ภาษาไทย

หน้าแรก>การเขียนโปรแกรมที่เกี่ยวข้อง>โค้ดแหล่งที่มา AI

Pytorch how and when to use Module Sequential ModuleList and ModuleDict

โค้ดแหล่งที่มา AI

1.0.0

ดาวน์โหลด

Pytorch: อย่างไรและเมื่อใดจึงจะใช้ Module, Sequential, ModuleList และ ModuleDict

วิธีที่มีประสิทธิภาพในการแชร์ นำมาใช้ซ้ำ และสลายความซับซ้อนของโมเดลของคุณ

อัปเดตที่ Pytorch 1.5.1

คุณสามารถค้นหารหัสได้ที่นี่

Pytorch เป็นเฟรมเวิร์กการเรียนรู้เชิงลึกแบบโอเพ่นซอร์สที่ให้วิธีที่ชาญฉลาดในการสร้างโมเดล ML แม้ว่าเอกสารจะจัดทำมาอย่างดี แต่ฉันก็ยังเห็นว่าคนส่วนใหญ่เขียนได้ไม่ดีและมีการจัดระเบียบโค้ดใน PyTorch

วันนี้เราจะมาดูวิธีใช้ Building Block หลักสามประการของ PyTorch: Module, Sequential and ModuleList เราจะเริ่มต้นด้วยตัวอย่างและทำซ้ำๆ จะทำให้ดีขึ้น

ทั้งสี่คลาสนี้รวมอยู่ใน torch.nn

 import torch . nn as nn

# nn.Module
# nn.Sequential
# nn.Module

โมดูล: โครงสร้างหลัก

โมดูลเป็นส่วนประกอบหลัก โดยจะกำหนดคลาสพื้นฐานสำหรับโครงข่ายประสาทเทียมทั้งหมด และคุณต้องซับคลาสนั้น

มาสร้างตัวแยกประเภท CNN แบบคลาสสิกเป็นตัวอย่าง:

 import torch . nn . functional as F

class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , n_classes ):
        super (). __init__ ()
        self . conv1 = nn . Conv2d ( in_c , 32 , kernel_size = 3 , stride = 1 , padding = 1 )
        self . bn1 = nn . BatchNorm2d ( 32 )
        
        self . conv2 = nn . Conv2d ( 32 , 64 , kernel_size = 3 , stride = 1 , padding = 1 )
        self . bn2 = nn . BatchNorm2d ( 64 )

        self . fc1 = nn . Linear ( 64 * 28 * 28 , 1024 )
        self . fc2 = nn . Linear ( 1024 , n_classes )
        
    def forward ( self , x ):
        x = self . conv1 ( x )
        x = self . bn1 ( x )
        x = F . relu ( x )
        
        x = self . conv2 ( x )
        x = self . bn2 ( x )
        x = F . relu ( x )

        x = x . view ( x . size ( 0 ), - 1 ) # flat
        
        x = self . fc1 ( x )
        x = F . sigmoid ( x )
        x = self . fc2 ( x )
        
        return x

 model = MyCNNClassifier ( 1 , 10 )
print ( model )

 MyCNNClassifier(
  (conv1): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (bn1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (conv2): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (fc1): Linear(in_features=50176, out_features=1024, bias=True)
  (fc2): Linear(in_features=1024, out_features=10, bias=True)
)

นี่เป็นลักษณนามที่เรียบง่ายมากพร้อมส่วนการเข้ารหัสที่ใช้สองชั้นที่มี 3x3 convs + batchnorm + relu และส่วนถอดรหัสที่มีเลเยอร์เชิงเส้นสองชั้น หากคุณไม่ใหม่กับ PyTorch คุณอาจเคยเห็นการเขียนโค้ดประเภทนี้มาก่อน แต่มีปัญหาสองประการ

หากเราต้องการเพิ่มเลเยอร์ เราต้องเขียนโค้ดจำนวนมากอีกครั้งใน __init__ และในฟังก์ชัน forward นอกจากนี้ หากเรามีบล็อกทั่วไปที่เราต้องการใช้ในโมเดลอื่น เช่น 3x3 Conv + Batchnorm + Relu เราจะต้องเขียนมันอีกครั้ง

ตามลำดับ: สแต็กและผสานเลเยอร์

Sequential คือคอนเทนเนอร์ของโมดูลที่สามารถซ้อนกันและรันได้ในเวลาเดียวกัน

จะสังเกตได้ว่าเราต้องเก็บทุกอย่างไว้ใน self เราสามารถใช้ Sequential เพื่อปรับปรุงโค้ดของเราได้

 class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , n_classes ):
        super (). __init__ ()
        self . conv_block1 = nn . Sequential (
            nn . Conv2d ( in_c , 32 , kernel_size = 3 , stride = 1 , padding = 1 ),
            nn . BatchNorm2d ( 32 ),
            nn . ReLU ()
        )
        
        self . conv_block2 = nn . Sequential (
            nn . Conv2d ( 32 , 64 , kernel_size = 3 , stride = 1 , padding = 1 ),
            nn . BatchNorm2d ( 64 ),
            nn . ReLU ()
        )
        
        self . decoder = nn . Sequential (
            nn . Linear ( 64 * 28 * 28 , 1024 ),
            nn . Sigmoid (),
            nn . Linear ( 1024 , n_classes )
        )

        
    def forward ( self , x ):
        x = self . conv_block1 ( x )
        x = self . conv_block2 ( x )

        x = x . view ( x . size ( 0 ), - 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , 10 )
print ( model )

 MyCNNClassifier(
  (conv_block1): Sequential(
    (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU()
  )
  (conv_block2): Sequential(
    (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU()
  )
  (decoder): Sequential(
    (0): Linear(in_features=50176, out_features=1024, bias=True)
    (1): Sigmoid()
    (2): Linear(in_features=1024, out_features=10, bias=True)
  )
)

ดีขึ้นมากใช่ไหม?

คุณสังเกตเห็นว่า conv_block1 และ conv_block2 ดูเกือบจะเหมือนกันหรือไม่? เราสามารถสร้างฟังก์ชันที่ส่งคืน nn.Sequential เพื่อทำให้โค้ดง่ายขึ้น!

 def conv_block ( in_f , out_f , * args , ** kwargs ):
    return nn . Sequential (
        nn . Conv2d ( in_f , out_f , * args , ** kwargs ),
        nn . BatchNorm2d ( out_f ),
        nn . ReLU ()
    )

จากนั้นเราก็สามารถเรียกใช้ฟังก์ชันนี้ในโมดูลของเราได้

 class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , n_classes ):
        super (). __init__ ()
        self . conv_block1 = conv_block ( in_c , 32 , kernel_size = 3 , padding = 1 )
        
        self . conv_block2 = conv_block ( 32 , 64 , kernel_size = 3 , padding = 1 )

        
        self . decoder = nn . Sequential (
            nn . Linear ( 64 * 28 * 28 , 1024 ),
            nn . Sigmoid (),
            nn . Linear ( 1024 , n_classes )
        )

        
    def forward ( self , x ):
        x = self . conv_block1 ( x )
        x = self . conv_block2 ( x )

        x = x . view ( x . size ( 0 ), - 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , 10 )
print ( model )

 MyCNNClassifier(
  (conv_block1): Sequential(
    (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU()
  )
  (conv_block2): Sequential(
    (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
    (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
    (2): ReLU()
  )
  (decoder): Sequential(
    (0): Linear(in_features=50176, out_features=1024, bias=True)
    (1): Sigmoid()
    (2): Linear(in_features=1024, out_features=10, bias=True)
  )
)

สะอาดยิ่งขึ้น! ยังคง conv_block1 และ conv_block2 เกือบจะเหมือนกัน! เราสามารถรวมพวกมันเข้าด้วยกันโดยใช้ nn.Sequential

 class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , n_classes ):
        super (). __init__ ()
        self . encoder = nn . Sequential (
            conv_block ( in_c , 32 , kernel_size = 3 , padding = 1 ),
            conv_block ( 32 , 64 , kernel_size = 3 , padding = 1 )
        )

        
        self . decoder = nn . Sequential (
            nn . Linear ( 64 * 28 * 28 , 1024 ),
            nn . Sigmoid (),
            nn . Linear ( 1024 , n_classes )
        )

        
    def forward ( self , x ):
        x = self . encoder ( x )
        
        x = x . view ( x . size ( 0 ), - 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , 10 )
print ( model )

 MyCNNClassifier(
  (encoder): Sequential(
    (0): Sequential(
      (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
    (1): Sequential(
      (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
  )
  (decoder): Sequential(
    (0): Linear(in_features=50176, out_features=1024, bias=True)
    (1): Sigmoid()
    (2): Linear(in_features=1024, out_features=10, bias=True)
  )
)

self.encoder ตอนนี้ถือบูธ conv_block เราได้แยกตรรกะสำหรับโมเดลของเรา และทำให้ง่ายต่อการอ่านและนำมาใช้ซ้ำ ฟังก์ชัน conv_block ของเราสามารถนำเข้าและใช้ในรุ่นอื่นได้

ลำดับไดนามิก: สร้างหลายเลเยอร์พร้อมกัน

จะเกิดอะไรขึ้นถ้าเราสามารถเพิ่มเลเยอร์ใหม่ใน self.encoder การฮาร์ดโค้ดนั้นไม่สะดวก:

 self . encoder = nn . Sequential (
            conv_block ( in_c , 32 , kernel_size = 3 , padding = 1 ),
            conv_block ( 32 , 64 , kernel_size = 3 , padding = 1 ),
            conv_block ( 64 , 128 , kernel_size = 3 , padding = 1 ),
            conv_block ( 128 , 256 , kernel_size = 3 , padding = 1 ),

        )

จะดีกว่าไหมถ้าเราสามารถกำหนดขนาดเป็นอาร์เรย์และสร้างเลเยอร์ทั้งหมดโดยอัตโนมัติโดยไม่ต้องเขียนแต่ละเลเยอร์ โชคดีที่เราสามารถสร้างอาร์เรย์และส่งผ่านไปยัง Sequential

 class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , n_classes ):
        super (). __init__ ()
        self . enc_sizes = [ in_c , 32 , 64 ]
        
        conv_blocks = [ conv_block ( in_f , out_f , kernel_size = 3 , padding = 1 ) 
                       for in_f , out_f in zip ( self . enc_sizes , self . enc_sizes [ 1 :])]
        
        self . encoder = nn . Sequential ( * conv_blocks )

        
        self . decoder = nn . Sequential (
            nn . Linear ( 64 * 28 * 28 , 1024 ),
            nn . Sigmoid (),
            nn . Linear ( 1024 , n_classes )
        )

        
    def forward ( self , x ):
        x = self . encoder ( x )
        
        x = x . view ( x . size ( 0 ), - 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , 10 )
print ( model )

 MyCNNClassifier(
  (encoder): Sequential(
    (0): Sequential(
      (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
    (1): Sequential(
      (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
  )
  (decoder): Sequential(
    (0): Linear(in_features=50176, out_features=1024, bias=True)
    (1): Sigmoid()
    (2): Linear(in_features=1024, out_features=10, bias=True)
  )
)

มาทำลายมันกัน เราสร้างอาร์เรย์ self.enc_sizes ที่เก็บขนาดของตัวเข้ารหัสของเรา จากนั้นเราสร้างอาร์เรย์ conv_blocks โดยการวนซ้ำขนาด เนื่องจากเราต้องกำหนดขนาดบูธและขนาดพิเศษสำหรับแต่ละเลเยอร์ เราจึง zip อัดอาร์เรย์ขนาดด้วยตัวเองโดยเลื่อนทีละอัน

เพื่อให้ชัดเจน ลองดูตัวอย่างต่อไปนี้:

 sizes = [ 1 , 32 , 64 ]

for in_f , out_f in zip ( sizes , sizes [ 1 :]):
    print ( in_f , out_f )

 1 32
32 64

จากนั้น เนื่องจาก Sequential ไม่ยอมรับรายการ เราจึงแยกย่อยรายการโดยใช้ตัวดำเนินการ *

ทาดา! ตอนนี้ถ้าเราเพียงต้องการเพิ่มขนาด เราก็สามารถเพิ่มหมายเลขใหม่ลงในรายการได้อย่างง่ายดาย เป็นเรื่องปกติที่จะทำให้ขนาดเป็นพารามิเตอร์

 class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , enc_sizes , n_classes ):
        super (). __init__ ()
        self . enc_sizes = [ in_c , * enc_sizes ]
        
        conv_blocks = [ conv_block ( in_f , out_f , kernel_size = 3 , padding = 1 ) 
                       for in_f , out_f in zip ( self . enc_sizes , self . enc_sizes [ 1 :])]
        
        self . encoder = nn . Sequential ( * conv_blocks )

        
        self . decoder = nn . Sequential (
            nn . Linear ( 64 * 28 * 28 , 1024 ),
            nn . Sigmoid (),
            nn . Linear ( 1024 , n_classes )
        )

        
    def forward ( self , x ):
        x = self . encoder ( x )
        
        x = x . view ( x . size ( 0 ), - 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , [ 32 , 64 , 128 ], 10 )
print ( model )

 MyCNNClassifier(
  (encoder): Sequential(
    (0): Sequential(
      (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
    (1): Sequential(
      (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
    (2): Sequential(
      (0): Conv2d(64, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(128, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
  )
  (decoder): Sequential(
    (0): Linear(in_features=50176, out_features=1024, bias=True)
    (1): Sigmoid()
    (2): Linear(in_features=1024, out_features=10, bias=True)
  )
)

เราก็ทำเช่นเดียวกันกับส่วนถอดรหัสได้

 def dec_block ( in_f , out_f ):
    return nn . Sequential (
        nn . Linear ( in_f , out_f ),
        nn . Sigmoid ()
    )

class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , enc_sizes , dec_sizes ,  n_classes ):
        super (). __init__ ()
        self . enc_sizes = [ in_c , * enc_sizes ]
        self . dec_sizes = [ 64 * 28 * 28 , * dec_sizes ]

        conv_blocks = [ conv_block ( in_f , out_f , kernel_size = 3 , padding = 1 ) 
                       for in_f , out_f in zip ( self . enc_sizes , self . enc_sizes [ 1 :])]
        
        self . encoder = nn . Sequential ( * conv_blocks )

        
        dec_blocks = [ dec_block ( in_f , out_f ) 
                       for in_f , out_f in zip ( self . dec_sizes , self . dec_sizes [ 1 :])]
        
        self . decoder = nn . Sequential ( * dec_blocks )
        
        self . last = nn . Linear ( self . dec_sizes [ - 1 ], n_classes )

        
    def forward ( self , x ):
        x = self . encoder ( x )
        
        x = x . view ( x . size ( 0 ), - 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , [ 32 , 64 ], [ 1024 , 512 ], 10 )
print ( model )

 MyCNNClassifier(
  (encoder): Sequential(
    (0): Sequential(
      (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
    (1): Sequential(
      (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
      (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (2): ReLU()
    )
  )
  (decoder): Sequential(
    (0): Sequential(
      (0): Linear(in_features=50176, out_features=1024, bias=True)
      (1): Sigmoid()
    )
    (1): Sequential(
      (0): Linear(in_features=1024, out_features=512, bias=True)
      (1): Sigmoid()
    )
  )
  (last): Linear(in_features=512, out_features=10, bias=True)
)

เราทำตามรูปแบบเดียวกัน เราสร้างบล็อกใหม่สำหรับส่วนถอดรหัส เชิงเส้น + ซิกมอยด์ และส่งผ่านอาร์เรย์ที่มีขนาด เราต้องเพิ่ม self.last เนื่องจากเราไม่ต้องการเปิดใช้งานเอาต์พุต

ตอนนี้เราสามารถแบ่งโมเดลของเราออกเป็นสองส่วนได้! ตัวเข้ารหัส + ตัวถอดรหัส

 class MyEncoder ( nn . Module ):
    def __init__ ( self , enc_sizes ):
        super (). __init__ ()
        self . conv_blocks = nn . Sequential ( * [ conv_block ( in_f , out_f , kernel_size = 3 , padding = 1 ) 
                       for in_f , out_f in zip ( enc_sizes , enc_sizes [ 1 :])])

        def forward ( self , x ):
            return self . conv_blocks ( x )
        
class MyDecoder ( nn . Module ):
    def __init__ ( self , dec_sizes , n_classes ):
        super (). __init__ ()
        self . dec_blocks = nn . Sequential ( * [ dec_block ( in_f , out_f ) 
                       for in_f , out_f in zip ( dec_sizes , dec_sizes [ 1 :])])
        self . last = nn . Linear ( dec_sizes [ - 1 ], n_classes )

    def forward ( self , x ):
        return self . dec_blocks ()
    
    
class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , enc_sizes , dec_sizes ,  n_classes ):
        super (). __init__ ()
        self . enc_sizes = [ in_c , * enc_sizes ]
        self . dec_sizes = [ self . enc_sizes [ - 1 ] * 28 * 28 , * dec_sizes ]

        self . encoder = MyEncoder ( self . enc_sizes )
        
        self . decoder = MyDecoder ( self . dec_sizes , n_classes )
        
    def forward ( self , x ):
        x = self . encoder ( x )
        
        x = x . flatten ( 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , [ 32 , 64 ], [ 1024 , 512 ], 10 )
print ( model )

 MyCNNClassifier(
  (encoder): MyEncoder(
    (conv_blocks): Sequential(
      (0): Sequential(
        (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
        (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): ReLU()
      )
      (1): Sequential(
        (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
        (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): ReLU()
      )
    )
  )
  (decoder): MyDecoder(
    (dec_blocks): Sequential(
      (0): Sequential(
        (0): Linear(in_features=50176, out_features=1024, bias=True)
        (1): Sigmoid()
      )
      (1): Sequential(
        (0): Linear(in_features=1024, out_features=512, bias=True)
        (1): Sigmoid()
      )
    )
    (last): Linear(in_features=512, out_features=10, bias=True)
  )
)

โปรดทราบว่า MyEncoder และ MyDecoder อาจเป็นฟังก์ชันที่ส่งคืน nn.Sequential ฉันชอบใช้รูปแบบแรกสำหรับโมเดลและรูปแบบที่สองสำหรับแบบเอกสารสำเร็จรูป

การเจาะโมดูลของเราเข้าไปในโมดูลย่อยจะทำให้ แชร์ โค้ด ดีบัก และ ทดสอบ ได้ง่ายขึ้น

ModuleList : เมื่อเราต้องการวนซ้ำ

ModuleList ช่วยให้คุณสามารถจัดเก็บ Module เป็นรายการได้ มันจะมีประโยชน์เมื่อคุณต้องการวนซ้ำผ่านเลเยอร์และจัดเก็บ/ใช้ข้อมูลบางอย่าง เช่น ใน U-net

ข้อแตกต่างหลักระหว่าง Sequential คือ ModuleList ไม่มีวิธี forward ดังนั้นจึงไม่ได้เชื่อมต่อเลเยอร์ภายใน สมมติว่าเราต้องการแต่ละเอาต์พุตของแต่ละเลเยอร์ในตัวถอดรหัส เราสามารถจัดเก็บได้โดย:

 class MyModule ( nn . Module ):
    def __init__ ( self , sizes ):
        super (). __init__ ()
        self . layers = nn . ModuleList ([ nn . Linear ( in_f , out_f ) for in_f , out_f in zip ( sizes , sizes [ 1 :])])
        self . trace = []
        
    def forward ( self , x ):
        for layer in self . layers :
            x = layer ( x )
            self . trace . append ( x )
        return x

 model = MyModule ([ 1 , 16 , 32 ])
import torch

model ( torch . rand (( 4 , 1 )))

[ print ( trace . shape ) for trace in model . trace ]

 torch.Size([4, 16])
torch.Size([4, 32])





[None, None]

ModuleDict: เมื่อเราต้องเลือก

จะเป็นอย่างไรหากเราต้องการเปลี่ยนมาใช้ LearkyRelu ใน conv_block ของเรา? เราสามารถใช้ ModuleDict เพื่อสร้างพจนานุกรมของ Module และสลับ Module แบบไดนามิกเมื่อเราต้องการ

 def conv_block ( in_f , out_f , activation = 'relu' , * args , ** kwargs ):
    
    activations = nn . ModuleDict ([
                [ 'lrelu' , nn . LeakyReLU ()],
                [ 'relu' , nn . ReLU ()]
    ])
    
    return nn . Sequential (
        nn . Conv2d ( in_f , out_f , * args , ** kwargs ),
        nn . BatchNorm2d ( out_f ),
        activations [ activation ]
    )

 print ( conv_block ( 1 , 32 , 'lrelu' , kernel_size = 3 , padding = 1 ))
print ( conv_block ( 1 , 32 , 'relu' , kernel_size = 3 , padding = 1 ))

 Sequential(
  (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (2): LeakyReLU(negative_slope=0.01)
)
Sequential(
  (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
  (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (2): ReLU()
)

การดำเนินการขั้นสุดท้าย

มาสรุปทุกอย่างกันเถอะ!

 def conv_block ( in_f , out_f , activation = 'relu' , * args , ** kwargs ):
    activations = nn . ModuleDict ([
                [ 'lrelu' , nn . LeakyReLU ()],
                [ 'relu' , nn . ReLU ()]
    ])
    
    return nn . Sequential (
        nn . Conv2d ( in_f , out_f , * args , ** kwargs ),
        nn . BatchNorm2d ( out_f ),
        activations [ activation ]
    )

def dec_block ( in_f , out_f ):
    return nn . Sequential (
        nn . Linear ( in_f , out_f ),
        nn . Sigmoid ()
    )

class MyEncoder ( nn . Module ):
    def __init__ ( self , enc_sizes , * args , ** kwargs ):
        super (). __init__ ()
        self . conv_blocks = nn . Sequential ( * [ conv_block ( in_f , out_f , kernel_size = 3 , padding = 1 , * args , ** kwargs ) 
                       for in_f , out_f in zip ( enc_sizes , enc_sizes [ 1 :])])
        
        def forward ( self , x ):
            return self . conv_blocks ( x )
        
class MyDecoder ( nn . Module ):
    def __init__ ( self , dec_sizes , n_classes ):
        super (). __init__ ()
        self . dec_blocks = nn . Sequential ( * [ dec_block ( in_f , out_f ) 
                       for in_f , out_f in zip ( dec_sizes , dec_sizes [ 1 :])])
        self . last = nn . Linear ( dec_sizes [ - 1 ], n_classes )

    def forward ( self , x ):
        return self . dec_blocks ()
    
    
class MyCNNClassifier ( nn . Module ):
    def __init__ ( self , in_c , enc_sizes , dec_sizes ,  n_classes , activation = 'relu' ):
        super (). __init__ ()
        self . enc_sizes = [ in_c , * enc_sizes ]
        self . dec_sizes = [ 32 * 28 * 28 , * dec_sizes ]

        self . encoder = MyEncoder ( self . enc_sizes , activation = activation )
        
        self . decoder = MyDecoder ( dec_sizes , n_classes )
        
    def forward ( self , x ):
        x = self . encoder ( x )
        
        x = x . flatten ( 1 ) # flat
        
        x = self . decoder ( x )
        
        return x

 model = MyCNNClassifier ( 1 , [ 32 , 64 ], [ 1024 , 512 ], 10 , activation = 'lrelu' )
print ( model )

 MyCNNClassifier(
  (encoder): MyEncoder(
    (conv_blocks): Sequential(
      (0): Sequential(
        (0): Conv2d(1, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
        (1): BatchNorm2d(32, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): LeakyReLU(negative_slope=0.01)
      )
      (1): Sequential(
        (0): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))
        (1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
        (2): LeakyReLU(negative_slope=0.01)
      )
    )
  )
  (decoder): MyDecoder(
    (dec_blocks): Sequential(
      (0): Sequential(
        (0): Linear(in_features=1024, out_features=512, bias=True)
        (1): Sigmoid()
      )
    )
    (last): Linear(in_features=512, out_features=10, bias=True)
  )
)

บทสรุป

ดังนั้นโดยสรุป

ใช้ Module เมื่อคุณมีบล็อกขนาดใหญ่ที่ประกอบด้วยบล็อกเล็ก ๆ หลายบล็อก
ใช้ Sequential เมื่อคุณต้องการสร้างบล็อกเล็กๆ จากเลเยอร์
ใช้ ModuleList เมื่อคุณต้องการวนซ้ำบางเลเยอร์หรือแบบเอกสารสำเร็จรูปและดำเนินการบางอย่าง
ใช้ ModuleDict เมื่อคุณต้องการกำหนดพารามิเตอร์ให้กับบล็อกบางบล็อกของโมเดลของคุณ เช่น ฟังก์ชันการเปิดใช้งาน

นั่นคือทั้งหมด คน!

ขอบคุณสำหรับการอ่าน

ขยาย

ข้อมูลเพิ่มเติม