.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python def nin_block(out_channels, kernel_size, strides, padding): return nn.Sequential( nn.LazyConv2d(out_channels, kernel_size, strides, padding), nn.ReLU(), nn.LazyConv2d(out_channels, kernel_size=1), nn.ReLU(), nn.LazyConv2d(out_channels, kernel_size=1), nn.ReLU()) .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python def nin_block(num_channels, kernel_size, strides, padding): blk = nn.Sequential() blk.add(nn.Conv2D(num_channels, kernel_size, strides, padding, activation='relu'), nn.Conv2D(num_channels, kernel_size=1, activation='relu'), nn.Conv2D(num_channels, kernel_size=1, activation='relu')) return blk .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python def nin_block(out_channels, kernel_size, strides, padding): return nn.Sequential([ nn.Conv(out_channels, kernel_size, strides, padding), nn.relu, nn.Conv(out_channels, kernel_size=(1, 1)), nn.relu, nn.Conv(out_channels, kernel_size=(1, 1)), nn.relu]) .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python def nin_block(out_channels, kernel_size, strides, padding): return tf.keras.models.Sequential([ tf.keras.layers.Conv2D(out_channels, kernel_size, strides=strides, padding=padding), tf.keras.layers.Activation('relu'), tf.keras.layers.Conv2D(out_channels, 1), tf.keras.layers.Activation('relu'), tf.keras.layers.Conv2D(out_channels, 1), tf.keras.layers.Activation('relu')]) .. raw:: html

.. raw:: html

pytorch mxnet jax tensorflow

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python class NiN(d2l.Classifier): def __init__(self, lr=0.1, num_classes=10): super().__init__() self.save_hyperparameters() if tab.selected('mxnet'): self.net = nn.Sequential() self.net.add( nin_block(96, kernel_size=11, strides=4, padding=0), nn.MaxPool2D(pool_size=3, strides=2), nin_block(256, kernel_size=5, strides=1, padding=2), nn.MaxPool2D(pool_size=3, strides=2), nin_block(384, kernel_size=3, strides=1, padding=1), nn.MaxPool2D(pool_size=3, strides=2), nn.Dropout(0.5), nin_block(num_classes, kernel_size=3, strides=1, padding=1), nn.GlobalAvgPool2D(), nn.Flatten()) self.net.initialize(init.Xavier()) if tab.selected('pytorch'): self.net = nn.Sequential( nin_block(96, kernel_size=11, strides=4, padding=0), nn.MaxPool2d(3, stride=2), nin_block(256, kernel_size=5, strides=1, padding=2), nn.MaxPool2d(3, stride=2), nin_block(384, kernel_size=3, strides=1, padding=1), nn.MaxPool2d(3, stride=2), nn.Dropout(0.5), nin_block(num_classes, kernel_size=3, strides=1, padding=1), nn.AdaptiveAvgPool2d((1, 1)), nn.Flatten()) self.net.apply(d2l.init_cnn) if tab.selected('tensorflow'): self.net = tf.keras.models.Sequential([ nin_block(96, kernel_size=11, strides=4, padding='valid'), tf.keras.layers.MaxPool2D(pool_size=3, strides=2), nin_block(256, kernel_size=5, strides=1, padding='same'), tf.keras.layers.MaxPool2D(pool_size=3, strides=2), nin_block(384, kernel_size=3, strides=1, padding='same'), tf.keras.layers.MaxPool2D(pool_size=3, strides=2), tf.keras.layers.Dropout(0.5), nin_block(num_classes, kernel_size=3, strides=1, padding='same'), tf.keras.layers.GlobalAvgPool2D(), tf.keras.layers.Flatten()]) .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python class NiN(d2l.Classifier): lr: float = 0.1 num_classes = 10 training: bool = True def setup(self): self.net = nn.Sequential([ nin_block(96, kernel_size=(11, 11), strides=(4, 4), padding=(0, 0)), lambda x: nn.max_pool(x, (3, 3), strides=(2, 2)), nin_block(256, kernel_size=(5, 5), strides=(1, 1), padding=(2, 2)), lambda x: nn.max_pool(x, (3, 3), strides=(2, 2)), nin_block(384, kernel_size=(3, 3), strides=(1, 1), padding=(1, 1)), lambda x: nn.max_pool(x, (3, 3), strides=(2, 2)), nn.Dropout(0.5, deterministic=not self.training), nin_block(self.num_classes, kernel_size=(3, 3), strides=1, padding=(1, 1)), lambda x: nn.avg_pool(x, (5, 5)), # global avg pooling lambda x: x.reshape((x.shape[0], -1)) # flatten ]) .. raw:: html

.. raw:: html

pytorch mxnet jax tensorflow

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python NiN().layer_summary((1, 1, 224, 224)) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output Sequential output shape: torch.Size([1, 96, 54, 54]) MaxPool2d output shape: torch.Size([1, 96, 26, 26]) Sequential output shape: torch.Size([1, 256, 26, 26]) MaxPool2d output shape: torch.Size([1, 256, 12, 12]) Sequential output shape: torch.Size([1, 384, 12, 12]) MaxPool2d output shape: torch.Size([1, 384, 5, 5]) Dropout output shape: torch.Size([1, 384, 5, 5]) Sequential output shape: torch.Size([1, 10, 5, 5]) AdaptiveAvgPool2d output shape: torch.Size([1, 10, 1, 1]) Flatten output shape: torch.Size([1, 10]) .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python NiN().layer_summary((1, 1, 224, 224)) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output Sequential output shape: (1, 96, 54, 54) MaxPool2D output shape: (1, 96, 26, 26) Sequential output shape: (1, 256, 26, 26) MaxPool2D output shape: (1, 256, 12, 12) Sequential output shape: (1, 384, 12, 12) MaxPool2D output shape: (1, 384, 5, 5) Dropout output shape: (1, 384, 5, 5) Sequential output shape: (1, 10, 5, 5) GlobalAvgPool2D output shape: (1, 10, 1, 1) Flatten output shape: (1, 10) [07:48:54] ../src/storage/storage.cc:196: Using Pooled (Naive) StorageManager for CPU .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python NiN(training=False).layer_summary((1, 224, 224, 1)) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output Sequential output shape: (1, 54, 54, 96) function output shape: (1, 26, 26, 96) Sequential output shape: (1, 26, 26, 256) function output shape: (1, 12, 12, 256) Sequential output shape: (1, 12, 12, 384) function output shape: (1, 5, 5, 384) Dropout output shape: (1, 5, 5, 384) Sequential output shape: (1, 5, 5, 10) function output shape: (1, 1, 1, 10) function output shape: (1, 10) .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python NiN().layer_summary((1, 224, 224, 1)) .. raw:: latex \diilbookstyleoutputcell .. parsed-literal:: :class: output Sequential output shape: (1, 54, 54, 96) MaxPooling2D output shape: (1, 26, 26, 96) Sequential output shape: (1, 26, 26, 256) MaxPooling2D output shape: (1, 12, 12, 256) Sequential output shape: (1, 12, 12, 384) MaxPooling2D output shape: (1, 5, 5, 384) Dropout output shape: (1, 5, 5, 384) Sequential output shape: (1, 5, 5, 10) GlobalAveragePooling2D output shape: (1, 10) Flatten output shape: (1, 10) .. raw:: html

.. raw:: html

pytorch mxnet jax tensorflow

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python model = NiN(lr=0.05) trainer = d2l.Trainer(max_epochs=10, num_gpus=1) data = d2l.FashionMNIST(batch_size=128, resize=(224, 224)) if tab.selected('pytorch'): model.apply_init([next(iter(data.get_dataloader(True)))[0]], d2l.init_cnn) trainer.fit(model, data) .. figure:: output_nin_2871e8_63_0.svg .. raw:: html

.. raw:: html

.. raw:: latex \diilbookstyleinputcell .. code:: python trainer = d2l.Trainer(max_epochs=10) data = d2l.FashionMNIST(batch_size=128, resize=(224, 224)) with d2l.try_gpu(): model = NiN(lr=0.05) trainer.fit(model, data) .. figure:: output_nin_2871e8_72_0.svg .. raw:: html

.. raw:: html