dịch tiêu đề phía trên

🏷️sec_fcn

dịch đoạn phía trên

%matplotlib inline
from d2l import mxnet as d2l
from mxnet import gluon, image, init, np, npx
from mxnet.gluon import nn

npx.set_np()

dịch tiêu đề phía trên

dịch đoạn phía trên

🏷️fig_fcn

dịch đoạn phía trên

pretrained_net = gluon.model_zoo.vision.resnet18_v2(pretrained=True)
pretrained_net.features[-4:], pretrained_net.output

dịch đoạn phía trên

net = nn.HybridSequential()
for layer in pretrained_net.features[:-2]:
    net.add(layer)

dịch đoạn phía trên

X = np.random.uniform(size=(1, 3, 320, 480))
net(X).shape

dịch đoạn phía trên

num_classes = 21
net.add(nn.Conv2D(num_classes, kernel_size=1),
        nn.Conv2DTranspose(
            num_classes, kernel_size=64, padding=16, strides=32))

dịch tiêu đề phía trên

dịch đoạn phía trên

def bilinear_kernel(in_channels, out_channels, kernel_size):
    factor = (kernel_size + 1) // 2
    if kernel_size % 2 == 1:
        center = factor - 1
    else:
        center = factor - 0.5
    og = (np.arange(kernel_size).reshape(-1, 1),
          np.arange(kernel_size).reshape(1, -1))
    filt = (1 - np.abs(og[0] - center) / factor) * \
           (1 - np.abs(og[1] - center) / factor)
    weight = np.zeros((in_channels, out_channels, kernel_size, kernel_size))
    weight[range(in_channels), range(out_channels), :, :] = filt
    return np.array(weight)

dịch đoạn phía trên

conv_trans = nn.Conv2DTranspose(3, kernel_size=4, padding=1, strides=2)
conv_trans.initialize(init.Constant(bilinear_kernel(3, 3, 4)))

dịch đoạn phía trên

img = image.imread('../img/catdog.jpg')
X = np.expand_dims(img.astype('float32').transpose(2, 0, 1), axis=0) / 255
Y = conv_trans(X)
out_img = Y[0].transpose(1, 2, 0)

dịch đoạn phía trên

d2l.set_figsize()
print('input image shape:', img.shape)
d2l.plt.imshow(img.asnumpy());
print('output image shape:', out_img.shape)
d2l.plt.imshow(out_img.asnumpy());

dịch đoạn phía trên

W = bilinear_kernel(num_classes, num_classes, 64)
net[-1].initialize(init.Constant(W))
net[-2].initialize(init=init.Xavier())

dịch tiêu đề phía trên

dịch đoạn phía trên

batch_size, crop_size = 32, (320, 480)
train_iter, test_iter = d2l.load_data_voc(batch_size, crop_size)

dịch tiêu đề phía trên

dịch đoạn phía trên

num_epochs, lr, wd, devices = 5, 0.1, 1e-3, d2l.try_all_gpus()
loss = gluon.loss.SoftmaxCrossEntropyLoss(axis=1)
net.collect_params().reset_ctx(devices)
trainer = gluon.Trainer(net.collect_params(), 'sgd',
                        {'learning_rate': lr, 'wd': wd})
d2l.train_ch13(net, train_iter, test_iter, loss, trainer, num_epochs, devices)

dịch tiêu đề phía trên

dịch đoạn phía trên

def predict(img):
    X = test_iter._dataset.normalize_image(img)
    X = np.expand_dims(X.transpose(2, 0, 1), axis=0)
    pred = net(X.as_in_ctx(devices[0])).argmax(axis=1)
    return pred.reshape(pred.shape[1], pred.shape[2])

dịch đoạn phía trên

def label2image(pred):
    colormap = np.array(d2l.VOC_COLORMAP, ctx=devices[0], dtype='uint8')
    X = pred.astype('int32')
    return colormap[X, :]

dịch đoạn phía trên

voc_dir = d2l.download_extract('voc2012', 'VOCdevkit/VOC2012')
test_images, test_labels = d2l.read_voc_images(voc_dir, False)
n, imgs = 4, []
for i in range(n):
    crop_rect = (0, 0, 480, 320)
    X = image.fixed_crop(test_images[i], *crop_rect)
    pred = label2image(predict(X))
    imgs += [X, pred, image.fixed_crop(test_labels[i], *crop_rect)]
d2l.show_images(imgs[::3] + imgs[1::3] + imgs[2::3], 3, n, scale=2);

Tóm tắt

dịch đoạn phía trên

Bài tập

dịch đoạn phía trên

Thảo luận

Tiếng Anh - MXNet
Tiếng Việt

Những người thực hiện

Bản dịch trong trang này được thực hiện bởi:

Đoàn Võ Duy Thanh

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

fcn_vn.md

fcn_vn.md

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

Tóm tắt

Bài tập

Thảo luận

Những người thực hiện

Files

fcn_vn.md

Latest commit

History

fcn_vn.md

File metadata and controls

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

dịch tiêu đề phía trên

Tóm tắt

Bài tập

Thảo luận

Những người thực hiện