-
Notifications
You must be signed in to change notification settings - Fork 0
/
train.py
76 lines (62 loc) · 2.49 KB
/
train.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
from dv.util import *
from dv.save import *
import torch
import torch.nn as nn
import torch.nn.functional as F
from PIL import Image
import os
import sys
import time
from torchvision import datasets, transforms, utils
import torchvision.models as models
import numpy as np
def train(args, train_loader, model, criterion, optimizer, epoch):
batch_time = AverageMeter()
data_time = AverageMeter()
losses = AverageMeter()
top1 = AverageMeter()
top5 = AverageMeter()
log = Log()
losses1 = AverageMeter()
losses2 = AverageMeter()
losses3 = AverageMeter()
# switch to train mode
model.train()
for i, (data, target) in enumerate(train_loader):
target = target.type(torch.LongTensor)
if args.gpu is not None:
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
data = data.to(device)
target = target.to(device)
out1, out2, out3, _ = model(data)
out = out1 + out2 + 0.1 * out3
loss1 = criterion(out1, target)
loss2 = criterion(out2, target)
loss3 = criterion(out3, target)
loss = loss1 + loss2 + 0.1 * loss3
# measure accuracy and record loss
prec1, prec5 = accuracy(out, target, topk=(1, 5)) # this is metric on trainset
batchsize = data.size(0)
losses.update(loss.item(), batchsize)
if np.isnan(losses.val):
sys.exit('Fuck, loss blows up!')
losses1.update(loss1.item(), batchsize)
losses2.update(loss2.item(), batchsize)
losses3.update(loss3.item(), batchsize)
top1.update(prec1[0], batchsize)
top5.update(prec5[0], batchsize)
# compute gradient and do SGD step
optimizer.zero_grad()
loss.backward()
optimizer.step()
if i % args.print_freq == 0:
print('Deep Vision <==> Train Epoch: [{0}][{1}/{2}]\n'
'Loss {loss.val:.4f} ({loss.avg:.4f})\t'
'Loss1 {loss1.val:.4f} ({loss1.avg:.4f})\t'
'Loss2 {loss2.val:.4f} ({loss2.avg:.4f})\t'
'Loss3 {loss3.val:.4f} ({loss3.avg:.4f})\n'
'Top1 {top1.val:.3f} ({top1.avg:.3f})\t'
'Top5 {top5.val:.3f} ({top5.avg:.3f})'.format(
epoch, i, len(train_loader), loss=losses, loss1=losses1, loss2=losses2, loss3=losses3, top1=top1, top5=top5))
totalloss = [losses, losses1, losses2, losses3]
log.save_train_info(epoch, i, len(train_loader), totalloss, top1, top5)