This repository has been archived by the owner on Dec 25, 2020. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathmain.py
117 lines (87 loc) · 3.97 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
import os
import argparse
import torch
import torch.optim as optim
from tensorboardX import SummaryWriter
from model import *
from utils import *
def hashing_loss(b, cls, m, alpha):
"""
compute hashing loss
automatically consider all n^2 pairs
"""
y = (cls.unsqueeze(0) != cls.unsqueeze(1)).float().view(-1)
dist = ((b.unsqueeze(0) - b.unsqueeze(1)) ** 2).sum(dim=2).view(-1)
loss = (1 - y) / 2 * dist + y / 2 * (m - dist).clamp(min=0)
loss = loss.mean() + alpha * (b.abs() - 1).abs().sum(dim=1).mean() * 2
return loss
def train(epoch, dataloader, net, optimizer, m, alpha):
accum_loss = 0
net.train()
for i, (img, cls) in enumerate(dataloader):
img, cls = [Variable(x.cuda()) for x in (img, cls)]
net.zero_grad()
b = net(img)
loss = hashing_loss(b, cls, m, alpha)
loss.backward()
optimizer.step()
accum_loss += loss.data[0]
print(f'[{epoch}][{i}/{len(dataloader)}] loss: {loss.data[0]:.4f}')
return accum_loss / len(dataloader)
def test(epoch, dataloader, net, m, alpha):
accum_loss = 0
net.eval()
for img, cls in dataloader:
img, cls = [Variable(x.cuda(), volatile=True) for x in (img, cls)]
b = net(img)
loss = hashing_loss(b, cls, m, alpha)
accum_loss += loss.data[0]
accum_loss /= len(dataloader)
print(f'[{epoch}] val loss: {accum_loss:.4f}')
return accum_loss
def main():
parser = argparse.ArgumentParser(description='train DSH')
parser.add_argument('--cifar', default='../dataset/cifar', help='path to cifar')
parser.add_argument('--weights', default='', help="path to weight (to continue training)")
parser.add_argument('--outf', default='checkpoints', help='folder to output model checkpoints')
parser.add_argument('--checkpoint', type=int, default=50, help='checkpointing after batches')
parser.add_argument('--batchSize', type=int, default=256, help='input batch size')
parser.add_argument('--ngpu', type=int, default=0, help='which GPU to use')
parser.add_argument('--binary_bits', type=int, default=12, help='length of hashing binary')
parser.add_argument('--alpha', type=float, default=0.01, help='weighting of regularizer')
parser.add_argument('--niter', type=int, default=500, help='number of epochs to train for')
parser.add_argument('--lr', type=float, default=0.001, help='learning rate')
opt = parser.parse_args()
print(opt)
os.makedirs(opt.outf, exist_ok=True)
choose_gpu(opt.ngpu)
feed_random_seed()
train_loader, test_loader = init_cifar_dataloader(opt.cifar, opt.batchSize)
logger = SummaryWriter()
# setup net
net = DSH(opt.binary_bits)
resume_epoch = 0
print(net)
if opt.weights:
print(f'loading weight form {opt.weights}')
resume_epoch = int(os.path.basename(opt.weights)[:-4])
net.load_state_dict(torch.load(opt.weights, map_location=lambda storage, location: storage))
net.cuda()
# setup optimizer
optimizer = optim.Adam(net.parameters(), lr=opt.lr, weight_decay=0.004)
for epoch in range(resume_epoch, opt.niter):
train_loss = train(epoch, train_loader, net, optimizer, 2 * opt.binary_bits, opt.alpha)
logger.add_scalar('train_loss', train_loss, epoch)
test_loss = test(epoch, test_loader, net, 2 * opt.binary_bits, opt.alpha)
logger.add_scalar('test_loss', test_loss, epoch)
if epoch % opt.checkpoint == 0:
# compute mAP by searching testset images from trainset
trn_binary, trn_label = compute_result(train_loader, net)
tst_binary, tst_label = compute_result(test_loader, net)
mAP = compute_mAP(trn_binary, tst_binary, trn_label, tst_label)
print(f'[{epoch}] retrieval mAP: {mAP:.4f}')
logger.add_scalar('retrieval_mAP', mAP, epoch)
# save checkpoints
torch.save(net.state_dict(), os.path.join(opt.outf, f'{epoch:03d}.pth'))
if __name__ == '__main__':
main()