-
Notifications
You must be signed in to change notification settings - Fork 34
/
train_matterport.py
215 lines (166 loc) · 6.99 KB
/
train_matterport.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
"""
Chuhang Zou
07.2019
Code Revised from:
Finetuning Torchvision Models
=============================
**Author:** `Nathan Inkawhich <https://github.com/inkawhich>`__
"""
from __future__ import print_function
from __future__ import division
import torch
import torch.nn as nn
import torch.optim as optim
import numpy as np
from torchvision import models, transforms
import time
import copy
print("PyTorch Version: ",torch.__version__)
#import pickle
from torch.utils import data
#import scipy.io as sio
from model import *
from data_generator_matterport import *
# Top level data directory. Here we assume the format of the directory conforms
# to the ImageFolder structure
model_path = './model/resnet34_matterport.pth'
train_filepath = './data/matterport/_final_label_v2/train.txt'
val_filepath = './data/matterport/_final_label_v2/val.txt'
data_path = './data/matterport/mp3d_align/'
# Pre-trained models to choose from [resnet18, resnet34, resnet50]
#model_name = "resnet18"
model_name = "resnet34"
#model_name = "resnet50"
# if load pretrained model
use_pretrained = True
Flag_loadweights = True
weight_path = './model/resnet34_matterport.pth'
# Number of classes in the dataset
num_classes = 1024
# Batch size for training (change depending on how much memory you have)
batch_size = 4
# Number of epochs to train for
num_epochs = 100000
steps_per_epoch = 20
# Number of workers
num_workers = 4
# Model Training and Validation Code
def train_model(model, train_generator, val_generator, optimizer, criterion, criterion2, steps=100, num_epochs=25):
since = time.time()
val_acc_history = []
best_acc = np.Inf
for epoch in range(num_epochs):
print('Epoch {}/{}'.format(epoch, num_epochs - 1))
print('-' * 10)
# Each epoch has a training and validation phase
for phase in ['train', 'val']:
if phase == 'train':
model.train() # Set model to training mode
dataloaders = train_generator
else:
model.eval() # Set model to evaluate mode
dataloaders = val_generator
loss_sum = 0.0
step = 0
# Iterate over data.
for input in dataloaders:
inputs = input[0]
labels = input[1]
labels2 = input[2]
# gpu mode
inputs = inputs.to(device)
labels = labels.to(device)
labels2 = labels2.to(device)
# zero the parameter gradients
optimizer.zero_grad()
# forward
# track history if only in train
with torch.set_grad_enabled(phase == 'train'):
# Get model outputs and calculate loss
outputs, outputs2 = model(inputs)
# loss
mask = (labels>0).float()
mask = mask+0.2*(1.0-mask)
mask2 = (labels2>0).float()
mask2 = mask2+0.2*(1.0-mask2)
loss = criterion(outputs*mask, labels*mask) + criterion2(outputs2*mask2, labels2*mask2)
# backward + optimize only if in training phase
if phase == 'train':
loss.backward()
torch.nn.utils.clip_grad_norm_(model.parameters(), 5.0)
optimizer.step()
# clear cache
#torch.cuda.empty_cache()
del inputs, outputs, outputs2, mask, mask2, labels, labels2
#del inputs, outputs, mask, labels
# statistics
loss_sum += loss.item()/steps #*inputs.size(0)/steps
# clear
del loss
# Break after 'steps' steps
if step==steps-1:
break
step += 1
print('{} Loss: {:.6f}'.format(phase, loss_sum))
# deep copy the model
if phase == 'val' and loss_sum < best_acc:
val_acc_history.append(loss_sum)
best_acc = loss_sum
best_model_wts = copy.deepcopy(model.state_dict())
# save model
torch.save(best_model_wts, model_path)
print("Model saved ...")
del best_model_wts
print()
time_elapsed = time.time() - since
print('Training complete in {:.0f}m {:.0f}s'.format(time_elapsed // 60, time_elapsed % 60))
print('Best val Acc: {:6f}'.format(best_acc))
# load best model weights
model.load_state_dict(best_model_wts)
return model, val_acc_history
print("Load Models...")
# Define the encoder
encoder = initialize_encoder(model_name, num_classes,use_pretrained=use_pretrained)
# Full model
model_ft = SegNet(encoder, num_classes)
# Model initialization
set_parameter_requires_grad(model_ft)
# Print the model we just instantiated
#print(model_ft)
# Detect if we have a GPU available
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
# Send the model to GPU
model_ft = model_ft.to(device)
# if load weights
if Flag_loadweights:
pretrained_dict = torch.load(weight_path)
model_dict = model_ft.state_dict()
#pretrained_dict['resnet.conv1.weight'] = torch.cat((pretrained_dict['resnet.conv1.weight'], model_dict['resnet.conv1.weight'][:,3:,:,:]), 1)
pretrained_dict = {k: v for k, v in pretrained_dict.items() if k in model_dict}
model_dict.update(pretrained_dict)
model_ft.load_state_dict(model_dict)
# update header
print("Params to learn:")
for name,param in model_ft.named_parameters():
if 'bn' in name:
# tune hearder only
# if name != 'conv11.bias' and name != 'conv11.weight' and name != 'conv22.weight' and name != 'conv22.bias' and name != 'conv33.bias' and name != 'conv33.weight' and name != 'conv44.bias' and name != 'conv44.weight' and name != 'conv55.bias' and name != 'conv55.weight':
param.requires_grad = False
if param.requires_grad == True:
print("\t",name)
# Gather the parameters to be optimized/updated in this run.
params_to_update = [param for name, param in model_ft.named_parameters() if param.requires_grad]
# Create the Optimizer
optimizer_ft = optim.Adam(params_to_update, lr = 1e-4, eps = 1e-6)
# Setup the loss
criterion = nn.BCELoss()
criterion2 = nn.BCELoss()
# Load Data
print("Initializing Datasets and Dataloaders...")
train_set = ShapeNetDataset(train_filepath, data_path, 'train', transform=True)
train_generator = torch.utils.data.DataLoader(train_set, batch_size=batch_size, shuffle=True, num_workers=num_workers)
val_set = ShapeNetDataset(val_filepath, data_path, 'val', transform=True)
val_generator = torch.utils.data.DataLoader(val_set, batch_size=batch_size, shuffle=True, num_workers=num_workers)
# Train and evaluate
model_ft, hist = train_model(model_ft, train_generator, val_generator, optimizer_ft, criterion, criterion2, steps_per_epoch, num_epochs=num_epochs)
print('training done')