-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathtrain.py
105 lines (89 loc) · 3 KB
/
train.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
import os
import glob
import torch
from torch.utils.data import DataLoader
from options import opts
if opts.model_name == 'model_A':
from src.model_A import GarmentModel
elif opts.model_name == 'model_AA':
from src.model_AA import GarmentModel
elif opts.model_name == 'model_B':
from src.model_B import GarmentModel
elif opts.model_name == 'model_BB':
from src.model_BB import GarmentModel
elif opts.model_name == 'model_C':
from src.model_C import GarmentModel
elif opts.model_name == 'model_D':
from src.model_D import GarmentModel
elif opts.model_name == 'model_E':
from src.model_E import GarmentModel
elif opts.model_name == 'model_F':
from src.model_F import GarmentModel
elif opts.model_name == 'model_G':
from src.model_G import GarmentModel
elif opts.model_name == 'model_H':
from src.model_H import GarmentModel
else:
raise ValueError('opts.model_name option wrong: %s'%opts.model_name)
print ('Using model: %s'%opts.model_name)
from src.dataset import GarmentDataset
from pytorch_lightning import Trainer
from pytorch_lightning.loggers import TensorBoardLogger
from pytorch_lightning.callbacks import ModelCheckpoint
if __name__ == '__main__':
dataset_train = GarmentDataset(
data_dir=opts.data_dir,
val_path=os.path.join(opts.data_dir, 'val.txt'),
num_views=opts.num_views,
num_points=opts.num_points,
evaluate=False,
use_partial=opts.partial
)
dataset_val = GarmentDataset(
data_dir=opts.data_dir,
val_path=os.path.join(opts.data_dir, 'val.txt'),
num_views=opts.num_views,
num_points=opts.num_points,
evaluate=True,
use_partial=opts.partial
)
print ('Using partial training: ', opts.partial)
train_loader = DataLoader(
dataset=dataset_train, batch_size=opts.batch_size,
shuffle=True, num_workers=opts.num_workers
)
val_loader = DataLoader(
dataset=dataset_val, batch_size=opts.batch_size, num_workers=opts.num_workers
)
logger = TensorBoardLogger('tb_logs', name=opts.exp_name)
checkpoint_callback = ModelCheckpoint(
monitor='val_loss',
mode='min',
dirpath='saved_models',
filename='%s'%opts.exp_name
)
ckpt_path = glob.glob(
os.path.join('saved_models', '%s*.ckpt'%opts.exp_name))
if len(ckpt_path) == 0:
ckpt_path = None
else:
ckpt_path = ckpt_path[0]
print ('resuming training from %s'%ckpt_path)
trainer = Trainer(
gpus=-1,
auto_select_gpus=True,
benchmark=True,
val_check_interval=1000,
max_steps=700000,
logger=logger,
callbacks=[checkpoint_callback],
resume_from_checkpoint=ckpt_path
)
if ckpt_path is None:
model = GarmentModel()
else:
print ('resuming training from %s'%ckpt_path)
model = GarmentModel.load_from_checkpoint(ckpt_path)
# training
trainer.fit(model, train_loader, val_loader)
# trainer.validate(model, val_loader)