forked from Vipermdl/OCR_detection_IC15
-
Notifications
You must be signed in to change notification settings - Fork 23
/
train.py
93 lines (76 loc) · 3.17 KB
/
train.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
import argparse
import json
import logging
import os
import pathlib
import random
from data_loader import SynthTextDataLoaderFactory
from data_loader import OCRDataLoaderFactory
from data_loader.dataset import ICDAR, MyDataset
from logger import Logger
from model.loss import *
from model.model import *
from model.metric import *
from trainer import Trainer
from utils.bbox import Toolbox
logging.basicConfig(level=logging.DEBUG, format='')
def main(config, resume):
train_logger = Logger()
if config['data_loader']['dataset'] == 'icdar2015':
# ICDAR 2015
data_root = pathlib.Path(config['data_loader']['data_dir'])
ICDARDataset2015 = ICDAR(data_root, year='2015')
data_loader = OCRDataLoaderFactory(config, ICDARDataset2015)
train = data_loader.train()
val = data_loader.val()
elif config['data_loader']['dataset'] == 'synth800k':
data_loader = SynthTextDataLoaderFactory(config)
train = data_loader.train()
val = data_loader.val()
elif config['data_loader']['dataset'] == 'mydataset':
image_root = pathlib.Path(config['data_loader']['image_dir'])
annotation_dir = pathlib.Path(config['data_loader']['annotation_dir'])
data_loader = OCRDataLoaderFactory(config,MyDataset(image_root,annotation_dir))
train = data_loader.train()
val = data_loader.val()
os.environ['CUDA_VISIBLE_DEVICES'] = ','.join([str(i) for i in config['gpus']])
model = eval(config['arch'])(config)
model.summary()
loss = eval(config['loss'])(config['model'])
metrics = [eval(metric) for metric in config['metrics']]
finetune_model = config['finetune']
trainer = Trainer(model, loss, metrics,
finetune=finetune_model,
resume=resume,
config=config,
data_loader=train,
valid_data_loader=val,
train_logger=train_logger,
toolbox = Toolbox,
keys=getattr(common_str,config['model']['keys']))
trainer.train()
if __name__ == '__main__':
SEED = 1228
torch.manual_seed(SEED)
torch.cuda.manual_seed(SEED)
np.random.seed(SEED)
random.seed(SEED)
torch.backends.cudnn.deterministic = True
logger = logging.getLogger()
parser = argparse.ArgumentParser(description='PyTorch Template')
parser.add_argument('-c', '--config', default='./config.json', type=str,
help='config file path (default: None)')
parser.add_argument('-r', '--resume', default=None, type=str,
help='path to latest checkpoint (default: None)')
args = parser.parse_args()
config = None
if args.resume is not None:
if args.config is not None:
logger.warning('Warning: --config overridden by --resume')
config = torch.load(args.resume)['config']
elif args.config is not None:
config = json.load(open(args.config))
path = os.path.join(config['trainer']['save_dir'], config['name'])
#assert not os.path.exists(path), "Path {} already exists!".format(path)
assert config is not None
main(config, args.resume)