forked from wenwenyu/MASTER-pytorch
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathtest.py
130 lines (112 loc) · 6.24 KB
/
test.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
# -*- coding: utf-8 -*-
# @Author: Wenwen Yu
# @Created Time: 8/17/2020 4:50 PM
import argparse
import torch
from tqdm import tqdm
from pathlib import Path
import json
import sys
from torch.utils.data.dataloader import DataLoader
import model.master as master_arch_module
from data_utils.datasets import TextDataset, ResizeWeight, DistCollateFn, CustomImagePreprocess
from utils.label_util import LabelTransformer
from utils import decode_util
def predict(args):
device = torch.device(f'cuda:{args.gpu}' if args.gpu != -1 else 'cpu')
checkpoint = torch.load(args.checkpoint, map_location=device)
config = checkpoint['config']
state_dict = checkpoint['model_state_dict']
monitor_best = checkpoint['monitor_best']
print('Loading checkpoint: {} \nwith saved best metric {:.4f}'.format(args.checkpoint, monitor_best))
# prepare model for testing
model = config.init_obj('model_arch', master_arch_module)
model = model.to(device)
model.load_state_dict(state_dict)
model.eval()
# setup dataset and data_loader instances
# img_w = config['train_dataset']['args']['img_w']
# img_h = config['train_dataset']['args']['img_h'] txt_file=None, img_root=None
index_txt_file = args.index_txt_file # if None, read img from img_root, otherwise, txt_file must be set.
in_channels = config['model_arch']['args']['backbone_kwargs']['in_channels']
convert_to_gray = False if in_channels == 3 else True
test_dataset = TextDataset(img_root=args.img_folder, txt_file=index_txt_file,
transform=ResizeWeight((args.width, args.height), gray_format=convert_to_gray),
img_w=args.width,
img_h=args.height,
training=False,
testing_with_label_file=index_txt_file is not None,
convert_to_gray=convert_to_gray)
test_data_loader = DataLoader(test_dataset, batch_size=args.bs, shuffle=False,
collate_fn=DistCollateFn(training=False),
num_workers=1, drop_last=False)
print(f'test data size: {len(test_dataset)} steps: {len(test_data_loader)}')
# setup output path
output_path = Path(args.output_folder)
output_path.mkdir(parents=True, exist_ok=True)
result_output_file = output_path.joinpath(args.output_file_name)
pred_results = []
# predict and save to file
for step_idx, input_data_item in tqdm(enumerate(test_data_loader),total=len(test_data_loader)):
batch_size = input_data_item['batch_size']
if batch_size == 0:
continue
images = input_data_item['images']
file_names = input_data_item['file_names']
with torch.no_grad():
images = images.to(device)
if hasattr(model, 'module'):
model = model.module
# (bs, max_len)
# TODO replace with memory-cache based decode
outputs, probs = decode_util.greedy_decode_with_probability(model, images, LabelTransformer.max_length,
LabelTransformer.SOS,
LabelTransformer.EOS,
_padding_symbol_index=LabelTransformer.PAD,
_result_device=images.device, _is_padding=True)
for index, (pred, prob, img_name) in enumerate(zip(outputs[:, 1:], probs, file_names)):
predict_text = ""
# pred_list = []
pred_score_list = []
for i in range(len(pred)): # decode one sample
if pred[i] == LabelTransformer.EOS:
pred_score_list.append(prob[i])
break
if pred[i] == LabelTransformer.UNK:
continue
decoded_char = LabelTransformer.decode(pred[i])
predict_text += decoded_char
# pred_list.append(decoded_char)
pred_score_list.append(prob[i])
pred_score = sum(pred_score_list) / len(pred_score_list)
pred_item = {"filename": Path(img_name).name,
"result": predict_text,
"pred_score": pred_score.cpu().item()}
pred_results.append(pred_item)
with result_output_file.open(mode='w') as f:
f.write(json.dumps(pred_results))
print(f'Predict results has written to {result_output_file.as_posix()}\n')
if __name__ == '__main__':
args = argparse.ArgumentParser(description='MASTER Pytorch Test')
args.add_argument('-ckpt', '--checkpoint', default=None, type=str, required=True,
help='path to load checkpoint (default: None)')
args.add_argument('-img', '--img_folder', default=None, type=str, required=True,
help='image folder (default: None)')
args.add_argument('-index_txt_file', '--index_txt_file', default=None, type=str, required=False,
help='path to index txt and corresponding filename, '
'if None, read img from img_folder, otherwise, index_txt_file must be set (default: None)')
args.add_argument('-width', '--width', default=256, type=int, required=False,
help='resized image width (default: 256)')
args.add_argument('-height', '--height', default=32, type=int, required=False,
help='resized image height (default: 32)')
args.add_argument('-output', '--output_folder', default='predict_results', type=str, required=False,
help='output folder (default: predict_results)')
args.add_argument('-output_file_name', '--output_file_name', default='predict_result.json', type=str,
required=False,
help='output file name (default: predict_result.json)')
args.add_argument('-g', '--gpu', default=-1, type=int, required=False,
help='GPU id to use. (default: -1, cpu)')
args.add_argument('--bs', '--batch_size', default=1, type=int, required=False,
help='batch size (default: 1)')
args = args.parse_args()
predict(args)