PaddleOCR/ppocr/metrics/e2e_metric.py

87 lines
3.1 KiB
Python
Raw Normal View History

# Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
2021-03-08 14:15:47 +08:00
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
__all__ = ['E2EMetric']
2021-04-20 19:47:19 +08:00
from ppocr.utils.e2e_metric.Deteval import get_socre_A, get_socre_B, combine_results
2021-04-11 16:40:46 +08:00
from ppocr.utils.e2e_utils.extract_textpoint_slow import get_dict
2021-03-08 14:15:47 +08:00
class E2EMetric(object):
2021-03-15 13:58:53 +08:00
def __init__(self,
2021-04-20 19:47:19 +08:00
mode,
2021-04-10 14:44:32 +08:00
gt_mat_dir,
2021-03-15 13:58:53 +08:00
character_dict_path,
main_indicator='f_score_e2e',
**kwargs):
2021-04-20 19:47:19 +08:00
self.mode = mode
2021-04-10 14:44:32 +08:00
self.gt_mat_dir = gt_mat_dir
2021-03-15 13:58:53 +08:00
self.label_list = get_dict(character_dict_path)
self.max_index = len(self.label_list)
2021-03-08 14:15:47 +08:00
self.main_indicator = main_indicator
self.reset()
def __call__(self, preds, batch, **kwargs):
2021-04-20 19:47:19 +08:00
if self.mode == 'A':
gt_polyons_batch = batch[2]
2021-04-21 14:15:51 +08:00
temp_gt_strs_batch = batch[3][0]
2021-04-20 19:47:19 +08:00
ignore_tags_batch = batch[4]
gt_strs_batch = []
for temp_list in temp_gt_strs_batch:
t = ""
for index in temp_list:
if index < self.max_index:
t += self.label_list[index]
gt_strs_batch.append(t)
for pred, gt_polyons, gt_strs, ignore_tags in zip(
2021-04-21 14:15:51 +08:00
[preds], gt_polyons_batch, [gt_strs_batch], ignore_tags_batch):
2021-04-20 19:47:19 +08:00
# prepare gt
gt_info_list = [{
'points': gt_polyon,
'text': gt_str,
'ignore': ignore_tag
} for gt_polyon, gt_str, ignore_tag in
zip(gt_polyons, gt_strs, ignore_tags)]
# prepare det
e2e_info_list = [{
'points': det_polyon,
'texts': pred_str
} for det_polyon, pred_str in
zip(pred['points'], pred['texts'])]
result = get_socre_A(gt_info_list, e2e_info_list)
self.results.append(result)
else:
img_id = batch[5][0]
e2e_info_list = [{
'points': det_polyon,
'texts': pred_str
} for det_polyon, pred_str in zip(preds['points'], preds['texts'])]
result = get_socre_B(self.gt_mat_dir, img_id, e2e_info_list)
self.results.append(result)
2021-03-08 14:15:47 +08:00
def get_metric(self):
metircs = combine_results(self.results)
self.reset()
return metircs
def reset(self):
self.results = [] # clear results