2020-09-19 14:41:43 +08:00
|
|
|
#copyright (c) 2020 PaddlePaddle Authors. All Rights Reserve.
|
|
|
|
#
|
|
|
|
#Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
#you may not use this file except in compliance with the License.
|
|
|
|
#You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
#Unless required by applicable law or agreed to in writing, software
|
|
|
|
#distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
#WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
#See the License for the specific language governing permissions and
|
|
|
|
#limitations under the License.
|
2020-09-18 18:54:15 +08:00
|
|
|
import os
|
|
|
|
import argparse
|
2020-09-23 19:03:45 +08:00
|
|
|
import json
|
2020-09-18 18:54:15 +08:00
|
|
|
|
|
|
|
|
|
|
|
def gen_rec_label(input_path, out_label):
|
2020-09-19 14:40:13 +08:00
|
|
|
with open(out_label, 'w') as out_file:
|
|
|
|
with open(input_path, 'r') as f:
|
|
|
|
for line in f.readlines():
|
|
|
|
tmp = line.strip('\n').replace(" ", "").split(',')
|
|
|
|
img_path, label = tmp[0], tmp[1]
|
|
|
|
label = label.replace("\"", "")
|
|
|
|
out_file.write(img_path + '\t' + label + '\n')
|
2020-09-18 18:54:15 +08:00
|
|
|
|
|
|
|
|
2020-09-19 14:40:13 +08:00
|
|
|
def gen_det_label(root_path, input_dir, out_label):
|
|
|
|
with open(out_label, 'w') as out_file:
|
|
|
|
for label_file in os.listdir(input_dir):
|
|
|
|
img_path = root_path + label_file[3:-4] + ".jpg"
|
|
|
|
label = []
|
|
|
|
with open(os.path.join(input_dir, label_file), 'r') as f:
|
|
|
|
for line in f.readlines():
|
2020-09-23 19:03:45 +08:00
|
|
|
tmp = line.strip("\n\r").replace("\xef\xbb\xbf",
|
|
|
|
"").split(',')
|
|
|
|
points = tmp[:8]
|
2020-09-19 14:40:13 +08:00
|
|
|
s = []
|
|
|
|
for i in range(0, len(points), 2):
|
|
|
|
b = points[i:i + 2]
|
2020-09-23 19:03:45 +08:00
|
|
|
b = [int(t) for t in b]
|
2020-09-19 14:40:13 +08:00
|
|
|
s.append(b)
|
2020-09-23 19:03:45 +08:00
|
|
|
result = {"transcription": tmp[8], "points": s}
|
2020-09-19 14:40:13 +08:00
|
|
|
label.append(result)
|
2020-09-23 19:03:45 +08:00
|
|
|
|
|
|
|
out_file.write(img_path + '\t' + json.dumps(
|
|
|
|
label, ensure_ascii=False) + '\n')
|
2020-09-18 18:54:15 +08:00
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
parser = argparse.ArgumentParser()
|
|
|
|
parser.add_argument(
|
|
|
|
'--mode',
|
|
|
|
type=str,
|
|
|
|
default="rec",
|
|
|
|
help='Generate rec_label or det_label, can be set rec or det')
|
2020-09-19 14:40:13 +08:00
|
|
|
parser.add_argument(
|
|
|
|
'--root_path',
|
|
|
|
type=str,
|
|
|
|
default=".",
|
|
|
|
help='The root directory of images.Only takes effect when mode=det ')
|
2020-09-18 18:54:15 +08:00
|
|
|
parser.add_argument(
|
|
|
|
'--input_path',
|
|
|
|
type=str,
|
|
|
|
default=".",
|
|
|
|
help='Input_label or input path to be converted')
|
|
|
|
parser.add_argument(
|
|
|
|
'--output_label',
|
|
|
|
type=str,
|
|
|
|
default="out_label.txt",
|
|
|
|
help='Output file name')
|
|
|
|
|
|
|
|
args = parser.parse_args()
|
|
|
|
if args.mode == "rec":
|
|
|
|
print("Generate rec label")
|
|
|
|
gen_rec_label(args.input_path, args.output_label)
|
|
|
|
elif args.mode == "det":
|
2020-09-19 14:40:13 +08:00
|
|
|
gen_det_label(args.root_path, args.input_path, args.output_label)
|