PaddleOCR/tools/test_hubserving.py

118 lines
4.0 KiB
Python
Raw Normal View History

2020-07-13 17:25:30 +08:00
# Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
import os
import sys
__dir__ = os.path.dirname(os.path.abspath(__file__))
sys.path.append(__dir__)
sys.path.append(os.path.abspath(os.path.join(__dir__, '..')))
2020-12-14 19:42:00 +08:00
from ppocr.utils.logging import get_logger
logger = get_logger()
2020-07-13 17:25:30 +08:00
import cv2
import numpy as np
import time
from PIL import Image
from ppocr.utils.utility import get_image_file_list
from tools.infer.utility import draw_ocr, draw_boxes
2020-07-09 20:34:42 +08:00
import requests
import json
import base64
2020-07-13 17:25:30 +08:00
2020-07-09 20:34:42 +08:00
def cv2_to_base64(image):
return base64.b64encode(image).decode('utf8')
2020-07-13 17:25:30 +08:00
def draw_server_result(image_file, res):
img = cv2.imread(image_file)
image = Image.fromarray(cv2.cvtColor(img, cv2.COLOR_BGR2RGB))
if len(res) == 0:
return np.array(image)
keys = res[0].keys()
2020-07-16 20:14:46 +08:00
if 'text_region' not in keys: # for ocr_rec, draw function is invalid
logger.info("draw function is invalid for ocr_rec!")
2020-07-13 17:25:30 +08:00
return None
2020-07-16 20:14:46 +08:00
elif 'text' not in keys: # for ocr_det
logger.info("draw text boxes only!")
2020-07-13 17:25:30 +08:00
boxes = []
for dno in range(len(res)):
boxes.append(res[dno]['text_region'])
boxes = np.array(boxes)
draw_img = draw_boxes(image, boxes)
return draw_img
2020-07-16 20:14:46 +08:00
else: # for ocr_system
logger.info("draw boxes and texts!")
2020-07-13 17:25:30 +08:00
boxes = []
texts = []
scores = []
for dno in range(len(res)):
boxes.append(res[dno]['text_region'])
texts.append(res[dno]['text'])
scores.append(res[dno]['confidence'])
boxes = np.array(boxes)
scores = np.array(scores)
2020-07-16 20:14:46 +08:00
draw_img = draw_ocr(
image, boxes, texts, scores, draw_txt=True, drop_score=0.5)
2020-07-13 17:25:30 +08:00
return draw_img
def main(url, image_path):
image_file_list = get_image_file_list(image_path)
is_visualize = False
headers = {"Content-type": "application/json"}
cnt = 0
total_time = 0
for image_file in image_file_list:
img = open(image_file, 'rb').read()
if img is None:
logger.info("error in loading image:{}".format(image_file))
continue
# 发送HTTP请求
starttime = time.time()
2020-07-16 20:14:46 +08:00
data = {'images': [cv2_to_base64(img)]}
2020-07-13 17:25:30 +08:00
r = requests.post(url=url, headers=headers, data=json.dumps(data))
elapse = time.time() - starttime
total_time += elapse
2020-07-16 20:14:46 +08:00
logger.info("Predict time of %s: %.3fs" % (image_file, elapse))
2020-07-13 17:25:30 +08:00
res = r.json()["results"][0]
2020-07-16 20:14:46 +08:00
logger.info(res)
2020-07-13 17:25:30 +08:00
if is_visualize:
draw_img = draw_server_result(image_file, res)
if draw_img is not None:
draw_img_save = "./server_results/"
if not os.path.exists(draw_img_save):
os.makedirs(draw_img_save)
cv2.imwrite(
os.path.join(draw_img_save, os.path.basename(image_file)),
draw_img[:, :, ::-1])
2020-07-16 20:14:46 +08:00
logger.info("The visualized image saved in {}".format(
2020-07-13 17:25:30 +08:00
os.path.join(draw_img_save, os.path.basename(image_file))))
cnt += 1
if cnt % 100 == 0:
2020-07-16 20:14:46 +08:00
logger.info("{} processed".format(cnt))
logger.info("avg time cost: {}".format(float(total_time) / cnt))
2020-07-13 17:25:30 +08:00
2020-07-16 20:14:46 +08:00
if __name__ == '__main__':
2020-07-13 17:25:30 +08:00
if len(sys.argv) != 3:
2020-07-16 20:14:46 +08:00
logger.info("Usage: %s server_url image_path" % sys.argv[0])
2020-07-13 17:25:30 +08:00
else:
server_url = sys.argv[1]
image_path = sys.argv[2]
2020-07-16 11:41:25 +08:00
main(server_url, image_path)