| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  | # Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved. | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # Licensed under the Apache License, Version 2.0 (the "License"); | 
					
						
							|  |  |  | # you may not use this file except in compliance with the License. | 
					
						
							|  |  |  | # You may obtain a copy of the License at | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | #     http://www.apache.org/licenses/LICENSE-2.0 | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # Unless required by applicable law or agreed to in writing, software | 
					
						
							|  |  |  | # distributed under the License is distributed on an "AS IS" BASIS, | 
					
						
							|  |  |  | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
					
						
							|  |  |  | # See the License for the specific language governing permissions and | 
					
						
							|  |  |  | # limitations under the License. | 
					
						
							|  |  |  | import os | 
					
						
							|  |  |  | import sys | 
					
						
							|  |  |  | __dir__ = os.path.dirname(os.path.abspath(__file__)) | 
					
						
							|  |  |  | sys.path.append(__dir__) | 
					
						
							|  |  |  | sys.path.append(os.path.abspath(os.path.join(__dir__, '..'))) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-12-14 11:42:00 +00:00
										 |  |  | from ppocr.utils.logging import get_logger | 
					
						
							|  |  |  | logger = get_logger() | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  | import cv2 | 
					
						
							|  |  |  | import numpy as np | 
					
						
							|  |  |  | import time | 
					
						
							|  |  |  | from PIL import Image | 
					
						
							|  |  |  | from ppocr.utils.utility import get_image_file_list | 
					
						
							|  |  |  | from tools.infer.utility import draw_ocr, draw_boxes | 
					
						
							| 
									
										
										
										
											2020-07-09 20:34:42 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | import requests | 
					
						
							|  |  |  | import json | 
					
						
							|  |  |  | import base64 | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-09 20:34:42 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | def cv2_to_base64(image): | 
					
						
							|  |  |  |     return base64.b64encode(image).decode('utf8') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | def draw_server_result(image_file, res): | 
					
						
							|  |  |  |     img = cv2.imread(image_file) | 
					
						
							|  |  |  |     image = Image.fromarray(cv2.cvtColor(img, cv2.COLOR_BGR2RGB)) | 
					
						
							|  |  |  |     if len(res) == 0: | 
					
						
							|  |  |  |         return np.array(image) | 
					
						
							|  |  |  |     keys = res[0].keys() | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |     if 'text_region' not in keys:  # for ocr_rec, draw function is invalid  | 
					
						
							|  |  |  |         logger.info("draw function is invalid for ocr_rec!") | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |         return None | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |     elif 'text' not in keys:  # for ocr_det | 
					
						
							|  |  |  |         logger.info("draw text boxes only!") | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |         boxes = [] | 
					
						
							|  |  |  |         for dno in range(len(res)): | 
					
						
							|  |  |  |             boxes.append(res[dno]['text_region']) | 
					
						
							|  |  |  |         boxes = np.array(boxes) | 
					
						
							|  |  |  |         draw_img = draw_boxes(image, boxes) | 
					
						
							|  |  |  |         return draw_img | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |     else:  # for ocr_system | 
					
						
							|  |  |  |         logger.info("draw boxes and texts!") | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |         boxes = [] | 
					
						
							|  |  |  |         texts = [] | 
					
						
							|  |  |  |         scores = [] | 
					
						
							|  |  |  |         for dno in range(len(res)): | 
					
						
							|  |  |  |             boxes.append(res[dno]['text_region']) | 
					
						
							|  |  |  |             texts.append(res[dno]['text']) | 
					
						
							|  |  |  |             scores.append(res[dno]['confidence']) | 
					
						
							|  |  |  |         boxes = np.array(boxes) | 
					
						
							|  |  |  |         scores = np.array(scores) | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |         draw_img = draw_ocr( | 
					
						
							|  |  |  |             image, boxes, texts, scores, draw_txt=True, drop_score=0.5) | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |         return draw_img | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def main(url, image_path): | 
					
						
							|  |  |  |     image_file_list = get_image_file_list(image_path) | 
					
						
							|  |  |  |     is_visualize = False | 
					
						
							|  |  |  |     headers = {"Content-type": "application/json"} | 
					
						
							|  |  |  |     cnt = 0 | 
					
						
							|  |  |  |     total_time = 0 | 
					
						
							|  |  |  |     for image_file in image_file_list: | 
					
						
							|  |  |  |         img = open(image_file, 'rb').read() | 
					
						
							|  |  |  |         if img is None: | 
					
						
							|  |  |  |             logger.info("error in loading image:{}".format(image_file)) | 
					
						
							|  |  |  |             continue | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         # 发送HTTP请求 | 
					
						
							|  |  |  |         starttime = time.time() | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |         data = {'images': [cv2_to_base64(img)]} | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |         r = requests.post(url=url, headers=headers, data=json.dumps(data)) | 
					
						
							|  |  |  |         elapse = time.time() - starttime | 
					
						
							|  |  |  |         total_time += elapse | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |         logger.info("Predict time of %s: %.3fs" % (image_file, elapse)) | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |         res = r.json()["results"][0] | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |         logger.info(res) | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  |         if is_visualize: | 
					
						
							|  |  |  |             draw_img = draw_server_result(image_file, res) | 
					
						
							|  |  |  |             if draw_img is not None: | 
					
						
							|  |  |  |                 draw_img_save = "./server_results/" | 
					
						
							|  |  |  |                 if not os.path.exists(draw_img_save): | 
					
						
							|  |  |  |                     os.makedirs(draw_img_save) | 
					
						
							|  |  |  |                 cv2.imwrite( | 
					
						
							|  |  |  |                     os.path.join(draw_img_save, os.path.basename(image_file)), | 
					
						
							|  |  |  |                     draw_img[:, :, ::-1]) | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |                 logger.info("The visualized image saved in {}".format( | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |                     os.path.join(draw_img_save, os.path.basename(image_file)))) | 
					
						
							|  |  |  |         cnt += 1 | 
					
						
							|  |  |  |         if cnt % 100 == 0: | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |             logger.info("{} processed".format(cnt)) | 
					
						
							|  |  |  |     logger.info("avg time cost: {}".format(float(total_time) / cnt)) | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | if __name__ == '__main__': | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |     if len(sys.argv) != 3: | 
					
						
							| 
									
										
										
										
											2020-07-16 12:14:46 +00:00
										 |  |  |         logger.info("Usage: %s server_url image_path" % sys.argv[0]) | 
					
						
							| 
									
										
										
										
											2020-07-13 17:25:30 +08:00
										 |  |  |     else: | 
					
						
							|  |  |  |         server_url = sys.argv[1] | 
					
						
							|  |  |  |         image_path = sys.argv[2] | 
					
						
							| 
									
										
										
										
											2020-07-16 11:41:25 +08:00
										 |  |  |         main(server_url, image_path) |