| 
									
										
										
										
											2021-06-10 14:24:59 +08:00
										 |  |  | # copyright (c) 2020 PaddlePaddle Authors. All Rights Reserve. | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # Licensed under the Apache License, Version 2.0 (the "License"); | 
					
						
							|  |  |  | # you may not use this file except in compliance with the License. | 
					
						
							|  |  |  | # You may obtain a copy of the License at | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | #    http://www.apache.org/licenses/LICENSE-2.0 | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # Unless required by applicable law or agreed to in writing, software | 
					
						
							|  |  |  | # distributed under the License is distributed on an "AS IS" BASIS, | 
					
						
							|  |  |  | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
					
						
							|  |  |  | # See the License for the specific language governing permissions and | 
					
						
							|  |  |  | # limitations under the License. | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2022-03-11 00:09:27 +00:00
										 |  |  | import ast | 
					
						
							| 
									
										
										
										
											2021-06-10 14:24:59 +08:00
										 |  |  | from PIL import Image | 
					
						
							|  |  |  | import numpy as np | 
					
						
							| 
									
										
										
										
											2022-04-22 13:24:45 +08:00
										 |  |  | from tools.infer.utility import draw_ocr_box_txt, str2bool, init_args as infer_args | 
					
						
							| 
									
										
										
										
											2021-06-10 14:24:59 +08:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def init_args(): | 
					
						
							|  |  |  |     parser = infer_args() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # params for output | 
					
						
							| 
									
										
										
										
											2021-12-13 07:38:05 +00:00
										 |  |  |     parser.add_argument("--output", type=str, default='./output') | 
					
						
							| 
									
										
										
										
											2021-06-10 14:24:59 +08:00
										 |  |  |     # params for table structure | 
					
						
							| 
									
										
										
										
											2021-06-23 12:28:32 +08:00
										 |  |  |     parser.add_argument("--table_max_len", type=int, default=488) | 
					
						
							|  |  |  |     parser.add_argument("--table_model_dir", type=str) | 
					
						
							| 
									
										
										
										
											2021-12-13 07:38:05 +00:00
										 |  |  |     parser.add_argument( | 
					
						
							|  |  |  |         "--table_char_dict_path", | 
					
						
							|  |  |  |         type=str, | 
					
						
							|  |  |  |         default="../ppocr/utils/dict/table_structure_dict.txt") | 
					
						
							| 
									
										
										
										
											2022-04-22 13:24:45 +08:00
										 |  |  |     # params for layout | 
					
						
							| 
									
										
										
										
											2021-12-13 07:38:05 +00:00
										 |  |  |     parser.add_argument( | 
					
						
							|  |  |  |         "--layout_path_model", | 
					
						
							|  |  |  |         type=str, | 
					
						
							|  |  |  |         default="lp://PubLayNet/ppyolov2_r50vd_dcn_365e_publaynet/config") | 
					
						
							| 
									
										
										
										
											2022-03-11 00:09:27 +00:00
										 |  |  |     parser.add_argument( | 
					
						
							|  |  |  |         "--layout_label_map", | 
					
						
							|  |  |  |         type=ast.literal_eval, | 
					
						
							|  |  |  |         default=None, | 
					
						
							|  |  |  |         help='label map according to ppstructure/layout/README_ch.md') | 
					
						
							| 
									
										
										
										
											2022-04-22 13:24:45 +08:00
										 |  |  |     # params for inference | 
					
						
							| 
									
										
										
										
											2021-12-13 07:38:05 +00:00
										 |  |  |     parser.add_argument( | 
					
						
							|  |  |  |         "--mode", | 
					
						
							|  |  |  |         type=str, | 
					
						
							|  |  |  |         default='structure', | 
					
						
							|  |  |  |         help='structure and vqa is supported') | 
					
						
							| 
									
										
										
										
											2022-04-22 13:24:45 +08:00
										 |  |  |     parser.add_argument( | 
					
						
							|  |  |  |         "--layout", | 
					
						
							|  |  |  |         type=str2bool, | 
					
						
							|  |  |  |         default=True, | 
					
						
							|  |  |  |         help='Whether to enable layout analysis') | 
					
						
							|  |  |  |     parser.add_argument( | 
					
						
							|  |  |  |         "--table", | 
					
						
							|  |  |  |         type=str2bool, | 
					
						
							|  |  |  |         default=True, | 
					
						
							|  |  |  |         help='In the forward, whether the table area uses table recognition') | 
					
						
							|  |  |  |     parser.add_argument( | 
					
						
							|  |  |  |         "--ocr", | 
					
						
							|  |  |  |         type=str2bool, | 
					
						
							|  |  |  |         default=True, | 
					
						
							|  |  |  |         help='In the forward, whether the non-table area is recognition by ocr') | 
					
						
							| 
									
										
										
										
											2021-06-10 14:24:59 +08:00
										 |  |  |     return parser | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def parse_args(): | 
					
						
							|  |  |  |     parser = init_args() | 
					
						
							|  |  |  |     return parser.parse_args() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-08-02 15:28:07 +08:00
										 |  |  | def draw_structure_result(image, result, font_path): | 
					
						
							| 
									
										
										
										
											2021-06-10 14:24:59 +08:00
										 |  |  |     if isinstance(image, np.ndarray): | 
					
						
							|  |  |  |         image = Image.fromarray(image) | 
					
						
							|  |  |  |     boxes, txts, scores = [], [], [] | 
					
						
							|  |  |  |     for region in result: | 
					
						
							|  |  |  |         if region['type'] == 'Table': | 
					
						
							|  |  |  |             pass | 
					
						
							|  |  |  |         else: | 
					
						
							| 
									
										
										
										
											2022-03-30 14:15:12 +00:00
										 |  |  |             for text_result in region['res']: | 
					
						
							|  |  |  |                 boxes.append(np.array(text_result['text_region'])) | 
					
						
							|  |  |  |                 txts.append(text_result['text']) | 
					
						
							|  |  |  |                 scores.append(text_result['confidence']) | 
					
						
							| 
									
										
										
										
											2021-12-13 07:38:05 +00:00
										 |  |  |     im_show = draw_ocr_box_txt( | 
					
						
							|  |  |  |         image, boxes, txts, scores, font_path=font_path, drop_score=0) | 
					
						
							|  |  |  |     return im_show |