2020-07-12 17:21:47 +00:00
|
|
|
// Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2021-08-11 13:04:47 +00:00
|
|
|
#pragma once
|
|
|
|
|
2025-05-20 15:59:59 +08:00
|
|
|
#include <fstream>
|
2023-10-18 17:37:23 +08:00
|
|
|
#include <include/preprocess_op.h>
|
2020-07-13 08:59:21 +00:00
|
|
|
#include <include/utility.h>
|
2025-05-20 15:59:59 +08:00
|
|
|
#include <iostream>
|
2025-02-05 21:24:44 +08:00
|
|
|
#include <memory>
|
2025-05-20 15:59:59 +08:00
|
|
|
#include <yaml-cpp/yaml.h>
|
2025-02-05 21:24:44 +08:00
|
|
|
|
|
|
|
namespace paddle_infer {
|
|
|
|
class Predictor;
|
|
|
|
}
|
2020-07-12 17:21:47 +00:00
|
|
|
|
|
|
|
namespace PaddleOCR {
|
|
|
|
|
|
|
|
class CRNNRecognizer {
|
|
|
|
public:
|
2020-07-13 13:05:36 +00:00
|
|
|
explicit CRNNRecognizer(const std::string &model_dir, const bool &use_gpu,
|
|
|
|
const int &gpu_id, const int &gpu_mem,
|
|
|
|
const int &cpu_math_library_num_threads,
|
2022-09-20 03:40:05 +00:00
|
|
|
const bool &use_mkldnn, const std::string &label_path,
|
2022-04-03 08:56:16 +00:00
|
|
|
const bool &use_tensorrt,
|
|
|
|
const std::string &precision,
|
2022-04-22 09:08:01 +00:00
|
|
|
const int &rec_batch_num, const int &rec_img_h,
|
2025-02-05 18:17:18 +08:00
|
|
|
const int &rec_img_w) noexcept {
|
2020-07-13 08:59:21 +00:00
|
|
|
this->use_gpu_ = use_gpu;
|
|
|
|
this->gpu_id_ = gpu_id;
|
|
|
|
this->gpu_mem_ = gpu_mem;
|
|
|
|
this->cpu_math_library_num_threads_ = cpu_math_library_num_threads;
|
2020-07-14 05:40:35 +00:00
|
|
|
this->use_mkldnn_ = use_mkldnn;
|
2020-12-27 17:48:18 +08:00
|
|
|
this->use_tensorrt_ = use_tensorrt;
|
2021-08-16 08:52:21 +00:00
|
|
|
this->precision_ = precision;
|
2021-11-03 07:20:22 +00:00
|
|
|
this->rec_batch_num_ = rec_batch_num;
|
2022-04-22 09:08:01 +00:00
|
|
|
this->rec_img_h_ = rec_img_h;
|
|
|
|
this->rec_img_w_ = rec_img_w;
|
|
|
|
std::vector<int> rec_image_shape = {3, rec_img_h, rec_img_w};
|
|
|
|
this->rec_image_shape_ = rec_image_shape;
|
2020-07-13 08:59:21 +00:00
|
|
|
|
2025-05-20 15:59:59 +08:00
|
|
|
std::string new_label_path = label_path;
|
|
|
|
std::string yaml_file_path = model_dir + "/inference.yml";
|
|
|
|
std::ifstream yaml_file(yaml_file_path);
|
|
|
|
if (yaml_file.is_open()) {
|
|
|
|
std::string model_name;
|
|
|
|
std::vector<std::string> rec_char_list;
|
|
|
|
try {
|
|
|
|
YAML::Node config = YAML::LoadFile(yaml_file_path);
|
|
|
|
if (config["Global"] && config["Global"]["model_name"]) {
|
|
|
|
model_name = config["Global"]["model_name"].as<std::string>();
|
|
|
|
}
|
2025-05-27 12:01:53 +08:00
|
|
|
if (!model_name.empty() && model_name != "PP-OCRv5_mobile_rec" &&
|
|
|
|
model_name != "PP-OCRv5_server_rec") {
|
2025-05-20 15:59:59 +08:00
|
|
|
std::cerr << "Error: " << model_name << " is currently not supported."
|
|
|
|
<< std::endl;
|
|
|
|
std::exit(EXIT_FAILURE);
|
|
|
|
}
|
|
|
|
if (config["PostProcess"] && config["PostProcess"]["character_dict"]) {
|
|
|
|
rec_char_list = config["PostProcess"]["character_dict"]
|
|
|
|
.as<std::vector<std::string>>();
|
|
|
|
}
|
|
|
|
} catch (const YAML::Exception &e) {
|
|
|
|
std::cerr << "Failed to load YAML file: " << e.what() << std::endl;
|
|
|
|
}
|
|
|
|
if (label_path == "../../ppocr/utils/ppocr_keys_v1.txt" &&
|
|
|
|
!rec_char_list.empty()) {
|
|
|
|
std::string new_rec_char_dict_path = model_dir + "/ppocr_keys.txt";
|
|
|
|
std::ofstream new_file(new_rec_char_dict_path);
|
|
|
|
if (new_file.is_open()) {
|
|
|
|
for (const auto &character : rec_char_list) {
|
|
|
|
new_file << character << '\n';
|
|
|
|
}
|
|
|
|
new_label_path = new_rec_char_dict_path;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
this->label_list_ = Utility::ReadDict(new_label_path);
|
2025-02-03 19:35:16 +08:00
|
|
|
this->label_list_.emplace(this->label_list_.begin(),
|
|
|
|
"#"); // blank char for ctc
|
|
|
|
this->label_list_.emplace_back(" ");
|
2020-07-13 13:05:36 +00:00
|
|
|
|
|
|
|
LoadModel(model_dir);
|
2020-07-12 17:21:47 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// Load Paddle inference model
|
2025-02-05 18:17:18 +08:00
|
|
|
void LoadModel(const std::string &model_dir) noexcept;
|
2020-07-12 17:21:47 +00:00
|
|
|
|
2025-02-03 19:35:16 +08:00
|
|
|
void Run(const std::vector<cv::Mat> &img_list,
|
|
|
|
std::vector<std::string> &rec_texts,
|
2025-02-05 18:17:18 +08:00
|
|
|
std::vector<float> &rec_text_scores,
|
|
|
|
std::vector<double> ×) noexcept;
|
2020-07-12 17:21:47 +00:00
|
|
|
|
|
|
|
private:
|
2022-09-20 03:40:05 +00:00
|
|
|
std::shared_ptr<paddle_infer::Predictor> predictor_;
|
2020-07-12 17:21:47 +00:00
|
|
|
|
2020-07-13 08:59:21 +00:00
|
|
|
bool use_gpu_ = false;
|
|
|
|
int gpu_id_ = 0;
|
|
|
|
int gpu_mem_ = 4000;
|
|
|
|
int cpu_math_library_num_threads_ = 4;
|
2020-07-14 05:40:35 +00:00
|
|
|
bool use_mkldnn_ = false;
|
2020-07-13 08:59:21 +00:00
|
|
|
|
2020-07-12 17:21:47 +00:00
|
|
|
std::vector<std::string> label_list_;
|
|
|
|
|
|
|
|
std::vector<float> mean_ = {0.5f, 0.5f, 0.5f};
|
|
|
|
std::vector<float> scale_ = {1 / 0.5f, 1 / 0.5f, 1 / 0.5f};
|
|
|
|
bool is_scale_ = true;
|
2020-12-27 17:48:18 +08:00
|
|
|
bool use_tensorrt_ = false;
|
2021-08-16 08:52:21 +00:00
|
|
|
std::string precision_ = "fp32";
|
2021-11-03 07:20:22 +00:00
|
|
|
int rec_batch_num_ = 6;
|
2022-04-22 09:08:01 +00:00
|
|
|
int rec_img_h_ = 32;
|
|
|
|
int rec_img_w_ = 320;
|
|
|
|
std::vector<int> rec_image_shape_ = {3, rec_img_h_, rec_img_w_};
|
2020-07-12 17:21:47 +00:00
|
|
|
// pre-process
|
|
|
|
CrnnResizeImg resize_op_;
|
|
|
|
Normalize normalize_op_;
|
2021-11-03 09:24:52 +00:00
|
|
|
PermuteBatch permute_op_;
|
2020-07-12 17:21:47 +00:00
|
|
|
|
|
|
|
}; // class CrnnRecognizer
|
|
|
|
|
2020-07-15 13:33:26 +00:00
|
|
|
} // namespace PaddleOCR
|