// Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved. // // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. #pragma once #include #include #include #include #include #include #include #include #include #include #include "opencv2/core.hpp" #include "opencv2/imgcodecs.hpp" #include "opencv2/imgproc.hpp" namespace PaddleOCR { struct OCRPredictResult { std::vector> box; std::string text; float score = -1.0; float cls_score; int cls_label = -1; }; struct StructurePredictResult { std::vector box; std::vector> cell_box; std::string type; std::vector text_res; std::string html; float html_score = -1; float confidence; }; class Utility { public: static std::vector ReadDict(const std::string &path); static void VisualizeBboxes(const cv::Mat &srcimg, const std::vector &ocr_result, const std::string &save_path); static void VisualizeBboxes(const cv::Mat &srcimg, const StructurePredictResult &structure_result, const std::string &save_path); template inline static size_t argmax(ForwardIterator first, ForwardIterator last) { return std::distance(first, std::max_element(first, last)); } static void GetAllFiles(const char *dir_name, std::vector &all_inputs); static cv::Mat GetRotateCropImage(const cv::Mat &srcimage, std::vector> box); static std::vector argsort(const std::vector &array); static std::string basename(const std::string &filename); static bool PathExists(const std::string &path); static void CreateDir(const std::string &path); static void print_result(const std::vector &ocr_result); static cv::Mat crop_image(cv::Mat &img, const std::vector &area); static cv::Mat crop_image(cv::Mat &img, const std::vector &area); static void sorted_boxes(std::vector &ocr_result); static std::vector xyxyxyxy2xyxy(std::vector> &box); static std::vector xyxyxyxy2xyxy(std::vector &box); static float fast_exp(float x); static std::vector activation_function_softmax(std::vector &src); static float iou(std::vector &box1, std::vector &box2); static float iou(std::vector &box1, std::vector &box2); private: static bool comparison_box(const OCRPredictResult &result1, const OCRPredictResult &result2) { if (result1.box[0][1] < result2.box[0][1]) { return true; } else if (result1.box[0][1] == result2.box[0][1]) { return result1.box[0][0] < result2.box[0][0]; } else { return false; } } }; } // namespace PaddleOCR