123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113 |
- // Copyright (c) 2020 PaddlePaddle Authors. All Rights Reserved.
- //
- // Licensed under the Apache License, Version 2.0 (the "License");
- // you may not use this file except in compliance with the License.
- // You may obtain a copy of the License at
- //
- // http://www.apache.org/licenses/LICENSE-2.0
- //
- // Unless required by applicable law or agreed to in writing, software
- // distributed under the License is distributed on an "AS IS" BASIS,
- // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- // See the License for the specific language governing permissions and
- // limitations under the License.
- #pragma once
- #include <chrono>
- #include <iomanip>
- #include <iostream>
- #include <ostream>
- #include <stdlib.h>
- #include <vector>
- #include <algorithm>
- #include <cstring>
- #include <fstream>
- #include <numeric>
- #include "opencv2/core.hpp"
- #include "opencv2/imgcodecs.hpp"
- #include "opencv2/imgproc.hpp"
- namespace PaddleOCR {
- struct OCRPredictResult {
- std::vector<std::vector<int>> box;
- std::string text;
- float score = -1.0;
- float cls_score;
- int cls_label = -1;
- };
- struct StructurePredictResult {
- std::vector<float> box;
- std::vector<std::vector<int>> cell_box;
- std::string type;
- std::vector<OCRPredictResult> text_res;
- std::string html;
- float html_score = -1;
- float confidence;
- };
- class Utility {
- public:
- static std::vector<std::string> ReadDict(const std::string &path);
- static void VisualizeBboxes(const cv::Mat &srcimg,
- const std::vector<OCRPredictResult> &ocr_result,
- const std::string &save_path);
- static void VisualizeBboxes(const cv::Mat &srcimg,
- const StructurePredictResult &structure_result,
- const std::string &save_path);
- template <class ForwardIterator>
- inline static size_t argmax(ForwardIterator first, ForwardIterator last) {
- return std::distance(first, std::max_element(first, last));
- }
- static void GetAllFiles(const char *dir_name,
- std::vector<std::string> &all_inputs);
- static cv::Mat GetRotateCropImage(const cv::Mat &srcimage,
- std::vector<std::vector<int>> box);
- static std::vector<int> argsort(const std::vector<float> &array);
- static std::string basename(const std::string &filename);
- static bool PathExists(const std::string &path);
- static void CreateDir(const std::string &path);
- static void print_result(const std::vector<OCRPredictResult> &ocr_result);
- static cv::Mat crop_image(cv::Mat &img, const std::vector<int> &area);
- static cv::Mat crop_image(cv::Mat &img, const std::vector<float> &area);
- static void sorted_boxes(std::vector<OCRPredictResult> &ocr_result);
- static std::vector<int> xyxyxyxy2xyxy(std::vector<std::vector<int>> &box);
- static std::vector<int> xyxyxyxy2xyxy(std::vector<int> &box);
- static float fast_exp(float x);
- static std::vector<float>
- activation_function_softmax(std::vector<float> &src);
- static float iou(std::vector<int> &box1, std::vector<int> &box2);
- static float iou(std::vector<float> &box1, std::vector<float> &box2);
- private:
- static bool comparison_box(const OCRPredictResult &result1,
- const OCRPredictResult &result2) {
- if (result1.box[0][1] < result2.box[0][1]) {
- return true;
- } else if (result1.box[0][1] == result2.box[0][1]) {
- return result1.box[0][0] < result2.box[0][0];
- } else {
- return false;
- }
- }
- };
- } // namespace PaddleOCR
|