Mercurial > hgrepos > Python2 > PyMuPDF
comparison mupdf-source/thirdparty/tesseract/src/textord/wordseg.h @ 2:b50eed0cc0ef upstream
ADD: MuPDF v1.26.7: the MuPDF source as downloaded by a default build of PyMuPDF 1.26.4.
The directory name has changed: no version number in the expanded directory now.
| author | Franz Glasner <fzglas.hg@dom66.de> |
|---|---|
| date | Mon, 15 Sep 2025 11:43:07 +0200 |
| parents | |
| children |
comparison
equal
deleted
inserted
replaced
| 1:1d09e1dec1d9 | 2:b50eed0cc0ef |
|---|---|
| 1 /********************************************************************** | |
| 2 * File: wordseg.h (Formerly wspace.h) | |
| 3 * Description: Code to segment the blobs into words. | |
| 4 * Author: Ray Smith | |
| 5 * | |
| 6 * (C) Copyright 1992, Hewlett-Packard Ltd. | |
| 7 ** Licensed under the Apache License, Version 2.0 (the "License"); | |
| 8 ** you may not use this file except in compliance with the License. | |
| 9 ** You may obtain a copy of the License at | |
| 10 ** http://www.apache.org/licenses/LICENSE-2.0 | |
| 11 ** Unless required by applicable law or agreed to in writing, software | |
| 12 ** distributed under the License is distributed on an "AS IS" BASIS, | |
| 13 ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
| 14 ** See the License for the specific language governing permissions and | |
| 15 ** limitations under the License. | |
| 16 * | |
| 17 **********************************************************************/ | |
| 18 | |
| 19 #ifndef WORDSEG_H | |
| 20 #define WORDSEG_H | |
| 21 | |
| 22 #include "blobbox.h" | |
| 23 #include "params.h" | |
| 24 #include "textord.h" | |
| 25 | |
| 26 namespace tesseract { | |
| 27 class Tesseract; | |
| 28 | |
| 29 extern BOOL_VAR_H(textord_force_make_prop_words); | |
| 30 extern BOOL_VAR_H(textord_chopper_test); | |
| 31 | |
| 32 void make_single_word(bool one_blob, TO_ROW_LIST *rows, ROW_LIST *real_rows); | |
| 33 void make_words(tesseract::Textord *textord, | |
| 34 ICOORD page_tr, // top right | |
| 35 float gradient, // page skew | |
| 36 BLOCK_LIST *blocks, // block list | |
| 37 TO_BLOCK_LIST *port_blocks); // output list | |
| 38 void set_row_spaces( // find space sizes | |
| 39 TO_BLOCK *block, // block to do | |
| 40 FCOORD rotation, // for drawing | |
| 41 bool testing_on // correct orientation | |
| 42 ); | |
| 43 int32_t row_words( // compute space size | |
| 44 TO_BLOCK *block, // block it came from | |
| 45 TO_ROW *row, // row to operate on | |
| 46 int32_t maxwidth, // max expected space size | |
| 47 FCOORD rotation, // for drawing | |
| 48 bool testing_on // for debug | |
| 49 ); | |
| 50 int32_t row_words2( // compute space size | |
| 51 TO_BLOCK *block, // block it came from | |
| 52 TO_ROW *row, // row to operate on | |
| 53 int32_t maxwidth, // max expected space size | |
| 54 FCOORD rotation, // for drawing | |
| 55 bool testing_on // for debug | |
| 56 ); | |
| 57 void make_real_words(tesseract::Textord *textord, | |
| 58 TO_BLOCK *block, // block to do | |
| 59 FCOORD rotation // for drawing | |
| 60 ); | |
| 61 ROW *make_rep_words( // make a row | |
| 62 TO_ROW *row, // row to convert | |
| 63 TO_BLOCK *block // block it lives in | |
| 64 ); | |
| 65 WERD *make_real_word( // make a WERD | |
| 66 BLOBNBOX_IT *box_it, // iterator | |
| 67 int32_t blobcount, // no of blobs to use | |
| 68 bool bol, // start of line | |
| 69 uint8_t blanks // no of blanks | |
| 70 ); | |
| 71 | |
| 72 } // namespace tesseract | |
| 73 | |
| 74 #endif |
