Mercurial > hgrepos > Python2 > PyMuPDF
view mupdf-source/thirdparty/tesseract/src/ccstruct/ocrrow.cpp @ 46:7ee69f120f19 default tip
>>>>> tag v1.26.5+1 for changeset b74429b0f5c4
| author | Franz Glasner <fzglas.hg@dom66.de> |
|---|---|
| date | Sat, 11 Oct 2025 17:17:30 +0200 |
| parents | b50eed0cc0ef |
| children |
line wrap: on
line source
/********************************************************************** * File: ocrrow.cpp (Formerly row.c) * Description: Code for the ROW class. * Author: Ray Smith * * (C) Copyright 1991, Hewlett-Packard Ltd. ** Licensed under the Apache License, Version 2.0 (the "License"); ** you may not use this file except in compliance with the License. ** You may obtain a copy of the License at ** http://www.apache.org/licenses/LICENSE-2.0 ** Unless required by applicable law or agreed to in writing, software ** distributed under the License is distributed on an "AS IS" BASIS, ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. ** See the License for the specific language governing permissions and ** limitations under the License. * **********************************************************************/ // Include automatically generated configuration file if running autoconf. #ifdef HAVE_CONFIG_H # include "config_auto.h" #endif #include "blobbox.h" #include "ocrrow.h" namespace tesseract { /********************************************************************** * ROW::ROW * * Constructor to build a ROW. Only the stats stuff are given here. * The words are added directly. **********************************************************************/ ROW::ROW( // constructor int32_t spline_size, // no of segments int32_t *xstarts, // segment boundaries double *coeffs, // coefficients float x_height, // line height float ascenders, // ascender size float descenders, // descender drop int16_t kern, // char gap int16_t space // word gap ) : baseline(spline_size, xstarts, coeffs), para_(nullptr) { kerning = kern; // just store stuff spacing = space; xheight = x_height; ascrise = ascenders; bodysize = 0.0f; descdrop = descenders; has_drop_cap_ = false; lmargin_ = 0; rmargin_ = 0; } /********************************************************************** * ROW::ROW * * Constructor to build a ROW. Only the stats stuff are given here. * The words are added directly. **********************************************************************/ ROW::ROW( // constructor TO_ROW *to_row, // source row int16_t kern, // char gap int16_t space // word gap ) : para_(nullptr) { kerning = kern; // just store stuff spacing = space; xheight = to_row->xheight; bodysize = to_row->body_size; ascrise = to_row->ascrise; descdrop = to_row->descdrop; baseline = to_row->baseline; has_drop_cap_ = false; lmargin_ = 0; rmargin_ = 0; } // Returns the bounding box including the desired combination of upper and // lower noise/diacritic elements. TBOX ROW::restricted_bounding_box(bool upper_dots, bool lower_dots) const { TBOX box; // This is a read-only iteration of the words in the row. WERD_IT it(const_cast<WERD_LIST *>(&words)); for (it.mark_cycle_pt(); !it.cycled_list(); it.forward()) { box += it.data()->restricted_bounding_box(upper_dots, lower_dots); } return box; } /********************************************************************** * ROW::recalc_bounding_box * * Set the bounding box correctly **********************************************************************/ void ROW::recalc_bounding_box() { // recalculate BB WERD *word; // current word WERD_IT it = &words; // words of ROW int16_t left; // of word int16_t prev_left; // old left if (!it.empty()) { word = it.data(); prev_left = word->bounding_box().left(); it.forward(); while (!it.at_first()) { word = it.data(); left = word->bounding_box().left(); if (left < prev_left) { it.move_to_first(); // words in BB order it.sort(word_comparator); break; } prev_left = left; it.forward(); } } for (it.mark_cycle_pt(); !it.cycled_list(); it.forward()) { word = it.data(); if (it.at_first()) { word->set_flag(W_BOL, true); } else { // not start of line word->set_flag(W_BOL, false); } if (it.at_last()) { word->set_flag(W_EOL, true); } else { // not end of line word->set_flag(W_EOL, false); } // extend BB as reqd bound_box += word->bounding_box(); } } /********************************************************************** * ROW::move * * Reposition row by vector **********************************************************************/ void ROW::move( // reposition row const ICOORD vec // by vector ) { WERD_IT it(&words); // word iterator for (it.mark_cycle_pt(); !it.cycled_list(); it.forward()) { it.data()->move(vec); } bound_box.move(vec); baseline.move(vec); } /********************************************************************** * ROW::print * * Display members **********************************************************************/ void ROW::print( // print FILE *fp // file to print on ) const { tprintf("Kerning= %d\n", kerning); tprintf("Spacing= %d\n", spacing); bound_box.print(); tprintf("Xheight= %f\n", xheight); tprintf("Ascrise= %f\n", ascrise); tprintf("Descdrop= %f\n", descdrop); tprintf("has_drop_cap= %d\n", has_drop_cap_); tprintf("lmargin= %d, rmargin= %d\n", lmargin_, rmargin_); } /********************************************************************** * ROW::plot * * Draw the ROW in the given colour. **********************************************************************/ #ifndef GRAPHICS_DISABLED void ROW::plot( // draw it ScrollView *window, // window to draw in ScrollView::Color colour // colour to draw in ) { WERD *word; // current word WERD_IT it = &words; // words of ROW for (it.mark_cycle_pt(); !it.cycled_list(); it.forward()) { word = it.data(); word->plot(window, colour); // all in one colour } } /********************************************************************** * ROW::plot * * Draw the ROW in rainbow colours. **********************************************************************/ void ROW::plot( // draw it ScrollView *window // window to draw in ) { WERD *word; // current word WERD_IT it = &words; // words of ROW for (it.mark_cycle_pt(); !it.cycled_list(); it.forward()) { word = it.data(); word->plot(window); // in rainbow colours } } #endif // !GRAPHICS_DISABLED /********************************************************************** * ROW::operator= * * Assign rows by duplicating the row structure but NOT the WERDLIST **********************************************************************/ ROW &ROW::operator=(const ROW &source) { this->ELIST_LINK::operator=(source); kerning = source.kerning; spacing = source.spacing; xheight = source.xheight; bodysize = source.bodysize; ascrise = source.ascrise; descdrop = source.descdrop; if (!words.empty()) { words.clear(); } baseline = source.baseline; // QSPLINES must do = bound_box = source.bound_box; has_drop_cap_ = source.has_drop_cap_; lmargin_ = source.lmargin_; rmargin_ = source.rmargin_; para_ = source.para_; return *this; } } // namespace tesseract
