Tesseract
3.02
|
00001 /********************************************************************** 00002 * File: ocrblock.cpp (Formerly block.c) 00003 * Description: BLOCK member functions and iterator functions. 00004 * Author: Ray Smith 00005 * Created: Fri Mar 15 09:41:28 GMT 1991 00006 * 00007 * (C) Copyright 1991, Hewlett-Packard Ltd. 00008 ** Licensed under the Apache License, Version 2.0 (the "License"); 00009 ** you may not use this file except in compliance with the License. 00010 ** You may obtain a copy of the License at 00011 ** http://www.apache.org/licenses/LICENSE-2.0 00012 ** Unless required by applicable law or agreed to in writing, software 00013 ** distributed under the License is distributed on an "AS IS" BASIS, 00014 ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 00015 ** See the License for the specific language governing permissions and 00016 ** limitations under the License. 00017 * 00018 **********************************************************************/ 00019 00020 #include "mfcpch.h" 00021 #include <stdlib.h> 00022 #include "blckerr.h" 00023 #include "ocrblock.h" 00024 #include "stepblob.h" 00025 #include "tprintf.h" 00026 00027 #define BLOCK_LABEL_HEIGHT 150 //char height of block id 00028 00029 ELISTIZE (BLOCK) 00035 BLOCK::BLOCK(const char *name, //< filename 00036 BOOL8 prop, //< proportional 00037 inT16 kern, //< kerning 00038 inT16 space, //< spacing 00039 inT16 xmin, //< bottom left 00040 inT16 ymin, inT16 xmax, //< top right 00041 inT16 ymax) 00042 : PDBLK (xmin, ymin, xmax, ymax), 00043 filename(name), 00044 re_rotation_(1.0f, 0.0f), 00045 classify_rotation_(1.0f, 0.0f), 00046 skew_(1.0f, 0.0f) { 00047 ICOORDELT_IT left_it = &leftside; 00048 ICOORDELT_IT right_it = &rightside; 00049 00050 proportional = prop; 00051 right_to_left_ = false; 00052 kerning = kern; 00053 spacing = space; 00054 font_class = -1; //not assigned 00055 cell_over_xheight_ = 2.0f; 00056 hand_poly = NULL; 00057 left_it.set_to_list (&leftside); 00058 right_it.set_to_list (&rightside); 00059 //make default box 00060 left_it.add_to_end (new ICOORDELT (xmin, ymin)); 00061 left_it.add_to_end (new ICOORDELT (xmin, ymax)); 00062 right_it.add_to_end (new ICOORDELT (xmax, ymin)); 00063 right_it.add_to_end (new ICOORDELT (xmax, ymax)); 00064 } 00065 00072 int decreasing_top_order( // 00073 const void *row1, 00074 const void *row2) { 00075 return (*(ROW **) row2)->bounding_box ().top () - 00076 (*(ROW **) row1)->bounding_box ().top (); 00077 } 00078 00079 00085 void BLOCK::rotate(const FCOORD& rotation) { 00086 poly_block()->rotate(rotation); 00087 box = *poly_block()->bounding_box(); 00088 } 00089 00096 void BLOCK::reflect_polygon_in_y_axis() { 00097 poly_block()->reflect_in_y_axis(); 00098 box = *poly_block()->bounding_box(); 00099 } 00100 00107 void BLOCK::sort_rows() { // order on "top" 00108 ROW_IT row_it(&rows); 00109 00110 row_it.sort (decreasing_top_order); 00111 } 00112 00113 00121 void BLOCK::compress() { // squash it up 00122 #define ROW_SPACING 5 00123 00124 ROW_IT row_it(&rows); 00125 ROW *row; 00126 ICOORD row_spacing (0, ROW_SPACING); 00127 00128 ICOORDELT_IT icoordelt_it; 00129 00130 sort_rows(); 00131 00132 box = TBOX (box.topleft (), box.topleft ()); 00133 box.move_bottom_edge (ROW_SPACING); 00134 for (row_it.mark_cycle_pt (); !row_it.cycled_list (); row_it.forward ()) { 00135 row = row_it.data (); 00136 row->move (box.botleft () - row_spacing - 00137 row->bounding_box ().topleft ()); 00138 box += row->bounding_box (); 00139 } 00140 00141 leftside.clear (); 00142 icoordelt_it.set_to_list (&leftside); 00143 icoordelt_it.add_to_end (new ICOORDELT (box.left (), box.bottom ())); 00144 icoordelt_it.add_to_end (new ICOORDELT (box.left (), box.top ())); 00145 rightside.clear (); 00146 icoordelt_it.set_to_list (&rightside); 00147 icoordelt_it.add_to_end (new ICOORDELT (box.right (), box.bottom ())); 00148 icoordelt_it.add_to_end (new ICOORDELT (box.right (), box.top ())); 00149 } 00150 00151 00159 void BLOCK::check_pitch() { // check prop 00160 // tprintf("Missing FFT fixed pitch stuff!\n"); 00161 pitch = -1; 00162 } 00163 00164 00171 void BLOCK::compress( // squash it up 00172 const ICOORD vec // and move 00173 ) { 00174 box.move (vec); 00175 compress(); 00176 } 00177 00178 00185 void BLOCK::print( //print list of sides 00186 FILE *, //< file to print on 00187 BOOL8 dump //< print full detail 00188 ) { 00189 ICOORDELT_IT it = &leftside; //iterator 00190 00191 box.print (); 00192 tprintf ("Proportional= %s\n", proportional ? "TRUE" : "FALSE"); 00193 tprintf ("Kerning= %d\n", kerning); 00194 tprintf ("Spacing= %d\n", spacing); 00195 tprintf ("Fixed_pitch=%d\n", pitch); 00196 tprintf ("Filename= %s\n", filename.string ()); 00197 00198 if (dump) { 00199 tprintf ("Left side coords are:\n"); 00200 for (it.mark_cycle_pt (); !it.cycled_list (); it.forward ()) 00201 tprintf ("(%d,%d) ", it.data ()->x (), it.data ()->y ()); 00202 tprintf ("\n"); 00203 tprintf ("Right side coords are:\n"); 00204 it.set_to_list (&rightside); 00205 for (it.mark_cycle_pt (); !it.cycled_list (); it.forward ()) 00206 tprintf ("(%d,%d) ", it.data ()->x (), it.data ()->y ()); 00207 tprintf ("\n"); 00208 } 00209 } 00210 00217 BLOCK & BLOCK::operator= ( //assignment 00218 const BLOCK & source //from this 00219 ) { 00220 this->ELIST_LINK::operator= (source); 00221 this->PDBLK::operator= (source); 00222 proportional = source.proportional; 00223 kerning = source.kerning; 00224 spacing = source.spacing; 00225 filename = source.filename; //STRINGs assign ok 00226 if (!rows.empty ()) 00227 rows.clear (); 00228 re_rotation_ = source.re_rotation_; 00229 classify_rotation_ = source.classify_rotation_; 00230 skew_ = source.skew_; 00231 return *this; 00232 } 00233 00234 // This function is for finding the approximate (horizontal) distance from 00235 // the x-coordinate of the left edge of a symbol to the left edge of the 00236 // text block which contains it. We are passed: 00237 // segments - output of PB_LINE_IT::get_line() which contains x-coordinate 00238 // intervals for the scan line going through the symbol's y-coordinate. 00239 // Each element of segments is of the form (x()=start_x, y()=length). 00240 // x - the x coordinate of the symbol we're interested in. 00241 // margin - return value, the distance from x,y to the left margin of the 00242 // block containing it. 00243 // If all segments were to the right of x, we return false and 0. 00244 bool LeftMargin(ICOORDELT_LIST *segments, int x, int *margin) { 00245 bool found = false; 00246 *margin = 0; 00247 if (segments->empty()) 00248 return found; 00249 ICOORDELT_IT seg_it(segments); 00250 for (seg_it.mark_cycle_pt(); !seg_it.cycled_list(); seg_it.forward()) { 00251 int cur_margin = x - seg_it.data()->x(); 00252 if (cur_margin >= 0) { 00253 if (!found) { 00254 *margin = cur_margin; 00255 } else if (cur_margin < *margin) { 00256 *margin = cur_margin; 00257 } 00258 found = true; 00259 } 00260 } 00261 return found; 00262 } 00263 00264 // This function is for finding the approximate (horizontal) distance from 00265 // the x-coordinate of the right edge of a symbol to the right edge of the 00266 // text block which contains it. We are passed: 00267 // segments - output of PB_LINE_IT::get_line() which contains x-coordinate 00268 // intervals for the scan line going through the symbol's y-coordinate. 00269 // Each element of segments is of the form (x()=start_x, y()=length). 00270 // x - the x coordinate of the symbol we're interested in. 00271 // margin - return value, the distance from x,y to the right margin of the 00272 // block containing it. 00273 // If all segments were to the left of x, we return false and 0. 00274 bool RightMargin(ICOORDELT_LIST *segments, int x, int *margin) { 00275 bool found = false; 00276 *margin = 0; 00277 if (segments->empty()) 00278 return found; 00279 ICOORDELT_IT seg_it(segments); 00280 for (seg_it.mark_cycle_pt(); !seg_it.cycled_list(); seg_it.forward()) { 00281 int cur_margin = seg_it.data()->x() + seg_it.data()->y() - x; 00282 if (cur_margin >= 0) { 00283 if (!found) { 00284 *margin = cur_margin; 00285 } else if (cur_margin < *margin) { 00286 *margin = cur_margin; 00287 } 00288 found = true; 00289 } 00290 } 00291 return found; 00292 } 00293 00294 // Compute the distance from the left and right ends of each row to the 00295 // left and right edges of the block's polyblock. Illustration: 00296 // ____________________________ _______________________ 00297 // | Howdy neighbor! | |rectangular blocks look| 00298 // | This text is written to| |more like stacked pizza| 00299 // |illustrate how useful poly- |boxes. | 00300 // |blobs are in ----------- ------ The polyblob| 00301 // |dealing with| _________ |for a BLOCK rec-| 00302 // |harder layout| /===========\ |ords the possibly| 00303 // |issues. | | _ _ | |skewed pseudo-| 00304 // | You see this| | |_| \|_| | |rectangular | 00305 // |text is flowed| | } | |boundary that| 00306 // |around a mid-| \ ____ | |forms the ideal-| 00307 // |cloumn portrait._____ \ / __|ized text margin| 00308 // | Polyblobs exist| \ / |from which we should| 00309 // |to account for insets| | | |measure paragraph| 00310 // |which make otherwise| ----- |indentation. | 00311 // ----------------------- ---------------------- 00312 // 00313 // If we identify a drop-cap, we measure the left margin for the lines 00314 // below the first line relative to one space past the drop cap. The 00315 // first line's margin and those past the drop cap area are measured 00316 // relative to the enclosing polyblock. 00317 // 00318 // TODO(rays): Before this will work well, we'll need to adjust the 00319 // polyblob tighter around the text near images, as in: 00320 // UNLV_AUTO:mag.3G0 page 2 00321 // UNLV_AUTO:mag.3G4 page 16 00322 void BLOCK::compute_row_margins() { 00323 if (row_list()->empty() || row_list()->singleton()) { 00324 return; 00325 } 00326 00327 // If Layout analysis was not called, default to this. 00328 POLY_BLOCK rect_block(bounding_box(), PT_FLOWING_TEXT); 00329 POLY_BLOCK *pblock = &rect_block; 00330 if (poly_block() != NULL) { 00331 pblock = poly_block(); 00332 } 00333 00334 // Step One: Determine if there is a drop-cap. 00335 // TODO(eger): Fix up drop cap code for RTL languages. 00336 ROW_IT r_it(row_list()); 00337 ROW *first_row = r_it.data(); 00338 ROW *second_row = r_it.data_relative(1); 00339 00340 // initialize the bottom of a fictitious drop cap far above the first line. 00341 int drop_cap_bottom = first_row->bounding_box().top() + 00342 first_row->bounding_box().height(); 00343 int drop_cap_right = first_row->bounding_box().left(); 00344 int mid_second_line = second_row->bounding_box().top() - 00345 second_row->bounding_box().height() / 2; 00346 WERD_IT werd_it(r_it.data()->word_list()); // words of line one 00347 if (!werd_it.empty()) { 00348 C_BLOB_IT cblob_it(werd_it.data()->cblob_list()); 00349 for (cblob_it.mark_cycle_pt(); !cblob_it.cycled_list(); 00350 cblob_it.forward()) { 00351 TBOX bbox = cblob_it.data()->bounding_box(); 00352 if (bbox.bottom() <= mid_second_line) { 00353 // we found a real drop cap 00354 first_row->set_has_drop_cap(true); 00355 if (drop_cap_bottom > bbox.bottom()) 00356 drop_cap_bottom = bbox.bottom(); 00357 if (drop_cap_right < bbox.right()) 00358 drop_cap_right = bbox.right(); 00359 } 00360 } 00361 } 00362 00363 // Step Two: Calculate the margin from the text of each row to the block 00364 // (or drop-cap) boundaries. 00365 PB_LINE_IT lines(pblock); 00366 r_it.set_to_list(row_list()); 00367 for (r_it.mark_cycle_pt(); !r_it.cycled_list(); r_it.forward()) { 00368 ROW *row = r_it.data(); 00369 TBOX row_box = row->bounding_box(); 00370 int left_y = row->base_line(row_box.left()) + row->x_height(); 00371 int left_margin; 00372 ICOORDELT_LIST *segments = lines.get_line(left_y); 00373 LeftMargin(segments, row_box.left(), &left_margin); 00374 delete segments; 00375 00376 if (row_box.top() >= drop_cap_bottom) { 00377 int drop_cap_distance = row_box.left() - row->space() - drop_cap_right; 00378 if (drop_cap_distance < 0) 00379 drop_cap_distance = 0; 00380 if (drop_cap_distance < left_margin) 00381 left_margin = drop_cap_distance; 00382 } 00383 00384 int right_y = row->base_line(row_box.right()) + row->x_height(); 00385 int right_margin; 00386 segments = lines.get_line(right_y); 00387 RightMargin(segments, row_box.right(), &right_margin); 00388 delete segments; 00389 row->set_lmargin(left_margin); 00390 row->set_rmargin(right_margin); 00391 } 00392 } 00393 00394 /********************************************************************** 00395 * PrintSegmentationStats 00396 * 00397 * Prints segmentation stats for the given block list. 00398 **********************************************************************/ 00399 00400 void PrintSegmentationStats(BLOCK_LIST* block_list) { 00401 int num_blocks = 0; 00402 int num_rows = 0; 00403 int num_words = 0; 00404 int num_blobs = 0; 00405 BLOCK_IT block_it(block_list); 00406 for (block_it.mark_cycle_pt(); !block_it.cycled_list(); block_it.forward()) { 00407 BLOCK* block = block_it.data(); 00408 ++num_blocks; 00409 ROW_IT row_it(block->row_list()); 00410 for (row_it.mark_cycle_pt(); !row_it.cycled_list(); row_it.forward()) { 00411 ++num_rows; 00412 ROW* row = row_it.data(); 00413 // Iterate over all werds in the row. 00414 WERD_IT werd_it(row->word_list()); 00415 for (werd_it.mark_cycle_pt(); !werd_it.cycled_list(); werd_it.forward()) { 00416 WERD* werd = werd_it.data(); 00417 ++num_words; 00418 num_blobs += werd->cblob_list()->length(); 00419 } 00420 } 00421 } 00422 tprintf("Block list stats:\nBlocks = %d\nRows = %d\nWords = %d\nBlobs = %d\n", 00423 num_blocks, num_rows, num_words, num_blobs); 00424 } 00425 00426 /********************************************************************** 00427 * ExtractBlobsFromSegmentation 00428 * 00429 * Extracts blobs from the given block list and adds them to the output list. 00430 * The block list must have been created by performing a page segmentation. 00431 **********************************************************************/ 00432 00433 void ExtractBlobsFromSegmentation(BLOCK_LIST* blocks, 00434 C_BLOB_LIST* output_blob_list) { 00435 C_BLOB_IT return_list_it(output_blob_list); 00436 BLOCK_IT block_it(blocks); 00437 for (block_it.mark_cycle_pt(); !block_it.cycled_list(); block_it.forward()) { 00438 BLOCK* block = block_it.data(); 00439 ROW_IT row_it(block->row_list()); 00440 for (row_it.mark_cycle_pt(); !row_it.cycled_list(); row_it.forward()) { 00441 ROW* row = row_it.data(); 00442 // Iterate over all werds in the row. 00443 WERD_IT werd_it(row->word_list()); 00444 for (werd_it.mark_cycle_pt(); !werd_it.cycled_list(); werd_it.forward()) { 00445 WERD* werd = werd_it.data(); 00446 return_list_it.move_to_last(); 00447 return_list_it.add_list_after(werd->cblob_list()); 00448 return_list_it.move_to_last(); 00449 return_list_it.add_list_after(werd->rej_cblob_list()); 00450 } 00451 } 00452 } 00453 } 00454 00455 /********************************************************************** 00456 * RefreshWordBlobsFromNewBlobs() 00457 * 00458 * Refreshes the words in the block_list by using blobs in the 00459 * new_blobs list. 00460 * Block list must have word segmentation in it. 00461 * It consumes the blobs provided in the new_blobs list. The blobs leftover in 00462 * the new_blobs list after the call weren't matched to any blobs of the words 00463 * in block list. 00464 * The output not_found_blobs is a list of blobs from the original segmentation 00465 * in the block_list for which no corresponding new blobs were found. 00466 **********************************************************************/ 00467 00468 void RefreshWordBlobsFromNewBlobs(BLOCK_LIST* block_list, 00469 C_BLOB_LIST* new_blobs, 00470 C_BLOB_LIST* not_found_blobs) { 00471 // Now iterate over all the blobs in the segmentation_block_list_, and just 00472 // replace the corresponding c-blobs inside the werds. 00473 BLOCK_IT block_it(block_list); 00474 for (block_it.mark_cycle_pt(); !block_it.cycled_list(); block_it.forward()) { 00475 BLOCK* block = block_it.data(); 00476 // Iterate over all rows in the block. 00477 ROW_IT row_it(block->row_list()); 00478 for (row_it.mark_cycle_pt(); !row_it.cycled_list(); row_it.forward()) { 00479 ROW* row = row_it.data(); 00480 // Iterate over all werds in the row. 00481 WERD_IT werd_it(row->word_list()); 00482 WERD_LIST new_words; 00483 WERD_IT new_words_it(&new_words); 00484 for (werd_it.mark_cycle_pt(); !werd_it.cycled_list(); werd_it.forward()) { 00485 WERD* werd = werd_it.extract(); 00486 WERD* new_werd = werd->ConstructWerdWithNewBlobs(new_blobs, 00487 not_found_blobs); 00488 if (new_werd) { 00489 // Insert this new werd into the actual row's werd-list. Remove the 00490 // existing one. 00491 new_words_it.add_after_then_move(new_werd); 00492 delete werd; 00493 } else { 00494 // Reinsert the older word back, for lack of better options. 00495 // This is critical since dropping the words messes up segmentation: 00496 // eg. 1st word in the row might otherwise have W_FUZZY_NON turned on. 00497 new_words_it.add_after_then_move(werd); 00498 } 00499 } 00500 // Get rid of the old word list & replace it with the new one. 00501 row->word_list()->clear(); 00502 werd_it.move_to_first(); 00503 werd_it.add_list_after(&new_words); 00504 } 00505 } 00506 }