/********************************************************************** * File: pithsync.cpp (Formerly pitsync2.c) * Description: Code to find the optimum fixed pitch segmentation of some blobs. * Author: Ray Smith * Created: Thu Nov 19 11:48:05 GMT 1992 * * (C) Copyright 1992, Hewlett-Packard Ltd. ** Licensed under the Apache License, Version 2.0 (the "License"); ** you may not use this file except in compliance with the License. ** You may obtain a copy of the License at ** http://www.apache.org/licenses/LICENSE-2.0 ** Unless required by applicable law or agreed to in writing, software ** distributed under the License is distributed on an "AS IS" BASIS, ** WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. ** See the License for the specific language governing permissions and ** limitations under the License. * **********************************************************************/ #include "mfcpch.h" #ifdef __UNIX__ #include #endif #include #include "memry.h" #include "makerow.h" #include "pitsync1.h" #include "topitch.h" #include "pithsync.h" #include "tprintf.h" #define PROJECTION_MARGIN 10 //arbitrary #define EXTERN /********************************************************************** * FPCUTPT::setup * * Constructor to make a new FPCUTPT. **********************************************************************/ void FPCUTPT::setup( //constructor FPCUTPT *cutpts, //predecessors INT16 array_origin, //start coord STATS *projection, //vertical occupation INT16 zero_count, //official zero INT16 pitch, //proposed pitch INT16 x, //position INT16 offset //dist to gap ) { //half of pitch INT16 half_pitch = pitch / 2 - 1; UINT32 lead_flag; //new flag INT32 ind; //current position if (half_pitch > 31) half_pitch = 31; else if (half_pitch < 0) half_pitch = 0; lead_flag = 1 << half_pitch; pred = NULL; mean_sum = 0; sq_sum = offset * offset; cost = sq_sum; faked = FALSE; terminal = FALSE; fake_count = 0; xpos = x; region_index = 0; mid_cuts = 0; if (x == array_origin) { back_balance = 0; fwd_balance = 0; for (ind = 0; ind <= half_pitch; ind++) { fwd_balance >>= 1; if (projection->pile_count (ind) > zero_count) fwd_balance |= lead_flag; } } else { back_balance = cutpts[x - 1 - array_origin].back_balance << 1; back_balance &= lead_flag + lead_flag - 1; if (projection->pile_count (x) > zero_count) back_balance |= 1; fwd_balance = cutpts[x - 1 - array_origin].fwd_balance >> 1; if (projection->pile_count (x + half_pitch) > zero_count) fwd_balance |= lead_flag; } } /********************************************************************** * FPCUTPT::assign * * Constructor to make a new FPCUTPT. **********************************************************************/ void FPCUTPT::assign( //constructor FPCUTPT *cutpts, //predecessors INT16 array_origin, //start coord INT16 x, //position BOOL8 faking, //faking this one BOOL8 mid_cut, //cheap cut. INT16 offset, //dist to gap STATS *projection, //vertical occupation float projection_scale, //scaling INT16 zero_count, //official zero INT16 pitch, //proposed pitch INT16 pitch_error //allowed tolerance ) { int index; //test index int balance_index; //for balance factor INT16 balance_count; //ding factor INT16 r_index; //test cut number FPCUTPT *segpt; //segment point INT32 dist; //from prev segment double sq_dist; //squared distance double mean; //mean pitch double total; //total dists double factor; //cost function //half of pitch INT16 half_pitch = pitch / 2 - 1; UINT32 lead_flag; //new flag if (half_pitch > 31) half_pitch = 31; else if (half_pitch < 0) half_pitch = 0; lead_flag = 1 << half_pitch; back_balance = cutpts[x - 1 - array_origin].back_balance << 1; back_balance &= lead_flag + lead_flag - 1; if (projection->pile_count (x) > zero_count) back_balance |= 1; fwd_balance = cutpts[x - 1 - array_origin].fwd_balance >> 1; if (projection->pile_count (x + half_pitch) > zero_count) fwd_balance |= lead_flag; xpos = x; cost = MAX_FLOAT32; pred = NULL; faked = faking; terminal = FALSE; region_index = 0; fake_count = MAX_INT16; for (index = x - pitch - pitch_error; index <= x - pitch + pitch_error; index++) { if (index >= array_origin) { segpt = &cutpts[index - array_origin]; dist = x - segpt->xpos; if (!segpt->terminal && segpt->fake_count < MAX_INT16) { balance_count = 0; if (textord_balance_factor > 0) { if (textord_fast_pitch_test) { lead_flag = back_balance ^ segpt->fwd_balance; balance_count = 0; while (lead_flag != 0) { balance_count++; lead_flag &= lead_flag - 1; } } else { for (balance_index = 0; index + balance_index < x - balance_index; balance_index++) balance_count += (projection->pile_count (index + balance_index) <= zero_count) ^ (projection->pile_count (x - balance_index) <= zero_count); } balance_count = (INT16) (balance_count * textord_balance_factor / projection_scale); } r_index = segpt->region_index + 1; total = segpt->mean_sum + dist; balance_count += offset; sq_dist = dist * dist + segpt->sq_sum + balance_count * balance_count; mean = total / r_index; factor = mean - pitch; factor *= factor; factor += sq_dist / (r_index) - mean * mean; if (factor < cost && segpt->fake_count + faked <= fake_count) { cost = factor; //find least cost pred = segpt; //save path mean_sum = total; sq_sum = sq_dist; fake_count = segpt->fake_count + faked; mid_cuts = segpt->mid_cuts + mid_cut; region_index = r_index; } } } } } /********************************************************************** * FPCUTPT::assign_cheap * * Constructor to make a new FPCUTPT on the cheap. **********************************************************************/ void FPCUTPT::assign_cheap( //constructor FPCUTPT *cutpts, //predecessors INT16 array_origin, //start coord INT16 x, //position BOOL8 faking, //faking this one BOOL8 mid_cut, //cheap cut. INT16 offset, //dist to gap STATS *projection, //vertical occupation float projection_scale, //scaling INT16 zero_count, //official zero INT16 pitch, //proposed pitch INT16 pitch_error //allowed tolerance ) { int index; //test index INT16 balance_count; //ding factor INT16 r_index; //test cut number FPCUTPT *segpt; //segment point INT32 dist; //from prev segment double sq_dist; //squared distance double mean; //mean pitch double total; //total dists double factor; //cost function //half of pitch INT16 half_pitch = pitch / 2 - 1; UINT32 lead_flag; //new flag if (half_pitch > 31) half_pitch = 31; else if (half_pitch < 0) half_pitch = 0; lead_flag = 1 << half_pitch; back_balance = cutpts[x - 1 - array_origin].back_balance << 1; back_balance &= lead_flag + lead_flag - 1; if (projection->pile_count (x) > zero_count) back_balance |= 1; fwd_balance = cutpts[x - 1 - array_origin].fwd_balance >> 1; if (projection->pile_count (x + half_pitch) > zero_count) fwd_balance |= lead_flag; xpos = x; cost = MAX_FLOAT32; pred = NULL; faked = faking; terminal = FALSE; region_index = 0; fake_count = MAX_INT16; index = x - pitch; if (index >= array_origin) { segpt = &cutpts[index - array_origin]; dist = x - segpt->xpos; if (!segpt->terminal && segpt->fake_count < MAX_INT16) { balance_count = 0; if (textord_balance_factor > 0) { lead_flag = back_balance ^ segpt->fwd_balance; balance_count = 0; while (lead_flag != 0) { balance_count++; lead_flag &= lead_flag - 1; } balance_count = (INT16) (balance_count * textord_balance_factor / projection_scale); } r_index = segpt->region_index + 1; total = segpt->mean_sum + dist; balance_count += offset; sq_dist = dist * dist + segpt->sq_sum + balance_count * balance_count; mean = total / r_index; factor = mean - pitch; factor *= factor; factor += sq_dist / (r_index) - mean * mean; cost = factor; //find least cost pred = segpt; //save path mean_sum = total; sq_sum = sq_dist; fake_count = segpt->fake_count + faked; mid_cuts = segpt->mid_cuts + mid_cut; region_index = r_index; } } } /********************************************************************** * check_pitch_sync * * Construct the lattice of possible segmentation points and choose the * optimal path. Return the optimal path only. * The return value is a measure of goodness of the sync. **********************************************************************/ double check_pitch_sync2( //find segmentation BLOBNBOX_IT *blob_it, //blobs to do INT16 blob_count, //no of blobs INT16 pitch, //pitch estimate INT16 pitch_error, //tolerance STATS *projection, //vertical INT16 projection_left, //edges //scale factor INT16 projection_right, float projection_scale, INT16 &occupation_count, //no of occupied cells FPSEGPT_LIST *seg_list, //output list INT16 start, //start of good range INT16 end //end of good range ) { BOOL8 faking; //illegal cut pt BOOL8 mid_cut; //cheap cut pt. INT16 x; //current coord INT16 blob_index; //blob number INT16 left_edge; //of word INT16 right_edge; //of word INT16 array_origin; //x coord of array INT16 offset; //dist to legal area INT16 zero_count; //projection zero INT16 best_left_x = 0; //for equals INT16 best_right_x = 0; //right edge BOX this_box; //bounding box BOX next_box; //box of next blob FPSEGPT *segpt; //segment point FPCUTPT *cutpts; //array of points double best_cost; //best path double mean_sum; //computes result FPCUTPT *best_end; //end of best path INT16 best_fake; //best fake level INT16 best_count; //no of cuts BLOBNBOX_IT this_it; //copy iterator FPSEGPT_IT seg_it = seg_list; //output iterator // tprintf("Computing sync on word of %d blobs with pitch %d\n", // blob_count, pitch); // if (blob_count==8 && pitch==27) // projection->print(stdout,TRUE); zero_count = 0; if (pitch < 3) pitch = 3; //nothing ludicrous if ((pitch - 3) / 2 < pitch_error) pitch_error = (pitch - 3) / 2; this_it = *blob_it; this_box = box_next (&this_it);//get box // left_edge=this_box.left(); //left of word // right_edge=this_box.right(); // for (blob_index=1;blob_indexright_edge) // right_edge=this_box.right(); // } for (left_edge = projection_left; projection->pile_count (left_edge) == 0 && left_edge < projection_right; left_edge++); for (right_edge = projection_right; projection->pile_count (right_edge) == 0 && right_edge > left_edge; right_edge--); ASSERT_HOST (right_edge >= left_edge); if (pitsync_linear_version >= 4) return check_pitch_sync3 (projection_left, projection_right, zero_count, pitch, pitch_error, projection, projection_scale, occupation_count, seg_list, start, end); array_origin = left_edge - pitch; cutpts = (FPCUTPT *) alloc_mem ((right_edge - left_edge + pitch * 2 + 1) * sizeof (FPCUTPT)); for (x = array_origin; x < left_edge; x++) //free cuts cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, 0); for (offset = 0; offset <= pitch_error; offset++, x++) //not quite free cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, offset); this_it = *blob_it; best_cost = MAX_FLOAT32; best_end = NULL; this_box = box_next (&this_it);//first box next_box = box_next (&this_it);//second box blob_index = 1; while (x < right_edge - pitch_error) { if (x > this_box.right () + pitch_error && blob_index < blob_count) { this_box = next_box; next_box = box_next (&this_it); blob_index++; } faking = FALSE; mid_cut = FALSE; if (x <= this_box.left ()) offset = 0; else if (x <= this_box.left () + pitch_error) offset = x - this_box.left (); else if (x >= this_box.right ()) offset = 0; else if (x >= next_box.left () && blob_index < blob_count) { offset = x - next_box.left (); if (this_box.right () - x < offset) offset = this_box.right () - x; } else if (x >= this_box.right () - pitch_error) offset = this_box.right () - x; else if (x - this_box.left () > pitch * pitsync_joined_edge && this_box.right () - x > pitch * pitsync_joined_edge) { mid_cut = TRUE; offset = 0; } else { faking = TRUE; offset = projection->pile_count (x); } cutpts[x - array_origin].assign (cutpts, array_origin, x, faking, mid_cut, offset, projection, projection_scale, zero_count, pitch, pitch_error); x++; } best_fake = MAX_INT16; best_cost = MAX_INT32; best_count = MAX_INT16; while (x < right_edge + pitch) { offset = x < right_edge ? right_edge - x : 0; cutpts[x - array_origin].assign (cutpts, array_origin, x, FALSE, FALSE, offset, projection, projection_scale, zero_count, pitch, pitch_error); cutpts[x - array_origin].terminal = TRUE; if (cutpts[x - array_origin].index () + cutpts[x - array_origin].fake_count <= best_count + best_fake) { if (cutpts[x - array_origin].fake_count < best_fake || (cutpts[x - array_origin].fake_count == best_fake && cutpts[x - array_origin].cost_function () < best_cost)) { best_fake = cutpts[x - array_origin].fake_count; best_cost = cutpts[x - array_origin].cost_function (); best_left_x = x; best_right_x = x; best_count = cutpts[x - array_origin].index (); } else if (cutpts[x - array_origin].fake_count == best_fake && x == best_right_x + 1 && cutpts[x - array_origin].cost_function () == best_cost) { //exactly equal best_right_x = x; } } x++; } ASSERT_HOST (best_fake < MAX_INT16); best_end = &cutpts[(best_left_x + best_right_x) / 2 - array_origin]; if (this_box.right () == textord_test_x && this_box.top () == textord_test_y) { for (x = left_edge - pitch; x < right_edge + pitch; x++) { tprintf ("x=%d, C=%g, s=%g, sq=%g, prev=%d\n", x, cutpts[x - array_origin].cost_function (), cutpts[x - array_origin].sum (), cutpts[x - array_origin].squares (), cutpts[x - array_origin].previous ()->position ()); } } occupation_count = -1; do { for (x = best_end->position () - pitch + pitch_error; x < best_end->position () - pitch_error && projection->pile_count (x) == 0; x++); if (x < best_end->position () - pitch_error) occupation_count++; //copy it segpt = new FPSEGPT (best_end); seg_it.add_before_then_move (segpt); best_end = best_end->previous (); } while (best_end != NULL); seg_it.move_to_last (); mean_sum = seg_it.data ()->sum (); mean_sum = mean_sum * mean_sum / best_count; if (seg_it.data ()->squares () - mean_sum < 0) tprintf ("Impossible sqsum=%g, mean=%g, total=%d\n", seg_it.data ()->squares (), seg_it.data ()->sum (), best_count); free_mem(cutpts); // tprintf("blob_count=%d, pitch=%d, sync=%g, occ=%d\n", // blob_count,pitch,seg_it.data()->squares()-mean_sum, // occupation_count); return seg_it.data ()->squares () - mean_sum; } /********************************************************************** * check_pitch_sync * * Construct the lattice of possible segmentation points and choose the * optimal path. Return the optimal path only. * The return value is a measure of goodness of the sync. **********************************************************************/ double check_pitch_sync3( //find segmentation INT16 projection_left, //edges //to be considered 0 INT16 projection_right, INT16 zero_count, INT16 pitch, //pitch estimate INT16 pitch_error, //tolerance STATS *projection, //vertical float projection_scale, //scale factor INT16 &occupation_count, //no of occupied cells FPSEGPT_LIST *seg_list, //output list INT16 start, //start of good range INT16 end //end of good range ) { BOOL8 faking; //illegal cut pt BOOL8 mid_cut; //cheap cut pt. INT16 left_edge; //of word INT16 right_edge; //of word INT16 x; //current coord INT16 array_origin; //x coord of array INT16 offset; //dist to legal area INT16 projection_offset; //from scaled projection INT16 prev_zero; //previous zero dist INT16 next_zero; //next zero dist INT16 zero_offset; //scan window INT16 best_left_x = 0; //for equals INT16 best_right_x = 0; //right edge FPSEGPT *segpt; //segment point FPCUTPT *cutpts; //array of points BOOL8 *mins; //local min results int minindex; //next input position int test_index; //index to mins double best_cost; //best path double mean_sum; //computes result FPCUTPT *best_end; //end of best path INT16 best_fake; //best fake level INT16 best_count; //no of cuts FPSEGPT_IT seg_it = seg_list; //output iterator end = (end - start) % pitch; if (pitch < 3) pitch = 3; //nothing ludicrous if ((pitch - 3) / 2 < pitch_error) pitch_error = (pitch - 3) / 2; //min dist of zero zero_offset = (INT16) (pitch * pitsync_joined_edge); for (left_edge = projection_left; projection->pile_count (left_edge) == 0 && left_edge < projection_right; left_edge++); for (right_edge = projection_right; projection->pile_count (right_edge) == 0 && right_edge > left_edge; right_edge--); array_origin = left_edge - pitch; cutpts = (FPCUTPT *) alloc_mem ((right_edge - left_edge + pitch * 2 + 1) * sizeof (FPCUTPT)); mins = (BOOL8 *) alloc_mem ((pitch_error * 2 + 1) * sizeof (BOOL8)); for (x = array_origin; x < left_edge; x++) //free cuts cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, 0); prev_zero = left_edge - 1; for (offset = 0; offset <= pitch_error; offset++, x++) //not quite free cutpts[x - array_origin].setup (cutpts, array_origin, projection, zero_count, pitch, x, offset); best_cost = MAX_FLOAT32; best_end = NULL; for (offset = -pitch_error, minindex = 0; offset < pitch_error; offset++, minindex++) mins[minindex] = projection->local_min (x + offset); next_zero = x + zero_offset + 1; for (offset = next_zero - 1; offset >= x; offset--) { if (projection->pile_count (offset) <= zero_count) { next_zero = offset; break; } } while (x < right_edge - pitch_error) { mins[minindex] = projection->local_min (x + pitch_error); minindex++; if (minindex > pitch_error * 2) minindex = 0; faking = FALSE; mid_cut = FALSE; offset = 0; if (projection->pile_count (x) <= zero_count) { prev_zero = x; } else { for (offset = 1; offset <= pitch_error; offset++) if (projection->pile_count (x + offset) <= zero_count || projection->pile_count (x - offset) <= zero_count) break; } if (offset > pitch_error) { if (x - prev_zero > zero_offset && next_zero - x > zero_offset) { for (offset = 0; offset <= pitch_error; offset++) { test_index = minindex + pitch_error + offset; if (test_index > pitch_error * 2) test_index -= pitch_error * 2 + 1; if (mins[test_index]) break; test_index = minindex + pitch_error - offset; if (test_index > pitch_error * 2) test_index -= pitch_error * 2 + 1; if (mins[test_index]) break; } } if (offset > pitch_error) { offset = projection->pile_count (x); faking = TRUE; } else { projection_offset = (INT16) (projection->pile_count (x) / projection_scale); if (projection_offset > offset) offset = projection_offset; mid_cut = TRUE; } } if ((start == 0 && end == 0) || !textord_fast_pitch_test || (x - projection_left - start) % pitch <= end) cutpts[x - array_origin].assign (cutpts, array_origin, x, faking, mid_cut, offset, projection, projection_scale, zero_count, pitch, pitch_error); else cutpts[x - array_origin].assign_cheap (cutpts, array_origin, x, faking, mid_cut, offset, projection, projection_scale, zero_count, pitch, pitch_error); x++; if (next_zero < x || next_zero == x + zero_offset) next_zero = x + zero_offset + 1; if (projection->pile_count (x + zero_offset) <= zero_count) next_zero = x + zero_offset; } best_fake = MAX_INT16; best_cost = MAX_INT32; best_count = MAX_INT16; while (x < right_edge + pitch) { offset = x < right_edge ? right_edge - x : 0; cutpts[x - array_origin].assign (cutpts, array_origin, x, FALSE, FALSE, offset, projection, projection_scale, zero_count, pitch, pitch_error); cutpts[x - array_origin].terminal = TRUE; if (cutpts[x - array_origin].index () + cutpts[x - array_origin].fake_count <= best_count + best_fake) { if (cutpts[x - array_origin].fake_count < best_fake || (cutpts[x - array_origin].fake_count == best_fake && cutpts[x - array_origin].cost_function () < best_cost)) { best_fake = cutpts[x - array_origin].fake_count; best_cost = cutpts[x - array_origin].cost_function (); best_left_x = x; best_right_x = x; best_count = cutpts[x - array_origin].index (); } else if (cutpts[x - array_origin].fake_count == best_fake && x == best_right_x + 1 && cutpts[x - array_origin].cost_function () == best_cost) { //exactly equal best_right_x = x; } } x++; } ASSERT_HOST (best_fake < MAX_INT16); best_end = &cutpts[(best_left_x + best_right_x) / 2 - array_origin]; // for (x=left_edge-pitch;xposition()); // } occupation_count = -1; do { for (x = best_end->position () - pitch + pitch_error; x < best_end->position () - pitch_error && projection->pile_count (x) == 0; x++); if (x < best_end->position () - pitch_error) occupation_count++; //copy it segpt = new FPSEGPT (best_end); seg_it.add_before_then_move (segpt); best_end = best_end->previous (); } while (best_end != NULL); seg_it.move_to_last (); mean_sum = seg_it.data ()->sum (); mean_sum = mean_sum * mean_sum / best_count; if (seg_it.data ()->squares () - mean_sum < 0) tprintf ("Impossible sqsum=%g, mean=%g, total=%d\n", seg_it.data ()->squares (), seg_it.data ()->sum (), best_count); free_mem(mins); free_mem(cutpts); return seg_it.data ()->squares () - mean_sum; }