tesseract::Textord Class Reference

#include <textord.h>

List of all members.

Public Member Functions

 Textord (CCStruct *ccstruct)
 ~Textord ()
void TextordPage (PageSegMode pageseg_mode, int width, int height, Pix *pix, BLOCK_LIST *blocks, TO_BLOCK_LIST *to_blocks)
void CleanupSingleRowResult (PageSegMode pageseg_mode, PAGE_RES *page_res)
bool use_cjk_fp_model () const
void set_use_cjk_fp_model (bool flag)
void to_spacing (ICOORD page_tr, TO_BLOCK_LIST *blocks)
ROWmake_prop_words (TO_ROW *row, FCOORD rotation)
ROWmake_blob_words (TO_ROW *row, FCOORD rotation)
void find_components (Pix *pix, BLOCK_LIST *blocks, TO_BLOCK_LIST *to_blocks)
void filter_blobs (ICOORD page_tr, TO_BLOCK_LIST *blocks, BOOL8 testing_on)

Public Attributes

bool textord_single_height_mode = false
bool tosp_old_to_method = false
bool tosp_old_to_constrain_sp_kn = false
bool tosp_only_use_prop_rows = true
bool tosp_force_wordbreak_on_punct = false
bool tosp_use_pre_chopping = false
bool tosp_old_to_bug_fix = false
bool tosp_block_use_cert_spaces = true
bool tosp_row_use_cert_spaces = true
bool tosp_narrow_blobs_not_cert = true
bool tosp_row_use_cert_spaces1 = true
bool tosp_recovery_isolated_row_stats = true
bool tosp_only_small_gaps_for_kern = false
bool tosp_all_flips_fuzzy = false
bool tosp_fuzzy_limit_all = true
bool tosp_stats_use_xht_gaps = true
bool tosp_use_xht_gaps = true
bool tosp_only_use_xht_gaps = false
bool tosp_rule_9_test_punct = false
bool tosp_flip_fuzz_kn_to_sp = true
bool tosp_flip_fuzz_sp_to_kn = true
bool tosp_improve_thresh = false
int tosp_debug_level = 0
int tosp_enough_space_samples_for_median = 3
int tosp_redo_kern_limit = 10
int tosp_few_samples = 40
int tosp_short_row = 20
int tosp_sanity_method = 1
double tosp_old_sp_kn_th_factor = 2.0
double tosp_threshold_bias1 = 0
double tosp_threshold_bias2 = 0
double tosp_narrow_fraction = 0.3
double tosp_narrow_aspect_ratio = 0.48
double tosp_wide_fraction = 0.52
double tosp_wide_aspect_ratio = 0.0
double tosp_fuzzy_space_factor = 0.6
double tosp_fuzzy_space_factor1 = 0.5
double tosp_fuzzy_space_factor2 = 0.72
double tosp_gap_factor = 0.83
double tosp_kern_gap_factor1 = 2.0
double tosp_kern_gap_factor2 = 1.3
double tosp_kern_gap_factor3 = 2.5
double tosp_ignore_big_gaps = -1
double tosp_ignore_very_big_gaps = 3.5
double tosp_rep_space = 1.6
double tosp_enough_small_gaps = 0.65
double tosp_table_kn_sp_ratio = 2.25
double tosp_table_xht_sp_ratio = 0.33
double tosp_table_fuzzy_kn_sp_ratio = 3.0
double tosp_fuzzy_kn_fraction = 0.5
double tosp_fuzzy_sp_fraction = 0.5
double tosp_min_sane_kn_sp = 1.5
double tosp_init_guess_kn_mult = 2.2
double tosp_init_guess_xht_mult = 0.28
double tosp_max_sane_kn_thresh = 5.0
double tosp_flip_caution = 0.0
double tosp_large_kerning = 0.19
double tosp_dont_fool_with_small_kerns = -1
double tosp_near_lh_edge = 0
double tosp_silly_kn_sp_gap = 0.2
double tosp_pass_wide_fuzz_sp_to_context = 0.75
bool textord_no_rejects = false
bool textord_show_blobs = false
bool textord_show_boxes = false
int textord_max_noise_size = 7
double textord_blob_size_bigile = 95
double textord_noise_area_ratio = 0.7
double textord_blob_size_smallile = 20
double textord_initialx_ile = 0.75
double textord_initialasc_ile = 0.90
int textord_noise_sizefraction = 10
double textord_noise_sizelimit = 0.5
int textord_noise_translimit = 16
double textord_noise_normratio = 2.0
bool textord_noise_rejwords = true
bool textord_noise_rejrows = true
double textord_noise_syfract = 0.2
double textord_noise_sxfract = 0.4
double textord_noise_hfract = 1.0/64
int textord_noise_sncount = 1
double textord_noise_rowratio = 6.0
bool textord_noise_debug = FALSE
double textord_blshift_maxshift = 0.00
double textord_blshift_xfraction = 9.99

Constructor & Destructor Documentation

tesseract::Textord::Textord ( CCStruct ccstruct  )  [explicit]
tesseract::Textord::~Textord (  ) 

Member Function Documentation

void tesseract::Textord::CleanupSingleRowResult ( PageSegMode  pageseg_mode,
PAGE_RES page_res 
)
void tesseract::Textord::filter_blobs ( ICOORD  page_tr,
TO_BLOCK_LIST *  blocks,
BOOL8  testing_on 
)
void tesseract::Textord::find_components ( Pix *  pix,
BLOCK_LIST *  blocks,
TO_BLOCK_LIST *  to_blocks 
)
ROW * tesseract::Textord::make_blob_words ( TO_ROW row,
FCOORD  rotation 
)
ROW * tesseract::Textord::make_prop_words ( TO_ROW row,
FCOORD  rotation 
)
void tesseract::Textord::set_use_cjk_fp_model ( bool  flag  )  [inline]
void tesseract::Textord::TextordPage ( PageSegMode  pageseg_mode,
int  width,
int  height,
Pix *  pix,
BLOCK_LIST *  blocks,
TO_BLOCK_LIST *  to_blocks 
)
void tesseract::Textord::to_spacing ( ICOORD  page_tr,
TO_BLOCK_LIST *  blocks 
)
bool tesseract::Textord::use_cjk_fp_model (  )  const [inline]

Member Data Documentation

"Percentile for large blobs"

"Percentile for small blobs"

"Max baseline shift"

"Min size of baseline shift"

"Ile of sizes for xheight guess"

"Ile of sizes for xheight guess"

"Pixel size of noise"

"Don't remove noise blobs"

"Fraction of bounding box for noise"

"Debug row garbage detector"

"Height fraction to discard outlines as speckle noise"

"Dot to norm ratio for deletion"

"Reject noise-like rows"

"Reject noise-like words"

"Dot to norm ratio for deletion"

"Fraction of size for maxima"

"Fraction of x for big t count"

"super norm blobs to save row"

"xh fract width error for norm blobs"

"xh fract error for norm blobs"

"Transitions for normal blob"

"Display unsorted blobs"

"Display boxes"

"Script has no xheight, so use a single mode for horizontal text"

"Pass ANY flip to context?"

"Only stat OBVIOUS spaces"

"Debug data"

"Limit use of xht gap with odd small kns"

"Fract of kerns reqd for isolated row stats"

"or should we use mean"

"No.gaps reqd with 1 large gap to treat as a table"

"Dont autoflip kn to sp when large separation"

"Default flip"

"Default flip"

"Force word breaks on punct to break long lines in non-space " "delimited langs"

"New fuzzy kn alg"

"Dont restrict kn->sp fuzzy limit to tables"

"New fuzzy sp alg"

"Fract of xheight for fuzz sp"

"Fract of xheight for fuzz sp"

"Fract of xheight for fuzz sp"

"gap ratio to flip sp->kern"

"xht multiplier"

"xht multiplier"

"Enable improvement heuristic"

"Thresh guess - mult kn by this"

"Thresh guess - mult xht by this"

"gap ratio to flip kern->sp"

"gap ratio to flip kern->sp"

"gap ratio to flip kern->sp"

"Limit use of xht gap with large kns"

"Multiplier on kn to limit thresh"

"Dont trust spaces less than this time kn"

"narrow if w/h less than this"

"Only stat OBVIOUS spaces"

"Fract of xheight for narrow"

"Dont reduce box if the top left is non blank"

"Factor for defining space threshold in terms of space and " "kern sizes"

"Fix suspected bug in old code"

"Constrain relative values of inter and intra-word gaps for " "old_to_method."

"Space stats use prechopping?"

"Better guess"

"Block stats to use fixed pitch rows?"

"Only use within xht gap for wd breaks"

"How wide fuzzies need context"

"Use row alone when inadequate cert spaces"

"No.samples reqd to reestimate for row"

"rep gap multiplier for space"

"Only stat OBVIOUS spaces"

"Only stat OBVIOUS spaces"

"Dont chng kn to space next to punct"

"How to avoid being silly"

"No.gaps reqd with few cert spaces to use certs"

"Dont let sp minus kn get too small"

"Use within xht gap for wd breaks"

"Fuzzy if less than this"

"Min difference of kn & sp in table"

"Expect spaces bigger than this"

"how far between kern and space?"

"how far between kern and space?"

"Space stats use prechopping?"

"Use within xht gap for wd breaks"

"wide if w/h less than this"

"Fract of xheight for wide"


The documentation for this class was generated from the following files:
Generated on Thu Feb 2 08:19:27 2012 for Tesseract by  doxygen 1.6.3