#include "varable.h"
#include "ocrblock.h"
#include "ratngs.h"
#include "statistc.h"
#include "ocrshell.h"
#include "pageres.h"
#include "charsample.h"
#include "notdll.h"
Go to the source code of this file.
Module-independent matcher controller.
typedef BOOL8(* BLOB_REJECTOR)(PBLOB *, BLOB_CHOICE_IT *, void *) |
enum ACCEPTABLE_WERD_TYPE |
good chars in word
row | current row | |
fonts | font stats | |
italic | output count | |
bold | output count |
void choice_dump_tester | ( | PBLOB * | , | |
DENORM * | , | |||
BOOL8 | correct, | |||
char * | text, | |||
inT32 | count, | |||
BLOB_CHOICE_LIST * | ratings | |||
) |
dump chars in word
correct | ly segmented | |
text | correct text | |
count | chars in text | |
ratings | list of results |
good chars in word
fonts | font stats | |
font_out | output font | |
font_count | output count |
void fix_hyphens | ( | WERD_CHOICE * | choice, | |
WERD * | word, | |||
BLOB_CHOICE_LIST_CLIST * | blob_choices | |||
) |
crunch double hyphens
choice | string to fix | |
word | word to do | |
blob_choices | char choices |
recognize one word
word | word to do |
combine 2 blobs
blob1 | dest blob | |
blob2 | source blob |
char* chs_leading_punct = "('`\"" |
"Leading punctuation"
char* chs_trailing_punct1 = ").,;:?!" |
"1st Trailing punctuation"
char* chs_trailing_punct2 = ")'`\"" |
"2nd Trailing punctuation"
bool debug_acceptable_wds = FALSE |
"Dump word pass/fail chk"
int debug_x_ht_level = 0 |
"Reestimate debug"
double quality_blob_pc = 0.0 |
"good_quality_doc gte good blobs limit"
double quality_char_pc = 0.95 |
"good_quality_doc gte good char limit"
int quality_min_initial_alphas_reqd = 2 |
"alphas in a good word"
double quality_outline_pc = 1.0 |
"good_quality_doc lte outline error limit"
double quality_rej_pc = 0.08 |
"good_quality_doc lte rejection limit"
"Individual rejection control"
bool save_best_choices = FALSE |
"Save the results of the recognition step" " (blob_choices) within the corresponding WERD_CHOICE"
bool tessedit_adaption_debug = FALSE |
"Generate and print debug information for adaption"
"Adapt using clusterer after pass 1"
"Adapt using clusterer after pass 1"
"Adapt using clusterer after pass 1"
"Adapt using clusterer before Tess adaping during pass 1"
int tessedit_cluster_adaption_mode = 0 |
"Adaptation decision algorithm for matrix matcher"
"Do our own adaption - ems only"
bool tessedit_debug_block_rejection = FALSE |
"Block and Row stats"
bool tessedit_draw_outwords = FALSE |
"Draw output words"
bool tessedit_draw_words = FALSE |
"Draw source words"
bool tessedit_dump_choices = FALSE |
"Dump char choices"
int tessedit_em_adaption_mode = 62 |
"Adaptation decision algorithm for ems matrix matcher"
"Add words to the document dictionary"
"Try to improve fuzzy spaces"
"Crunch double hyphens?"
bool tessedit_global_adaption = FALSE |
"Adapt to all docs over time"
bool tessedit_matcher_is_wiseowl = FALSE |
"Call WO to classify"
bool tessedit_matcher_log = FALSE |
"Log matcher activity"
bool tessedit_minimal_rej_pass1 = FALSE |
"Do minimal rejection on pass 1 output"
bool tessedit_print_text = FALSE |
"Write text to stdout"
"Check/Correct x-height"
bool tessedit_reject_fullstops = FALSE |
"Reject all fullstops"
"Reject suspect fullstops"
int tessedit_single_match = FALSE |
"Top choice only from CP"
bool tessedit_tess_adapt_to_rejmap = FALSE |
"Use reject map to control Tesseract adaption"
int tessedit_tess_adaption_mode = 3 |
"Adaptation decision algorithm for tess"
bool tessedit_test_adaption = FALSE |
"Test adaption criteria"
int tessedit_test_adaption_mode = 3 |
"Adaptation decision algorithm for tess"
bool tessedit_training_tess = FALSE |
"Call Tess to learn blobs"
bool tessedit_training_wiseowl = FALSE |
"Call WO to learn blobs"
bool tessedit_unrej_any_wd = FALSE |
"Dont bother with word plausibility"
"Apply xht fix up even if done"
"Apply xht fix up even in no rejects"
double test_pt_x = 99999.99 |
"xcoord"
double test_pt_y = 99999.99 |
"ycoord"
bool word_occ_first = FALSE |
"Do word occ before re-est xht"
int x_ht_check_word_occ = 2 |
"Check Char Block occupancy"
"Dont allow worse quality"
int x_ht_stringency = 1 |
"How many confirmed a/n to accept?"