tesseract-doxygen/ccmain/reject.h File Reference

#include "varable.h"
#include "pageres.h"
#include "notdll.h"

Go to the source code of this file.

Functions

void reject_blanks (WERD_RES *word)
void reject_I_1_L (WERD_RES *word)
void reject_poor_matches (WERD_RES *word, BLOB_CHOICE_LIST_CLIST *blob_choices)
float compute_reject_threshold (BLOB_CHOICE_LIST_CLIST *blob_choices)
int sort_floats (const void *arg1, const void *arg2)
void reject_edge_blobs (WERD_RES *word)
BOOL8 word_contains_non_1_digit (const char *word, const char *word_lengths)
inT16 nn_match_char (IMAGE &scaled_image, float baseline_pos, BOOL8 dict_word, BOOL8 checked_dict_word, BOOL8 sensible_word, BOOL8 centre, BOOL8 good_quality_word, char tess_ch)
inT16 evaluate_net_match (char top, float top_score, char next, float next_score, char tess_ch, BOOL8 dict_word, BOOL8 checked_dict_word, BOOL8 sensible_word, BOOL8 centre, BOOL8 good_quality_word)
void dont_allow_dubious_chars (WERD_RES *word)
void dont_allow_1Il (WERD_RES *word)
void reject_mostly_rejects (WERD_RES *word)
void flip_hyphens (WERD_RES *word)
void flip_0O (WERD_RES *word)
BOOL8 non_0_digit (const char *str, int length)

Variables

int tessedit_reject_mode = 5
int tessedit_ok_mode = 5
bool tessedit_use_nn = TRUE
bool tessedit_rejection_debug = FALSE
bool tessedit_rejection_stats = FALSE
bool tessedit_flip_0O = TRUE
double tessedit_lower_flip_hyphen = 1.5
double tessedit_upper_flip_hyphen = 1.8
bool rej_trust_doc_dawg = FALSE
bool rej_1Il_use_dict_word = FALSE
bool rej_1Il_trust_permuter_type = TRUE
bool one_ell_conflict_default = TRUE
bool show_char_clipping = FALSE
bool nn_debug = FALSE
bool nn_reject_debug = FALSE
bool nn_lax = FALSE
bool nn_double_check_dict = FALSE
bool nn_conf_double_check_dict = TRUE
bool nn_conf_1Il = TRUE
bool nn_conf_Ss = TRUE
bool nn_conf_hyphen = TRUE
bool nn_conf_test_good_qual = FALSE
bool nn_conf_test_dict = TRUE
bool nn_conf_test_sensible = TRUE
bool nn_conf_strict_on_dodgy_chs = TRUE
double nn_dodgy_char_threshold = 0.99
int nn_conf_accept_level = 4
int nn_conf_initial_i_level = 3
bool no_unrej_dubious_chars = TRUE
bool no_unrej_no_alphanum_wds = TRUE
bool no_unrej_1Il = FALSE
bool rej_use_tess_accepted = TRUE
bool rej_use_tess_blanks = TRUE
bool rej_use_good_perm = TRUE
bool rej_use_sensible_wd = FALSE
bool rej_alphas_in_number_perm = FALSE
double rej_whole_of_mostly_reject_word_fract = 0.85
int rej_mostly_reject_mode = 1
double tessed_fullstop_aspect_ratio = 1.2
int net_image_width = 40
int net_image_height = 36
int net_image_x_height = 22
int tessedit_image_border = 2
int net_bl_nodes = 20
double nn_reject_threshold = 0.5
double nn_reject_head_and_shoulders = 0.6
char * ok_single_ch_non_alphanum_wds = "-?\075"
char * ok_repeated_ch_non_alphanum_wds = "-?*\075"
char * conflict_set_I_l_1 = "Il1[]"
char * conflict_set_S_s = "Ss$"
char * conflict_set_hyphen = "-_~"
char * dubious_chars_left_of_reject = "!'+`()-./\<>;:^_,~\""
char * dubious_chars_right_of_reject = "!'+`()-./\<>;:^_,~\""
int min_sane_x_ht_pixels = 8

Function Documentation

float compute_reject_threshold ( BLOB_CHOICE_LIST_CLIST *  blob_choices  ) 
void dont_allow_1Il ( WERD_RES word  ) 
void dont_allow_dubious_chars ( WERD_RES word  ) 
inT16 evaluate_net_match ( char  top,
float  top_score,
char  next,
float  next_score,
char  tess_ch,
BOOL8  dict_word,
BOOL8  checked_dict_word,
BOOL8  sensible_word,
BOOL8  centre,
BOOL8  good_quality_word 
)
void flip_0O ( WERD_RES word  ) 
void flip_hyphens ( WERD_RES word  ) 
inT16 nn_match_char ( IMAGE scaled_image,
float  baseline_pos,
BOOL8  dict_word,
BOOL8  checked_dict_word,
BOOL8  sensible_word,
BOOL8  centre,
BOOL8  good_quality_word,
char  tess_ch 
)
BOOL8 non_0_digit ( const char *  str,
int  length 
)
void reject_blanks ( WERD_RES word  ) 
void reject_edge_blobs ( WERD_RES word  ) 
void reject_I_1_L ( WERD_RES word  ) 
void reject_mostly_rejects ( WERD_RES word  ) 
void reject_poor_matches ( WERD_RES word,
BLOB_CHOICE_LIST_CLIST *  blob_choices 
)
int sort_floats ( const void *  arg1,
const void *  arg2 
) [inline]
BOOL8 word_contains_non_1_digit ( const char *  word,
const char *  word_lengths 
)

Variable Documentation

char* conflict_set_hyphen = "-_~"

"hyphen conflict set"

char* conflict_set_I_l_1 = "Il1[]"

"Il1 conflict set"

char* conflict_set_S_s = "Ss$"

"Ss conflict set"

char* dubious_chars_left_of_reject = "!'+`()-./\<>;:^_,~\""

"Unreliable chars"

char* dubious_chars_right_of_reject = "!'+`()-./\<>;:^_,~\""

"Unreliable chars"

"Reject any x-ht lt or eq than this"

int net_bl_nodes = 20

"Number of baseline nodes"

int net_image_height = 36

"NN input image height"

int net_image_width = 40

"NN input image width"

"NN input image x_height"

"NN use 1Il conflicts"

"NN accept dodgy 1Il matches? "

"Double check for confusions"

"NN hyphen conflicts"

"NN accept initial Ii match level "

"NN use Ss conflicts"

"Require stronger NN match"

"NN dodgy 1Il cross check"

"NN dodgy 1Il cross check"

"NN dodgy 1Il cross check"

bool nn_debug = FALSE

"NN DEBUGGING?"

double nn_dodgy_char_threshold = 0.99

"min accept score"

"Double check"

bool nn_lax = FALSE

"Use 2nd rate matches"

"NN DEBUG each char?"

"top scores sep factor"

double nn_reject_threshold = 0.5

"NN min accept score"

bool no_unrej_1Il = FALSE

"Stop unrej of 1Ilchars?"

"Dubious chars next to reject?"

"Stop unrej of non A/N wds?"

"Allow NN to unrej"

"Allow NN to unrej"

"one_ell_conflict default"

"Dont double check"

"Use dictword test"

"Extend permuter check"

"0-never, 1-afterNN, 2-after new xht"

"Use DOC dawg in 11l conf. detector"

"Individual rejection control"

"Extend permuter check"

"Individual rejection control"

"Individual rejection control"

"if >this fract"

"Show clip image window?"

"if >this fract then reject"

"Contextual 0O O0 flips"

"Rej blbs near image edge limit"

"Aspect ratio dot/hyphen test"

"Acceptance decision algorithm"

"Rejection algorithm"

"Adaption debug"

"Show NN stats"

"Aspect ratio dot/hyphen test"

""

Generated on Sun Jul 18 17:10:49 2010 for Tesseract by  doxygen 1.6.3