#include "control.h"
#include "notdll.h"
Go to the source code of this file.
enum GARBAGE_LEVEL |
void print_boxes | ( | WERD * | word | ) |
void reject_whole_page | ( | PAGE_RES_IT & | page_res_it | ) |
BOOL8 terrible_word_crunch | ( | WERD_RES * | word, | |
GARBAGE_LEVEL | garbage_level | |||
) |
void word_char_quality | ( | WERD_RES * | word, | |
ROW * | row, | |||
inT16 * | match_count, | |||
inT16 * | accepted_match_count | |||
) |
Blob seg changes
CRUNCH_MODE word_deletable | ( | WERD_RES * | word, | |
inT16 & | delete_mode | |||
) |
bool bland_unrej = FALSE |
"unrej potential with no chekcs"
"Use acceptability in okstring"
int crunch_debug = 0 |
"As it says"
double crunch_del_cert = -10.0 |
"POTENTIAL crunch cert lt this"
double crunch_del_high_word = 1.5 |
"Del if word gt xht x this above bl"
double crunch_del_low_word = 0.5 |
"Del if word gt xht x this below bl"
double crunch_del_max_ht = 3.0 |
"Del if word ht gt xht x this"
double crunch_del_min_ht = 0.7 |
"Del if word ht lt xht x this"
double crunch_del_min_width = 3.0 |
"Del if word width lt xht x this"
double crunch_del_rating = 60 |
"POTENTIAL crunch rating lt this"
"Take out ~^ early?"
"Before word crunch?"
bool crunch_include_numerals = FALSE |
"Fiddle alpha figures"
bool crunch_leave_accept_strings = FALSE |
"Dont pot crunch sensible strings"
int crunch_leave_lc_strings = 4 |
"Dont crunch words with long lower case strings"
"Dont touch sensible strings"
int crunch_leave_uc_strings = 4 |
"Dont crunch words with long lower case strings"
int crunch_long_repetitions = 3 |
"Crunch words with long repetitions"
double crunch_poor_garbage_cert = -9.0 |
"crunch garbage cert lt this"
double crunch_poor_garbage_rate = 60 |
"crunch garbage rating lt this"
"POTENTIAL crunch garbage"
int crunch_pot_indicators = 1 |
"How many potential indicators needed"
double crunch_pot_poor_cert = -8.0 |
"POTENTIAL crunch cert lt this"
double crunch_pot_poor_rate = 40 |
"POTENTIAL crunch rating lt this"
int crunch_rating_max = 10 |
"For adj length in rating per ch"
double crunch_small_outlines_size = 0.6 |
"Small if lt xht x this"
"As it says"
double crunch_terrible_rating = 80.0 |
"crunch rating lt this"
bool docqual_excuse_outline_errs = FALSE |
"Allow outline errs in unrejection?"
char* outlines_2 = "ij!?%\":;" |
"Non standard number of outlines"
char* outlines_odd = "%| " |
"Non standard number of outlines"
double quality_rowrej_pc = 1.1 |
"good_quality_doc gte good char limit"
bool tessedit_debug_doc_rejection = FALSE |
"Page stats"
bool tessedit_debug_quality_metrics = FALSE |
"Output data to debug file"
bool tessedit_dont_blkrej_good_wds = FALSE |
"Use word segmentation quality metric"
bool tessedit_dont_rowrej_good_wds = FALSE |
"Use word segmentation quality metric"
double tessedit_good_doc_still_rowrej_wd = 1.1 |
"rej good doc wd if more than this fraction rejected"
"Reduce rejection on good docs"
"Only rej partially rejected words in block rejection"
int tessedit_preserve_min_wd_len = 2 |
"Only preserve wds longer than this"
"Only rej partially rejected words in row rejection"
"Reject all bad quality wds"
double tessedit_reject_block_percent = 45.00 |
"%rej allowed before rej whole block"
double tessedit_reject_doc_percent = 65.00 |
"%rej allowed before rej whole doc"
double tessedit_reject_row_percent = 40.00 |
"%rej allowed before rej whole row"
"Apply row rejection to good docs"
"Reject spaces?"
double tessedit_whole_wd_rej_row_percent = 70.00 |
"%of row rejects in whole word rejects which prevents whole row rejection"
"Mark v.bad words for tilde crunch"