#include "varable.h"
#include "pageres.h"
#include "notdll.h"
Go to the source code of this file.
Functions | |
BOOL_EVAR_H (tessedit_write_block_separators, TRUE,"Write block separators in output") | |
BOOL_EVAR_H (tessedit_write_output, TRUE,"Write text to name.txt") | |
BOOL_EVAR_H (tessedit_write_txt_map, TRUE,"Write .txt to .etx map file") | |
BOOL_EVAR_H (tessedit_write_rep_codes, TRUE,"Write repetition char code") | |
BOOL_EVAR_H (tessedit_write_unlv, FALSE,"Write .unlv output file") | |
STRING_EVAR_H (unrecognised_char,"|","Output char for unidentified blobs") | |
INT_EVAR_H (suspect_level, 99,"Suspect marker level") | |
BOOL_EVAR_H (tessedit_minimal_rejection, FALSE,"Only reject tess failures") | |
void | write_results (PAGE_RES_IT &page_res_it, char newline_type, BOOL8 force_eol, BOOL8 write_to_shm) |
WERD_CHOICE * | make_epaper_choice (WERD_RES *word, char newline_type) |
inT16 | make_reject (TBOX *inset_box, inT16 prevright, inT16 nextleft, DENORM *denorm, char word_string[]) |
char | determine_newline_type (WERD *word, BLOCK *block, WERD *next_word, BLOCK *next_block) |
void | write_cooked_text (WERD *word, const STRING &text, BOOL8 acceptable, BOOL8 pass2, FILE *fp) |
void | write_shm_text (WERD_RES *word, BLOCK *block, ROW_RES *row, const STRING &text, const STRING &text_lengths) |
void | write_map (FILE *mapfile, WERD_RES *word) |
void | write_unlv_text (WERD_RES *word) |
void | ensure_rep_chars_are_consistent (WERD_RES *word) |
Variables | |
bool | tessedit_write_raw_output = FALSE |
int | suspect_space_level = 100 |
int | suspect_short_words = 2 |
bool | suspect_constrain_1Il = FALSE |
double | suspect_rating_per_ch = 999.9 |
double | suspect_accept_rating = -999.9 |
bool | tessedit_zero_rejection = FALSE |
bool | tessedit_word_for_word = FALSE |
bool | tessedit_consistent_reps = TRUE |
BOOL_EVAR_H | ( | tessedit_minimal_rejection | , | |
FALSE | , | |||
"Only reject tess failures" | ||||
) |
BOOL_EVAR_H | ( | tessedit_write_unlv | , | |
FALSE | , | |||
"Write .unlv output file" | ||||
) |
BOOL_EVAR_H | ( | tessedit_write_rep_codes | , | |
TRUE | , | |||
"Write repetition char code" | ||||
) |
BOOL_EVAR_H | ( | tessedit_write_txt_map | , | |
TRUE | , | |||
"Write .txt to .etx map file" | ||||
) |
BOOL_EVAR_H | ( | tessedit_write_output | , | |
TRUE | , | |||
"Write text to name.txt" | ||||
) |
BOOL_EVAR_H | ( | tessedit_write_block_separators | , | |
TRUE | , | |||
"Write block separators in output" | ||||
) |
test line ends
word | word to do | |
block | current block | |
next_word | next word | |
next_block | block of next word |
void ensure_rep_chars_are_consistent | ( | WERD_RES * | word | ) |
INT_EVAR_H | ( | suspect_level | , | |
99 | , | |||
"Suspect marker level" | ||||
) |
WERD_CHOICE* make_epaper_choice | ( | WERD_RES * | word, | |
char | newline_type | |||
) |
convert one word
word | word to do | |
newline_type | type of newline |
inT16 make_reject | ( | TBOX * | inset_box, | |
inT16 | prevright, | |||
inT16 | nextleft, | |||
DENORM * | denorm, | |||
char | word_string[] | |||
) |
make reject code
inset_box | bounding box | |
prevright | previous char | |
nextleft | next char | |
denorm | de-normalizer | |
word_string | output string |
STRING_EVAR_H | ( | unrecognised_char | , | |
"|" | , | |||
"Output char for unidentified blobs" | ||||
) |
void write_cooked_text | ( | WERD * | word, | |
const STRING & | text, | |||
BOOL8 | acceptable, | |||
BOOL8 | pass2, | |||
FILE * | fp | |||
) |
write output
word | word to do | |
text | text to write | |
acceptable | good stuff | |
pass2 | done on pass2 | |
fp | file to write |
void write_map | ( | FILE * | mapfile, | |
WERD_RES * | word | |||
) |
output a map file
mapfile | mapfile to write to |
void write_results | ( | PAGE_RES_IT & | page_res_it, | |
char | newline_type, | |||
BOOL8 | force_eol, | |||
BOOL8 | write_to_shm | |||
) |
output a word
page_res_it | full info | |
newline_type | type of newline | |
force_eol | override tilde crunch? | |
write_to_shm | send to api |
void write_shm_text | ( | WERD_RES * | word, | |
BLOCK * | block, | |||
ROW_RES * | row, | |||
const STRING & | text, | |||
const STRING & | text_lengths | |||
) |
write output
word | word to do | |
block | block it is from | |
row | row it is from | |
text | text to write |
void write_unlv_text | ( | WERD_RES * | word | ) |
double suspect_accept_rating = -999.9 |
"Accept good rating limit"
bool suspect_constrain_1Il = FALSE |
"UNLV keep 1Il chars rejected"
double suspect_rating_per_ch = 999.9 |
"Dont touch bad rating limit"
int suspect_short_words = 2 |
"Dont Suspect dict wds longer than this"
int suspect_space_level = 100 |
"Min suspect level for rejecting spaces"
"Force all rep chars the same"
bool tessedit_word_for_word = FALSE |
"Make output have exactly one word per WERD"
bool tessedit_write_raw_output = FALSE |
"Write raw stuff to name.raw"
bool tessedit_zero_rejection = FALSE |
"Dont reject ANYTHING"