tesseract-doxygen/dict/permute.h File Reference

#include "choicearr.h"
#include "choices.h"
#include "ratngs.h"
#include "varable.h"

Go to the source code of this file.

Defines

#define RATING_PAD   4.0

Functions

void adjust_non_word (const char *word, const char *word_lengths, float rating, float *new_rating, float *adjust_factor)
const char * choose_il1 (const char *first_char, const char *second_char, const char *third_char, const char *prev_char, const char *next_char, const char *next_next_char)

Variables

int fragments_debug = 0
bool segment_debug = 0
bool permute_debug = 0
bool permute_script_word = 0
bool segment_segcost_rating = 0
double segment_reward_script = 0.95
double segment_penalty_garbage = 1.5
double segment_penalty_dict_nonword = 1.25
int permute_only_top
float wordseg_rating_adjust_factor

Define Documentation

#define RATING_PAD   4.0

Function Documentation

void adjust_non_word ( const char *  word,
const char *  word_lengths,
float  rating,
float *  new_rating,
float *  adjust_factor 
)
const char* choose_il1 ( const char *  first_char,
const char *  second_char,
const char *  third_char,
const char *  prev_char,
const char *  next_char,
const char *  next_next_char 
)

Variable Documentation

int fragments_debug = 0

"Debug character fragments"

"char permutation debug"

"Debug char permutation process"

"Turn on word script consistency permuter"

"Debug the whole segmentation process"

"Score multiplier for glyph fragment segmentations which " "do not match a dictionary word (lower is better)."

"Score multiplier for glyph fragment segmentations which do not " "match a dictionary word (lower is better)."

"Score multiplier for poorly cased strings that are not " "in the dictionary and generally look like garbage " "(lower is better)."

"Score multiplier for poorly cased strings that are not in the " "dictionary and generally look like garbage (lower is better)."

double segment_reward_script = 0.95

"Score multipler for script consistency within a word. " "Being a 'reward' factor, it should be <= 1. " "Smaller value implies bigger reward."

"incorporate segmentation cost in word rating?"

Generated on Sun Jul 18 17:10:51 2010 for Tesseract by  doxygen 1.6.3