tesseract  v4.0.0-17-g361f3264
Open Source OCR Engine
tesseract::Dict Member List

This is the complete list of members for tesseract::Dict, including all inherited members.

absolute_garbage(const WERD_CHOICE &word, const UNICHARSET &unicharset)tesseract::Dict
AcceptableChoice(const WERD_CHOICE &best_choice, XHeightConsistencyEnum xheight_consistency)tesseract::Dict
AcceptableResult(WERD_RES *word) consttesseract::Dict
add_document_word(const WERD_CHOICE &best_choice)tesseract::Dict
adjust_word(WERD_CHOICE *word, bool nonword, XHeightConsistencyEnum xheight_consistency, float additional_adjust, bool modify_rating, bool debug)tesseract::Dict
apostrophe_unichar_id_tesseract::Dictprivate
append_choices(const char *debug, const BLOB_CHOICE_LIST_VECTOR &char_choices, const BLOB_CHOICE &blob_choice, int char_choice_index, const CHAR_FRAGMENT_INFO *prev_char_frag_info, WERD_CHOICE *word, float certainties[], float *limit, WERD_CHOICE *best_choice, int *attempts_left, void *more_args)tesseract::Dict
bigram_dawg_tesseract::Dictprivate
BOOL_VAR_H(load_system_dawg, true, "Load system word dawg.")tesseract::Dict
BOOL_VAR_H(load_freq_dawg, true, "Load frequent word dawg.")tesseract::Dict
BOOL_VAR_H(load_unambig_dawg, true, "Load unambiguous word dawg.")tesseract::Dict
BOOL_VAR_H(load_punc_dawg, true, "Load dawg with punctuation patterns.")tesseract::Dict
BOOL_VAR_H(load_number_dawg, true, "Load dawg with number patterns.")tesseract::Dict
BOOL_VAR_H(load_bigram_dawg, true, "Load dawg with special word bigrams.")tesseract::Dict
BOOL_VAR_H(use_only_first_uft8_step, false, "Use only the first UTF8 step of the given string" " when computing log probabilities.")tesseract::Dict
BOOL_VAR_H(stopper_no_acceptable_choices, false, "Make AcceptableChoice() always return false. Useful" " when there is a need to explore all segmentations")tesseract::Dict
BOOL_VAR_H(segment_nonalphabetic_script, false, "Don't use any alphabetic-specific tricks." "Set to true in the traineddata config file for" " scripts that are cursive or inherently fixed-pitch")tesseract::Dict
BOOL_VAR_H(save_doc_words, 0, "Save Document Words")tesseract::Dict
CallParamsModelClassify(void *path)tesseract::Dictinline
case_ok(const WERD_CHOICE &word, const UNICHARSET &unicharset) consttesseract::Dict
ccutil_tesseract::Dictprivate
char_for_dawg(const UNICHARSET &unicharset, UNICHAR_ID ch, const Dawg *dawg) consttesseract::Dictinline
compound_marker(UNICHAR_ID unichar_id)tesseract::Dictinline
copy_hyphen_info(WERD_CHOICE *word) consttesseract::Dictinline
dang_ambigs_table_tesseract::Dictprivate
dawg_cache_tesseract::Dictprivate
dawg_cache_is_ours_tesseract::Dictprivate
dawg_permute_and_select(const BLOB_CHOICE_LIST_VECTOR &char_choices, float rating_limit)tesseract::Dict
dawgs_tesseract::Dictprivate
DebugWordChoices()tesseract::Dict
def_letter_is_okay(void *void_dawg_args, const UNICHARSET &unicharset, UNICHAR_ID unichar_id, bool word_end) consttesseract::Dict
def_probability_in_context(const char *lang, const char *context, int context_bytes, const char *character, int character_bytes)tesseract::Dictinline
default_dawgs(DawgPositionVector *anylength_dawgs, bool suppress_patterns) consttesseract::Dict
Dict(CCUtil *image_ptr)tesseract::Dict
document_words_tesseract::Dictprivate
double_VAR_H(xheight_penalty_subscripts, 0.125, "Score penalty (0.1 = 10%) added if there are subscripts " "or superscripts in a word, but it is otherwise OK.")tesseract::Dict
double_VAR_H(xheight_penalty_inconsistent, 0.25, "Score penalty (0.1 = 10%) added if an xheight is " "inconsistent.")tesseract::Dict
double_VAR_H(segment_penalty_dict_frequent_word, 1.0, "Score multiplier for word matches which have good case and" "are frequent in the given language (lower is better).")tesseract::Dict
double_VAR_H(segment_penalty_dict_case_ok, 1.1, "Score multiplier for word matches that have good case " "(lower is better).")tesseract::Dict
double_VAR_H(segment_penalty_dict_case_bad, 1.3125, "Default score multiplier for word matches, which may have " "case issues (lower is better).")tesseract::Dict
double_VAR_H(segment_penalty_dict_nonword, 1.25, "Score multiplier for glyph fragment segmentations which " "do not match a dictionary word (lower is better).")tesseract::Dict
double_VAR_H(segment_penalty_garbage, 1.50, "Score multiplier for poorly cased strings that are not in" " the dictionary and generally look like garbage (lower is" " better).")tesseract::Dict
double_VAR_H(certainty_scale, 20.0, "Certainty scaling factor")tesseract::Dict
double_VAR_H(stopper_nondict_certainty_base, -2.50, "Certainty threshold for non-dict words")tesseract::Dict
double_VAR_H(stopper_phase2_certainty_rejection_offset, 1.0, "Reject certainty offset")tesseract::Dict
double_VAR_H(stopper_certainty_per_char, -0.50, "Certainty to add for each dict char above small word size.")tesseract::Dict
double_VAR_H(stopper_allowable_character_badness, 3.0, "Max certaintly variation allowed in a word (in sigma)")tesseract::Dict
double_VAR_H(doc_dict_pending_threshold, 0.0, "Worst certainty for using pending dictionary")tesseract::Dict
double_VAR_H(doc_dict_certainty_threshold, -2.25, "Worst certainty" " for words that can be inserted into the document dictionary")tesseract::Dict
End()tesseract::Dict
EndDangerousAmbigs()tesseract::Dict
equivalent_symbols_tesseract::Dictprivate
FinishLoad()tesseract::Dict
fragment_state_okay(UNICHAR_ID curr_unichar_id, float curr_rating, float curr_certainty, const CHAR_FRAGMENT_INFO *prev_char_frag_info, const char *debug, int word_ending, CHAR_FRAGMENT_INFO *char_frag_info)tesseract::Dict
freq_dawg_tesseract::Dictprivate
getCCUtil() consttesseract::Dictinline
getCCUtil()tesseract::Dictinline
GetDawg(int index) consttesseract::Dictinline
GetPuncDawg() consttesseract::Dictinline
GetStartingNode(const Dawg *dawg, EDGE_REF edge_ref)tesseract::Dictinlinestatic
GetUnambigDawg() consttesseract::Dictinline
getUnicharAmbigs() consttesseract::Dictinline
getUnicharset() consttesseract::Dictinline
getUnicharset()tesseract::Dictinline
GlobalDawgCache()tesseract::Dictstatic
go_deeper_dawg_fxn(const char *debug, const BLOB_CHOICE_LIST_VECTOR &char_choices, int char_choice_index, const CHAR_FRAGMENT_INFO *prev_char_frag_info, bool word_ending, WERD_CHOICE *word, float certainties[], float *limit, WERD_CHOICE *best_choice, int *attempts_left, void *void_more_args)tesseract::Dict
go_deeper_fxn_tesseract::Dict
good_choice(const WERD_CHOICE &choice)tesseract::Dict
has_hyphen_end(UNICHAR_ID unichar_id, bool first_pos) consttesseract::Dictinline
has_hyphen_end(const WERD_CHOICE &word) consttesseract::Dictinline
hyphen_active_dawgs_tesseract::Dictprivate
hyphen_base_size() consttesseract::Dictinline
hyphen_unichar_id_tesseract::Dictprivate
hyphen_word_tesseract::Dictprivate
hyphenated() consttesseract::Dictinline
init_active_dawgs(DawgPositionVector *active_dawgs, bool ambigs_mode) consttesseract::Dict
INT_VAR_H(dawg_debug_level, 0, "Set to 1 for general debug info" ", to 2 for more details, to 3 to see all the debug messages")tesseract::Dict
INT_VAR_H(hyphen_debug_level, 0, "Debug level for hyphenated words.")tesseract::Dict
INT_VAR_H(max_viterbi_list_size, 10, "Maximum size of viterbi list.")tesseract::Dict
INT_VAR_H(stopper_smallword_size, 2, "Size of dict word to be treated as non-dict word")tesseract::Dict
INT_VAR_H(stopper_debug_level, 0, "Stopper debug level")tesseract::Dict
INT_VAR_H(tessedit_truncate_wordchoice_log, 10, "Max words to keep in list")tesseract::Dict
INT_VAR_H(fragments_debug, 0, "Debug character fragments")tesseract::Dict
INT_VAR_H(max_permuter_attempts, 10000, "Maximum number of different" " character choices to consider during permutation." " This limit is especially useful when user patterns" " are specified, since overly generic patterns can result in" " dawg search exploring an overly large number of options.")tesseract::Dict
is_apostrophe(UNICHAR_ID unichar_id)tesseract::Dictinline
IsSpaceDelimitedLang() consttesseract::Dict
last_word_on_line_tesseract::Dictprivate
LengthOfShortestAlphaRun(const WERD_CHOICE &WordChoice) consttesseract::Dict
letter_is_okay_tesseract::Dict
LetterIsOkay(void *void_dawg_args, const UNICHARSET &unicharset, UNICHAR_ID unichar_id, bool word_end) consttesseract::Dictinline
Load(const STRING &lang, TessdataManager *data_file)tesseract::Dict
LoadLSTM(const STRING &lang, TessdataManager *data_file)tesseract::Dict
ngram_probability_in_context(const char *lang, const char *context, int context_bytes, const char *character, int character_bytes)tesseract::Dict
NoDangerousAmbig(WERD_CHOICE *BestChoice, DANGERR *fixpt, bool fix_replaceable, MATRIX *ratings)tesseract::Dict
NumDawgs() consttesseract::Dictinline
output_ambig_words_file_tesseract::Dictprivate
params_model_classify_tesseract::Dict
ParamsModelClassify(const char *lang, void *path)tesseract::Dict
pending_words_tesseract::Dictprivate
permute_choices(const char *debug, const BLOB_CHOICE_LIST_VECTOR &char_choices, int char_choice_index, const CHAR_FRAGMENT_INFO *prev_char_frag_info, WERD_CHOICE *word, float certainties[], float *limit, WERD_CHOICE *best_choice, int *attempts_left, void *more_args)tesseract::Dict
probability_in_context_tesseract::Dict
ProbabilityInContext(const char *context, int context_bytes, const char *character, int character_bytes)tesseract::Dictinline
ProcessPatternEdges(const Dawg *dawg, const DawgPosition &info, UNICHAR_ID unichar_id, bool word_end, DawgArgs *dawg_args, PermuterType *current_permuter) consttesseract::Dict
punc_dawg_tesseract::Dictprivate
question_unichar_id_tesseract::Dictprivate
reject_offset_tesseract::Dictprivate
replace_ambigs_table_tesseract::Dictprivate
ReplaceAmbig(int wrong_ngram_begin_index, int wrong_ngram_size, UNICHAR_ID correct_ngram_id, WERD_CHOICE *werd_choice, MATRIX *ratings)tesseract::Dict
reset_hyphen_vars(bool last_word_on_line)tesseract::Dict
ResetDocumentDictionary()tesseract::Dictinline
set_hyphen_word(const WERD_CHOICE &word, const DawgPositionVector &active_dawgs)tesseract::Dict
SettupStopperPass1()tesseract::Dict
SettupStopperPass2()tesseract::Dict
SetupForLoad(DawgCache *dawg_cache)tesseract::Dict
SetWildcardID(UNICHAR_ID id)tesseract::Dictinline
SetWordsegRatingAdjustFactor(float f)tesseract::Dictinline
slash_unichar_id_tesseract::Dictprivate
STRING_VAR_H(user_words_file, "", "A filename of user-provided words.")tesseract::Dict
STRING_VAR_H(user_words_suffix, "", "A suffix of user-provided words located in tessdata.")tesseract::Dict
STRING_VAR_H(user_patterns_file, "", "A filename of user-provided patterns.")tesseract::Dict
STRING_VAR_H(user_patterns_suffix, "", "A suffix of user-provided patterns located in tessdata.")tesseract::Dict
STRING_VAR_H(output_ambig_words_file, "", "Output file for ambiguities found in the dictionary")tesseract::Dict
STRING_VAR_H(word_to_debug, "", "Word for which stopper debug information" " should be printed to stdout")tesseract::Dict
STRING_VAR_H(word_to_debug_lengths, "", "Lengths of unichars in word_to_debug")tesseract::Dict
successors_tesseract::Dictprivate
unambig_dawg_tesseract::Dictprivate
UniformCertainties(const WERD_CHOICE &word)tesseract::Dict
update_best_choice(const WERD_CHOICE &word, WERD_CHOICE *best_choice)tesseract::Dictinline
valid_bigram(const WERD_CHOICE &word1, const WERD_CHOICE &word2) consttesseract::Dict
valid_punctuation(const WERD_CHOICE &word)tesseract::Dict
valid_word(const WERD_CHOICE &word, bool numbers_ok) consttesseract::Dict
valid_word(const WERD_CHOICE &word) consttesseract::Dictinline
valid_word(const char *string) consttesseract::Dictinline
valid_word_or_number(const WERD_CHOICE &word) consttesseract::Dictinline
valid_word_permuter(uint8_t perm, bool numbers_ok)tesseract::Dictinlinestatic
wildcard_unichar_id_tesseract::Dictprivate
WildcardID() consttesseract::Dictinline
wordseg_rating_adjust_factor_tesseract::Dictprivate
~Dict()tesseract::Dict