#include "control.h"#include "notdll.h"Go to the source code of this file.
| enum GARBAGE_LEVEL |
| void print_boxes | ( | WERD * | word | ) |
| void reject_whole_page | ( | PAGE_RES_IT & | page_res_it | ) |
| BOOL8 terrible_word_crunch | ( | WERD_RES * | word, | |
| GARBAGE_LEVEL | garbage_level | |||
| ) |
| void word_char_quality | ( | WERD_RES * | word, | |
| ROW * | row, | |||
| inT16 * | match_count, | |||
| inT16 * | accepted_match_count | |||
| ) |
Blob seg changes
| CRUNCH_MODE word_deletable | ( | WERD_RES * | word, | |
| inT16 & | delete_mode | |||
| ) |
| bool bland_unrej = FALSE |
"unrej potential with no chekcs"
"Use acceptability in okstring"
| int crunch_debug = 0 |
"As it says"
| double crunch_del_cert = -10.0 |
"POTENTIAL crunch cert lt this"
| double crunch_del_high_word = 1.5 |
"Del if word gt xht x this above bl"
| double crunch_del_low_word = 0.5 |
"Del if word gt xht x this below bl"
| double crunch_del_max_ht = 3.0 |
"Del if word ht gt xht x this"
| double crunch_del_min_ht = 0.7 |
"Del if word ht lt xht x this"
| double crunch_del_min_width = 3.0 |
"Del if word width lt xht x this"
| double crunch_del_rating = 60 |
"POTENTIAL crunch rating lt this"
"Take out ~^ early?"
"Before word crunch?"
| bool crunch_include_numerals = FALSE |
"Fiddle alpha figures"
| bool crunch_leave_accept_strings = FALSE |
"Dont pot crunch sensible strings"
| int crunch_leave_lc_strings = 4 |
"Dont crunch words with long lower case strings"
"Dont touch sensible strings"
| int crunch_leave_uc_strings = 4 |
"Dont crunch words with long lower case strings"
| int crunch_long_repetitions = 3 |
"Crunch words with long repetitions"
| double crunch_poor_garbage_cert = -9.0 |
"crunch garbage cert lt this"
| double crunch_poor_garbage_rate = 60 |
"crunch garbage rating lt this"
"POTENTIAL crunch garbage"
| int crunch_pot_indicators = 1 |
"How many potential indicators needed"
| double crunch_pot_poor_cert = -8.0 |
"POTENTIAL crunch cert lt this"
| double crunch_pot_poor_rate = 40 |
"POTENTIAL crunch rating lt this"
| int crunch_rating_max = 10 |
"For adj length in rating per ch"
| double crunch_small_outlines_size = 0.6 |
"Small if lt xht x this"
"As it says"
| double crunch_terrible_rating = 80.0 |
"crunch rating lt this"
| bool docqual_excuse_outline_errs = FALSE |
"Allow outline errs in unrejection?"
| char* outlines_2 = "ij!?%\":;" |
"Non standard number of outlines"
| char* outlines_odd = "%| " |
"Non standard number of outlines"
| double quality_rowrej_pc = 1.1 |
"good_quality_doc gte good char limit"
| bool tessedit_debug_doc_rejection = FALSE |
"Page stats"
| bool tessedit_debug_quality_metrics = FALSE |
"Output data to debug file"
| bool tessedit_dont_blkrej_good_wds = FALSE |
"Use word segmentation quality metric"
| bool tessedit_dont_rowrej_good_wds = FALSE |
"Use word segmentation quality metric"
| double tessedit_good_doc_still_rowrej_wd = 1.1 |
"rej good doc wd if more than this fraction rejected"
"Reduce rejection on good docs"
"Only rej partially rejected words in block rejection"
| int tessedit_preserve_min_wd_len = 2 |
"Only preserve wds longer than this"
"Only rej partially rejected words in row rejection"
"Reject all bad quality wds"
| double tessedit_reject_block_percent = 45.00 |
"%rej allowed before rej whole block"
| double tessedit_reject_doc_percent = 65.00 |
"%rej allowed before rej whole doc"
| double tessedit_reject_row_percent = 40.00 |
"%rej allowed before rej whole row"
"Apply row rejection to good docs"
"Reject spaces?"
| double tessedit_whole_wd_rej_row_percent = 70.00 |
"%of row rejects in whole word rejects which prevents whole row rejection"
"Mark v.bad words for tilde crunch"
1.6.3