Skip to content

Commit

Permalink
Adding tesseract back
Browse files Browse the repository at this point in the history
  • Loading branch information
astutejoe committed Jul 6, 2021
1 parent 76a8849 commit 39536ab
Show file tree
Hide file tree
Showing 38 changed files with 146 additions and 0 deletions.
8 changes: 8 additions & 0 deletions tesseract/tessdata/configs/Makefile.am
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
datadir = @datadir@/tessdata/configs
data_DATA = inter makebox box.train unlv ambigs.train lstm.train lstmdebug
data_DATA += api_config kannada box.train.stderr quiet logfile digits get.images
data_DATA += lstmbox wordstrbox
# Configurations for OCR output.
data_DATA += alto hocr pdf tsv txt
data_DATA += linebox rebox strokewidth bigram
EXTRA_DIST = $(data_DATA)
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/alto
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_create_alto 1
7 changes: 7 additions & 0 deletions tesseract/tessdata/configs/ambigs.train
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
tessedit_ambigs_training 1
load_freq_dawg 0
load_punc_dawg 0
load_system_dawg 0
load_number_dawg 0
ambigs_debug_level 3
load_fixed_length_dawgs 0
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/api_config
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_zero_rejection T
4 changes: 4 additions & 0 deletions tesseract/tessdata/configs/bazaar
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
load_system_dawg F
load_freq_dawg F
user_words_suffix user-words
user_patterns_suffix user-patterns
5 changes: 5 additions & 0 deletions tesseract/tessdata/configs/bigram
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
load_bigram_dawg True
tessedit_enable_bigram_correction True
tessedit_bigram_debug 3
save_raw_choices True
save_alt_choices True
12 changes: 12 additions & 0 deletions tesseract/tessdata/configs/box.train
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
disable_character_fragments T
file_type .bl
textord_fast_pitch_test T
tessedit_zero_rejection T
tessedit_minimal_rejection F
tessedit_write_rep_codes F
edges_children_fix F
edges_childarea 0.65
edges_boxarea 0.9
tessedit_resegment_from_boxes T
tessedit_train_from_boxes T
textord_no_rejects T
13 changes: 13 additions & 0 deletions tesseract/tessdata/configs/box.train.stderr
Original file line number Diff line number Diff line change
@@ -0,0 +1,13 @@
file_type .bl
#tessedit_use_nn F
textord_fast_pitch_test T
tessedit_zero_rejection T
tessedit_minimal_rejection F
tessedit_write_rep_codes F
edges_children_fix F
edges_childarea 0.65
edges_boxarea 0.9
tessedit_resegment_from_boxes T
tessedit_train_from_boxes T
#textord_repeat_extraction F
textord_no_rejects T
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/digits
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_char_whitelist 0123456789-.
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/get.images
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_write_images T
2 changes: 2 additions & 0 deletions tesseract/tessdata/configs/hocr
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
tessedit_create_hocr 1
hocr_font_info 0
2 changes: 2 additions & 0 deletions tesseract/tessdata/configs/inter
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
interactive_display_mode T
tessedit_display_outwords T
4 changes: 4 additions & 0 deletions tesseract/tessdata/configs/kannada
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
textord_skewsmooth_offset 8
textord_skewsmooth_offset2 8
textord_merge_desc 0.5
textord_no_rejects 1
2 changes: 2 additions & 0 deletions tesseract/tessdata/configs/linebox
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
tessedit_resegment_from_line_boxes 1
tessedit_make_boxes_from_boxes 1
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/logfile
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
debug_file tesseract.log
11 changes: 11 additions & 0 deletions tesseract/tessdata/configs/lstm.train
Original file line number Diff line number Diff line change
@@ -0,0 +1,11 @@
file_type .bl
textord_fast_pitch_test T
tessedit_zero_rejection T
tessedit_minimal_rejection F
tessedit_write_rep_codes F
edges_children_fix F
edges_childarea 0.65
edges_boxarea 0.9
tessedit_train_line_recognizer T
textord_no_rejects T
tessedit_init_config_only T
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/lstmbox
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_create_lstmbox 1
4 changes: 4 additions & 0 deletions tesseract/tessdata/configs/lstmdebug
Original file line number Diff line number Diff line change
@@ -0,0 +1,4 @@
stopper_debug_level 1
classify_debug_level 1
segsearch_debug_level 1
language_model_debug_level 3
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/makebox
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_create_boxfile 1
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/pdf
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_create_pdf 1
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/quiet
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
debug_file /dev/null
2 changes: 2 additions & 0 deletions tesseract/tessdata/configs/rebox
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
tessedit_resegment_from_boxes 1
tessedit_make_boxes_from_boxes 1
12 changes: 12 additions & 0 deletions tesseract/tessdata/configs/strokewidth
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
textord_show_blobs 0
textord_debug_tabfind 3
textord_tabfind_show_partitions 1
textord_tabfind_show_initial_partitions 1
textord_tabfind_show_columns 1
textord_tabfind_show_blocks 1
textord_tabfind_show_initialtabs 1
textord_tabfind_show_finaltabs 1
textord_tabfind_show_strokewidths 1
textord_tabfind_show_vlines 0
textord_tabfind_show_images 1
tessedit_dump_pageseg_images 0
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/tsv
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_create_tsv 1
3 changes: 3 additions & 0 deletions tesseract/tessdata/configs/txt
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
# This config file should be used with other cofig files which creates renderers.
# usage example: tesseract eurotext.tif eurotext txt hocr pdf
tessedit_create_txt 1
2 changes: 2 additions & 0 deletions tesseract/tessdata/configs/unlv
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
tessedit_write_unlv 1
unlv_tilde_crunching T
1 change: 1 addition & 0 deletions tesseract/tessdata/configs/wordstrbox
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
tessedit_create_wordstrbox 1
Binary file added tesseract/tessdata/eng.traineddata
Binary file not shown.
2 changes: 2 additions & 0 deletions tesseract/tessdata/eng.user-patterns
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
1-\d\d\d-GOOG-411
www.\n\\\*.com
5 changes: 5 additions & 0 deletions tesseract/tessdata/eng.user-words
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
the
quick
brown
fox
jumped
Binary file added tesseract/tessdata/pdf.ttf
Binary file not shown.
3 changes: 3 additions & 0 deletions tesseract/tessdata/tessconfigs/Makefile.am
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
datadir = @datadir@/tessdata/tessconfigs
data_DATA = batch batch.nochop nobatch matdemo segdemo msdemo
EXTRA_DIST = batch batch.nochop nobatch matdemo segdemo msdemo
1 change: 1 addition & 0 deletions tesseract/tessdata/tessconfigs/batch
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
# No content needed as all defaults are correct.
2 changes: 2 additions & 0 deletions tesseract/tessdata/tessconfigs/batch.nochop
Original file line number Diff line number Diff line change
@@ -0,0 +1,2 @@
chop_enable 0
wordrec_enable_assoc 0
7 changes: 7 additions & 0 deletions tesseract/tessdata/tessconfigs/matdemo
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
#################################################
# Adaptive Matcher Using PreAdapted Templates
#################################################

classify_enable_adaptive_debugger 1
matcher_debug_flags 6
matcher_debug_level 1
12 changes: 12 additions & 0 deletions tesseract/tessdata/tessconfigs/msdemo
Original file line number Diff line number Diff line change
@@ -0,0 +1,12 @@
#################################################
# Adaptive Matcher Using PreAdapted Templates
#################################################

classify_enable_adaptive_debugger 1
matcher_debug_flags 6
matcher_debug_level 1

wordrec_display_splits 0
wordrec_display_all_blobs 1
wordrec_display_segmentations 2
classify_debug_level 1
1 change: 1 addition & 0 deletions tesseract/tessdata/tessconfigs/nobatch
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@

9 changes: 9 additions & 0 deletions tesseract/tessdata/tessconfigs/segdemo
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
#################################################
# Adaptive Matcher Using PreAdapted Templates
#################################################

wordrec_display_splits 0
wordrec_display_all_blobs 1
wordrec_display_segmentations 2
classify_debug_level 1
stopper_debug_level 1

0 comments on commit 39536ab

Please sign in to comment.