Fixed issue 6

jeff-cn · Dec 19, 2016 · cbbbf96 · cbbbf96
1 parent 0f0d6e9
commit cbbbf96
Show file tree

Hide file tree

Showing 3 changed files with 69 additions and 0 deletions.
diff --git a/mar/mar.config b/mar/mar.config
@@ -0,0 +1,23 @@
+# Use Tesseract/LSTM combiner
+# (see OcrEngineMode enum in third_party/tesseract/ccstruct/publictypes.h).
+tessedit_ocr_engine_mode	2
+
+# Devanagari configuration variables
+
+# Preprocess images to split shiro rekha
+pageseg_devanagari_split_strategy 1
+segment_nonalphabetic_script 1
+
+# Avoid over-estimating intra-word spacing at both row and
+# block levels when using old to method
+tosp_old_to_method T
+tosp_old_to_constrain_sp_kn T
+tosp_old_sp_kn_th_factor 4.0
+
+tosp_only_small_gaps_for_kern T
+tosp_use_pre_chopping T
+
+# Add a penalty for non-alphanumerics that are vertically badly positioned.
+classify_misfit_junk_penalty 0.125
+
+merge_fragments_in_matrix F
diff --git a/nep/nep.config b/nep/nep.config
@@ -0,0 +1,23 @@
+# Use Tesseract/LSTM combiner
+# (see OcrEngineMode enum in third_party/tesseract/ccstruct/publictypes.h).
+tessedit_ocr_engine_mode	2
+
+# Devanagari configuration variables
+
+# Preprocess images to split shiro rekha
+pageseg_devanagari_split_strategy 1
+segment_nonalphabetic_script 1
+
+# Avoid over-estimating intra-word spacing at both row and
+# block levels when using old to method
+tosp_old_to_method T
+tosp_old_to_constrain_sp_kn T
+tosp_old_sp_kn_th_factor 4.0
+
+tosp_only_small_gaps_for_kern T
+tosp_use_pre_chopping T
+
+# Add a penalty for non-alphanumerics that are vertically badly positioned.
+classify_misfit_junk_penalty 0.125
+
+merge_fragments_in_matrix F
diff --git a/san/san.config b/san/san.config
@@ -0,0 +1,23 @@
+# Use Tesseract/LSTM combiner
+# (see OcrEngineMode enum in third_party/tesseract/ccstruct/publictypes.h).
+tessedit_ocr_engine_mode	2
+
+# Devanagari configuration variables
+
+# Preprocess images to split shiro rekha
+pageseg_devanagari_split_strategy 1
+segment_nonalphabetic_script 1
+
+# Avoid over-estimating intra-word spacing at both row and
+# block levels when using old to method
+tosp_old_to_method T
+tosp_old_to_constrain_sp_kn T
+tosp_old_sp_kn_th_factor 4.0
+
+tosp_only_small_gaps_for_kern T
+tosp_use_pre_chopping T
+
+# Add a penalty for non-alphanumerics that are vertically badly positioned.
+classify_misfit_junk_penalty 0.125
+
+merge_fragments_in_matrix F