Skip to content
GitLab
Menu
Projects
Groups
Snippets
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Sign in
Toggle navigation
Menu
Open sidebar
smarthec
smarthec_backend
Commits
4024f970
Commit
4024f970
authored
Jul 08, 2021
by
Robert Sachunsky
Browse files
workflow: use wolf binarization, fix whitelisting
parent
c5b7ddbb
Changes
1
Hide whitespace changes
Inline
Side-by-side
smarthec-sparse-tesseract-deu.mk
View file @
4024f970
...
...
@@ -102,15 +102,17 @@ $(RECOGNIZED): OPTIONS = -P model deu \
-P textequiv_level glyph
\
-P xpath_parameters
\
'{ "contains(@custom
,
\"
zeitraum
\"
)":
\
{ "char_whitelist": "0123456789.
,
-" }
,
\
{ "
tessedit_
char_whitelist": "0123456789.
,
-
" }
,
\
"contains(@custom
,
\"
kost
\"
) and not(contains(@custom
,
\"
anteil
\"
))":
\
{ "char_whitelist": "0123456789.
,
" }
,
\
"contains(@custom
,
\"
einheiten
\"
) or contains(@custom
,
\"
temperatur
\"
)":
\
{ "char_whitelist": "0123456789." }
,
\
{ "tessedit_char_whitelist": "0123456789.
,
€" }
,
\
"contains(@custom
,
\"
einheiten
\"
) or contains(@custom
,
\"
_flaeche
\"
) or contains(@custom
,
\"
_verbrauch
\"
) and not(contains(@custom(
\"
_einheit
\"
)))":
\
{ "tessedit_char_whitelist": "0123456789.
,
" }
,
\
"contains(@custom
,
\"
temperatur
\"
)":
\
{ "tessedit_char_whitelist": "0123456789" }
,
\
"contains(@custom
,
\"
anteil
\"
)":
\
{ "char_whitelist": "0123456789%" }
,
\
{ "
tessedit_
char_whitelist": "0123456789%" }
,
\
"contains(@custom
,
\"
_einheit
\"
)":
\
{ "char_whitelist": "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz23²³." }
\
{ "
tessedit_
char_whitelist": "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz23²³." }
\
}'
.DEFAULT_GOAL
=
$(RECOGNIZED)
...
...
Robert Sachunsky
@sachunsky
mentioned in commit
12934c0e
·
Aug 24, 2021
mentioned in commit
12934c0e
mentioned in commit 12934c0e92181f00561eaacb4840ed7a5008f45a
Toggle commit list
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment