@@ -12,23 +12,6 @@ all: all-tess all-hunspell
12
12
13
13
TESS_MODELS := frak2021 GT4HistOCR ONB Fraktur_5000000 german_print frk Fraktur
14
14
15
- get-tess : $(TESS_MODELS:%=%.traineddata )
16
-
17
- all-tess : $(foreach MODEL, $(TESS_MODELS ) , $(MODEL ) _dta10.traineddata $(MODEL ) _dta50.traineddata $(MODEL ) _dta100.traineddata)
18
-
19
- % _dta10.traineddata : dta_lexdb_10.words
20
- % _dta50.traineddata : dta_lexdb_50.words
21
- % _dta100.traineddata : dta_lexdb_100.words
22
- % _dta10.traineddata % _dta50.traineddata % _dta100.traineddata : % .traineddata
23
- cp $< $@
24
- ./combine_tessdata.sh $@ dta_lexdb_$(patsubst $* _dta% .traineddata,% ,$@ ) .words
25
-
26
- dta_lexdb_% .words : dta_lexdb.sqlite
27
- ./sql2wordlist.sh $< $@ $*
28
-
29
- dta_lexdb.sqlite :
30
- wget -O $@ https://www.dwds.de/dwds_static/lexdb/dta/lexdb.sqlite
31
-
32
15
GT4HistOCR.traineddata :
33
16
wget -O $@ https://ub-backup.bib.uni-mannheim.de/~stweil/tesstrain/GT4HistOCR/tessdata_best/GT4HistOCR.traineddata
34
17
@@ -50,6 +33,28 @@ frk.traineddata:
50
33
Fraktur.traineddata :
51
34
wget -O $@ https://github.com/tesseract-ocr/tessdata_fast/raw/main/script/Fraktur.traineddata
52
35
36
+ get-tess : $(TESS_MODELS:%=%.traineddata )
37
+
38
+ all-tess : $(foreach MODEL, $(TESS_MODELS ) , $(MODEL ) _dta10.traineddata $(MODEL ) _dta50.traineddata $(MODEL ) _dta100.traineddata)
39
+
40
+ % _dta10.traineddata : % .traineddata dta_lexdb_10.words
41
+ cp $< $@
42
+ ./combine_tessdata.sh $@ dta_lexdb_10.words
43
+
44
+ % _dta50.traineddata : % .traineddata dta_lexdb_50.words
45
+ cp $< $@
46
+ ./combine_tessdata.sh $@ dta_lexdb_50.words
47
+
48
+ % _dta100.traineddata : % .traineddata dta_lexdb_100.words
49
+ cp $< $@
50
+ ./combine_tessdata.sh $@ dta_lexdb_100.words
51
+
52
+ dta_lexdb_% .words : dta_lexdb.sqlite
53
+ ./sql2wordlist.sh $< $@ $*
54
+
55
+ dta_lexdb.sqlite :
56
+ wget -O $@ https://www.dwds.de/dwds_static/lexdb/dta/lexdb.sqlite
57
+
53
58
all-hunspell : de-dta.dic
54
59
55
60
de-dta.dic : dta_lexdb_10.words
0 commit comments