diff options
Diffstat (limited to 'cmd/rescribe/main.go')
-rw-r--r-- | cmd/rescribe/main.go | 13 |
1 files changed, 7 insertions, 6 deletions
diff --git a/cmd/rescribe/main.go b/cmd/rescribe/main.go index ea2590f..889a3d2 100644 --- a/cmd/rescribe/main.go +++ b/cmd/rescribe/main.go @@ -38,11 +38,6 @@ Process and OCR a book using the Rescribe pipeline on a local machine. OCR results are saved into the bookdir directory unless savedir is specified. - -Note that embedded Tesseract includes these training files: -- carolinemsv1_fast.traineddata (Caroline Miniscule) -- rescribefrav2_fast.traineddata (French historic printing) -- rescribev8_fast.traineddata (Latin historic printing) ` //go:embed tessdata.20210622.zip @@ -146,7 +141,13 @@ func main() { verbose := flag.Bool("v", false, "verbose") systess := flag.Bool("systess", false, "Use the system installed Tesseract, rather than the copy embedded in rescribe.") - training := flag.String("t", "trainings/rescribev8_fast.traineddata", "path to the tesseract training file to use") + training := flag.String("t", "rescribev8_fast.traineddata", `Path to the tesseract training file to use. +These training files are included in rescribe, and are always available: +- carolinemsv1_fast.traineddata (Caroline Miniscule) +- eng.traineddata (Modern English) +- rescribefrav2_fast.traineddata (French historic printing) +- rescribev8_fast.traineddata (Latin historic printing) + `) tesscmd := flag.String("tesscmd", deftesscmd, "The Tesseract executable to run. You may need to set this to the full path of Tesseract.exe if you're on Windows.") flag.Usage = func() { |