diff options
author | Nick White <git@njw.name> | 2019-10-09 16:41:26 +0100 |
---|---|---|
committer | Nick White <git@njw.name> | 2019-10-09 16:41:26 +0100 |
commit | 8908fc011f83aee2a958d798648d08a0d04fa55b (patch) | |
tree | 861a1048011ebb3249f5ae3fc3de411b92077d47 | |
parent | 26e869f09a94153d8e1c323373180b55e06698cb (diff) |
Match prebinarised presegmented output from ocropus in wipepattern (named like "010001.bin.png")
-rw-r--r-- | cmd/bookpipeline/main.go | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/cmd/bookpipeline/main.go b/cmd/bookpipeline/main.go index 62d3115..2179549 100644 --- a/cmd/bookpipeline/main.go +++ b/cmd/bookpipeline/main.go @@ -383,8 +383,8 @@ func main() { verboselog = log.New(n, "", 0) } - origPattern := regexp.MustCompile(`[0-9]{4}.jpg$`) // TODO: match alternative file naming - wipePattern := regexp.MustCompile(`[0-9]{4}.png$`) + origPattern := regexp.MustCompile(`[0-9]{4}.jpg$`) + wipePattern := regexp.MustCompile(`[0-9]{4,6}(.bin)?.png$`) preprocessedPattern := regexp.MustCompile(`_bin[0-9].[0-9].png$`) ocredPattern := regexp.MustCompile(`.hocr$`) |