summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorNick White <git@njw.name>2019-10-09 16:41:26 +0100
committerNick White <git@njw.name>2019-10-09 16:41:26 +0100
commit8908fc011f83aee2a958d798648d08a0d04fa55b (patch)
tree861a1048011ebb3249f5ae3fc3de411b92077d47
parent26e869f09a94153d8e1c323373180b55e06698cb (diff)
Match prebinarised presegmented output from ocropus in wipepattern (named like "010001.bin.png")
-rw-r--r--cmd/bookpipeline/main.go4
1 files changed, 2 insertions, 2 deletions
diff --git a/cmd/bookpipeline/main.go b/cmd/bookpipeline/main.go
index 62d3115..2179549 100644
--- a/cmd/bookpipeline/main.go
+++ b/cmd/bookpipeline/main.go
@@ -383,8 +383,8 @@ func main() {
verboselog = log.New(n, "", 0)
}
- origPattern := regexp.MustCompile(`[0-9]{4}.jpg$`) // TODO: match alternative file naming
- wipePattern := regexp.MustCompile(`[0-9]{4}.png$`)
+ origPattern := regexp.MustCompile(`[0-9]{4}.jpg$`)
+ wipePattern := regexp.MustCompile(`[0-9]{4,6}(.bin)?.png$`)
preprocessedPattern := regexp.MustCompile(`_bin[0-9].[0-9].png$`)
ocredPattern := regexp.MustCompile(`.hocr$`)