diff options
author | Nick White <git@njw.name> | 2019-09-05 22:20:35 +0100 |
---|---|---|
committer | Nick White <git@njw.name> | 2019-09-05 22:20:35 +0100 |
commit | 60a198f7ee5843a0f77b6dfb845c3b0413e83705 (patch) | |
tree | 5463522ac03b512ffe0f6e7c111cb904a4f5e3a4 | |
parent | 7c897a13ad90bdcaffccf74d43cc4fd20f150226 (diff) |
Don't abort analysis if we encounter a hocr with no words, just skip it
-rw-r--r-- | bookpipeline/cmd/bookpipeline/main.go | 3 | ||||
-rw-r--r-- | lib/hocr/hocr.go | 2 |
2 files changed, 4 insertions, 1 deletions
diff --git a/bookpipeline/cmd/bookpipeline/main.go b/bookpipeline/cmd/bookpipeline/main.go index 520311b..97f4109 100644 --- a/bookpipeline/cmd/bookpipeline/main.go +++ b/bookpipeline/cmd/bookpipeline/main.go @@ -156,6 +156,9 @@ func analyse(toanalyse chan string, up chan string, errc chan error, logger *log errc <- errors.New(fmt.Sprintf("Error retreiving confidence for %s: %s", path, err)) return } + if avg == 0 { + continue + } base := filepath.Base(path) codestart := strings.Index(base, "_bin") name := base[0:codestart] diff --git a/lib/hocr/hocr.go b/lib/hocr/hocr.go index dcd0494..052aa19 100644 --- a/lib/hocr/hocr.go +++ b/lib/hocr/hocr.go @@ -123,7 +123,7 @@ func GetAvgConf(hocrfn string) (float64, error) { } } if num == 0 { - return 0, errors.New("No words found") + return 0, nil } return total / num, nil } |