diff options
author | Nick White <git@njw.name> | 2020-04-14 11:56:56 +0100 |
---|---|---|
committer | Nick White <git@njw.name> | 2020-04-14 11:56:56 +0100 |
commit | 848f961c277525ebba3ab08fadc116970bcfed24 (patch) | |
tree | 00a6883568c29ac34d56f958f7d3479e372d8c31 /pkg/hocr/hocr.go | |
parent | d9612a98ab66409858e07a9a430d40beac1b17b8 (diff) |
Add godoc documentation
Diffstat (limited to 'pkg/hocr/hocr.go')
-rw-r--r-- | pkg/hocr/hocr.go | 9 |
1 files changed, 8 insertions, 1 deletions
diff --git a/pkg/hocr/hocr.go b/pkg/hocr/hocr.go index 9dea49c..6b43558 100644 --- a/pkg/hocr/hocr.go +++ b/pkg/hocr/hocr.go @@ -2,6 +2,8 @@ // Use of this source code is governed by the GPLv3 // license that can be found in the LICENSE file. +// hocr contains structures and functions for parsing and analysing +// hocr files package hocr import ( @@ -51,6 +53,7 @@ func wordConf(s string) (float64, error) { return strconv.ParseFloat(conf[1], 64) } +// BoxCoords parses bbox coordinate strings func BoxCoords(s string) ([4]int, error) { var coords [4]int re, err := regexp.Compile(`bbox ([0-9]+) ([0-9]+) ([0-9]+) ([0-9]+)`) @@ -73,6 +76,7 @@ func noText(s string) bool { return len(t) == 0 } +// Parse parses a hOCR file func Parse(b []byte) (Hocr, error) { var hocr Hocr @@ -84,6 +88,7 @@ func Parse(b []byte) (Hocr, error) { return hocr, nil } +// GetText parses a hOCR file and extracts the text from it func GetText(hocrfn string) (string, error) { var s string @@ -104,6 +109,8 @@ func GetText(hocrfn string) (string, error) { return s, nil } +// GetAvgConf calculates the average confidence of a hOCR file from +// confidences embedded in each word func GetAvgConf(hocrfn string) (float64, error) { file, err := ioutil.ReadFile(hocrfn) if err != nil { @@ -134,7 +141,7 @@ func GetAvgConf(hocrfn string) (float64, error) { // GetWordConfs is a utility function that parses a hocr // file and returns an array containing the confidences -// of each word therein. +// of each word therein func GetWordConfs(hocrfn string) ([]float64, error) { var confs []float64 |