summaryrefslogtreecommitdiff
path: root/parse/hocr
diff options
context:
space:
mode:
authorNick White <git@njw.name>2019-01-24 17:56:14 +0000
committerNick White <git@njw.name>2019-01-24 17:56:14 +0000
commit6e08494a8883a8e304ef02ea352a11776ab2294c (patch)
tree47ca50fefafa5f8381dc2237792aff11a9b2c085 /parse/hocr
parent010255d2c19bbd06ca7e5ce92d8f98f3c12e0ad3 (diff)
Merge bucket-lines-{prob,hocr} into one tool called bucket-lines, that uses the filename extension to determine how to process the lines
Diffstat (limited to 'parse/hocr')
-rw-r--r--parse/hocr/hocr.go9
1 files changed, 5 insertions, 4 deletions
diff --git a/parse/hocr/hocr.go b/parse/hocr/hocr.go
index f7cac05..c03b73a 100644
--- a/parse/hocr/hocr.go
+++ b/parse/hocr/hocr.go
@@ -1,9 +1,10 @@
package hocr
-// TODO: consider making GetLineDetails() a function of Hocr, so could do a
-// similar thing with prob format files too, and then fire them both
-// off a generic interface, potentially.
-// TODO: Parse line name to zero pad line numbers, so they come out in the correct order
+// TODO: Parse line name to zero pad line numbers, so they can
+// be sorted easily
+// TODO: have same filename format as .prob uses, so include base
+// dirname, and don't include line numbers if there's only
+// one line in the hocr
import (
"encoding/xml"