From 28091bd3a22de816aa12c8e96636384d9a516fea Mon Sep 17 00:00:00 2001 From: Nick White Date: Tue, 14 May 2019 17:34:50 +0100 Subject: Add bookgraphv2, to go hand in hand with fullocrdir --- bookgraphv2.sh | 39 +++++++++++++++++++++++++++++++++++++++ 1 file changed, 39 insertions(+) create mode 100644 bookgraphv2.sh diff --git a/bookgraphv2.sh b/bookgraphv2.sh new file mode 100644 index 0000000..9984ede --- /dev/null +++ b/bookgraphv2.sh @@ -0,0 +1,39 @@ +#!/bin/sh +usage="$0 bookdir + +Creates a graph showing the average confidence of each page in a book." + +test $# -ne 1 && echo "$usage" && exit 1 + +if ! command -v pgconf > /dev/null ; then + echo "Error: no pgconf tool found" + exit 1 +fi + +t=`mktemp` + +find "$1/best" -maxdepth 1 -type f -name '*hocr' | while read i; do + c=`pgconf "$i"` + n=`basename "$i" .hocr | sed 's/_.*//'` + printf '%s\t%d\n' "$n" "$c" >> "$t" +done + +b=`basename "$1"` + +gp=`mktemp` +printf ' + +set style data lines +set title "Book Confidence for %s" +set xlabel "Page Number" +set ylabel "Page Confidence %%" +set mxtics +set terminal png truecolor size 4600,1700 +set output "%s" +plot "%s" using 1:2 with lines title "Confidence",\\ + "" using 1:2:(sprintf("%%d", $1)) with labels point pt 2 notitle +quit +' "$b" "$1/${b}_bookgraph.png" "$t" >> "$gp" +gnuplot "$gp" + +#rm -f "$t" "$gp" -- cgit v1.2.1-24-ge1ad