summaryrefslogtreecommitdiff
path: root/snippets
diff options
context:
space:
mode:
Diffstat (limited to 'snippets')
-rw-r--r--snippets/tessfortesting22
1 files changed, 22 insertions, 0 deletions
diff --git a/snippets/tessfortesting b/snippets/tessfortesting
new file mode 100644
index 0000000..daec106
--- /dev/null
+++ b/snippets/tessfortesting
@@ -0,0 +1,22 @@
+#!/bin/sh
+
+# rename .gt.txt files to .txt
+for i in *gt.txt; do n=`echo "$i"|sed 's/\.gt\.txt/.txt/g'`; mv "$i" "$n"; done
+
+# create boxes for all lines
+for i in *png; do b=`basename "$i" .png`; python ../../generate_line_box.py -i "$b.png" -t "$b.txt" > "$b.box"; done
+
+# back up ground truth .txt (the lstm.train step wipes it)
+for i in *txt; do cp "$i" "$i.bak"; done
+
+# create lstmf counterparts to all files
+for i in *png; do b=`basename "$i" .png`; tesseract "$i" "$b" --psm 6 lstm.train; done
+
+# restore ground truth .txt
+for i in *.bak; do b=`basename "$i" .bak`; mv "$i" "$b"; done
+
+# create list of lstmf files
+ls *lstmf > all-files.txt
+
+# do the evaluation (note: verbosity 2 means that correct lines are printed as well as incorrect ones)
+lstmeval --model ../rescribealphav4.traineddata --eval_listfile all-files.txt --verbosity 2 2>&1 | tee evaluation