1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
|
// Copyright 2019 Nick White.
// Use of this source code is governed by the GPLv3
// license that can be found in the LICENSE file.
// preprocmulti runs binarisation with a variety of different binarisation
// levels, preprocessing and saving each version
package main
// TODO: come up with a way to set a good ksize automatically
import (
"flag"
"fmt"
"image"
"image/draw"
_ "image/jpeg"
"image/png"
"log"
"os"
"rescribe.xyz/preproc"
"rescribe.xyz/integral"
)
// TODO: do more testing to see how good this assumption is
func autowsize(bounds image.Rectangle) int {
return bounds.Dx() / 60
}
func main() {
ksizes := []float64{0.1, 0.2, 0.4, 0.5}
flag.Usage = func() {
fmt.Fprintf(os.Stderr, "Usage: preprocmulti [-bt bintype] [-bw winsize] [-m minperc] [-nowipe] [-ws wipesize] inimg outbase\n")
fmt.Fprintf(os.Stderr, "Binarize and preprocess an image, with multiple binarisation levels,\n")
fmt.Fprintf(os.Stderr, "saving images to outbase_bin{k}.png.\n")
fmt.Fprintf(os.Stderr, "Binarises with these levels for k: %v.\n", ksizes)
flag.PrintDefaults()
}
binwsize := flag.Int("bw", 0, "Window size for sauvola binarization algorithm. Set automatically based on resolution if not set.")
btype := flag.String("bt", "binary", "Type of binarization threshold. binary or zeroinv are currently implemented.")
min := flag.Int("m", 30, "Minimum percentage of the image width for the content width calculation to be considered valid.")
nowipe := flag.Bool("nowipe", false, "Disable wiping completely.")
wipewsize := flag.Int("ws", 5, "Window size for wiping algorithm.")
vmin := flag.Int("vm", 30, "Minimum percentage of the image height for the content width calculation to be considered valid.")
vthresh := flag.Float64("vt", 0.005, "Threshold for the proportion of black pixels below which a vertical wipe window is determined to be the edge. Higher means more aggressive wiping.")
vwsize := flag.Int("vw", 120, "Window size for vertical mask finding algorithm. Should be set to approximately line height + largest expected gap.")
flag.Parse()
if flag.NArg() < 2 {
flag.Usage()
os.Exit(1)
}
log.Printf("Opening %s\n", flag.Arg(0))
f, err := os.Open(flag.Arg(0))
defer f.Close()
if err != nil {
log.Fatalf("Could not open file %s: %v\n", flag.Arg(0), err)
}
img, _, err := image.Decode(f)
if err != nil {
log.Fatalf("Could not decode image: %v\n", err)
}
b := img.Bounds()
if *binwsize == 0 {
*binwsize = autowsize(b)
}
if *binwsize%2 == 0 {
*binwsize++
}
var clean, threshimg, vclean image.Image
log.Print("Precalculating integral images")
intImg := integral.NewImage(b)
draw.Draw(intImg, b, img, b.Min, draw.Src)
intSqImg := integral.NewSqImage(b)
draw.Draw(intSqImg, b, img, b.Min, draw.Src)
for _, k := range ksizes {
log.Print("Binarising")
threshimg = preproc.PreCalcedSauvola(*intImg, *intSqImg, img, k, *binwsize)
if *btype == "zeroinv" {
threshimg, err = preproc.BinToZeroInv(threshimg.(*image.Gray), img.(*image.RGBA))
if err != nil {
log.Fatal(err)
}
}
if !*nowipe {
log.Print("Wiping sides")
vclean = preproc.VWipe(threshimg.(*image.Gray), *vwsize, *vthresh, *vmin)
clean = preproc.Wipe(vclean.(*image.Gray), *wipewsize, k*0.02, *min)
} else {
clean = threshimg
}
savefn := fmt.Sprintf("%s_bin%0.1f.png", flag.Arg(1), k)
log.Printf("Saving %s\n", savefn)
f, err = os.Create(savefn)
if err != nil {
log.Fatalf("Could not create file %s: %v\n", savefn, err)
}
defer f.Close()
err = png.Encode(f, clean)
if err != nil {
log.Fatalf("Could not encode image: %v\n", err)
}
}
}
|