diff options
Diffstat (limited to 'preproc')
| -rw-r--r-- | preproc/cmd/preproc/main.go | 6 | ||||
| -rw-r--r-- | preproc/cmd/preprocmulti/main.go | 6 | ||||
| -rw-r--r-- | preproc/cmd/wipe/main.go | 9 | ||||
| -rw-r--r-- | preproc/wipesides.go | 19 | 
4 files changed, 27 insertions, 13 deletions
| diff --git a/preproc/cmd/preproc/main.go b/preproc/cmd/preproc/main.go index 053de8f..d8d5b66 100644 --- a/preproc/cmd/preproc/main.go +++ b/preproc/cmd/preproc/main.go @@ -1,7 +1,6 @@  package main  // TODO: come up with a way to set a good ksize automatically -// TODO: add minimum size variable (default ~30%?) for wipe  import (  	"flag" @@ -23,13 +22,14 @@ func autowsize(bounds image.Rectangle) int {  func main() {  	flag.Usage = func() { -		fmt.Fprintf(os.Stderr, "Usage: preproc [-bt bintype] [-bw winsize] [-k num] [-wt wipethresh] [-ws wipesize] inimg outimg\n") +		fmt.Fprintf(os.Stderr, "Usage: preproc [-bt bintype] [-bw winsize] [-k num] [-m minperc] [-wt wipethresh] [-ws wipesize] inimg outimg\n")  		fmt.Fprintf(os.Stderr, "Binarize and preprocess an image\n")  		flag.PrintDefaults()  	}  	binwsize := flag.Int("bw", 0, "Window size for sauvola binarization algorithm. Set automatically based on resolution if not set.")  	ksize := flag.Float64("k", 0.5, "K for sauvola binarization algorithm. This controls the overall threshold level. Set it lower for very light text (try 0.1 or 0.2).")  	btype := flag.String("bt", "binary", "Type of binarization threshold. binary or zeroinv are currently implemented.") +	min := flag.Int("m", 30, "Minimum percentage of the image width for the content width calculation to be considered valid.")  	wipewsize := flag.Int("ws", 5, "Window size for wiping algorithm.")  	thresh := flag.Float64("wt", 0.05, "Threshold for the wiping algorithm to determine the proportion of black pixels below which a window is determined to be the edge.")  	flag.Parse() @@ -71,7 +71,7 @@ func main() {  	}  	log.Print("Wiping sides") -	clean := preproc.Wipe(threshimg.(*image.Gray), *wipewsize, *thresh) +	clean := preproc.Wipe(threshimg.(*image.Gray), *wipewsize, *thresh, *min)  	f, err = os.Create(flag.Arg(1))  	if err != nil { diff --git a/preproc/cmd/preprocmulti/main.go b/preproc/cmd/preprocmulti/main.go index eea7ab4..947625e 100644 --- a/preproc/cmd/preprocmulti/main.go +++ b/preproc/cmd/preprocmulti/main.go @@ -1,7 +1,6 @@  package main  // TODO: come up with a way to set a good ksize automatically -// TODO: add minimum size variable (default ~30%?) for wipe  import (  	"flag" @@ -26,7 +25,7 @@ func main() {  	ksizes := []float64{0.2, 0.3, 0.4, 0.5, 0.6}  	flag.Usage = func() { -		fmt.Fprintf(os.Stderr, "Usage: preproc [-bt bintype] [-bw winsize] [-wt wipethresh] [-ws wipesize] inimg outbase\n") +		fmt.Fprintf(os.Stderr, "Usage: preproc [-bt bintype] [-bw winsize] [-m minperc] [-wt wipethresh] [-ws wipesize] inimg outbase\n")  		fmt.Fprintf(os.Stderr, "Binarize and preprocess an image, with multiple binarisation levels,\n")  		fmt.Fprintf(os.Stderr, "saving images to outbase_bin{k}.png.\n")  		fmt.Fprintf(os.Stderr, "Binarises with these levels for k: %v.\n", ksizes) @@ -34,6 +33,7 @@ func main() {  	}  	binwsize := flag.Int("bw", 0, "Window size for sauvola binarization algorithm. Set automatically based on resolution if not set.")  	btype := flag.String("bt", "binary", "Type of binarization threshold. binary or zeroinv are currently implemented.") +	min := flag.Int("m", 30, "Minimum percentage of the image width for the content width calculation to be considered valid.")  	wipewsize := flag.Int("ws", 5, "Window size for wiping algorithm.")  	thresh := flag.Float64("wt", 0.05, "Threshold for the wiping algorithm to determine the proportion of black pixels below which a window is determined to be the edge.")  	flag.Parse() @@ -80,7 +80,7 @@ func main() {  		}  		log.Print("Wiping sides") -		clean := preproc.Wipe(threshimg.(*image.Gray), *wipewsize, *thresh) +		clean := preproc.Wipe(threshimg.(*image.Gray), *wipewsize, *thresh, *min)  		savefn := fmt.Sprintf("%s_bin%0.1f.png", flag.Arg(1), k)  		log.Printf("Saving %s\n", savefn) diff --git a/preproc/cmd/wipe/main.go b/preproc/cmd/wipe/main.go index e735a0a..ceff2e7 100644 --- a/preproc/cmd/wipe/main.go +++ b/preproc/cmd/wipe/main.go @@ -1,7 +1,5 @@  package main -// TODO: add minimum size variable (default ~30%?) -  import (  	"flag"  	"fmt" @@ -17,12 +15,13 @@ import (  func main() {  	flag.Usage = func() { -		fmt.Fprintf(os.Stderr, "Usage: wipe [-t thresh] [-w winsize] inimg outimg\n") +		fmt.Fprintf(os.Stderr, "Usage: wipe [-m minperc] [-t thresh] [-w winsize] inimg outimg\n")  		fmt.Fprintf(os.Stderr, "Wipes the sections of an image which are outside the content area.\n")  		flag.PrintDefaults()  	} -	wsize := flag.Int("w", 5, "Window size for mask finding algorithm.") +	min := flag.Int("m", 30, "Minimum percentage of the image width for the content width calculation to be considered valid.")  	thresh := flag.Float64("t", 0.05, "Threshold for the proportion of black pixels below which a window is determined to be the edge.") +	wsize := flag.Int("w", 5, "Window size for mask finding algorithm.")  	flag.Parse()  	if flag.NArg() < 2 {  		flag.Usage() @@ -42,7 +41,7 @@ func main() {  	gray := image.NewGray(image.Rect(0, 0, b.Dx(), b.Dy()))  	draw.Draw(gray, b, img, b.Min, draw.Src) -	clean := preproc.Wipe(gray, *wsize, *thresh) +	clean := preproc.Wipe(gray, *wsize, *thresh, *min)  	f, err = os.Create(flag.Arg(1))  	if err != nil { diff --git a/preproc/wipesides.go b/preproc/wipesides.go index 04bfa11..9b8387a 100644 --- a/preproc/wipesides.go +++ b/preproc/wipesides.go @@ -90,10 +90,25 @@ func wipesides(img *image.Gray, lowedge int, highedge int) *image.Gray {  	return new  } +// toonarrow checks whether the area between lowedge and highedge is +// less than min % of the total image width +func toonarrow(img *image.Gray, lowedge int, highedge int, min int) bool { +	b := img.Bounds() +	imgw := b.Max.X - b.Min.X +	wipew := highedge - lowedge +	if float64(wipew) / float64(imgw) * 100 < float64(min) { +		return true +	} +	return false +} +  // wipe fills the sections of image which fall outside the content -// area with white -func Wipe(img *image.Gray, wsize int, thresh float64) *image.Gray { +// area with white, providing the content area is above min % +func Wipe(img *image.Gray, wsize int, thresh float64, min int) *image.Gray {  	integral := integralimg.ToIntegralImg(img)  	lowedge, highedge := findedges(integral, wsize, thresh) +	if toonarrow(img, lowedge, highedge, min) { +		return img +	}  	return wipesides(img, lowedge, highedge)  } | 
