diff options
Diffstat (limited to 'preproc')
| -rw-r--r-- | preproc/cmd/cleanup/main.go | 62 | ||||
| -rw-r--r-- | preproc/testdata/pg1.png | bin | 0 -> 30803 bytes | |||
| -rw-r--r-- | preproc/testdata/pg1_integralwipesides_t0.02_w5.png | bin | 0 -> 33595 bytes | |||
| -rw-r--r-- | preproc/testdata/pg1_integralwipesides_t0.05_w25.png | bin | 0 -> 33432 bytes | |||
| -rw-r--r-- | preproc/testdata/pg1_integralwipesides_t0.05_w5.png | bin | 0 -> 14546 bytes | |||
| -rw-r--r-- | preproc/wipesides.go | 122 | ||||
| -rw-r--r-- | preproc/wipesides_test.go | 105 | 
7 files changed, 289 insertions, 0 deletions
diff --git a/preproc/cmd/cleanup/main.go b/preproc/cmd/cleanup/main.go new file mode 100644 index 0000000..7ea0c84 --- /dev/null +++ b/preproc/cmd/cleanup/main.go @@ -0,0 +1,62 @@ +package main + +// TODO: add minimum size variable (default ~30%?) +// TODO: make into a small library +// TODO: have the integral image specific stuff done by interface functions + +import ( +	"flag" +	"fmt" +	"image" +	"image/draw" +	_ "image/jpeg" +	"image/png" +	"log" +	"os" + +	"rescribe.xyz/go.git/binarize" +	"rescribe.xyz/go.git/preproc" +) + +func main() { +	flag.Usage = func() { +		fmt.Fprintf(os.Stderr, "Usage: cleanup [-t thresh] [-w winsize] inimg outimg\n") +		flag.PrintDefaults() +	} +	wsize := flag.Int("w", 5, "Window size for mask finding algorithm.") +	thresh := flag.Float64("t", 0.05, "Threshold for the proportion of black pixels below which a window is determined to be the edge.") +	flag.Parse() +	if flag.NArg() < 2 { +		flag.Usage() +		os.Exit(1) +	} + +	f, err := os.Open(flag.Arg(0)) +	defer f.Close() +	if err != nil { +		log.Fatalf("Could not open file %s: %v\n", flag.Arg(0), err) +	} +	img, _, err := image.Decode(f) +	if err != nil { +		log.Fatalf("Could not decode image: %v\n", err) +	} +	b := img.Bounds() +	gray := image.NewGray(image.Rect(0, 0, b.Dx(), b.Dy())) +	draw.Draw(gray, b, img, b.Min, draw.Src) + +	integral := binarize.Integralimg(gray) + +	lowedge, highedge := preproc.Findedges(integral, *wsize, *thresh) + +	clean := preproc.Wipesides(gray, lowedge, highedge) + +	f, err = os.Create(flag.Arg(1)) +	if err != nil { +		log.Fatalf("Could not create file %s: %v\n", flag.Arg(1), err) +	} +	defer f.Close() +	err = png.Encode(f, clean) +	if err != nil { +		log.Fatalf("Could not encode image: %v\n", err) +	} +} diff --git a/preproc/testdata/pg1.png b/preproc/testdata/pg1.png Binary files differnew file mode 100644 index 0000000..c7c4249 --- /dev/null +++ b/preproc/testdata/pg1.png diff --git a/preproc/testdata/pg1_integralwipesides_t0.02_w5.png b/preproc/testdata/pg1_integralwipesides_t0.02_w5.png Binary files differnew file mode 100644 index 0000000..6b4ccb2 --- /dev/null +++ b/preproc/testdata/pg1_integralwipesides_t0.02_w5.png diff --git a/preproc/testdata/pg1_integralwipesides_t0.05_w25.png b/preproc/testdata/pg1_integralwipesides_t0.05_w25.png Binary files differnew file mode 100644 index 0000000..39dc88d --- /dev/null +++ b/preproc/testdata/pg1_integralwipesides_t0.05_w25.png diff --git a/preproc/testdata/pg1_integralwipesides_t0.05_w5.png b/preproc/testdata/pg1_integralwipesides_t0.05_w5.png Binary files differnew file mode 100644 index 0000000..50df855 --- /dev/null +++ b/preproc/testdata/pg1_integralwipesides_t0.05_w5.png diff --git a/preproc/wipesides.go b/preproc/wipesides.go new file mode 100644 index 0000000..2afe1d2 --- /dev/null +++ b/preproc/wipesides.go @@ -0,0 +1,122 @@ +package preproc + +// TODO: add minimum size variable (default ~30%?) +// TODO: have the integral image specific stuff done by interface functions + +import ( +	"image" +	"image/color" +) + +type windowslice struct { +	topleft     uint64 +	topright    uint64 +	bottomleft  uint64 +	bottomright uint64 +} + +func getwindowslice(i [][]uint64, x int, size int) windowslice { +	maxy := len(i) - 1 +	maxx := x + size +	if maxx > len(i[0])-1 { +		maxx = len(i[0]) - 1 +	} + +	return windowslice{i[0][x], i[0][maxx], i[maxy][x], i[maxy][maxx]} +} + +// checkwindow checks the window from x to see whether more than +// thresh proportion of the pixels are white, if so it returns true. +func checkwindow(integral [][]uint64, x int, size int, thresh float64) bool { +	height := len(integral) +	window := getwindowslice(integral, x, size) +	// divide by 255 as each on pixel has the value of 255 +	sum := (window.bottomright + window.topleft - window.topright - window.bottomleft) / 255 +	area := size * height +	proportion := float64(area)/float64(sum) - 1 +	return proportion <= thresh +} + +// returns the proportion of the given window that is black pixels +func proportion(integral [][]uint64, x int, size int) float64 { +	height := len(integral) +	window := getwindowslice(integral, x, size) +	// divide by 255 as each on pixel has the value of 255 +	sum := (window.bottomright + window.topleft - window.topright - window.bottomleft) / 255 +	area := size * height +	return float64(area)/float64(sum) - 1 +} + +// findbestedge goes through every vertical line from x to x+w to +// find the one with the lowest proportion of black pixels. +func findbestedge(integral [][]uint64, x int, w int) int { +	var bestx int +	var best float64 + +	if w == 1 { +		return x +	} + +	right := x + w +	for ; x < right; x++ { +		prop := proportion(integral, x, 1) +		if prop > best { +			best = prop +			bestx = x +		} +	} + +	return bestx +} + +// Findedges finds the edges of the main content, by moving a window of wsize +// from the middle of the image to the left and right, stopping when it reaches +// a point at which there is a lower proportion of black pixels than thresh. +func Findedges(integral [][]uint64, wsize int, thresh float64) (int, int) { +	maxx := len(integral[0]) - 1 +	var lowedge, highedge int = 0, maxx + +	for x := maxx / 2; x < maxx-wsize; x++ { +		if checkwindow(integral, x, wsize, thresh) { +			highedge = findbestedge(integral, x, wsize) +			break +		} +	} + +	for x := maxx / 2; x > 0; x-- { +		if checkwindow(integral, x, wsize, thresh) { +			lowedge = findbestedge(integral, x, wsize) +			break +		} +	} + +	return lowedge, highedge +} + +// Wipesides fills the sections of image not within the boundaries +// of lowedge and highedge with white +func Wipesides(img *image.Gray, lowedge int, highedge int) *image.Gray { +	b := img.Bounds() +	new := image.NewGray(b) + +	// set left edge white +	for x := b.Min.X; x < lowedge; x++ { +		for y := b.Min.Y; y < b.Max.Y; y++ { +			new.SetGray(x, y, color.Gray{255}) +		} +	} +	// copy middle +	for x := lowedge; x < highedge; x++ { +		for y := b.Min.Y; y < b.Max.Y; y++ { +			new.SetGray(x, y, img.GrayAt(x, y)) +		} +	} +	// set right edge white +	for x := highedge; x < b.Max.X; x++ { +		for y := b.Min.Y; y < b.Max.Y; y++ { +			new.SetGray(x, y, color.Gray{255}) +		} +	} + +	return new +} diff --git a/preproc/wipesides_test.go b/preproc/wipesides_test.go new file mode 100644 index 0000000..76151fb --- /dev/null +++ b/preproc/wipesides_test.go @@ -0,0 +1,105 @@ +package preproc + +// TODO: add different pages as test cases +// TODO: test non integral img version + +import ( +	"flag" +	"fmt" +	"image" +	"image/draw" +	"image/png" +	"os" +	"testing" + +	"rescribe.xyz/go.git/binarize" +) + +var update = flag.Bool("update", false, "update golden files") + +func decode(s string) (*image.Gray, error) { +	f, err := os.Open(s) +	defer f.Close() +	if err != nil { +		return nil, err +	} +	img, err := png.Decode(f) +	if err != nil { +		return nil, err +	} +	b := img.Bounds() +	gray := image.NewGray(image.Rect(0, 0, b.Dx(), b.Dy())) +	draw.Draw(gray, b, img, b.Min, draw.Src) +	return gray, nil +} + +func imgsequal(img1 *image.Gray, img2 *image.Gray) bool { +	b := img1.Bounds() +	if !b.Eq(img2.Bounds()) { +		return false +	} +	for y := b.Min.Y; y < b.Max.Y; y++ { +		for x := b.Min.X; x < b.Max.X; x++ { +			r0, g0, b0, a0 := img1.At(x, y).RGBA() +			r1, g1, b1, a1 := img2.At(x, y).RGBA() +			if r0 != r1 { +				return false +			} +			if g0 != g1 { +				return false +			} +			if b0 != b1 { +				return false +			} +			if a0 != a1 { +				return false +			} +		} +	} +	return true +} + +func TestWipeSides(t *testing.T) { +	cases := []struct { +		name   string +		orig   string +		golden string +		thresh float64 +		wsize  int +	}{ +		{"integralwipesides", "testdata/pg1.png", "testdata/pg1_integralwipesides_t0.02_w5.png", 0.02, 5}, +		{"integralwipesides", "testdata/pg1.png", "testdata/pg1_integralwipesides_t0.05_w5.png", 0.05, 5}, +		{"integralwipesides", "testdata/pg1.png", "testdata/pg1_integralwipesides_t0.05_w25.png", 0.05, 25}, +	} + +	for _, c := range cases { +		t.Run(fmt.Sprintf("%s_%0.2f_%d", c.name, c.thresh, c.wsize), func(t *testing.T) { +			var actual *image.Gray +			orig, err := decode(c.orig) +			if err != nil { +				t.Fatalf("Could not open file %s: %v\n", c.orig, err) +			} +			integral := binarize.Integralimg(orig) +			lowedge, highedge := Findedges(integral, c.wsize, c.thresh) +			actual = Wipesides(orig, lowedge, highedge) +			if *update { +				f, err := os.Create(c.golden) +				defer f.Close() +				if err != nil { +					t.Fatalf("Could not open file %s to update: %v\n", c.golden, err) +				} +				err = png.Encode(f, actual) +				if err != nil { +					t.Fatalf("Could not encode update of %s: %v\n", c.golden, err) +				} +			} +			golden, err := decode(c.golden) +			if err != nil { +				t.Fatalf("Could not open file %s: %v\n", c.golden, err) +			} +			if !imgsequal(golden, actual) { +				t.Errorf("Processed %s differs to %s\n", c.orig, c.golden) +			} +		}) +	} +}  | 
