diff options
| -rw-r--r-- | aws.go | 10 | ||||
| -rw-r--r-- | cmd/getsamplepages/main.go | 4 | ||||
| -rw-r--r-- | cmd/getstats/main.go | 16 | ||||
| -rw-r--r-- | cmd/rescribe/getembeds.go | 4 | ||||
| -rw-r--r-- | cmd/rescribe/main.go | 7 | ||||
| -rw-r--r-- | cmd/rmbook/main.go | 4 | ||||
| -rw-r--r-- | internal/pipeline/pipeline_test.go | 36 | 
7 files changed, 41 insertions, 40 deletions
@@ -383,8 +383,8 @@ func (a *AwsConn) ListObjectsWithMeta(bucket string, prefix string) ([]ObjMeta,  func (a *AwsConn) ListObjectWithMeta(bucket string, prefix string) (ObjMeta, error) {  	var obj ObjMeta  	err := a.s3svc.ListObjectsV2Pages(&s3.ListObjectsV2Input{ -		Bucket: aws.String(bucket), -		Prefix: aws.String(prefix), +		Bucket:  aws.String(bucket), +		Prefix:  aws.String(prefix),  		MaxKeys: aws.Int64(1),  	}, func(page *s3.ListObjectsV2Output, last bool) bool {  		for _, r := range page.Contents { @@ -421,12 +421,12 @@ func (a *AwsConn) DeleteObjects(bucket string, keys []string) error {  		// s3.DeleteObjects can only take up to 1000 keys at a time,  		// so if necessary delete those collected so far and empty  		// the objs queue -		if i % 1000 == 1 { +		if i%1000 == 1 {  			_, err := a.s3svc.DeleteObjects(&s3.DeleteObjectsInput{  				Bucket: aws.String(bucket),  				Delete: &s3.Delete{  					Objects: objs, -					Quiet: aws.Bool(true), +					Quiet:   aws.Bool(true),  				},  			})  			if err != nil { @@ -439,7 +439,7 @@ func (a *AwsConn) DeleteObjects(bucket string, keys []string) error {  		Bucket: aws.String(bucket),  		Delete: &s3.Delete{  			Objects: objs, -			Quiet: aws.Bool(true), +			Quiet:   aws.Bool(true),  		},  	})  	return err diff --git a/cmd/getsamplepages/main.go b/cmd/getsamplepages/main.go index 8e35055..cb32700 100644 --- a/cmd/getsamplepages/main.go +++ b/cmd/getsamplepages/main.go @@ -74,7 +74,7 @@ func main() {  		err = conn.Download(conn.WIPStorageId(), p+"best", name+"best")  		if err != nil {  		} -		b, err := ioutil.ReadFile(name+"best") +		b, err := ioutil.ReadFile(name + "best")  		if err != nil {  			log.Fatalf("Failed to read file %s\n", name+"best")  		} @@ -85,7 +85,7 @@ func main() {  		}  		pg := strings.TrimSuffix(lines[0], ".hocr") -		err = os.Remove(name+"best") +		err = os.Remove(name + "best")  		if err != nil {  			log.Fatalf("Failed to remove temporary best file for %s", name)  		} diff --git a/cmd/getstats/main.go b/cmd/getstats/main.go index 5ed1414..b51be2a 100644 --- a/cmd/getstats/main.go +++ b/cmd/getstats/main.go @@ -62,16 +62,16 @@ func main() {  	log.Println("Downloading all best and conf files found")  	for _, i := range objs {  		parts := strings.Split(i, "/") -		if parts[len(parts) - 1] == "best" { -			fmt.Printf("Downloading %s to %s\n", i, parts[0] + "-best") -			err = conn.Download(conn.WIPStorageId(), i, parts[0] + "-best") +		if parts[len(parts)-1] == "best" { +			fmt.Printf("Downloading %s to %s\n", i, parts[0]+"-best") +			err = conn.Download(conn.WIPStorageId(), i, parts[0]+"-best")  			if err != nil {  				log.Fatalln("Failed to download file", i, err)  			}  		} -		if parts[len(parts) - 1] == "conf" { -			fmt.Printf("Downloading %s to %s\n", i, parts[0] + "-conf") -			err = conn.Download(conn.WIPStorageId(), i, parts[0] + "-conf") +		if parts[len(parts)-1] == "conf" { +			fmt.Printf("Downloading %s to %s\n", i, parts[0]+"-conf") +			err = conn.Download(conn.WIPStorageId(), i, parts[0]+"-conf")  			if err != nil {  				log.Fatalln("Failed to download file", i, err)  			} @@ -99,8 +99,8 @@ func main() {  		}  		if strings.HasSuffix(parts[1], ".hocr") { -			fmt.Printf("Downloading %s to %s\n", i, parts[0] + "-hocr") -			err = conn.Download(conn.WIPStorageId(), i, parts[0] + "-hocr") +			fmt.Printf("Downloading %s to %s\n", i, parts[0]+"-hocr") +			err = conn.Download(conn.WIPStorageId(), i, parts[0]+"-hocr")  			if err != nil {  				log.Fatalln("Failed to download file", i, err)  			} diff --git a/cmd/rescribe/getembeds.go b/cmd/rescribe/getembeds.go index a3edaf2..1747d82 100644 --- a/cmd/rescribe/getembeds.go +++ b/cmd/rescribe/getembeds.go @@ -11,9 +11,9 @@ package main  import (  	"fmt"  	"io" +	"net/http"  	"os"  	"path" -	"net/http"  )  func dl(url string) error { @@ -40,7 +40,7 @@ func dl(url string) error {  }  func main() { -	urls := []string { +	urls := []string{  		"https://rescribe.xyz/rescribe/embeds/tessdata.20210622.zip",  		"https://rescribe.xyz/rescribe/embeds/tesseract-linux-v5.0.0-alpha.20210510.zip",  		"https://rescribe.xyz/rescribe/embeds/tesseract-osx-v4.1.1.20191227.zip", diff --git a/cmd/rescribe/main.go b/cmd/rescribe/main.go index 4404789..db8eb41 100644 --- a/cmd/rescribe/main.go +++ b/cmd/rescribe/main.go @@ -46,6 +46,7 @@ var tessdatazip []byte  const QueueTimeoutSecs = 2 * 60  const PauseBetweenChecks = 1 * time.Second  const LogSaveTime = 1 * time.Minute +  var thresholds = []float64{0.1, 0.2, 0.3}  // null writer to enable non-verbose logging to be discarded @@ -322,8 +323,8 @@ These training files are included in rescribe, and are always available:  	}  	// For simplicity, remove .binarised.pdf and rename .colour.pdf to .pdf -	_ = os.Remove(filepath.Join(savedir, bookname + ".binarised.pdf")) -	_ = os.Rename(filepath.Join(savedir, bookname + ".colour.pdf"), filepath.Join(savedir, bookname + ".pdf")) +	_ = os.Remove(filepath.Join(savedir, bookname+".binarised.pdf")) +	_ = os.Rename(filepath.Join(savedir, bookname+".colour.pdf"), filepath.Join(savedir, bookname+".pdf"))  }  func addTxtVersion(hocrfn string) error { @@ -342,7 +343,7 @@ func addTxtVersion(hocrfn string) error {  	for _, v := range thresholds {  		basefn = strings.TrimSuffix(basefn, fmt.Sprintf("_bin%.1f.hocr", v))  	} -	fn := filepath.Join(dir, "text", basefn + ".txt") +	fn := filepath.Join(dir, "text", basefn+".txt")  	err = ioutil.WriteFile(fn, []byte(t), 0644)  	if err != nil { diff --git a/cmd/rmbook/main.go b/cmd/rmbook/main.go index fcacc2e..a26c553 100644 --- a/cmd/rmbook/main.go +++ b/cmd/rmbook/main.go @@ -26,8 +26,8 @@ func (w NullWriter) Write(p []byte) (n int, err error) {  }  type RmPipeliner interface { -        MinimalInit() error -        WIPStorageId() string +	MinimalInit() error +	WIPStorageId() string  	DeleteObjects(bucket string, keys []string) error  	ListObjects(bucket string, prefix string) ([]string, error)  } diff --git a/internal/pipeline/pipeline_test.go b/internal/pipeline/pipeline_test.go index 806f9be..4a08d3b 100644 --- a/internal/pipeline/pipeline_test.go +++ b/internal/pipeline/pipeline_test.go @@ -36,7 +36,7 @@ type PipelineTester interface {  type connection struct {  	name string -	c PipelineTester +	c    PipelineTester  }  // Test_download tests the download() function inside the pipeline @@ -53,11 +53,11 @@ func Test_download(t *testing.T) {  	}  	cases := []struct { -		dl string +		dl       string  		contents []byte -		process string -		errs []error -	} { +		process  string +		errs     []error +	}{  		{"notpresent", []byte(""), "", []error{errors.New("no such file or directory"), errors.New("NoSuchKey: The specified key does not exist")}},  		{"empty", []byte{}, "empty", []error{}},  		{"justastring", []byte("I am just a basic string"), "justastring", []error{}}, @@ -73,7 +73,7 @@ func Test_download(t *testing.T) {  				slog.log = ""  				tempDir := filepath.Join(os.TempDir(), "pipelinetest")  				err = os.MkdirAll(tempDir, 0700) -				if err != nil && ! os.IsExist(err) { +				if err != nil && !os.IsExist(err) {  					t.Fatalf("Could not create temporary directory %s: %v\nLog: %s", tempDir, err, slog.log)  				} @@ -174,11 +174,11 @@ func Test_up(t *testing.T) {  	}  	cases := []struct { -		ul string +		ul       string  		contents []byte -		process string -		errs []error -	} { +		process  string +		errs     []error +	}{  		{"notpresent", []byte(""), "", []error{errors.New("no such file or directory"), errors.New("NoSuchKey: The specified key does not exist")}},  		{"empty", []byte{}, "empty", []error{}},  		{"justastring", []byte("I am just a basic string"), "justastring", []error{}}, @@ -194,7 +194,7 @@ func Test_up(t *testing.T) {  				slog.log = ""  				tempDir := filepath.Join(os.TempDir(), "pipelinetest")  				err = os.MkdirAll(tempDir, 0700) -				if err != nil && ! os.IsExist(err) { +				if err != nil && !os.IsExist(err) {  					t.Fatalf("Could not create temporary directory %s: %v\nLog: %s", tempDir, err, slog.log)  				} @@ -244,7 +244,7 @@ func Test_up(t *testing.T) {  					t.Fatalf("Uploaded file not removed as it should have been after uploading %s: %v\nLog: %s", tempFile, err, slog.log)  				} -				err = conn.c.Download(conn.c.WIPStorageId(), "pipelinetest/" + c.ul, tempFile) +				err = conn.c.Download(conn.c.WIPStorageId(), "pipelinetest/"+c.ul, tempFile)  				if err != nil {  					t.Fatalf("Could not download file %s: %v\nLog: %s", tempFile, err, slog.log)  				} @@ -292,11 +292,11 @@ func Test_upAndQueue(t *testing.T) {  	}  	cases := []struct { -		ul string +		ul       string  		contents []byte -		process string -		errs []error -	} { +		process  string +		errs     []error +	}{  		{"notpresent", []byte(""), "", []error{errors.New("no such file or directory"), errors.New("NoSuchKey: The specified key does not exist")}},  		{"empty", []byte{}, "empty", []error{}},  		{"justastring", []byte("I am just a basic string"), "justastring", []error{}}, @@ -312,7 +312,7 @@ func Test_upAndQueue(t *testing.T) {  				slog.log = ""  				tempDir := filepath.Join(os.TempDir(), "pipelinetest")  				err = os.MkdirAll(tempDir, 0700) -				if err != nil && ! os.IsExist(err) { +				if err != nil && !os.IsExist(err) {  					t.Fatalf("Could not create temporary directory %s: %v\nLog: %s", tempDir, err, slog.log)  				} @@ -376,7 +376,7 @@ func Test_upAndQueue(t *testing.T) {  					t.Fatalf("Uploaded file not removed as it should have been after uploading %s: %v\nLog: %s", tempFile, err, slog.log)  				} -				err = conn.c.Download(conn.c.WIPStorageId(), "pipelinetest/" + c.ul, tempFile) +				err = conn.c.Download(conn.c.WIPStorageId(), "pipelinetest/"+c.ul, tempFile)  				if err != nil {  					t.Fatalf("Could not download file %s: %v\nLog: %s", tempFile, err, slog.log)  				}  | 
