-
Notifications
You must be signed in to change notification settings - Fork 225
/
tesseract_engine_test.go
96 lines (74 loc) · 2.76 KB
/
tesseract_engine_test.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
package ocrworker
import (
"encoding/json"
"testing"
"io/ioutil"
"github.com/couchbaselabs/go.assert"
"github.com/couchbaselabs/logg"
)
func TestTesseractEngineWithRequest(t *testing.T) {
if testing.Short() {
t.Skip("skipping test in short mode.")
}
engine := TesseractEngine{}
bytes, err := ioutil.ReadFile("docs/testimage.png")
assert.True(t, err == nil)
cFlags := make(map[string]interface{})
cFlags["tessedit_char_whitelist"] = "0123456789"
ocrRequest := OcrRequest{
ImgBytes: bytes,
EngineType: ENGINE_TESSERACT,
EngineArgs: cFlags,
}
assert.True(t, err == nil)
result, err := engine.ProcessRequest(ocrRequest)
assert.True(t, err == nil)
logg.LogTo("TEST", "result: %v", result)
}
func TestTesseractEngineWithJson(t *testing.T) {
if testing.Short() {
t.Skip("skipping test in short mode.")
}
testJsons := []string{}
testJsons = append(testJsons, `{"engine":"tesseract"}`)
testJsons = append(testJsons, `{"engine":"tesseract", "engine_args":{}}`)
testJsons = append(testJsons, `{"engine":"tesseract", "engine_args":null}`)
testJsons = append(testJsons, `{"engine":"tesseract", "engine_args":{"config_vars":{"tessedit_char_whitelist":"0123456789"}, "psm":"1"}}`)
testJsons = append(testJsons, `{"engine":"tesseract", "engine_args":{"config_vars":{"tessedit_create_hocr":"1", "tessedit_pageseg_mode":"1"}, "psm":"3"}}`)
for _, testJson := range testJsons {
logg.LogTo("TEST", "testJson: %v", testJson)
ocrRequest := OcrRequest{}
err := json.Unmarshal([]byte(testJson), &ocrRequest)
assert.True(t, err == nil)
bytes, err := ioutil.ReadFile("docs/testimage.png")
assert.True(t, err == nil)
ocrRequest.ImgBytes = bytes
engine := NewOcrEngine(ocrRequest.EngineType)
result, err := engine.ProcessRequest(ocrRequest)
logg.LogTo("TEST", "err: %v", err)
assert.True(t, err == nil)
logg.LogTo("TEST", "result: %v", result)
}
}
func TestNewTesseractEngineArgs(t *testing.T) {
testJson := `{"engine":"tesseract", "engine_args":{"config_vars":{"tessedit_char_whitelist":"0123456789"}, "psm":"0", "lang":"jpn"}}`
ocrRequest := OcrRequest{}
err := json.Unmarshal([]byte(testJson), &ocrRequest)
assert.True(t, err == nil)
engineArgs, err := NewTesseractEngineArgs(ocrRequest)
assert.True(t, err == nil)
assert.Equals(t, len(engineArgs.configVars), 1)
assert.Equals(t, engineArgs.configVars["tessedit_char_whitelist"], "0123456789")
assert.Equals(t, engineArgs.pageSegMode, "0")
assert.Equals(t, engineArgs.lang, "jpn")
}
func TestTesseractEngineWithFile(t *testing.T) {
if testing.Short() {
t.Skip("skipping test in short mode.")
}
engine := TesseractEngine{}
engineArgs := TesseractEngineArgs{}
result, err := engine.processImageFile("docs/testimage.png", engineArgs)
assert.True(t, err == nil)
logg.LogTo("TEST", "result: %v", result)
}