Skip to content

Commit e700173

Browse files
committedMar 17, 2019
Add typos tests
Signed-off-by: Vadim Markovtsev <vadim@sourced.tech>
1 parent 92ca68a commit e700173

File tree

2 files changed

+224
-2
lines changed

2 files changed

+224
-2
lines changed
 

‎leaves/research/typos.go

+17-2
Original file line numberDiff line numberDiff line change
@@ -55,6 +55,10 @@ const (
5555
// DefaultMaximumAllowedTypoDistance is the default value of the maximum Levenshtein distance
5656
// between two identifiers to consider them a typo-fix pair.
5757
DefaultMaximumAllowedTypoDistance = 4
58+
// ConfigTyposDatasetMaximumAllowedDistance is the name of the configuration option
59+
// (`TyposDatasetBuilder.Configure()`) which sets the maximum Levenshtein distance between
60+
// two identifiers to consider them a typo-fix pair.
61+
ConfigTyposDatasetMaximumAllowedDistance = "TyposDatasetBuilder.MaximumAllowedDistance"
5862
)
5963

6064
// Name of this PipelineItem. Uniquely identifies the type, used for mapping keys, etc.
@@ -80,11 +84,22 @@ func (tdb *TyposDatasetBuilder) Requires() []string {
8084

8185
// ListConfigurationOptions returns the list of changeable public properties of this PipelineItem.
8286
func (tdb *TyposDatasetBuilder) ListConfigurationOptions() []core.ConfigurationOption {
83-
return nil
87+
options := [...]core.ConfigurationOption{{
88+
Name: ConfigTyposDatasetMaximumAllowedDistance,
89+
Description: "Maximum Levenshtein distance between two identifiers to consider them " +
90+
"a typo-fix pair.",
91+
Flag: "typos-max-distance",
92+
Type: core.IntConfigurationOption,
93+
Default: DefaultMaximumAllowedTypoDistance},
94+
}
95+
return options[:]
8496
}
8597

8698
// Configure sets the properties previously published by ListConfigurationOptions().
8799
func (tdb *TyposDatasetBuilder) Configure(facts map[string]interface{}) error {
100+
if val, exists := facts[ConfigTyposDatasetMaximumAllowedDistance].(int); exists {
101+
tdb.MaximumAllowedDistance = val
102+
}
88103
return nil
89104
}
90105

@@ -101,7 +116,7 @@ func (tdb *TyposDatasetBuilder) Description() string {
101116
// Initialize resets the temporary caches and prepares this PipelineItem for a series of Consume()
102117
// calls. The repository which is going to be analysed is supplied as an argument.
103118
func (tdb *TyposDatasetBuilder) Initialize(repository *git.Repository) error {
104-
if tdb.MaximumAllowedDistance == 0 {
119+
if tdb.MaximumAllowedDistance <= 0 {
105120
tdb.MaximumAllowedDistance = DefaultMaximumAllowedTypoDistance
106121
}
107122
tdb.lcontext = &levenshtein.Context{}

‎leaves/research/typos_test.go

+207
Original file line numberDiff line numberDiff line change
@@ -1 +1,208 @@
11
package research
2+
3+
import (
4+
"bytes"
5+
"testing"
6+
7+
"github.com/gogo/protobuf/proto"
8+
"github.com/stretchr/testify/assert"
9+
"gopkg.in/src-d/go-git.v4/plumbing"
10+
"gopkg.in/src-d/go-git.v4/plumbing/object"
11+
"gopkg.in/src-d/hercules.v9/internal/core"
12+
"gopkg.in/src-d/hercules.v9/internal/pb"
13+
items "gopkg.in/src-d/hercules.v9/internal/plumbing"
14+
uast_items "gopkg.in/src-d/hercules.v9/internal/plumbing/uast"
15+
"gopkg.in/src-d/hercules.v9/internal/test"
16+
)
17+
18+
func TestTyposDatasetMeta(t *testing.T) {
19+
tdb := TyposDatasetBuilder{}
20+
assert.Equal(t, tdb.Name(), "TyposDataset")
21+
assert.Len(t, tdb.Provides(), 0)
22+
required := [...]string{
23+
uast_items.DependencyUastChanges, items.DependencyFileDiff, items.DependencyBlobCache}
24+
for _, name := range required {
25+
assert.Contains(t, tdb.Requires(), name)
26+
}
27+
opts := tdb.ListConfigurationOptions()
28+
assert.Len(t, opts, 1)
29+
assert.Equal(t, opts[0].Name, ConfigTyposDatasetMaximumAllowedDistance)
30+
assert.Equal(t, opts[0].Type, core.IntConfigurationOption)
31+
assert.Equal(t, tdb.Flag(), "typos-dataset")
32+
}
33+
34+
func TestTyposDatasetRegistration(t *testing.T) {
35+
summoned := core.Registry.Summon((&TyposDatasetBuilder{}).Name())
36+
assert.Len(t, summoned, 1)
37+
assert.Equal(t, summoned[0].Name(), "TyposDataset")
38+
leaves := core.Registry.GetLeaves()
39+
matched := false
40+
for _, tp := range leaves {
41+
if tp.Flag() == (&TyposDatasetBuilder{}).Flag() {
42+
matched = true
43+
break
44+
}
45+
}
46+
assert.True(t, matched)
47+
}
48+
49+
func TestTyposDatasetConfigure(t *testing.T) {
50+
tdb := TyposDatasetBuilder{}
51+
facts := map[string]interface{}{}
52+
facts[ConfigTyposDatasetMaximumAllowedDistance] = 5
53+
assert.Nil(t, tdb.Configure(facts))
54+
assert.Equal(t, tdb.MaximumAllowedDistance, 5)
55+
facts = map[string]interface{}{}
56+
assert.Nil(t, tdb.Configure(facts))
57+
assert.Equal(t, tdb.MaximumAllowedDistance, 5)
58+
}
59+
60+
func AddHash(t *testing.T, cache map[plumbing.Hash]*items.CachedBlob, hash string) {
61+
objhash := plumbing.NewHash(hash)
62+
blob, err := test.Repository.BlobObject(objhash)
63+
assert.Nil(t, err)
64+
cb := &items.CachedBlob{Blob: *blob}
65+
err = cb.Cache()
66+
assert.Nil(t, err)
67+
cache[objhash] = cb
68+
}
69+
70+
func TestTyposDatasetConsume(t *testing.T) {
71+
deps := map[string]interface{}{}
72+
cache := map[plumbing.Hash]*items.CachedBlob{}
73+
AddHash(t, cache, "b9a12fd144274c99c7c9a0a32a0268f8b36d2f2c")
74+
AddHash(t, cache, "d5f8e61069136f3578457a3131800ede353527b8")
75+
AddHash(t, cache, "75bb0a09fc01db55d7322f0fae523453edba7846")
76+
deps[items.DependencyBlobCache] = cache
77+
changes := make(object.Changes, 2)
78+
treeFrom, _ := test.Repository.TreeObject(plumbing.NewHash(
79+
"eac25f9126db00e38fa72a59d49773a84580d4ce"))
80+
treeTo, _ := test.Repository.TreeObject(plumbing.NewHash(
81+
"828467b465864b1f757dcec9a034be49030fc8b9"))
82+
changes[0] = &object.Change{From: object.ChangeEntry{
83+
Name: "file_test.go",
84+
Tree: treeFrom,
85+
TreeEntry: object.TreeEntry{
86+
Name: "file_test.go",
87+
Mode: 0100644,
88+
Hash: plumbing.NewHash("75bb0a09fc01db55d7322f0fae523453edba7846"),
89+
},
90+
}, To: object.ChangeEntry{
91+
Name: "file_test.go",
92+
Tree: treeTo,
93+
TreeEntry: object.TreeEntry{
94+
Name: "file_test.go",
95+
Mode: 0100644,
96+
Hash: plumbing.NewHash("75bb0a09fc01db55d7322f0fae523453edba7846"),
97+
},
98+
}}
99+
changes[1] = &object.Change{From: object.ChangeEntry{}, To: object.ChangeEntry{
100+
Name: "blob_cache_test.go",
101+
Tree: treeTo,
102+
TreeEntry: object.TreeEntry{
103+
Name: "blob_cache_test.go",
104+
Mode: 0100644,
105+
Hash: plumbing.NewHash("b9a12fd144274c99c7c9a0a32a0268f8b36d2f2c"),
106+
},
107+
},
108+
}
109+
deps[items.DependencyTreeChanges] = changes
110+
deps[core.DependencyCommit], _ = test.Repository.CommitObject(plumbing.NewHash(
111+
"84165d3b02647fae12cc026c7a580045246e8c98"))
112+
deps[core.DependencyIsMerge] = false
113+
uastItem := &uast_items.Extractor{}
114+
assert.Nil(t, uastItem.Initialize(test.Repository))
115+
uastResult, err := uastItem.Consume(deps)
116+
assert.Nil(t, err)
117+
deps[uast_items.DependencyUasts] = uastResult[uast_items.DependencyUasts]
118+
uastChanges := &uast_items.Changes{}
119+
assert.Nil(t, uastChanges.Initialize(test.Repository))
120+
_, err = uastChanges.Consume(deps)
121+
assert.Nil(t, err)
122+
changes[0].To.TreeEntry.Hash = plumbing.NewHash("d5f8e61069136f3578457a3131800ede353527b8")
123+
uastResult, err = uastItem.Consume(deps)
124+
assert.Nil(t, err)
125+
deps[uast_items.DependencyUasts] = uastResult[uast_items.DependencyUasts]
126+
changesResult, err := uastChanges.Consume(deps)
127+
assert.Nil(t, err)
128+
deps[uast_items.DependencyUastChanges] = changesResult[uast_items.DependencyUastChanges]
129+
fd := &items.FileDiff{}
130+
assert.Nil(t, fd.Initialize(test.Repository))
131+
diffResult, err := fd.Consume(deps)
132+
assert.Nil(t, err)
133+
deps[items.DependencyFileDiff] = diffResult[items.DependencyFileDiff]
134+
135+
tbd := &TyposDatasetBuilder{}
136+
assert.Nil(t, tbd.Initialize(test.Repository))
137+
res, err := tbd.Consume(deps)
138+
assert.Nil(t, res)
139+
assert.Nil(t, err)
140+
assert.Len(t, tbd.typos, 4)
141+
assert.Equal(t, tbd.typos[0].Wrong, "TestZeroInitializeFile")
142+
assert.Equal(t, tbd.typos[0].Correct, "TestZeroInitialize")
143+
assert.Equal(t, tbd.typos[0].Commit, plumbing.NewHash(
144+
"84165d3b02647fae12cc026c7a580045246e8c98"))
145+
assert.Equal(t, tbd.typos[0].File, "file_test.go")
146+
assert.Equal(t, tbd.typos[0].Line, 74)
147+
148+
deps[core.DependencyIsMerge] = true
149+
res, err = tbd.Consume(deps)
150+
assert.Nil(t, res)
151+
assert.Nil(t, err)
152+
assert.Len(t, tbd.typos, 4)
153+
}
154+
155+
func fixtureTyposDataset() *TyposDatasetBuilder {
156+
tdb := TyposDatasetBuilder{}
157+
tdb.Initialize(test.Repository)
158+
tdb.typos = append(tdb.typos, Typo{
159+
Wrong: "Fo",
160+
Correct: "Foo",
161+
Commit: plumbing.ZeroHash,
162+
File: "bar.go",
163+
Line: 7,
164+
})
165+
return &tdb
166+
}
167+
168+
func TestTyposDatasetFinalize(t *testing.T) {
169+
tdb := fixtureTyposDataset()
170+
tdb.typos = append(tdb.typos, tdb.typos[0])
171+
x := tdb.Finalize().(TyposResult)
172+
assert.Len(t, x.Typos, 1)
173+
assert.Equal(t, x.Typos[0], Typo{
174+
Wrong: "Fo",
175+
Correct: "Foo",
176+
Commit: plumbing.ZeroHash,
177+
File: "bar.go",
178+
Line: 7,
179+
})
180+
}
181+
182+
func TestTyposDatasetSerialize(t *testing.T) {
183+
ca := fixtureTyposDataset()
184+
res := ca.Finalize().(TyposResult)
185+
buffer := &bytes.Buffer{}
186+
err := ca.Serialize(res, false, buffer)
187+
assert.Nil(t, err)
188+
assert.Equal(t, ` - wrong: Fo
189+
correct: Foo
190+
commit: 0000000000000000000000000000000000000000
191+
file: bar.go
192+
line: 7
193+
`, buffer.String())
194+
195+
buffer = &bytes.Buffer{}
196+
err = ca.Serialize(res, true, buffer)
197+
assert.Nil(t, err)
198+
msg := pb.TyposDataset{}
199+
assert.Nil(t, proto.Unmarshal(buffer.Bytes(), &msg))
200+
assert.Len(t, msg.Typos, 1)
201+
assert.Equal(t, *msg.Typos[0], pb.Typo{
202+
Wrong: "Fo",
203+
Correct: "Foo",
204+
Commit: "0000000000000000000000000000000000000000",
205+
File: "bar.go",
206+
Line: 7,
207+
})
208+
}

0 commit comments

Comments
 (0)
Please sign in to comment.