File tree Expand file tree Collapse file tree 1 file changed +7
-12
lines changed
Expand file tree Collapse file tree 1 file changed +7
-12
lines changed Original file line number Diff line number Diff line change 11class Tokenizer (object ):
2- """ A class to turn arbitrary inputs into integer classes. """
2+ """A class to turn arbitrary inputs into integer classes."""
33
44 def __init__ (self ):
55 # the default class for an unseen entry during test-time
6- self ._data = {' unk' : 1 }
7- self ._num_classes = 1
6+ self ._data = {" unk" : 1 }
7+ self .num_classes = 1
88 self .train = True
99 self .unknown = []
1010
1111 def __call__ (self , item ):
12- """ Check to see if the Tokenizer has seen `item` before, and if so,
12+ """Check to see if the Tokenizer has seen `item` before, and if so,
1313 return the integer class associated with it. Otherwise, if we're
1414 training, create a new integer class, otherwise return the 'unknown'
1515 class.
@@ -26,13 +26,8 @@ def __call__(self, item):
2626 else :
2727 # Record the unknown item, then return the unknown label
2828 self .unknown += [item ]
29- return self ._data ['unk' ]
30-
31- @property
32- def num_classes (self ) -> int :
33- """The maximum number of assigned classes"""
34- return self ._num_classes
29+ return self ._data ["unk" ]
3530
3631 def _add_token (self , item ):
37- self ._num_classes += 1
38- self ._data [item ] = self ._num_classes
32+ self .num_classes += 1
33+ self ._data [item ] = self .num_classes
You can’t perform that action at this time.
0 commit comments