stringcompare.preprocessing package

class stringcompare.preprocessing.DeepparseAddressTagger(deepparse_handle)[source]

Bases: Tagger

LABELS = ['StreetNumber', 'StreetName', 'Unit', 'Municipality', 'Province', 'PostalCode', 'Orientation', 'GeneralDelivery']
batch_tag(objs: List) List[Dict][source]
tag(obj) Dict[source]
class stringcompare.preprocessing.DelimTokenizer(delim=' ')[source]

Bases: Tokenizer

tokenize(sentence)[source]
class stringcompare.preprocessing.NGramTokenizer(n)[source]

Bases: Tokenizer

tokenize(sentence)[source]
class stringcompare.preprocessing.Tagger[source]

Bases: ABC

abstract property LABELS
batch_tag(objs: List) List[Dict][source]
abstractmethod tag(obj) Dict[source]
class stringcompare.preprocessing.Tokenizer[source]

Bases: ABC

String tokenization interface.

batch_tokenize(sentences)[source]
abstractmethod tokenize(sentence)[source]
class stringcompare.preprocessing.WhitespaceTokenizer[source]

Bases: DelimTokenizer

Submodules

stringcompare.preprocessing.tagger module

class stringcompare.preprocessing.tagger.DeepparseAddressTagger(deepparse_handle)[source]

Bases: Tagger

LABELS = ['StreetNumber', 'StreetName', 'Unit', 'Municipality', 'Province', 'PostalCode', 'Orientation', 'GeneralDelivery']
batch_tag(objs: List) List[Dict][source]
tag(obj) Dict[source]
class stringcompare.preprocessing.tagger.Tagger[source]

Bases: ABC

abstract property LABELS
batch_tag(objs: List) List[Dict][source]
abstractmethod tag(obj) Dict[source]

stringcompare.preprocessing.tokenizer module

class stringcompare.preprocessing.tokenizer.DelimTokenizer(delim=' ')[source]

Bases: Tokenizer

tokenize(sentence)[source]
class stringcompare.preprocessing.tokenizer.NGramTokenizer(n)[source]

Bases: Tokenizer

tokenize(sentence)[source]
class stringcompare.preprocessing.tokenizer.Tokenizer[source]

Bases: ABC

String tokenization interface.

batch_tokenize(sentences)[source]
abstractmethod tokenize(sentence)[source]
class stringcompare.preprocessing.tokenizer.WhitespaceTokenizer[source]

Bases: DelimTokenizer