AUTHORS.rst
CONTRIBUTING.rst
HISTORY.rst
LICENSE
MANIFEST.in
README.md
setup.cfg
setup.py
MicroTokenizer/__init__.py
MicroTokenizer/pipeline.py
MicroTokenizer.egg-info/PKG-INFO
MicroTokenizer.egg-info/SOURCES.txt
MicroTokenizer.egg-info/dependency_links.txt
MicroTokenizer.egg-info/entry_points.txt
MicroTokenizer.egg-info/not-zip-safe
MicroTokenizer.egg-info/requires.txt
MicroTokenizer.egg-info/top_level.txt
MicroTokenizer/cli/__init__.py
MicroTokenizer/cli/main.py
MicroTokenizer/cli/commands/__init__.py
MicroTokenizer/cli/commands/train.py
MicroTokenizer/data_structures/__init__.py
MicroTokenizer/data_structures/dictionary.py
MicroTokenizer/data_structures/graph_builder.py
MicroTokenizer/data_structures/non_recursive_algorithm.py
MicroTokenizer/data_structures/train_dictionary.py
MicroTokenizer/data_structures/trie_algorithm.py
MicroTokenizer/encoding/BMES.py
MicroTokenizer/encoding/__init__.py
MicroTokenizer/ensemble/__init__.py
MicroTokenizer/ensemble/merge_solutions.py
MicroTokenizer/experimental/__init__.py
MicroTokenizer/model_data/A.pickle
MicroTokenizer/model_data/B.pickle
MicroTokenizer/model_data/dict.txt
MicroTokenizer/model_data/feature_func_list.pickle
MicroTokenizer/model_data/model.crfsuite
MicroTokenizer/model_data/vocabulary.pickle
MicroTokenizer/tokenizers/BMES.py
MicroTokenizer/tokenizers/__init__.py
MicroTokenizer/tokenizers/base_tokenizer.py
MicroTokenizer/tokenizers/dag_tokenizer.py
MicroTokenizer/tokenizers/hmm_tokenizer.py
MicroTokenizer/tokenizers/load_tokenizers.py
MicroTokenizer/tokenizers/whitespace_split_tokenizer.py
MicroTokenizer/tokenizers/crf/__init__.py
MicroTokenizer/tokenizers/crf/tokenizer.py
MicroTokenizer/tokenizers/crf/trainer.py
MicroTokenizer/tokenizers/ensemble/__init__.py
MicroTokenizer/tokenizers/ensemble/tokenizer.py
MicroTokenizer/tokenizers/max_match/__init__.py
MicroTokenizer/tokenizers/max_match/backward.py
MicroTokenizer/tokenizers/max_match/bidirectional.py
MicroTokenizer/tokenizers/max_match/forward.py
docs/Makefile
docs/authors.rst
docs/conf.py
docs/contributing.rst
docs/history.rst
docs/index.rst
docs/installation.rst
docs/make.bat
docs/readme.rst
docs/usage.rst
tests/__init__.py
tests/conftest.py
tests/test_pipeline.py
tests/tokenizers/__init__.py
tests/tokenizers/test_BaseTokenizerV2.py
tests/tokenizers/test_dag_tokenizer.py
tests/tokenizers/test_hmm_tokenizer.py
tests/tokenizers/crf/__init__.py
tests/tokenizers/crf/test_tokenizer.py
tests/tokenizers/ensemble/__init__.py
tests/tokenizers/ensemble/test_tokenizer.py
tests/tokenizers/max_match/__init__.py
tests/tokenizers/max_match/test_backward.py
tests/tokenizers/max_match/test_bidirectional.py
tests/tokenizers/max_match/test_forward.py
tests/tokenizers/unicode_script/__init__.py
tests/tokenizers/unicode_script/test_tokenizer.py
tests/training/__init__.py
tests/training/test_train.py
tests/training/test_train/data.txt