LICENSE
MANIFEST.in
README.md
pyproject.toml
setup.py
compressor/__init__.py
compressor/semantic.py
compressor/minbpe/__init__.py
compressor/minbpe/base.py
compressor/minbpe/basic.py
compressor/minbpe/regex.py
compressor/resources/__init__.py
compressor/resources/en_stopwords.pkl
compressor/resources/lid.176.ftz
compressor/resources/pt_stopwords.pkl
compressor/resources/nltk_data/corpora/stopwords.zip
compressor/resources/nltk_data/corpora/wordnet.zip
compressor/resources/nltk_data/corpora/stopwords/README
compressor/resources/nltk_data/corpora/stopwords/albanian
compressor/resources/nltk_data/corpora/stopwords/arabic
compressor/resources/nltk_data/corpora/stopwords/azerbaijani
compressor/resources/nltk_data/corpora/stopwords/basque
compressor/resources/nltk_data/corpora/stopwords/belarusian
compressor/resources/nltk_data/corpora/stopwords/bengali
compressor/resources/nltk_data/corpora/stopwords/catalan
compressor/resources/nltk_data/corpora/stopwords/chinese
compressor/resources/nltk_data/corpora/stopwords/danish
compressor/resources/nltk_data/corpora/stopwords/dutch
compressor/resources/nltk_data/corpora/stopwords/english
compressor/resources/nltk_data/corpora/stopwords/finnish
compressor/resources/nltk_data/corpora/stopwords/french
compressor/resources/nltk_data/corpora/stopwords/german
compressor/resources/nltk_data/corpora/stopwords/greek
compressor/resources/nltk_data/corpora/stopwords/hebrew
compressor/resources/nltk_data/corpora/stopwords/hinglish
compressor/resources/nltk_data/corpora/stopwords/hungarian
compressor/resources/nltk_data/corpora/stopwords/indonesian
compressor/resources/nltk_data/corpora/stopwords/italian
compressor/resources/nltk_data/corpora/stopwords/kazakh
compressor/resources/nltk_data/corpora/stopwords/nepali
compressor/resources/nltk_data/corpora/stopwords/norwegian
compressor/resources/nltk_data/corpora/stopwords/portuguese
compressor/resources/nltk_data/corpora/stopwords/romanian
compressor/resources/nltk_data/corpora/stopwords/russian
compressor/resources/nltk_data/corpora/stopwords/slovene
compressor/resources/nltk_data/corpora/stopwords/spanish
compressor/resources/nltk_data/corpora/stopwords/swedish
compressor/resources/nltk_data/corpora/stopwords/tajik
compressor/resources/nltk_data/corpora/stopwords/tamil
compressor/resources/nltk_data/corpora/stopwords/turkish
compressor/resources/nltk_data/corpora/words/README
compressor/resources/nltk_data/corpora/words/en
compressor/resources/nltk_data/corpora/words/en-basic
compressor/resources/nltk_data/stemmers/rslp.zip
compressor/resources/nltk_data/stemmers/rslp/step0.pt
compressor/resources/nltk_data/stemmers/rslp/step1.pt
compressor/resources/nltk_data/stemmers/rslp/step2.pt
compressor/resources/nltk_data/stemmers/rslp/step3.pt
compressor/resources/nltk_data/stemmers/rslp/step4.pt
compressor/resources/nltk_data/stemmers/rslp/step5.pt
compressor/resources/nltk_data/stemmers/rslp/step6.pt
compressor/resources/nltk_data/taggers/averaged_perceptron_tagger/averaged_perceptron_tagger.pickle
compressor/resources/nltk_data/tokenizers/punkt.zip
compressor/resources/nltk_data/tokenizers/punkt/.DS_Store
compressor/resources/nltk_data/tokenizers/punkt/README
compressor/resources/nltk_data/tokenizers/punkt/czech.pickle
compressor/resources/nltk_data/tokenizers/punkt/danish.pickle
compressor/resources/nltk_data/tokenizers/punkt/dutch.pickle
compressor/resources/nltk_data/tokenizers/punkt/english.pickle
compressor/resources/nltk_data/tokenizers/punkt/estonian.pickle
compressor/resources/nltk_data/tokenizers/punkt/finnish.pickle
compressor/resources/nltk_data/tokenizers/punkt/french.pickle
compressor/resources/nltk_data/tokenizers/punkt/german.pickle
compressor/resources/nltk_data/tokenizers/punkt/greek.pickle
compressor/resources/nltk_data/tokenizers/punkt/italian.pickle
compressor/resources/nltk_data/tokenizers/punkt/malayalam.pickle
compressor/resources/nltk_data/tokenizers/punkt/norwegian.pickle
compressor/resources/nltk_data/tokenizers/punkt/polish.pickle
compressor/resources/nltk_data/tokenizers/punkt/portuguese.pickle
compressor/resources/nltk_data/tokenizers/punkt/russian.pickle
compressor/resources/nltk_data/tokenizers/punkt/slovene.pickle
compressor/resources/nltk_data/tokenizers/punkt/spanish.pickle
compressor/resources/nltk_data/tokenizers/punkt/swedish.pickle
compressor/resources/nltk_data/tokenizers/punkt/turkish.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/README
compressor/resources/nltk_data/tokenizers/punkt/PY3/czech.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/danish.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/dutch.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/english.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/estonian.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/finnish.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/french.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/german.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/greek.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/italian.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/malayalam.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/norwegian.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/polish.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/portuguese.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/russian.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/slovene.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/spanish.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/swedish.pickle
compressor/resources/nltk_data/tokenizers/punkt/PY3/turkish.pickle
semantic_compressor.egg-info/PKG-INFO
semantic_compressor.egg-info/SOURCES.txt
semantic_compressor.egg-info/dependency_links.txt
semantic_compressor.egg-info/requires.txt
semantic_compressor.egg-info/top_level.txt