.gitignore
.gitmodules
CHANGELOG.md
LICENSE
README.md
requirements.txt
setup.py
.github/stale.yml
bicleaner_hardrules.egg-info/PKG-INFO
bicleaner_hardrules.egg-info/SOURCES.txt
bicleaner_hardrules.egg-info/dependency_links.txt
bicleaner_hardrules.egg-info/requires.txt
bicleaner_hardrules.egg-info/top_level.txt
hardrules/__init__.py
hardrules/bicleaner_hardrules.py
hardrules/hardrules.py
hardrules/lm.py
hardrules/tokenizer.py
hardrules/training.py
hardrules/unicodedata2.py
hardrules/util.py
hardrules/../requirements.txt
kenlm/.gitignore
kenlm/BUILDING
kenlm/CMakeLists.txt
kenlm/COPYING
kenlm/COPYING.3
kenlm/COPYING.LESSER.3
kenlm/Doxyfile
kenlm/LICENSE
kenlm/MANIFEST.in
kenlm/README.md
kenlm/clean_query_only.sh
kenlm/compile_query_only.sh
kenlm/setup.py
kenlm/.github/workflows/mac.yml
kenlm/.github/workflows/ubuntu.yml
kenlm/.github/workflows/windows.yml
kenlm/cmake/KenLMFunctions.cmake
kenlm/cmake/kenlmConfig.cmake.in
kenlm/cmake/modules/FindEigen3.cmake
kenlm/lm/CMakeLists.txt
kenlm/lm/bhiksha.cc
kenlm/lm/bhiksha.hh
kenlm/lm/binary_format.cc
kenlm/lm/binary_format.hh
kenlm/lm/blank.hh
kenlm/lm/build_binary_main.cc
kenlm/lm/config.cc
kenlm/lm/config.hh
kenlm/lm/enumerate_vocab.hh
kenlm/lm/facade.hh
kenlm/lm/fragment_main.cc
kenlm/lm/kenlm_benchmark_main.cc
kenlm/lm/left.hh
kenlm/lm/left_test.cc
kenlm/lm/lm_exception.cc
kenlm/lm/lm_exception.hh
kenlm/lm/max_order.hh
kenlm/lm/model.cc
kenlm/lm/model.hh
kenlm/lm/model_test.cc
kenlm/lm/model_type.hh
kenlm/lm/ngram_query.hh
kenlm/lm/partial.hh
kenlm/lm/partial_test.cc
kenlm/lm/quantize.cc
kenlm/lm/quantize.hh
kenlm/lm/query_main.cc
kenlm/lm/read_arpa.cc
kenlm/lm/read_arpa.hh
kenlm/lm/return.hh
kenlm/lm/search_hashed.cc
kenlm/lm/search_hashed.hh
kenlm/lm/search_trie.cc
kenlm/lm/search_trie.hh
kenlm/lm/sizes.cc
kenlm/lm/sizes.hh
kenlm/lm/state.hh
kenlm/lm/test.arpa
kenlm/lm/test_nounk.arpa
kenlm/lm/trie.cc
kenlm/lm/trie.hh
kenlm/lm/trie_sort.cc
kenlm/lm/trie_sort.hh
kenlm/lm/value.hh
kenlm/lm/value_build.cc
kenlm/lm/value_build.hh
kenlm/lm/virtual_interface.cc
kenlm/lm/virtual_interface.hh
kenlm/lm/vocab.cc
kenlm/lm/vocab.hh
kenlm/lm/weights.hh
kenlm/lm/word_index.hh
kenlm/lm/builder/CMakeLists.txt
kenlm/lm/builder/README.md
kenlm/lm/builder/TODO
kenlm/lm/builder/adjust_counts.cc
kenlm/lm/builder/adjust_counts.hh
kenlm/lm/builder/adjust_counts_test.cc
kenlm/lm/builder/combine_counts.hh
kenlm/lm/builder/corpus_count.cc
kenlm/lm/builder/corpus_count.hh
kenlm/lm/builder/corpus_count_test.cc
kenlm/lm/builder/count_ngrams_main.cc
kenlm/lm/builder/debug_print.hh
kenlm/lm/builder/discount.hh
kenlm/lm/builder/dump_counts_main.cc
kenlm/lm/builder/hash_gamma.hh
kenlm/lm/builder/header_info.hh
kenlm/lm/builder/initial_probabilities.cc
kenlm/lm/builder/initial_probabilities.hh
kenlm/lm/builder/interpolate.cc
kenlm/lm/builder/interpolate.hh
kenlm/lm/builder/lmplz_main.cc
kenlm/lm/builder/output.cc
kenlm/lm/builder/output.hh
kenlm/lm/builder/payload.hh
kenlm/lm/builder/pipeline.cc
kenlm/lm/builder/pipeline.hh
kenlm/lm/common/CMakeLists.txt
kenlm/lm/common/compare.hh
kenlm/lm/common/joint_order.hh
kenlm/lm/common/model_buffer.cc
kenlm/lm/common/model_buffer.hh
kenlm/lm/common/model_buffer_test.cc
kenlm/lm/common/ngram.hh
kenlm/lm/common/ngram_stream.hh
kenlm/lm/common/print.cc
kenlm/lm/common/print.hh
kenlm/lm/common/renumber.cc
kenlm/lm/common/renumber.hh
kenlm/lm/common/size_option.cc
kenlm/lm/common/size_option.hh
kenlm/lm/common/special.hh
kenlm/lm/common/test_data/generate.sh
kenlm/lm/common/test_data/toy0.arpa
kenlm/lm/common/test_data/toy1.arpa
kenlm/lm/common/test_data/bigendian/toy0.1
kenlm/lm/common/test_data/bigendian/toy0.2
kenlm/lm/common/test_data/bigendian/toy0.3
kenlm/lm/common/test_data/bigendian/toy0.kenlm_intermediate
kenlm/lm/common/test_data/bigendian/toy0.vocab
kenlm/lm/common/test_data/bigendian/toy1.1
kenlm/lm/common/test_data/bigendian/toy1.2
kenlm/lm/common/test_data/bigendian/toy1.3
kenlm/lm/common/test_data/bigendian/toy1.kenlm_intermediate
kenlm/lm/common/test_data/bigendian/toy1.vocab
kenlm/lm/common/test_data/littleendian/toy0.1
kenlm/lm/common/test_data/littleendian/toy0.2
kenlm/lm/common/test_data/littleendian/toy0.3
kenlm/lm/common/test_data/littleendian/toy0.kenlm_intermediate
kenlm/lm/common/test_data/littleendian/toy0.vocab
kenlm/lm/common/test_data/littleendian/toy1.1
kenlm/lm/common/test_data/littleendian/toy1.2
kenlm/lm/common/test_data/littleendian/toy1.3
kenlm/lm/common/test_data/littleendian/toy1.kenlm_intermediate
kenlm/lm/common/test_data/littleendian/toy1.vocab
kenlm/lm/filter/CMakeLists.txt
kenlm/lm/filter/arpa_io.cc
kenlm/lm/filter/arpa_io.hh
kenlm/lm/filter/count_io.hh
kenlm/lm/filter/filter_main.cc
kenlm/lm/filter/format.hh
kenlm/lm/filter/phrase.cc
kenlm/lm/filter/phrase.hh
kenlm/lm/filter/phrase_table_vocab_main.cc
kenlm/lm/filter/thread.hh
kenlm/lm/filter/vocab.cc
kenlm/lm/filter/vocab.hh
kenlm/lm/filter/wrapper.hh
kenlm/lm/interpolate/CMakeLists.txt
kenlm/lm/interpolate/backoff_matrix.hh
kenlm/lm/interpolate/backoff_reunification.cc
kenlm/lm/interpolate/backoff_reunification.hh
kenlm/lm/interpolate/backoff_reunification_test.cc
kenlm/lm/interpolate/bounded_sequence_encoding.cc
kenlm/lm/interpolate/bounded_sequence_encoding.hh
kenlm/lm/interpolate/bounded_sequence_encoding_test.cc
kenlm/lm/interpolate/interpolate_info.hh
kenlm/lm/interpolate/interpolate_main.cc
kenlm/lm/interpolate/merge_probabilities.cc
kenlm/lm/interpolate/merge_probabilities.hh
kenlm/lm/interpolate/merge_vocab.cc
kenlm/lm/interpolate/merge_vocab.hh
kenlm/lm/interpolate/merge_vocab_test.cc
kenlm/lm/interpolate/normalize.cc
kenlm/lm/interpolate/normalize.hh
kenlm/lm/interpolate/normalize_test.cc
kenlm/lm/interpolate/pipeline.cc
kenlm/lm/interpolate/pipeline.hh
kenlm/lm/interpolate/split_worker.cc
kenlm/lm/interpolate/split_worker.hh
kenlm/lm/interpolate/streaming_example_main.cc
kenlm/lm/interpolate/tune_derivatives.cc
kenlm/lm/interpolate/tune_derivatives.hh
kenlm/lm/interpolate/tune_derivatives_test.cc
kenlm/lm/interpolate/tune_instances.cc
kenlm/lm/interpolate/tune_instances.hh
kenlm/lm/interpolate/tune_instances_test.cc
kenlm/lm/interpolate/tune_matrix.hh
kenlm/lm/interpolate/tune_weights.cc
kenlm/lm/interpolate/tune_weights.hh
kenlm/lm/interpolate/universal_vocab.cc
kenlm/lm/interpolate/universal_vocab.hh
kenlm/lm/wrappers/README
kenlm/lm/wrappers/nplm.cc
kenlm/lm/wrappers/nplm.hh
kenlm/python/CMakeLists.txt
kenlm/python/_kenlm.pxd
kenlm/python/example.py
kenlm/python/kenlm.cpp
kenlm/python/kenlm.pyx
kenlm/python/score_sentence.cc
kenlm/python/score_sentence.hh
kenlm/util/CMakeLists.txt
kenlm/util/bit_packing.cc
kenlm/util/bit_packing.hh
kenlm/util/bit_packing_test.cc
kenlm/util/cat_compressed_main.cc
kenlm/util/ersatz_progress.cc
kenlm/util/ersatz_progress.hh
kenlm/util/exception.cc
kenlm/util/exception.hh
kenlm/util/fake_ostream.hh
kenlm/util/file.cc
kenlm/util/file.hh
kenlm/util/file_piece.cc
kenlm/util/file_piece.hh
kenlm/util/file_piece_test.cc
kenlm/util/file_stream.hh
kenlm/util/fixed_array.hh
kenlm/util/float_to_string.cc
kenlm/util/float_to_string.hh
kenlm/util/getopt.c
kenlm/util/getopt.hh
kenlm/util/have.hh
kenlm/util/integer_to_string.cc
kenlm/util/integer_to_string.hh
kenlm/util/integer_to_string_test.cc
kenlm/util/joint_sort.hh
kenlm/util/joint_sort_test.cc
kenlm/util/mmap.cc
kenlm/util/mmap.hh
kenlm/util/multi_intersection.hh
kenlm/util/multi_intersection_test.cc
kenlm/util/murmur_hash.cc
kenlm/util/murmur_hash.hh
kenlm/util/parallel_read.cc
kenlm/util/parallel_read.hh
kenlm/util/pcqueue.hh
kenlm/util/pcqueue_test.cc
kenlm/util/pool.cc
kenlm/util/pool.hh
kenlm/util/probing_hash_table.hh
kenlm/util/probing_hash_table_benchmark_main.cc
kenlm/util/probing_hash_table_test.cc
kenlm/util/proxy_iterator.hh
kenlm/util/read_compressed.cc
kenlm/util/read_compressed.hh
kenlm/util/read_compressed_test.cc
kenlm/util/scoped.cc
kenlm/util/scoped.hh
kenlm/util/sized_iterator.hh
kenlm/util/sized_iterator_test.cc
kenlm/util/sorted_uniform.hh
kenlm/util/sorted_uniform_test.cc
kenlm/util/spaces.cc
kenlm/util/spaces.hh
kenlm/util/string_piece.cc
kenlm/util/string_piece.hh
kenlm/util/string_piece_hash.hh
kenlm/util/string_stream.hh
kenlm/util/string_stream_test.cc
kenlm/util/thread_pool.hh
kenlm/util/tokenize_piece.hh
kenlm/util/tokenize_piece_test.cc
kenlm/util/usage.cc
kenlm/util/usage.hh
kenlm/util/double-conversion/CMakeLists.txt
kenlm/util/double-conversion/LICENSE
kenlm/util/double-conversion/bignum-dtoa.cc
kenlm/util/double-conversion/bignum-dtoa.h
kenlm/util/double-conversion/bignum.cc
kenlm/util/double-conversion/bignum.h
kenlm/util/double-conversion/cached-powers.cc
kenlm/util/double-conversion/cached-powers.h
kenlm/util/double-conversion/diy-fp.h
kenlm/util/double-conversion/double-conversion.h
kenlm/util/double-conversion/double-to-string.cc
kenlm/util/double-conversion/double-to-string.h
kenlm/util/double-conversion/fast-dtoa.cc
kenlm/util/double-conversion/fast-dtoa.h
kenlm/util/double-conversion/fixed-dtoa.cc
kenlm/util/double-conversion/fixed-dtoa.h
kenlm/util/double-conversion/ieee.h
kenlm/util/double-conversion/string-to-double.cc
kenlm/util/double-conversion/string-to-double.h
kenlm/util/double-conversion/strtod.cc
kenlm/util/double-conversion/strtod.h
kenlm/util/double-conversion/utils.h
kenlm/util/stream/CMakeLists.txt
kenlm/util/stream/block.hh
kenlm/util/stream/chain.cc
kenlm/util/stream/chain.hh
kenlm/util/stream/config.hh
kenlm/util/stream/count_records.cc
kenlm/util/stream/count_records.hh
kenlm/util/stream/io.cc
kenlm/util/stream/io.hh
kenlm/util/stream/io_test.cc
kenlm/util/stream/line_input.cc
kenlm/util/stream/line_input.hh
kenlm/util/stream/multi_progress.cc
kenlm/util/stream/multi_progress.hh
kenlm/util/stream/multi_stream.hh
kenlm/util/stream/rewindable_stream.cc
kenlm/util/stream/rewindable_stream.hh
kenlm/util/stream/rewindable_stream_test.cc
kenlm/util/stream/sort.hh
kenlm/util/stream/sort_test.cc
kenlm/util/stream/stream.hh
kenlm/util/stream/stream_test.cc
kenlm/util/stream/typed_stream.hh
scripts/bicleaner-hardrules
tests/hardrules_test.py
tests/test-corpus.en-de
utils/download-pack.sh