├── .clang-format ├── CMakeLists.txt ├── LICENSE ├── README.md ├── automata ├── CMakeLists.txt ├── ac_iterator.h ├── aho_corasick.h ├── attr_fsm.h ├── automata.cpp ├── automata.h ├── compact_trie.h ├── flat_transitions.h ├── flex_transitions.h ├── fsm.h ├── fsm_defs.h ├── nfa.h ├── nfa_operations.h ├── nfa_printer.h ├── serializer.h ├── test │ ├── CMakeLists.txt │ ├── ac_test.cpp │ └── trie_test.cpp └── trie.h ├── cmake ├── AddBoostTests.cmake ├── Build.cmake └── FindLog4cplus.cmake ├── encode ├── CMakeLists.txt ├── char_iterator.h ├── char_unicode32_decoder.cpp ├── char_unicode32_decoder.h ├── test │ ├── CMakeLists.txt │ ├── char_iterator_test.cpp │ └── utf8_iterator_test.cpp ├── utf8_generator.h └── utf8_iterator.h ├── examples ├── CMakeLists.txt ├── morpher.cpp └── symbol_iterator.cpp ├── morpho ├── CMakeLists.txt ├── alphabets │ ├── alphabet.h │ ├── eng_alphabet.h │ └── rus_alphabet.h ├── aot │ ├── CMakeLists.txt │ ├── aot_parser.h │ ├── eng_aot_parser.h │ ├── eng_morphs.txt │ ├── eng_tabs.txt │ ├── main.cpp │ ├── rus_aot_parser.h │ ├── rus_morphs.txt │ └── rus_tabs.txt ├── models │ ├── CMakeLists.txt │ ├── eng_model.h │ ├── eng_model_description.h │ ├── model.h │ ├── rus_model.h │ ├── rus_model_description.h │ └── test │ │ ├── CMakeLists.txt │ │ └── rus_model_test.cpp └── morpholib │ ├── CMakeLists.txt │ ├── base_storage.cpp │ ├── base_storage.h │ ├── morpho.cpp │ ├── morpho.h │ ├── morpho_modifier.h │ ├── suffix_storage.cpp │ ├── suffix_storage.h │ └── test │ ├── CMakeLists.txt │ └── test.cpp ├── style ├── cpplint.py ├── style_check.sh └── style_check_dir.sh ├── symbols ├── CMakeLists.txt ├── UnicodeData.txt ├── Unihan_Readings.txt ├── st_generator.py ├── symbols.h ├── test │ ├── CMakeLists.txt │ └── test.cpp ├── unihan_generator.py └── unihan_table.cpp ├── ut-data └── ut_main.cpp └── utility ├── filter_iterator.h ├── ngram_iterator.h ├── symbol_iterator.h ├── test ├── CMakeLists.txt └── test.cpp └── word_iterator.h /.clang-format: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/.clang-format -------------------------------------------------------------------------------- /CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/CMakeLists.txt -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/README.md -------------------------------------------------------------------------------- /automata/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/CMakeLists.txt -------------------------------------------------------------------------------- /automata/ac_iterator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/ac_iterator.h -------------------------------------------------------------------------------- /automata/aho_corasick.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/aho_corasick.h -------------------------------------------------------------------------------- /automata/attr_fsm.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/attr_fsm.h -------------------------------------------------------------------------------- /automata/automata.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/automata.cpp -------------------------------------------------------------------------------- /automata/automata.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/automata.h -------------------------------------------------------------------------------- /automata/compact_trie.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/compact_trie.h -------------------------------------------------------------------------------- /automata/flat_transitions.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/flat_transitions.h -------------------------------------------------------------------------------- /automata/flex_transitions.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/flex_transitions.h -------------------------------------------------------------------------------- /automata/fsm.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/fsm.h -------------------------------------------------------------------------------- /automata/fsm_defs.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/fsm_defs.h -------------------------------------------------------------------------------- /automata/nfa.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/nfa.h -------------------------------------------------------------------------------- /automata/nfa_operations.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/nfa_operations.h -------------------------------------------------------------------------------- /automata/nfa_printer.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/nfa_printer.h -------------------------------------------------------------------------------- /automata/serializer.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/serializer.h -------------------------------------------------------------------------------- /automata/test/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/test/CMakeLists.txt -------------------------------------------------------------------------------- /automata/test/ac_test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/test/ac_test.cpp -------------------------------------------------------------------------------- /automata/test/trie_test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/test/trie_test.cpp -------------------------------------------------------------------------------- /automata/trie.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/automata/trie.h -------------------------------------------------------------------------------- /cmake/AddBoostTests.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/cmake/AddBoostTests.cmake -------------------------------------------------------------------------------- /cmake/Build.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/cmake/Build.cmake -------------------------------------------------------------------------------- /cmake/FindLog4cplus.cmake: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/cmake/FindLog4cplus.cmake -------------------------------------------------------------------------------- /encode/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/CMakeLists.txt -------------------------------------------------------------------------------- /encode/char_iterator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/char_iterator.h -------------------------------------------------------------------------------- /encode/char_unicode32_decoder.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/char_unicode32_decoder.cpp -------------------------------------------------------------------------------- /encode/char_unicode32_decoder.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/char_unicode32_decoder.h -------------------------------------------------------------------------------- /encode/test/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/test/CMakeLists.txt -------------------------------------------------------------------------------- /encode/test/char_iterator_test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/test/char_iterator_test.cpp -------------------------------------------------------------------------------- /encode/test/utf8_iterator_test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/test/utf8_iterator_test.cpp -------------------------------------------------------------------------------- /encode/utf8_generator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/utf8_generator.h -------------------------------------------------------------------------------- /encode/utf8_iterator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/encode/utf8_iterator.h -------------------------------------------------------------------------------- /examples/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/examples/CMakeLists.txt -------------------------------------------------------------------------------- /examples/morpher.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/examples/morpher.cpp -------------------------------------------------------------------------------- /examples/symbol_iterator.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/examples/symbol_iterator.cpp -------------------------------------------------------------------------------- /morpho/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/CMakeLists.txt -------------------------------------------------------------------------------- /morpho/alphabets/alphabet.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/alphabets/alphabet.h -------------------------------------------------------------------------------- /morpho/alphabets/eng_alphabet.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/alphabets/eng_alphabet.h -------------------------------------------------------------------------------- /morpho/alphabets/rus_alphabet.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/alphabets/rus_alphabet.h -------------------------------------------------------------------------------- /morpho/aot/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/CMakeLists.txt -------------------------------------------------------------------------------- /morpho/aot/aot_parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/aot_parser.h -------------------------------------------------------------------------------- /morpho/aot/eng_aot_parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/eng_aot_parser.h -------------------------------------------------------------------------------- /morpho/aot/eng_morphs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/eng_morphs.txt -------------------------------------------------------------------------------- /morpho/aot/eng_tabs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/eng_tabs.txt -------------------------------------------------------------------------------- /morpho/aot/main.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/main.cpp -------------------------------------------------------------------------------- /morpho/aot/rus_aot_parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/rus_aot_parser.h -------------------------------------------------------------------------------- /morpho/aot/rus_morphs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/rus_morphs.txt -------------------------------------------------------------------------------- /morpho/aot/rus_tabs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/aot/rus_tabs.txt -------------------------------------------------------------------------------- /morpho/models/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/CMakeLists.txt -------------------------------------------------------------------------------- /morpho/models/eng_model.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/eng_model.h -------------------------------------------------------------------------------- /morpho/models/eng_model_description.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/eng_model_description.h -------------------------------------------------------------------------------- /morpho/models/model.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/model.h -------------------------------------------------------------------------------- /morpho/models/rus_model.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/rus_model.h -------------------------------------------------------------------------------- /morpho/models/rus_model_description.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/rus_model_description.h -------------------------------------------------------------------------------- /morpho/models/test/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/test/CMakeLists.txt -------------------------------------------------------------------------------- /morpho/models/test/rus_model_test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/models/test/rus_model_test.cpp -------------------------------------------------------------------------------- /morpho/morpholib/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/CMakeLists.txt -------------------------------------------------------------------------------- /morpho/morpholib/base_storage.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/base_storage.cpp -------------------------------------------------------------------------------- /morpho/morpholib/base_storage.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/base_storage.h -------------------------------------------------------------------------------- /morpho/morpholib/morpho.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/morpho.cpp -------------------------------------------------------------------------------- /morpho/morpholib/morpho.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/morpho.h -------------------------------------------------------------------------------- /morpho/morpholib/morpho_modifier.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/morpho_modifier.h -------------------------------------------------------------------------------- /morpho/morpholib/suffix_storage.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/suffix_storage.cpp -------------------------------------------------------------------------------- /morpho/morpholib/suffix_storage.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/suffix_storage.h -------------------------------------------------------------------------------- /morpho/morpholib/test/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/test/CMakeLists.txt -------------------------------------------------------------------------------- /morpho/morpholib/test/test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/morpho/morpholib/test/test.cpp -------------------------------------------------------------------------------- /style/cpplint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/style/cpplint.py -------------------------------------------------------------------------------- /style/style_check.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/style/style_check.sh -------------------------------------------------------------------------------- /style/style_check_dir.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/style/style_check_dir.sh -------------------------------------------------------------------------------- /symbols/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/CMakeLists.txt -------------------------------------------------------------------------------- /symbols/UnicodeData.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/UnicodeData.txt -------------------------------------------------------------------------------- /symbols/Unihan_Readings.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/Unihan_Readings.txt -------------------------------------------------------------------------------- /symbols/st_generator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/st_generator.py -------------------------------------------------------------------------------- /symbols/symbols.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/symbols.h -------------------------------------------------------------------------------- /symbols/test/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/test/CMakeLists.txt -------------------------------------------------------------------------------- /symbols/test/test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/test/test.cpp -------------------------------------------------------------------------------- /symbols/unihan_generator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/unihan_generator.py -------------------------------------------------------------------------------- /symbols/unihan_table.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/symbols/unihan_table.cpp -------------------------------------------------------------------------------- /ut-data/ut_main.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/ut-data/ut_main.cpp -------------------------------------------------------------------------------- /utility/filter_iterator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/utility/filter_iterator.h -------------------------------------------------------------------------------- /utility/ngram_iterator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/utility/ngram_iterator.h -------------------------------------------------------------------------------- /utility/symbol_iterator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/utility/symbol_iterator.h -------------------------------------------------------------------------------- /utility/test/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/utility/test/CMakeLists.txt -------------------------------------------------------------------------------- /utility/test/test.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/utility/test/test.cpp -------------------------------------------------------------------------------- /utility/word_iterator.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/merfill/strutext/HEAD/utility/word_iterator.h --------------------------------------------------------------------------------