├── .formatter ├── eclipse-formatter.xml └── license-header ├── .gitattributes ├── .github ├── FUNDING.yml └── workflows │ ├── build.yml │ ├── publish.yml │ └── release.yml ├── .gitignore ├── CHANGELOG.md ├── LICENSE-2.0.txt ├── README.md ├── benchmark ├── .gitignore ├── README.md ├── benchmark_multithread.sh ├── benchmark_run.sh ├── benchmark_setup.sh ├── commoncrawl.sh ├── jawikipedia.sh ├── kyoto-leads-corpus.sh ├── process_warc.py └── src │ └── com │ └── worksap │ └── nlp │ └── sudachi │ └── benchmark │ └── TokenizeMultiThread.java ├── docs ├── Sudachi.png ├── Sudachi.svg ├── _config.yml ├── _layouts │ └── default.html ├── development.md ├── favicon.ico ├── index.en.md ├── index.md ├── oov_handlers.md ├── tutorial.md ├── tutorial_plugin.md └── user_dict.md ├── gradle.properties ├── gradle └── wrapper │ ├── gradle-wrapper.jar │ └── gradle-wrapper.properties ├── gradlew ├── gradlew.bat ├── licenses └── javax.json-1.1.txt ├── settings.gradle └── src ├── jmh └── java │ └── com │ └── worksap │ └── nlp │ └── sudachi │ └── dictionary │ ├── DictionaryBuilderPerformanceTest.java │ ├── DoubleArrayLookupBench.java │ └── MemChannelJmh.kt ├── main ├── java │ └── com │ │ └── worksap │ │ └── nlp │ │ └── sudachi │ │ ├── Config.java │ │ ├── DefaultInputTextPlugin.java │ │ ├── Dictionary.java │ │ ├── DictionaryFactory.java │ │ ├── EditConnectionCostPlugin.java │ │ ├── IOTools.java │ │ ├── IgnoreYomiganaPlugin.java │ │ ├── InhibitConnectionPlugin.java │ │ ├── InputText.java │ │ ├── InputTextBuilder.java │ │ ├── InputTextPlugin.java │ │ ├── JapaneseDictionary.java │ │ ├── JapaneseTokenizer.java │ │ ├── JoinKatakanaOovPlugin.java │ │ ├── JoinNumericPlugin.java │ │ ├── Lattice.java │ │ ├── LatticeImpl.java │ │ ├── LatticeNode.java │ │ ├── LatticeNodeImpl.java │ │ ├── MMap.java │ │ ├── MeCabOovProviderPlugin.java │ │ ├── Morpheme.java │ │ ├── MorphemeFormatterPlugin.java │ │ ├── MorphemeImpl.java │ │ ├── MorphemeList.java │ │ ├── NumericParser.java │ │ ├── OovProviderPlugin.java │ │ ├── PartialPOS.java │ │ ├── PathAnchor.java │ │ ├── PathRewritePlugin.java │ │ ├── Plugin.java │ │ ├── PosMatcher.java │ │ ├── ProlongedSoundMarkInputTextPlugin.java │ │ ├── RegexOovProvider.java │ │ ├── SentenceSplittingAnalysis.java │ │ ├── SentenceSplittingLazyAnalysis.java │ │ ├── Settings.java │ │ ├── SimpleMorphemeFormatter.java │ │ ├── SimpleOovProviderPlugin.java │ │ ├── StringUtil.java │ │ ├── SudachiCommandLine.java │ │ ├── TextNormalizer.java │ │ ├── Tokenizer.java │ │ ├── UTF8InputText.java │ │ ├── UTF8InputTextBuilder.java │ │ ├── WordId.java │ │ ├── WordMask.java │ │ ├── WordSegmentationFormatter.java │ │ ├── dictionary │ │ ├── BinaryDictionary.java │ │ ├── CSVParser.java │ │ ├── CategoryType.java │ │ ├── CharacterCategory.java │ │ ├── Connection.java │ │ ├── DictionaryAccess.java │ │ ├── DictionaryBuilder.java │ │ ├── DictionaryHeader.java │ │ ├── DictionaryHeaderPrinter.java │ │ ├── DictionaryPrinter.java │ │ ├── DictionaryVersion.java │ │ ├── DoubleArrayLexicon.java │ │ ├── DoubleArrayLookup.java │ │ ├── Grammar.java │ │ ├── GrammarImpl.java │ │ ├── Lexicon.java │ │ ├── LexiconSet.java │ │ ├── POS.java │ │ ├── UserDictionaryBuilder.java │ │ ├── WordIdTable.java │ │ ├── WordInfo.java │ │ ├── WordInfoList.java │ │ ├── WordLookup.java │ │ ├── WordParameterList.java │ │ └── build │ │ │ ├── BuildStats.java │ │ │ ├── ConnectionMatrix.java │ │ │ ├── CsvLexicon.java │ │ │ ├── DicBuffer.java │ │ │ ├── DicBuilder.java │ │ │ ├── Index.java │ │ │ ├── InputFileException.java │ │ │ ├── ModelOutput.java │ │ │ ├── POSTable.java │ │ │ ├── Parameters.java │ │ │ ├── Progress.java │ │ │ ├── TrackingInputStream.java │ │ │ ├── WordIdResolver.java │ │ │ ├── WordLookup.java │ │ │ └── WriteDictionary.java │ │ └── sentdetect │ │ └── SentenceDetector.java └── resources │ ├── char.def │ ├── rewrite.def │ ├── sudachi.json │ ├── sudachi.logging.properties │ └── unk.def └── test ├── dict ├── lex.csv ├── matrix.def ├── user.csv └── user2.csv ├── java └── com │ └── worksap │ └── nlp │ └── sudachi │ ├── ConfigTest.kt │ ├── DefaultInputTextPluginTest.java │ ├── DictionaryFactoryTest.kt │ ├── IgnoreYomiganaPluginTest.java │ ├── InhibitConnectionPluginTest.java │ ├── JapaneseDictionaryTest.java │ ├── JapaneseTokenizerMaskTest.kt │ ├── JapaneseTokenizerStreamingTest.kt │ ├── JapaneseTokenizerTest.java │ ├── JoinKatakanaOovPluginTest.java │ ├── JoinNumericPluginTest.java │ ├── MMapTest.java │ ├── MeCabOovProviderPluginTest.java │ ├── MockGrammar.java │ ├── MockInputText.java │ ├── MorphemeImplTest.kt │ ├── NumericParserTest.java │ ├── OovProviderPluginTest.kt │ ├── PathAnchorTest.kt │ ├── PosMatcherTest.kt │ ├── ProlongedSoundMarkInputTextPluginTest.java │ ├── RegexOovProviderTest.kt │ ├── SettingsTest.java │ ├── StringUtilTest.kt │ ├── SudachiCommandLineTest.java │ ├── TestDictionary.kt │ ├── TestLoggingConfig.java │ ├── TextNormalizerTest.kt │ ├── UTF8InputTextTest.java │ ├── UserDictionaryTest.java │ ├── Utils.java │ ├── WordIdTest.kt │ ├── WordMaskTest.kt │ ├── dictionary │ ├── CSVParserTest.java │ ├── CharacterCategoryTest.java │ ├── DictionaryBuilderTest.java │ ├── DictionaryHeaderPrinterTest.java │ ├── DictionaryHeaderTest.java │ ├── DictionaryPrinterTest.java │ ├── DictionaryReader.java │ ├── DoubleArrayLexiconTest.java │ ├── GrammarImplTest.java │ ├── UserDictionaryBuilderTest.java │ └── build │ │ ├── ConnectionMatrixTest.kt │ │ ├── CsvLexiconTest.kt │ │ ├── DicBufferTest.kt │ │ ├── GrammarTest.kt │ │ ├── MemChannel.kt │ │ ├── ParametersTest.kt │ │ ├── SystemDicTest.kt │ │ └── UserDicTest.kt │ └── sentdetect │ └── SentenceDetectorTest.java └── resources ├── char.def ├── com └── worksap │ └── nlp │ └── sudachi │ └── dictionary │ └── build │ ├── one.csv │ ├── sudachi_dic_build.json │ └── test.matrix ├── dict ├── lex.csv ├── matrix.def ├── user.csv └── user2.csv ├── joinnumeric └── char.def ├── logging.properties ├── rewrite.def ├── rewrite_error_dup.def ├── rewrite_error_ignorelist.def ├── rewrite_error_replacelist.def ├── sudachi.json ├── sudachi_minimum.json └── sudachi_test_empty.json /.formatter/eclipse-formatter.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.formatter/eclipse-formatter.xml -------------------------------------------------------------------------------- /.formatter/license-header: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.formatter/license-header -------------------------------------------------------------------------------- /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.gitattributes -------------------------------------------------------------------------------- /.github/FUNDING.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.github/FUNDING.yml -------------------------------------------------------------------------------- /.github/workflows/build.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.github/workflows/build.yml -------------------------------------------------------------------------------- /.github/workflows/publish.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.github/workflows/publish.yml -------------------------------------------------------------------------------- /.github/workflows/release.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.github/workflows/release.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/.gitignore -------------------------------------------------------------------------------- /CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/CHANGELOG.md -------------------------------------------------------------------------------- /LICENSE-2.0.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/LICENSE-2.0.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/README.md -------------------------------------------------------------------------------- /benchmark/.gitignore: -------------------------------------------------------------------------------- 1 | data/ 2 | -------------------------------------------------------------------------------- /benchmark/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/README.md -------------------------------------------------------------------------------- /benchmark/benchmark_multithread.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/benchmark_multithread.sh -------------------------------------------------------------------------------- /benchmark/benchmark_run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/benchmark_run.sh -------------------------------------------------------------------------------- /benchmark/benchmark_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/benchmark_setup.sh -------------------------------------------------------------------------------- /benchmark/commoncrawl.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/commoncrawl.sh -------------------------------------------------------------------------------- /benchmark/jawikipedia.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/jawikipedia.sh -------------------------------------------------------------------------------- /benchmark/kyoto-leads-corpus.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/kyoto-leads-corpus.sh -------------------------------------------------------------------------------- /benchmark/process_warc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/process_warc.py -------------------------------------------------------------------------------- /benchmark/src/com/worksap/nlp/sudachi/benchmark/TokenizeMultiThread.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/benchmark/src/com/worksap/nlp/sudachi/benchmark/TokenizeMultiThread.java -------------------------------------------------------------------------------- /docs/Sudachi.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/Sudachi.png -------------------------------------------------------------------------------- /docs/Sudachi.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/Sudachi.svg -------------------------------------------------------------------------------- /docs/_config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/_config.yml -------------------------------------------------------------------------------- /docs/_layouts/default.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/_layouts/default.html -------------------------------------------------------------------------------- /docs/development.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/development.md -------------------------------------------------------------------------------- /docs/favicon.ico: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/favicon.ico -------------------------------------------------------------------------------- /docs/index.en.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/index.en.md -------------------------------------------------------------------------------- /docs/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/index.md -------------------------------------------------------------------------------- /docs/oov_handlers.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/oov_handlers.md -------------------------------------------------------------------------------- /docs/tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/tutorial.md -------------------------------------------------------------------------------- /docs/tutorial_plugin.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/tutorial_plugin.md -------------------------------------------------------------------------------- /docs/user_dict.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/docs/user_dict.md -------------------------------------------------------------------------------- /gradle.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/gradle.properties -------------------------------------------------------------------------------- /gradle/wrapper/gradle-wrapper.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/gradle/wrapper/gradle-wrapper.jar -------------------------------------------------------------------------------- /gradle/wrapper/gradle-wrapper.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/gradle/wrapper/gradle-wrapper.properties -------------------------------------------------------------------------------- /gradlew: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/gradlew -------------------------------------------------------------------------------- /gradlew.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/gradlew.bat -------------------------------------------------------------------------------- /licenses/javax.json-1.1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/licenses/javax.json-1.1.txt -------------------------------------------------------------------------------- /settings.gradle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/settings.gradle -------------------------------------------------------------------------------- /src/jmh/java/com/worksap/nlp/sudachi/dictionary/DictionaryBuilderPerformanceTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/jmh/java/com/worksap/nlp/sudachi/dictionary/DictionaryBuilderPerformanceTest.java -------------------------------------------------------------------------------- /src/jmh/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLookupBench.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/jmh/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLookupBench.java -------------------------------------------------------------------------------- /src/jmh/java/com/worksap/nlp/sudachi/dictionary/MemChannelJmh.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/jmh/java/com/worksap/nlp/sudachi/dictionary/MemChannelJmh.kt -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/Config.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/Config.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/DefaultInputTextPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/DefaultInputTextPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/Dictionary.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/Dictionary.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/DictionaryFactory.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/DictionaryFactory.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/EditConnectionCostPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/EditConnectionCostPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/IOTools.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/IOTools.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/IgnoreYomiganaPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/IgnoreYomiganaPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/InhibitConnectionPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/InhibitConnectionPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/InputText.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/InputText.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/InputTextBuilder.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/InputTextBuilder.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/InputTextPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/InputTextPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/JapaneseDictionary.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/JapaneseDictionary.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/JapaneseTokenizer.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/JapaneseTokenizer.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/JoinKatakanaOovPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/JoinKatakanaOovPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/JoinNumericPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/JoinNumericPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/Lattice.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/Lattice.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/LatticeImpl.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/LatticeImpl.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/LatticeNode.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/LatticeNode.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/LatticeNodeImpl.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/LatticeNodeImpl.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/MMap.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/MMap.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/MeCabOovProviderPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/MeCabOovProviderPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/Morpheme.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/Morpheme.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/MorphemeFormatterPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/MorphemeFormatterPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/MorphemeImpl.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/MorphemeImpl.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/MorphemeList.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/MorphemeList.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/NumericParser.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/NumericParser.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/OovProviderPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/OovProviderPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/PartialPOS.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/PartialPOS.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/PathAnchor.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/PathAnchor.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/PathRewritePlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/PathRewritePlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/Plugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/Plugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/PosMatcher.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/PosMatcher.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/ProlongedSoundMarkInputTextPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/ProlongedSoundMarkInputTextPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/RegexOovProvider.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/RegexOovProvider.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/SentenceSplittingAnalysis.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/SentenceSplittingAnalysis.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/SentenceSplittingLazyAnalysis.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/SentenceSplittingLazyAnalysis.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/Settings.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/Settings.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/SimpleMorphemeFormatter.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/SimpleMorphemeFormatter.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/SimpleOovProviderPlugin.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/SimpleOovProviderPlugin.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/StringUtil.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/StringUtil.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/SudachiCommandLine.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/SudachiCommandLine.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/TextNormalizer.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/TextNormalizer.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/Tokenizer.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/Tokenizer.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/UTF8InputText.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/UTF8InputText.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/UTF8InputTextBuilder.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/UTF8InputTextBuilder.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/WordId.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/WordId.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/WordMask.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/WordMask.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/WordSegmentationFormatter.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/WordSegmentationFormatter.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/BinaryDictionary.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/BinaryDictionary.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/CSVParser.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/CSVParser.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/CategoryType.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/CategoryType.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/CharacterCategory.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/CharacterCategory.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/Connection.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/Connection.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryAccess.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryAccess.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryBuilder.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryBuilder.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeader.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeader.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeaderPrinter.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeaderPrinter.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryPrinter.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryPrinter.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryVersion.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DictionaryVersion.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLexicon.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLexicon.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLookup.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLookup.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/Grammar.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/Grammar.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/GrammarImpl.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/GrammarImpl.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/Lexicon.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/Lexicon.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/LexiconSet.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/LexiconSet.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/POS.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/POS.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/UserDictionaryBuilder.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/UserDictionaryBuilder.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/WordIdTable.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/WordIdTable.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/WordInfo.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/WordInfo.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/WordInfoList.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/WordInfoList.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/WordLookup.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/WordLookup.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/WordParameterList.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/WordParameterList.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/BuildStats.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/BuildStats.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/ConnectionMatrix.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/ConnectionMatrix.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/CsvLexicon.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/CsvLexicon.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/DicBuffer.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/DicBuffer.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/DicBuilder.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/DicBuilder.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/Index.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/Index.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/InputFileException.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/InputFileException.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/ModelOutput.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/ModelOutput.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/POSTable.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/POSTable.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/Parameters.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/Parameters.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/Progress.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/Progress.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/TrackingInputStream.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/TrackingInputStream.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/WordIdResolver.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/WordIdResolver.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/WordLookup.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/WordLookup.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/dictionary/build/WriteDictionary.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/dictionary/build/WriteDictionary.java -------------------------------------------------------------------------------- /src/main/java/com/worksap/nlp/sudachi/sentdetect/SentenceDetector.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/java/com/worksap/nlp/sudachi/sentdetect/SentenceDetector.java -------------------------------------------------------------------------------- /src/main/resources/char.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/resources/char.def -------------------------------------------------------------------------------- /src/main/resources/rewrite.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/resources/rewrite.def -------------------------------------------------------------------------------- /src/main/resources/sudachi.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/resources/sudachi.json -------------------------------------------------------------------------------- /src/main/resources/sudachi.logging.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/resources/sudachi.logging.properties -------------------------------------------------------------------------------- /src/main/resources/unk.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/main/resources/unk.def -------------------------------------------------------------------------------- /src/test/dict/lex.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/dict/lex.csv -------------------------------------------------------------------------------- /src/test/dict/matrix.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/dict/matrix.def -------------------------------------------------------------------------------- /src/test/dict/user.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/dict/user.csv -------------------------------------------------------------------------------- /src/test/dict/user2.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/dict/user2.csv -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/ConfigTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/ConfigTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/DefaultInputTextPluginTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/DefaultInputTextPluginTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/DictionaryFactoryTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/DictionaryFactoryTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/IgnoreYomiganaPluginTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/IgnoreYomiganaPluginTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/InhibitConnectionPluginTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/InhibitConnectionPluginTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/JapaneseDictionaryTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/JapaneseDictionaryTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/JapaneseTokenizerMaskTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/JapaneseTokenizerMaskTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/JapaneseTokenizerStreamingTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/JapaneseTokenizerStreamingTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/JapaneseTokenizerTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/JapaneseTokenizerTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/JoinKatakanaOovPluginTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/JoinKatakanaOovPluginTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/JoinNumericPluginTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/JoinNumericPluginTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/MMapTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/MMapTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/MeCabOovProviderPluginTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/MeCabOovProviderPluginTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/MockGrammar.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/MockGrammar.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/MockInputText.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/MockInputText.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/MorphemeImplTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/MorphemeImplTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/NumericParserTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/NumericParserTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/OovProviderPluginTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/OovProviderPluginTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/PathAnchorTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/PathAnchorTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/PosMatcherTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/PosMatcherTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/ProlongedSoundMarkInputTextPluginTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/ProlongedSoundMarkInputTextPluginTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/RegexOovProviderTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/RegexOovProviderTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/SettingsTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/SettingsTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/StringUtilTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/StringUtilTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/SudachiCommandLineTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/SudachiCommandLineTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/TestDictionary.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/TestDictionary.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/TestLoggingConfig.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/TestLoggingConfig.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/TextNormalizerTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/TextNormalizerTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/UTF8InputTextTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/UTF8InputTextTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/UserDictionaryTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/UserDictionaryTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/Utils.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/Utils.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/WordIdTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/WordIdTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/WordMaskTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/WordMaskTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/CSVParserTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/CSVParserTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/CharacterCategoryTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/CharacterCategoryTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryBuilderTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryBuilderTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeaderPrinterTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeaderPrinterTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeaderTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryHeaderTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryPrinterTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryPrinterTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryReader.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/DictionaryReader.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLexiconTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/DoubleArrayLexiconTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/GrammarImplTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/GrammarImplTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/UserDictionaryBuilderTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/UserDictionaryBuilderTest.java -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/ConnectionMatrixTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/ConnectionMatrixTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/CsvLexiconTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/CsvLexiconTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/DicBufferTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/DicBufferTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/GrammarTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/GrammarTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/MemChannel.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/MemChannel.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/ParametersTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/ParametersTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/SystemDicTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/SystemDicTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/dictionary/build/UserDicTest.kt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/dictionary/build/UserDicTest.kt -------------------------------------------------------------------------------- /src/test/java/com/worksap/nlp/sudachi/sentdetect/SentenceDetectorTest.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/java/com/worksap/nlp/sudachi/sentdetect/SentenceDetectorTest.java -------------------------------------------------------------------------------- /src/test/resources/char.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/char.def -------------------------------------------------------------------------------- /src/test/resources/com/worksap/nlp/sudachi/dictionary/build/one.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/com/worksap/nlp/sudachi/dictionary/build/one.csv -------------------------------------------------------------------------------- /src/test/resources/com/worksap/nlp/sudachi/dictionary/build/sudachi_dic_build.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/com/worksap/nlp/sudachi/dictionary/build/sudachi_dic_build.json -------------------------------------------------------------------------------- /src/test/resources/com/worksap/nlp/sudachi/dictionary/build/test.matrix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/com/worksap/nlp/sudachi/dictionary/build/test.matrix -------------------------------------------------------------------------------- /src/test/resources/dict/lex.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/dict/lex.csv -------------------------------------------------------------------------------- /src/test/resources/dict/matrix.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/dict/matrix.def -------------------------------------------------------------------------------- /src/test/resources/dict/user.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/dict/user.csv -------------------------------------------------------------------------------- /src/test/resources/dict/user2.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/dict/user2.csv -------------------------------------------------------------------------------- /src/test/resources/joinnumeric/char.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/joinnumeric/char.def -------------------------------------------------------------------------------- /src/test/resources/logging.properties: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/logging.properties -------------------------------------------------------------------------------- /src/test/resources/rewrite.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/rewrite.def -------------------------------------------------------------------------------- /src/test/resources/rewrite_error_dup.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/rewrite_error_dup.def -------------------------------------------------------------------------------- /src/test/resources/rewrite_error_ignorelist.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/rewrite_error_ignorelist.def -------------------------------------------------------------------------------- /src/test/resources/rewrite_error_replacelist.def: -------------------------------------------------------------------------------- 1 | # there are three columns in replace list 2 | 12 21 31 3 | -------------------------------------------------------------------------------- /src/test/resources/sudachi.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/sudachi.json -------------------------------------------------------------------------------- /src/test/resources/sudachi_minimum.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/WorksApplications/Sudachi/HEAD/src/test/resources/sudachi_minimum.json -------------------------------------------------------------------------------- /src/test/resources/sudachi_test_empty.json: -------------------------------------------------------------------------------- 1 | {} --------------------------------------------------------------------------------