├── .formatter.exs ├── .github └── workflows │ └── ci.yml ├── .gitignore ├── CHANGELOG.md ├── LICENSE.md ├── README.md ├── benchee ├── casing.exs ├── compare.exs └── next.exs ├── config └── config.exs ├── lib ├── tasks │ └── download_dictionaries.ex └── unicode │ ├── break.ex │ ├── case │ ├── folding.ex │ ├── greek_upper.ex │ └── mapping.ex │ ├── dictionary.ex │ ├── segment.ex │ ├── string.ex │ └── trie.ex ├── logo.png ├── mix.exs ├── mix.lock ├── mix └── myapp_backend.ex ├── priv ├── dictionaries │ └── .gitkeep └── segments │ ├── de.xml │ ├── el.xml │ ├── en.xml │ ├── en_US.xml │ ├── en_US_POSIX.xml │ ├── es.xml │ ├── fi.xml │ ├── fr.xml │ ├── it.xml │ ├── ja.xml │ ├── pt.xml │ ├── root.xml │ ├── ru.xml │ ├── sv.xml │ ├── zh.xml │ └── zh_Hant.xml ├── test ├── casing_test.exs ├── line_break_test.exs ├── segment_test.exs ├── sentence_break_test.exs ├── support │ ├── test_data │ │ ├── grapheme_break_test.txt │ │ ├── line_break_test.txt │ │ ├── sentence_break_test.txt │ │ └── word_break_test.txt │ └── test_data_parser.ex ├── test_helper.exs ├── unicode_string_test.exs └── word_break_test.exs ├── update_segment_data └── update_test_data /.formatter.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/.formatter.exs -------------------------------------------------------------------------------- /.github/workflows/ci.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/.github/workflows/ci.yml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/.gitignore -------------------------------------------------------------------------------- /CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/CHANGELOG.md -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/LICENSE.md -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/README.md -------------------------------------------------------------------------------- /benchee/casing.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/benchee/casing.exs -------------------------------------------------------------------------------- /benchee/compare.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/benchee/compare.exs -------------------------------------------------------------------------------- /benchee/next.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/benchee/next.exs -------------------------------------------------------------------------------- /config/config.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/config/config.exs -------------------------------------------------------------------------------- /lib/tasks/download_dictionaries.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/tasks/download_dictionaries.ex -------------------------------------------------------------------------------- /lib/unicode/break.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/break.ex -------------------------------------------------------------------------------- /lib/unicode/case/folding.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/case/folding.ex -------------------------------------------------------------------------------- /lib/unicode/case/greek_upper.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/case/greek_upper.ex -------------------------------------------------------------------------------- /lib/unicode/case/mapping.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/case/mapping.ex -------------------------------------------------------------------------------- /lib/unicode/dictionary.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/dictionary.ex -------------------------------------------------------------------------------- /lib/unicode/segment.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/segment.ex -------------------------------------------------------------------------------- /lib/unicode/string.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/string.ex -------------------------------------------------------------------------------- /lib/unicode/trie.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/lib/unicode/trie.ex -------------------------------------------------------------------------------- /logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/logo.png -------------------------------------------------------------------------------- /mix.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/mix.exs -------------------------------------------------------------------------------- /mix.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/mix.lock -------------------------------------------------------------------------------- /mix/myapp_backend.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/mix/myapp_backend.ex -------------------------------------------------------------------------------- /priv/dictionaries/.gitkeep: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /priv/segments/de.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/de.xml -------------------------------------------------------------------------------- /priv/segments/el.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/el.xml -------------------------------------------------------------------------------- /priv/segments/en.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/en.xml -------------------------------------------------------------------------------- /priv/segments/en_US.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/en_US.xml -------------------------------------------------------------------------------- /priv/segments/en_US_POSIX.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/en_US_POSIX.xml -------------------------------------------------------------------------------- /priv/segments/es.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/es.xml -------------------------------------------------------------------------------- /priv/segments/fi.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/fi.xml -------------------------------------------------------------------------------- /priv/segments/fr.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/fr.xml -------------------------------------------------------------------------------- /priv/segments/it.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/it.xml -------------------------------------------------------------------------------- /priv/segments/ja.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/ja.xml -------------------------------------------------------------------------------- /priv/segments/pt.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/pt.xml -------------------------------------------------------------------------------- /priv/segments/root.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/root.xml -------------------------------------------------------------------------------- /priv/segments/ru.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/ru.xml -------------------------------------------------------------------------------- /priv/segments/sv.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/sv.xml -------------------------------------------------------------------------------- /priv/segments/zh.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/zh.xml -------------------------------------------------------------------------------- /priv/segments/zh_Hant.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/priv/segments/zh_Hant.xml -------------------------------------------------------------------------------- /test/casing_test.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/casing_test.exs -------------------------------------------------------------------------------- /test/line_break_test.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/line_break_test.exs -------------------------------------------------------------------------------- /test/segment_test.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/segment_test.exs -------------------------------------------------------------------------------- /test/sentence_break_test.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/sentence_break_test.exs -------------------------------------------------------------------------------- /test/support/test_data/grapheme_break_test.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/support/test_data/grapheme_break_test.txt -------------------------------------------------------------------------------- /test/support/test_data/line_break_test.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/support/test_data/line_break_test.txt -------------------------------------------------------------------------------- /test/support/test_data/sentence_break_test.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/support/test_data/sentence_break_test.txt -------------------------------------------------------------------------------- /test/support/test_data/word_break_test.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/support/test_data/word_break_test.txt -------------------------------------------------------------------------------- /test/support/test_data_parser.ex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/support/test_data_parser.ex -------------------------------------------------------------------------------- /test/test_helper.exs: -------------------------------------------------------------------------------- 1 | ExUnit.start() 2 | -------------------------------------------------------------------------------- /test/unicode_string_test.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/unicode_string_test.exs -------------------------------------------------------------------------------- /test/word_break_test.exs: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/test/word_break_test.exs -------------------------------------------------------------------------------- /update_segment_data: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/update_segment_data -------------------------------------------------------------------------------- /update_test_data: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/elixir-unicode/unicode_string/HEAD/update_test_data --------------------------------------------------------------------------------