├── .gitignore ├── .travis.yml ├── LICENSE.txt ├── Makefile ├── README.md ├── test_wcwidth.c ├── wcwidth.c └── wcwidth.h /.gitignore: -------------------------------------------------------------------------------- 1 | test_wcwidth 2 | -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- 1 | sudo: false 2 | language: c 3 | compiler: 4 | - clang 5 | - gcc 6 | os: 7 | - linux 8 | - osx 9 | script: make test 10 | -------------------------------------------------------------------------------- /LICENSE.txt: -------------------------------------------------------------------------------- 1 | This project is licensed for use as follows: 2 | 3 | """ 4 | The MIT License (MIT) 5 | 6 | Copyright (c) 2016 Fredrik Fornwall 7 | 8 | Permission is hereby granted, free of charge, to any person obtaining a copy 9 | of this software and associated documentation files (the "Software"), to deal 10 | in the Software without restriction, including without limitation the rights 11 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 12 | copies of the Software, and to permit persons to whom the Software is 13 | furnished to do so, subject to the following conditions: 14 | 15 | The above copyright notice and this permission notice shall be included in all 16 | copies or substantial portions of the Software. 17 | 18 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 19 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 20 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 21 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 22 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 23 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 24 | SOFTWARE. 25 | """ 26 | 27 | This license applies to parts originating from the 28 | https://github.com/jquast/wcwidth repository: 29 | 30 | """ 31 | The MIT License (MIT) 32 | 33 | Copyright (c) 2014 Jeff Quast 34 | 35 | Permission is hereby granted, free of charge, to any person obtaining a copy 36 | of this software and associated documentation files (the "Software"), to deal 37 | in the Software without restriction, including without limitation the rights 38 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 39 | copies of the Software, and to permit persons to whom the Software is 40 | furnished to do so, subject to the following conditions: 41 | 42 | The above copyright notice and this permission notice shall be included in all 43 | copies or substantial portions of the Software. 44 | 45 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 46 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 47 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 48 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 49 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 50 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 51 | SOFTWARE. 52 | 53 | Markus Kuhn -- 2007-05-26 (Unicode 5.0) 54 | 55 | Permission to use, copy, modify, and distribute this software 56 | for any purpose and without fee is hereby granted. The author 57 | disclaims all warranties with regard to this software. 58 | """ 59 | -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- 1 | CFLAGS = -O2 -Werror -Wall -Wextra -pedantic -std=c99 2 | 3 | test: test_wcwidth 4 | @./test_wcwidth 5 | 6 | test_wcwidth: test_wcwidth.c wcwidth.c wcwidth.h 7 | $(CC) $(CFLAGS) -o $@ test_wcwidth.c wcwidth.c 8 | 9 | clean: 10 | rm -f test_wcwidth 11 | 12 | .PHONY: clean test 13 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | A wcwidth implementation in C 2 | ============================= 3 | [![Travis build status](https://travis-ci.org/termux/wcwidth.svg?branch=master)](https://travis-ci.org/termux/wcwidth) 4 | 5 | A simple implementation of [wcwidth(3)](http://pubs.opengroup.org/onlinepubs/009695399/functions/wcwidth.html) 6 | in C as a port of [wcwidth.py](https://github.com/jquast/wcwidth/blob/master/wcwidth/wcwidth.py). 7 | 8 | Used in [Termux](https://termux.com) as part of the `libandroid-support.so` shared library. 9 | -------------------------------------------------------------------------------- /test_wcwidth.c: -------------------------------------------------------------------------------- 1 | #include 2 | #include 3 | #include 4 | 5 | #include "wcwidth.h" 6 | 7 | static int tests_run; 8 | static int test_failures; 9 | 10 | void assertWidthIs(int expected_width, wchar_t c) { 11 | tests_run++; 12 | int actual_width = wcwidth(c); 13 | if (actual_width != expected_width) { 14 | fprintf(stderr, "ERROR: wcwidth(U+%04x) returned %d, expected %d\n", c, actual_width, expected_width); 15 | test_failures++; 16 | } 17 | } 18 | 19 | int main() { 20 | assertWidthIs(1, 'a'); 21 | assertWidthIs(1, L'ö'); 22 | 23 | // Some wide: 24 | assertWidthIs(2, L'A'); 25 | assertWidthIs(2, L'B'); 26 | assertWidthIs(2, L'C'); 27 | assertWidthIs(2, L'中'); 28 | assertWidthIs(2, L'文'); 29 | assertWidthIs(2, 0x679C); 30 | assertWidthIs(2, 0x679D); 31 | assertWidthIs(2, 0x2070E); 32 | assertWidthIs(2, 0x20731); 33 | 34 | assertWidthIs(1, 0x11A3); 35 | 36 | assertWidthIs(2, 0x1F428); // Koala emoji. 37 | assertWidthIs(2, 0x231a); // Watch emoji. 38 | 39 | if (test_failures > 0) printf("%d tests FAILED, ", test_failures); 40 | printf("%d tests OK\n", tests_run); 41 | return (test_failures == 0) ? 0 : 1; 42 | } 43 | 44 | -------------------------------------------------------------------------------- /wcwidth.c: -------------------------------------------------------------------------------- 1 | /* 2 | * Copyright (C) Fredrik Fornwall 2016. 3 | * Distributed under the MIT License. 4 | * 5 | * Implementation of wcwidth(3) as a C port of: 6 | * https://github.com/jquast/wcwidth 7 | * 8 | * Report issues at: 9 | * https://github.com/termux/wcwidth 10 | * 11 | * IMPORTANT: 12 | * Must be kept in sync with the following: 13 | * https://github.com/termux/termux-app/blob/master/terminal-emulator/src/main/java/com/termux/terminal/WcWidth.java 14 | * https://github.com/termux/libandroid-support 15 | * https://github.com/termux/termux-packages/tree/master/packages/libandroid-support 16 | */ 17 | 18 | #include 19 | #include 20 | 21 | struct width_interval { 22 | int start; 23 | int end; 24 | }; 25 | 26 | // From https://github.com/jquast/wcwidth/blob/master/wcwidth/table_zero.py 27 | // from https://github.com/jquast/wcwidth/pull/64 28 | // at commit 1b9b6585b0080ea5cb88dc9815796505724793fe (2022-12-16): 29 | static struct width_interval ZERO_WIDTH[] = { 30 | {0x00300, 0x0036f}, // Combining Grave Accent ..Combining Latin Small Le 31 | {0x00483, 0x00489}, // Combining Cyrillic Titlo..Combining Cyrillic Milli 32 | {0x00591, 0x005bd}, // Hebrew Accent Etnahta ..Hebrew Point Meteg 33 | {0x005bf, 0x005bf}, // Hebrew Point Rafe ..Hebrew Point Rafe 34 | {0x005c1, 0x005c2}, // Hebrew Point Shin Dot ..Hebrew Point Sin Dot 35 | {0x005c4, 0x005c5}, // Hebrew Mark Upper Dot ..Hebrew Mark Lower Dot 36 | {0x005c7, 0x005c7}, // Hebrew Point Qamats Qata..Hebrew Point Qamats Qata 37 | {0x00610, 0x0061a}, // Arabic Sign Sallallahou ..Arabic Small Kasra 38 | {0x0064b, 0x0065f}, // Arabic Fathatan ..Arabic Wavy Hamza Below 39 | {0x00670, 0x00670}, // Arabic Letter Superscrip..Arabic Letter Superscrip 40 | {0x006d6, 0x006dc}, // Arabic Small High Ligatu..Arabic Small High Seen 41 | {0x006df, 0x006e4}, // Arabic Small High Rounde..Arabic Small High Madda 42 | {0x006e7, 0x006e8}, // Arabic Small High Yeh ..Arabic Small High Noon 43 | {0x006ea, 0x006ed}, // Arabic Empty Centre Low ..Arabic Small Low Meem 44 | {0x00711, 0x00711}, // Syriac Letter Superscrip..Syriac Letter Superscrip 45 | {0x00730, 0x0074a}, // Syriac Pthaha Above ..Syriac Barrekh 46 | {0x007a6, 0x007b0}, // Thaana Abafili ..Thaana Sukun 47 | {0x007eb, 0x007f3}, // Nko Combining Short High..Nko Combining Double Dot 48 | {0x007fd, 0x007fd}, // Nko Dantayalan ..Nko Dantayalan 49 | {0x00816, 0x00819}, // Samaritan Mark In ..Samaritan Mark Dagesh 50 | {0x0081b, 0x00823}, // Samaritan Mark Epentheti..Samaritan Vowel Sign A 51 | {0x00825, 0x00827}, // Samaritan Vowel Sign Sho..Samaritan Vowel Sign U 52 | {0x00829, 0x0082d}, // Samaritan Vowel Sign Lon..Samaritan Mark Nequdaa 53 | {0x00859, 0x0085b}, // Mandaic Affrication Mark..Mandaic Gemination Mark 54 | {0x00898, 0x0089f}, // Arabic Small High Word A..Arabic Half Madda Over M 55 | {0x008ca, 0x008e1}, // Arabic Small High Farsi ..Arabic Small High Sign S 56 | {0x008e3, 0x00902}, // Arabic Turned Damma Belo..Devanagari Sign Anusvara 57 | {0x0093a, 0x0093a}, // Devanagari Vowel Sign Oe..Devanagari Vowel Sign Oe 58 | {0x0093c, 0x0093c}, // Devanagari Sign Nukta ..Devanagari Sign Nukta 59 | {0x00941, 0x00948}, // Devanagari Vowel Sign U ..Devanagari Vowel Sign Ai 60 | {0x0094d, 0x0094d}, // Devanagari Sign Virama ..Devanagari Sign Virama 61 | {0x00951, 0x00957}, // Devanagari Stress Sign U..Devanagari Vowel Sign Uu 62 | {0x00962, 0x00963}, // Devanagari Vowel Sign Vo..Devanagari Vowel Sign Vo 63 | {0x00981, 0x00981}, // Bengali Sign Candrabindu..Bengali Sign Candrabindu 64 | {0x009bc, 0x009bc}, // Bengali Sign Nukta ..Bengali Sign Nukta 65 | {0x009c1, 0x009c4}, // Bengali Vowel Sign U ..Bengali Vowel Sign Vocal 66 | {0x009cd, 0x009cd}, // Bengali Sign Virama ..Bengali Sign Virama 67 | {0x009e2, 0x009e3}, // Bengali Vowel Sign Vocal..Bengali Vowel Sign Vocal 68 | {0x009fe, 0x009fe}, // Bengali Sandhi Mark ..Bengali Sandhi Mark 69 | {0x00a01, 0x00a02}, // Gurmukhi Sign Adak Bindi..Gurmukhi Sign Bindi 70 | {0x00a3c, 0x00a3c}, // Gurmukhi Sign Nukta ..Gurmukhi Sign Nukta 71 | {0x00a41, 0x00a42}, // Gurmukhi Vowel Sign U ..Gurmukhi Vowel Sign Uu 72 | {0x00a47, 0x00a48}, // Gurmukhi Vowel Sign Ee ..Gurmukhi Vowel Sign Ai 73 | {0x00a4b, 0x00a4d}, // Gurmukhi Vowel Sign Oo ..Gurmukhi Sign Virama 74 | {0x00a51, 0x00a51}, // Gurmukhi Sign Udaat ..Gurmukhi Sign Udaat 75 | {0x00a70, 0x00a71}, // Gurmukhi Tippi ..Gurmukhi Addak 76 | {0x00a75, 0x00a75}, // Gurmukhi Sign Yakash ..Gurmukhi Sign Yakash 77 | {0x00a81, 0x00a82}, // Gujarati Sign Candrabind..Gujarati Sign Anusvara 78 | {0x00abc, 0x00abc}, // Gujarati Sign Nukta ..Gujarati Sign Nukta 79 | {0x00ac1, 0x00ac5}, // Gujarati Vowel Sign U ..Gujarati Vowel Sign Cand 80 | {0x00ac7, 0x00ac8}, // Gujarati Vowel Sign E ..Gujarati Vowel Sign Ai 81 | {0x00acd, 0x00acd}, // Gujarati Sign Virama ..Gujarati Sign Virama 82 | {0x00ae2, 0x00ae3}, // Gujarati Vowel Sign Voca..Gujarati Vowel Sign Voca 83 | {0x00afa, 0x00aff}, // Gujarati Sign Sukun ..Gujarati Sign Two-circle 84 | {0x00b01, 0x00b01}, // Oriya Sign Candrabindu ..Oriya Sign Candrabindu 85 | {0x00b3c, 0x00b3c}, // Oriya Sign Nukta ..Oriya Sign Nukta 86 | {0x00b3f, 0x00b3f}, // Oriya Vowel Sign I ..Oriya Vowel Sign I 87 | {0x00b41, 0x00b44}, // Oriya Vowel Sign U ..Oriya Vowel Sign Vocalic 88 | {0x00b4d, 0x00b4d}, // Oriya Sign Virama ..Oriya Sign Virama 89 | {0x00b55, 0x00b56}, // Oriya Sign Overline ..Oriya Ai Length Mark 90 | {0x00b62, 0x00b63}, // Oriya Vowel Sign Vocalic..Oriya Vowel Sign Vocalic 91 | {0x00b82, 0x00b82}, // Tamil Sign Anusvara ..Tamil Sign Anusvara 92 | {0x00bc0, 0x00bc0}, // Tamil Vowel Sign Ii ..Tamil Vowel Sign Ii 93 | {0x00bcd, 0x00bcd}, // Tamil Sign Virama ..Tamil Sign Virama 94 | {0x00c00, 0x00c00}, // Telugu Sign Combining Ca..Telugu Sign Combining Ca 95 | {0x00c04, 0x00c04}, // Telugu Sign Combining An..Telugu Sign Combining An 96 | {0x00c3c, 0x00c3c}, // Telugu Sign Nukta ..Telugu Sign Nukta 97 | {0x00c3e, 0x00c40}, // Telugu Vowel Sign Aa ..Telugu Vowel Sign Ii 98 | {0x00c46, 0x00c48}, // Telugu Vowel Sign E ..Telugu Vowel Sign Ai 99 | {0x00c4a, 0x00c4d}, // Telugu Vowel Sign O ..Telugu Sign Virama 100 | {0x00c55, 0x00c56}, // Telugu Length Mark ..Telugu Ai Length Mark 101 | {0x00c62, 0x00c63}, // Telugu Vowel Sign Vocali..Telugu Vowel Sign Vocali 102 | {0x00c81, 0x00c81}, // Kannada Sign Candrabindu..Kannada Sign Candrabindu 103 | {0x00cbc, 0x00cbc}, // Kannada Sign Nukta ..Kannada Sign Nukta 104 | {0x00cbf, 0x00cbf}, // Kannada Vowel Sign I ..Kannada Vowel Sign I 105 | {0x00cc6, 0x00cc6}, // Kannada Vowel Sign E ..Kannada Vowel Sign E 106 | {0x00ccc, 0x00ccd}, // Kannada Vowel Sign Au ..Kannada Sign Virama 107 | {0x00ce2, 0x00ce3}, // Kannada Vowel Sign Vocal..Kannada Vowel Sign Vocal 108 | {0x00d00, 0x00d01}, // Malayalam Sign Combining..Malayalam Sign Candrabin 109 | {0x00d3b, 0x00d3c}, // Malayalam Sign Vertical ..Malayalam Sign Circular 110 | {0x00d41, 0x00d44}, // Malayalam Vowel Sign U ..Malayalam Vowel Sign Voc 111 | {0x00d4d, 0x00d4d}, // Malayalam Sign Virama ..Malayalam Sign Virama 112 | {0x00d62, 0x00d63}, // Malayalam Vowel Sign Voc..Malayalam Vowel Sign Voc 113 | {0x00d81, 0x00d81}, // Sinhala Sign Candrabindu..Sinhala Sign Candrabindu 114 | {0x00dca, 0x00dca}, // Sinhala Sign Al-lakuna ..Sinhala Sign Al-lakuna 115 | {0x00dd2, 0x00dd4}, // Sinhala Vowel Sign Ketti..Sinhala Vowel Sign Ketti 116 | {0x00dd6, 0x00dd6}, // Sinhala Vowel Sign Diga ..Sinhala Vowel Sign Diga 117 | {0x00e31, 0x00e31}, // Thai Character Mai Han-a..Thai Character Mai Han-a 118 | {0x00e34, 0x00e3a}, // Thai Character Sara I ..Thai Character Phinthu 119 | {0x00e47, 0x00e4e}, // Thai Character Maitaikhu..Thai Character Yamakkan 120 | {0x00eb1, 0x00eb1}, // Lao Vowel Sign Mai Kan ..Lao Vowel Sign Mai Kan 121 | {0x00eb4, 0x00ebc}, // Lao Vowel Sign I ..Lao Semivowel Sign Lo 122 | {0x00ec8, 0x00ece}, // Lao Tone Mai Ek ..(nil) 123 | {0x00f18, 0x00f19}, // Tibetan Astrological Sig..Tibetan Astrological Sig 124 | {0x00f35, 0x00f35}, // Tibetan Mark Ngas Bzung ..Tibetan Mark Ngas Bzung 125 | {0x00f37, 0x00f37}, // Tibetan Mark Ngas Bzung ..Tibetan Mark Ngas Bzung 126 | {0x00f39, 0x00f39}, // Tibetan Mark Tsa -phru ..Tibetan Mark Tsa -phru 127 | {0x00f71, 0x00f7e}, // Tibetan Vowel Sign Aa ..Tibetan Sign Rjes Su Nga 128 | {0x00f80, 0x00f84}, // Tibetan Vowel Sign Rever..Tibetan Mark Halanta 129 | {0x00f86, 0x00f87}, // Tibetan Sign Lci Rtags ..Tibetan Sign Yang Rtags 130 | {0x00f8d, 0x00f97}, // Tibetan Subjoined Sign L..Tibetan Subjoined Letter 131 | {0x00f99, 0x00fbc}, // Tibetan Subjoined Letter..Tibetan Subjoined Letter 132 | {0x00fc6, 0x00fc6}, // Tibetan Symbol Padma Gda..Tibetan Symbol Padma Gda 133 | {0x0102d, 0x01030}, // Myanmar Vowel Sign I ..Myanmar Vowel Sign Uu 134 | {0x01032, 0x01037}, // Myanmar Vowel Sign Ai ..Myanmar Sign Dot Below 135 | {0x01039, 0x0103a}, // Myanmar Sign Virama ..Myanmar Sign Asat 136 | {0x0103d, 0x0103e}, // Myanmar Consonant Sign M..Myanmar Consonant Sign M 137 | {0x01058, 0x01059}, // Myanmar Vowel Sign Vocal..Myanmar Vowel Sign Vocal 138 | {0x0105e, 0x01060}, // Myanmar Consonant Sign M..Myanmar Consonant Sign M 139 | {0x01071, 0x01074}, // Myanmar Vowel Sign Geba ..Myanmar Vowel Sign Kayah 140 | {0x01082, 0x01082}, // Myanmar Consonant Sign S..Myanmar Consonant Sign S 141 | {0x01085, 0x01086}, // Myanmar Vowel Sign Shan ..Myanmar Vowel Sign Shan 142 | {0x0108d, 0x0108d}, // Myanmar Sign Shan Counci..Myanmar Sign Shan Counci 143 | {0x0109d, 0x0109d}, // Myanmar Vowel Sign Aiton..Myanmar Vowel Sign Aiton 144 | {0x0135d, 0x0135f}, // Ethiopic Combining Gemin..Ethiopic Combining Gemin 145 | {0x01712, 0x01714}, // Tagalog Vowel Sign I ..Tagalog Sign Virama 146 | {0x01732, 0x01733}, // Hanunoo Vowel Sign I ..Hanunoo Vowel Sign U 147 | {0x01752, 0x01753}, // Buhid Vowel Sign I ..Buhid Vowel Sign U 148 | {0x01772, 0x01773}, // Tagbanwa Vowel Sign I ..Tagbanwa Vowel Sign U 149 | {0x017b4, 0x017b5}, // Khmer Vowel Inherent Aq ..Khmer Vowel Inherent Aa 150 | {0x017b7, 0x017bd}, // Khmer Vowel Sign I ..Khmer Vowel Sign Ua 151 | {0x017c6, 0x017c6}, // Khmer Sign Nikahit ..Khmer Sign Nikahit 152 | {0x017c9, 0x017d3}, // Khmer Sign Muusikatoan ..Khmer Sign Bathamasat 153 | {0x017dd, 0x017dd}, // Khmer Sign Atthacan ..Khmer Sign Atthacan 154 | {0x0180b, 0x0180d}, // Mongolian Free Variation..Mongolian Free Variation 155 | {0x0180f, 0x0180f}, // Mongolian Free Variation..Mongolian Free Variation 156 | {0x01885, 0x01886}, // Mongolian Letter Ali Gal..Mongolian Letter Ali Gal 157 | {0x018a9, 0x018a9}, // Mongolian Letter Ali Gal..Mongolian Letter Ali Gal 158 | {0x01920, 0x01922}, // Limbu Vowel Sign A ..Limbu Vowel Sign U 159 | {0x01927, 0x01928}, // Limbu Vowel Sign E ..Limbu Vowel Sign O 160 | {0x01932, 0x01932}, // Limbu Small Letter Anusv..Limbu Small Letter Anusv 161 | {0x01939, 0x0193b}, // Limbu Sign Mukphreng ..Limbu Sign Sa-i 162 | {0x01a17, 0x01a18}, // Buginese Vowel Sign I ..Buginese Vowel Sign U 163 | {0x01a1b, 0x01a1b}, // Buginese Vowel Sign Ae ..Buginese Vowel Sign Ae 164 | {0x01a56, 0x01a56}, // Tai Tham Consonant Sign ..Tai Tham Consonant Sign 165 | {0x01a58, 0x01a5e}, // Tai Tham Sign Mai Kang L..Tai Tham Consonant Sign 166 | {0x01a60, 0x01a60}, // Tai Tham Sign Sakot ..Tai Tham Sign Sakot 167 | {0x01a62, 0x01a62}, // Tai Tham Vowel Sign Mai ..Tai Tham Vowel Sign Mai 168 | {0x01a65, 0x01a6c}, // Tai Tham Vowel Sign I ..Tai Tham Vowel Sign Oa B 169 | {0x01a73, 0x01a7c}, // Tai Tham Vowel Sign Oa A..Tai Tham Sign Khuen-lue 170 | {0x01a7f, 0x01a7f}, // Tai Tham Combining Crypt..Tai Tham Combining Crypt 171 | {0x01ab0, 0x01ace}, // Combining Doubled Circum..Combining Latin Small Le 172 | {0x01b00, 0x01b03}, // Balinese Sign Ulu Ricem ..Balinese Sign Surang 173 | {0x01b34, 0x01b34}, // Balinese Sign Rerekan ..Balinese Sign Rerekan 174 | {0x01b36, 0x01b3a}, // Balinese Vowel Sign Ulu ..Balinese Vowel Sign Ra R 175 | {0x01b3c, 0x01b3c}, // Balinese Vowel Sign La L..Balinese Vowel Sign La L 176 | {0x01b42, 0x01b42}, // Balinese Vowel Sign Pepe..Balinese Vowel Sign Pepe 177 | {0x01b6b, 0x01b73}, // Balinese Musical Symbol ..Balinese Musical Symbol 178 | {0x01b80, 0x01b81}, // Sundanese Sign Panyecek ..Sundanese Sign Panglayar 179 | {0x01ba2, 0x01ba5}, // Sundanese Consonant Sign..Sundanese Vowel Sign Pan 180 | {0x01ba8, 0x01ba9}, // Sundanese Vowel Sign Pam..Sundanese Vowel Sign Pan 181 | {0x01bab, 0x01bad}, // Sundanese Sign Virama ..Sundanese Consonant Sign 182 | {0x01be6, 0x01be6}, // Batak Sign Tompi ..Batak Sign Tompi 183 | {0x01be8, 0x01be9}, // Batak Vowel Sign Pakpak ..Batak Vowel Sign Ee 184 | {0x01bed, 0x01bed}, // Batak Vowel Sign Karo O ..Batak Vowel Sign Karo O 185 | {0x01bef, 0x01bf1}, // Batak Vowel Sign U For S..Batak Consonant Sign H 186 | {0x01c2c, 0x01c33}, // Lepcha Vowel Sign E ..Lepcha Consonant Sign T 187 | {0x01c36, 0x01c37}, // Lepcha Sign Ran ..Lepcha Sign Nukta 188 | {0x01cd0, 0x01cd2}, // Vedic Tone Karshana ..Vedic Tone Prenkha 189 | {0x01cd4, 0x01ce0}, // Vedic Sign Yajurvedic Mi..Vedic Tone Rigvedic Kash 190 | {0x01ce2, 0x01ce8}, // Vedic Sign Visarga Svari..Vedic Sign Visarga Anuda 191 | {0x01ced, 0x01ced}, // Vedic Sign Tiryak ..Vedic Sign Tiryak 192 | {0x01cf4, 0x01cf4}, // Vedic Tone Candra Above ..Vedic Tone Candra Above 193 | {0x01cf8, 0x01cf9}, // Vedic Tone Ring Above ..Vedic Tone Double Ring A 194 | {0x01dc0, 0x01dff}, // Combining Dotted Grave A..Combining Right Arrowhea 195 | {0x020d0, 0x020f0}, // Combining Left Harpoon A..Combining Asterisk Above 196 | {0x02cef, 0x02cf1}, // Coptic Combining Ni Abov..Coptic Combining Spiritu 197 | {0x02d7f, 0x02d7f}, // Tifinagh Consonant Joine..Tifinagh Consonant Joine 198 | {0x02de0, 0x02dff}, // Combining Cyrillic Lette..Combining Cyrillic Lette 199 | {0x0302a, 0x0302d}, // Ideographic Level Tone M..Ideographic Entering Ton 200 | {0x03099, 0x0309a}, // Combining Katakana-hirag..Combining Katakana-hirag 201 | {0x0a66f, 0x0a672}, // Combining Cyrillic Vzmet..Combining Cyrillic Thous 202 | {0x0a674, 0x0a67d}, // Combining Cyrillic Lette..Combining Cyrillic Payer 203 | {0x0a69e, 0x0a69f}, // Combining Cyrillic Lette..Combining Cyrillic Lette 204 | {0x0a6f0, 0x0a6f1}, // Bamum Combining Mark Koq..Bamum Combining Mark Tuk 205 | {0x0a802, 0x0a802}, // Syloti Nagri Sign Dvisva..Syloti Nagri Sign Dvisva 206 | {0x0a806, 0x0a806}, // Syloti Nagri Sign Hasant..Syloti Nagri Sign Hasant 207 | {0x0a80b, 0x0a80b}, // Syloti Nagri Sign Anusva..Syloti Nagri Sign Anusva 208 | {0x0a825, 0x0a826}, // Syloti Nagri Vowel Sign ..Syloti Nagri Vowel Sign 209 | {0x0a82c, 0x0a82c}, // Syloti Nagri Sign Altern..Syloti Nagri Sign Altern 210 | {0x0a8c4, 0x0a8c5}, // Saurashtra Sign Virama ..Saurashtra Sign Candrabi 211 | {0x0a8e0, 0x0a8f1}, // Combining Devanagari Dig..Combining Devanagari Sig 212 | {0x0a8ff, 0x0a8ff}, // Devanagari Vowel Sign Ay..Devanagari Vowel Sign Ay 213 | {0x0a926, 0x0a92d}, // Kayah Li Vowel Ue ..Kayah Li Tone Calya Plop 214 | {0x0a947, 0x0a951}, // Rejang Vowel Sign I ..Rejang Consonant Sign R 215 | {0x0a980, 0x0a982}, // Javanese Sign Panyangga ..Javanese Sign Layar 216 | {0x0a9b3, 0x0a9b3}, // Javanese Sign Cecak Telu..Javanese Sign Cecak Telu 217 | {0x0a9b6, 0x0a9b9}, // Javanese Vowel Sign Wulu..Javanese Vowel Sign Suku 218 | {0x0a9bc, 0x0a9bd}, // Javanese Vowel Sign Pepe..Javanese Consonant Sign 219 | {0x0a9e5, 0x0a9e5}, // Myanmar Sign Shan Saw ..Myanmar Sign Shan Saw 220 | {0x0aa29, 0x0aa2e}, // Cham Vowel Sign Aa ..Cham Vowel Sign Oe 221 | {0x0aa31, 0x0aa32}, // Cham Vowel Sign Au ..Cham Vowel Sign Ue 222 | {0x0aa35, 0x0aa36}, // Cham Consonant Sign La ..Cham Consonant Sign Wa 223 | {0x0aa43, 0x0aa43}, // Cham Consonant Sign Fina..Cham Consonant Sign Fina 224 | {0x0aa4c, 0x0aa4c}, // Cham Consonant Sign Fina..Cham Consonant Sign Fina 225 | {0x0aa7c, 0x0aa7c}, // Myanmar Sign Tai Laing T..Myanmar Sign Tai Laing T 226 | {0x0aab0, 0x0aab0}, // Tai Viet Mai Kang ..Tai Viet Mai Kang 227 | {0x0aab2, 0x0aab4}, // Tai Viet Vowel I ..Tai Viet Vowel U 228 | {0x0aab7, 0x0aab8}, // Tai Viet Mai Khit ..Tai Viet Vowel Ia 229 | {0x0aabe, 0x0aabf}, // Tai Viet Vowel Am ..Tai Viet Tone Mai Ek 230 | {0x0aac1, 0x0aac1}, // Tai Viet Tone Mai Tho ..Tai Viet Tone Mai Tho 231 | {0x0aaec, 0x0aaed}, // Meetei Mayek Vowel Sign ..Meetei Mayek Vowel Sign 232 | {0x0aaf6, 0x0aaf6}, // Meetei Mayek Virama ..Meetei Mayek Virama 233 | {0x0abe5, 0x0abe5}, // Meetei Mayek Vowel Sign ..Meetei Mayek Vowel Sign 234 | {0x0abe8, 0x0abe8}, // Meetei Mayek Vowel Sign ..Meetei Mayek Vowel Sign 235 | {0x0abed, 0x0abed}, // Meetei Mayek Apun Iyek ..Meetei Mayek Apun Iyek 236 | {0x0fb1e, 0x0fb1e}, // Hebrew Point Judeo-spani..Hebrew Point Judeo-spani 237 | {0x0fe00, 0x0fe0f}, // Variation Selector-1 ..Variation Selector-16 238 | {0x0fe20, 0x0fe2f}, // Combining Ligature Left ..Combining Cyrillic Titlo 239 | {0x101fd, 0x101fd}, // Phaistos Disc Sign Combi..Phaistos Disc Sign Combi 240 | {0x102e0, 0x102e0}, // Coptic Epact Thousands M..Coptic Epact Thousands M 241 | {0x10376, 0x1037a}, // Combining Old Permic Let..Combining Old Permic Let 242 | {0x10a01, 0x10a03}, // Kharoshthi Vowel Sign I ..Kharoshthi Vowel Sign Vo 243 | {0x10a05, 0x10a06}, // Kharoshthi Vowel Sign E ..Kharoshthi Vowel Sign O 244 | {0x10a0c, 0x10a0f}, // Kharoshthi Vowel Length ..Kharoshthi Sign Visarga 245 | {0x10a38, 0x10a3a}, // Kharoshthi Sign Bar Abov..Kharoshthi Sign Dot Belo 246 | {0x10a3f, 0x10a3f}, // Kharoshthi Virama ..Kharoshthi Virama 247 | {0x10ae5, 0x10ae6}, // Manichaean Abbreviation ..Manichaean Abbreviation 248 | {0x10d24, 0x10d27}, // Hanifi Rohingya Sign Har..Hanifi Rohingya Sign Tas 249 | {0x10eab, 0x10eac}, // Yezidi Combining Hamza M..Yezidi Combining Madda M 250 | {0x10efd, 0x10eff}, // (nil) ..(nil) 251 | {0x10f46, 0x10f50}, // Sogdian Combining Dot Be..Sogdian Combining Stroke 252 | {0x10f82, 0x10f85}, // Old Uyghur Combining Dot..Old Uyghur Combining Two 253 | {0x11001, 0x11001}, // Brahmi Sign Anusvara ..Brahmi Sign Anusvara 254 | {0x11038, 0x11046}, // Brahmi Vowel Sign Aa ..Brahmi Virama 255 | {0x11070, 0x11070}, // Brahmi Sign Old Tamil Vi..Brahmi Sign Old Tamil Vi 256 | {0x11073, 0x11074}, // Brahmi Vowel Sign Old Ta..Brahmi Vowel Sign Old Ta 257 | {0x1107f, 0x11081}, // Brahmi Number Joiner ..Kaithi Sign Anusvara 258 | {0x110b3, 0x110b6}, // Kaithi Vowel Sign U ..Kaithi Vowel Sign Ai 259 | {0x110b9, 0x110ba}, // Kaithi Sign Virama ..Kaithi Sign Nukta 260 | {0x110c2, 0x110c2}, // Kaithi Vowel Sign Vocali..Kaithi Vowel Sign Vocali 261 | {0x11100, 0x11102}, // Chakma Sign Candrabindu ..Chakma Sign Visarga 262 | {0x11127, 0x1112b}, // Chakma Vowel Sign A ..Chakma Vowel Sign Uu 263 | {0x1112d, 0x11134}, // Chakma Vowel Sign Ai ..Chakma Maayyaa 264 | {0x11173, 0x11173}, // Mahajani Sign Nukta ..Mahajani Sign Nukta 265 | {0x11180, 0x11181}, // Sharada Sign Candrabindu..Sharada Sign Anusvara 266 | {0x111b6, 0x111be}, // Sharada Vowel Sign U ..Sharada Vowel Sign O 267 | {0x111c9, 0x111cc}, // Sharada Sandhi Mark ..Sharada Extra Short Vowe 268 | {0x111cf, 0x111cf}, // Sharada Sign Inverted Ca..Sharada Sign Inverted Ca 269 | {0x1122f, 0x11231}, // Khojki Vowel Sign U ..Khojki Vowel Sign Ai 270 | {0x11234, 0x11234}, // Khojki Sign Anusvara ..Khojki Sign Anusvara 271 | {0x11236, 0x11237}, // Khojki Sign Nukta ..Khojki Sign Shadda 272 | {0x1123e, 0x1123e}, // Khojki Sign Sukun ..Khojki Sign Sukun 273 | {0x11241, 0x11241}, // (nil) ..(nil) 274 | {0x112df, 0x112df}, // Khudawadi Sign Anusvara ..Khudawadi Sign Anusvara 275 | {0x112e3, 0x112ea}, // Khudawadi Vowel Sign U ..Khudawadi Sign Virama 276 | {0x11300, 0x11301}, // Grantha Sign Combining A..Grantha Sign Candrabindu 277 | {0x1133b, 0x1133c}, // Combining Bindu Below ..Grantha Sign Nukta 278 | {0x11340, 0x11340}, // Grantha Vowel Sign Ii ..Grantha Vowel Sign Ii 279 | {0x11366, 0x1136c}, // Combining Grantha Digit ..Combining Grantha Digit 280 | {0x11370, 0x11374}, // Combining Grantha Letter..Combining Grantha Letter 281 | {0x11438, 0x1143f}, // Newa Vowel Sign U ..Newa Vowel Sign Ai 282 | {0x11442, 0x11444}, // Newa Sign Virama ..Newa Sign Anusvara 283 | {0x11446, 0x11446}, // Newa Sign Nukta ..Newa Sign Nukta 284 | {0x1145e, 0x1145e}, // Newa Sandhi Mark ..Newa Sandhi Mark 285 | {0x114b3, 0x114b8}, // Tirhuta Vowel Sign U ..Tirhuta Vowel Sign Vocal 286 | {0x114ba, 0x114ba}, // Tirhuta Vowel Sign Short..Tirhuta Vowel Sign Short 287 | {0x114bf, 0x114c0}, // Tirhuta Sign Candrabindu..Tirhuta Sign Anusvara 288 | {0x114c2, 0x114c3}, // Tirhuta Sign Virama ..Tirhuta Sign Nukta 289 | {0x115b2, 0x115b5}, // Siddham Vowel Sign U ..Siddham Vowel Sign Vocal 290 | {0x115bc, 0x115bd}, // Siddham Sign Candrabindu..Siddham Sign Anusvara 291 | {0x115bf, 0x115c0}, // Siddham Sign Virama ..Siddham Sign Nukta 292 | {0x115dc, 0x115dd}, // Siddham Vowel Sign Alter..Siddham Vowel Sign Alter 293 | {0x11633, 0x1163a}, // Modi Vowel Sign U ..Modi Vowel Sign Ai 294 | {0x1163d, 0x1163d}, // Modi Sign Anusvara ..Modi Sign Anusvara 295 | {0x1163f, 0x11640}, // Modi Sign Virama ..Modi Sign Ardhacandra 296 | {0x116ab, 0x116ab}, // Takri Sign Anusvara ..Takri Sign Anusvara 297 | {0x116ad, 0x116ad}, // Takri Vowel Sign Aa ..Takri Vowel Sign Aa 298 | {0x116b0, 0x116b5}, // Takri Vowel Sign U ..Takri Vowel Sign Au 299 | {0x116b7, 0x116b7}, // Takri Sign Nukta ..Takri Sign Nukta 300 | {0x1171d, 0x1171f}, // Ahom Consonant Sign Medi..Ahom Consonant Sign Medi 301 | {0x11722, 0x11725}, // Ahom Vowel Sign I ..Ahom Vowel Sign Uu 302 | {0x11727, 0x1172b}, // Ahom Vowel Sign Aw ..Ahom Sign Killer 303 | {0x1182f, 0x11837}, // Dogra Vowel Sign U ..Dogra Sign Anusvara 304 | {0x11839, 0x1183a}, // Dogra Sign Virama ..Dogra Sign Nukta 305 | {0x1193b, 0x1193c}, // Dives Akuru Sign Anusvar..Dives Akuru Sign Candrab 306 | {0x1193e, 0x1193e}, // Dives Akuru Virama ..Dives Akuru Virama 307 | {0x11943, 0x11943}, // Dives Akuru Sign Nukta ..Dives Akuru Sign Nukta 308 | {0x119d4, 0x119d7}, // Nandinagari Vowel Sign U..Nandinagari Vowel Sign V 309 | {0x119da, 0x119db}, // Nandinagari Vowel Sign E..Nandinagari Vowel Sign A 310 | {0x119e0, 0x119e0}, // Nandinagari Sign Virama ..Nandinagari Sign Virama 311 | {0x11a01, 0x11a0a}, // Zanabazar Square Vowel S..Zanabazar Square Vowel L 312 | {0x11a33, 0x11a38}, // Zanabazar Square Final C..Zanabazar Square Sign An 313 | {0x11a3b, 0x11a3e}, // Zanabazar Square Cluster..Zanabazar Square Cluster 314 | {0x11a47, 0x11a47}, // Zanabazar Square Subjoin..Zanabazar Square Subjoin 315 | {0x11a51, 0x11a56}, // Soyombo Vowel Sign I ..Soyombo Vowel Sign Oe 316 | {0x11a59, 0x11a5b}, // Soyombo Vowel Sign Vocal..Soyombo Vowel Length Mar 317 | {0x11a8a, 0x11a96}, // Soyombo Final Consonant ..Soyombo Sign Anusvara 318 | {0x11a98, 0x11a99}, // Soyombo Gemination Mark ..Soyombo Subjoiner 319 | {0x11c30, 0x11c36}, // Bhaiksuki Vowel Sign I ..Bhaiksuki Vowel Sign Voc 320 | {0x11c38, 0x11c3d}, // Bhaiksuki Vowel Sign E ..Bhaiksuki Sign Anusvara 321 | {0x11c3f, 0x11c3f}, // Bhaiksuki Sign Virama ..Bhaiksuki Sign Virama 322 | {0x11c92, 0x11ca7}, // Marchen Subjoined Letter..Marchen Subjoined Letter 323 | {0x11caa, 0x11cb0}, // Marchen Subjoined Letter..Marchen Vowel Sign Aa 324 | {0x11cb2, 0x11cb3}, // Marchen Vowel Sign U ..Marchen Vowel Sign E 325 | {0x11cb5, 0x11cb6}, // Marchen Sign Anusvara ..Marchen Sign Candrabindu 326 | {0x11d31, 0x11d36}, // Masaram Gondi Vowel Sign..Masaram Gondi Vowel Sign 327 | {0x11d3a, 0x11d3a}, // Masaram Gondi Vowel Sign..Masaram Gondi Vowel Sign 328 | {0x11d3c, 0x11d3d}, // Masaram Gondi Vowel Sign..Masaram Gondi Vowel Sign 329 | {0x11d3f, 0x11d45}, // Masaram Gondi Vowel Sign..Masaram Gondi Virama 330 | {0x11d47, 0x11d47}, // Masaram Gondi Ra-kara ..Masaram Gondi Ra-kara 331 | {0x11d90, 0x11d91}, // Gunjala Gondi Vowel Sign..Gunjala Gondi Vowel Sign 332 | {0x11d95, 0x11d95}, // Gunjala Gondi Sign Anusv..Gunjala Gondi Sign Anusv 333 | {0x11d97, 0x11d97}, // Gunjala Gondi Virama ..Gunjala Gondi Virama 334 | {0x11ef3, 0x11ef4}, // Makasar Vowel Sign I ..Makasar Vowel Sign U 335 | {0x11f00, 0x11f01}, // (nil) ..(nil) 336 | {0x11f36, 0x11f3a}, // (nil) ..(nil) 337 | {0x11f40, 0x11f40}, // (nil) ..(nil) 338 | {0x11f42, 0x11f42}, // (nil) ..(nil) 339 | {0x13440, 0x13440}, // (nil) ..(nil) 340 | {0x13447, 0x13455}, // (nil) ..(nil) 341 | {0x16af0, 0x16af4}, // Bassa Vah Combining High..Bassa Vah Combining High 342 | {0x16b30, 0x16b36}, // Pahawh Hmong Mark Cim Tu..Pahawh Hmong Mark Cim Ta 343 | {0x16f4f, 0x16f4f}, // Miao Sign Consonant Modi..Miao Sign Consonant Modi 344 | {0x16f8f, 0x16f92}, // Miao Tone Right ..Miao Tone Below 345 | {0x16fe4, 0x16fe4}, // Khitan Small Script Fill..Khitan Small Script Fill 346 | {0x1bc9d, 0x1bc9e}, // Duployan Thick Letter Se..Duployan Double Mark 347 | {0x1cf00, 0x1cf2d}, // Znamenny Combining Mark ..Znamenny Combining Mark 348 | {0x1cf30, 0x1cf46}, // Znamenny Combining Tonal..Znamenny Priznak Modifie 349 | {0x1d167, 0x1d169}, // Musical Symbol Combining..Musical Symbol Combining 350 | {0x1d17b, 0x1d182}, // Musical Symbol Combining..Musical Symbol Combining 351 | {0x1d185, 0x1d18b}, // Musical Symbol Combining..Musical Symbol Combining 352 | {0x1d1aa, 0x1d1ad}, // Musical Symbol Combining..Musical Symbol Combining 353 | {0x1d242, 0x1d244}, // Combining Greek Musical ..Combining Greek Musical 354 | {0x1da00, 0x1da36}, // Signwriting Head Rim ..Signwriting Air Sucking 355 | {0x1da3b, 0x1da6c}, // Signwriting Mouth Closed..Signwriting Excitement 356 | {0x1da75, 0x1da75}, // Signwriting Upper Body T..Signwriting Upper Body T 357 | {0x1da84, 0x1da84}, // Signwriting Location Hea..Signwriting Location Hea 358 | {0x1da9b, 0x1da9f}, // Signwriting Fill Modifie..Signwriting Fill Modifie 359 | {0x1daa1, 0x1daaf}, // Signwriting Rotation Mod..Signwriting Rotation Mod 360 | {0x1e000, 0x1e006}, // Combining Glagolitic Let..Combining Glagolitic Let 361 | {0x1e008, 0x1e018}, // Combining Glagolitic Let..Combining Glagolitic Let 362 | {0x1e01b, 0x1e021}, // Combining Glagolitic Let..Combining Glagolitic Let 363 | {0x1e023, 0x1e024}, // Combining Glagolitic Let..Combining Glagolitic Let 364 | {0x1e026, 0x1e02a}, // Combining Glagolitic Let..Combining Glagolitic Let 365 | {0x1e08f, 0x1e08f}, // (nil) ..(nil) 366 | {0x1e130, 0x1e136}, // Nyiakeng Puachue Hmong T..Nyiakeng Puachue Hmong T 367 | {0x1e2ae, 0x1e2ae}, // Toto Sign Rising Tone ..Toto Sign Rising Tone 368 | {0x1e2ec, 0x1e2ef}, // Wancho Tone Tup ..Wancho Tone Koini 369 | {0x1e4ec, 0x1e4ef}, // (nil) ..(nil) 370 | {0x1e8d0, 0x1e8d6}, // Mende Kikakui Combining ..Mende Kikakui Combining 371 | {0x1e944, 0x1e94a}, // Adlam Alif Lengthener ..Adlam Nukta 372 | {0xe0100, 0xe01ef}, // Variation Selector-17 ..Variation Selector-256 373 | }; 374 | 375 | // https://github.com/jquast/wcwidth/blob/master/wcwidth/table_wide.py 376 | // from https://github.com/jquast/wcwidth/pull/64 377 | // at commit 1b9b6585b0080ea5cb88dc9815796505724793fe (2022-12-16): 378 | static struct width_interval WIDE_EASTASIAN[] = { 379 | {0x01100, 0x0115f}, // Hangul Choseong Kiyeok ..Hangul Choseong Filler 380 | {0x0231a, 0x0231b}, // Watch ..Hourglass 381 | {0x02329, 0x0232a}, // Left-pointing Angle Brac..Right-pointing Angle Bra 382 | {0x023e9, 0x023ec}, // Black Right-pointing Dou..Black Down-pointing Doub 383 | {0x023f0, 0x023f0}, // Alarm Clock ..Alarm Clock 384 | {0x023f3, 0x023f3}, // Hourglass With Flowing S..Hourglass With Flowing S 385 | {0x025fd, 0x025fe}, // White Medium Small Squar..Black Medium Small Squar 386 | {0x02614, 0x02615}, // Umbrella With Rain Drops..Hot Beverage 387 | {0x02648, 0x02653}, // Aries ..Pisces 388 | {0x0267f, 0x0267f}, // Wheelchair Symbol ..Wheelchair Symbol 389 | {0x02693, 0x02693}, // Anchor ..Anchor 390 | {0x026a1, 0x026a1}, // High Voltage Sign ..High Voltage Sign 391 | {0x026aa, 0x026ab}, // Medium White Circle ..Medium Black Circle 392 | {0x026bd, 0x026be}, // Soccer Ball ..Baseball 393 | {0x026c4, 0x026c5}, // Snowman Without Snow ..Sun Behind Cloud 394 | {0x026ce, 0x026ce}, // Ophiuchus ..Ophiuchus 395 | {0x026d4, 0x026d4}, // No Entry ..No Entry 396 | {0x026ea, 0x026ea}, // Church ..Church 397 | {0x026f2, 0x026f3}, // Fountain ..Flag In Hole 398 | {0x026f5, 0x026f5}, // Sailboat ..Sailboat 399 | {0x026fa, 0x026fa}, // Tent ..Tent 400 | {0x026fd, 0x026fd}, // Fuel Pump ..Fuel Pump 401 | {0x02705, 0x02705}, // White Heavy Check Mark ..White Heavy Check Mark 402 | {0x0270a, 0x0270b}, // Raised Fist ..Raised Hand 403 | {0x02728, 0x02728}, // Sparkles ..Sparkles 404 | {0x0274c, 0x0274c}, // Cross Mark ..Cross Mark 405 | {0x0274e, 0x0274e}, // Negative Squared Cross M..Negative Squared Cross M 406 | {0x02753, 0x02755}, // Black Question Mark Orna..White Exclamation Mark O 407 | {0x02757, 0x02757}, // Heavy Exclamation Mark S..Heavy Exclamation Mark S 408 | {0x02795, 0x02797}, // Heavy Plus Sign ..Heavy Division Sign 409 | {0x027b0, 0x027b0}, // Curly Loop ..Curly Loop 410 | {0x027bf, 0x027bf}, // Double Curly Loop ..Double Curly Loop 411 | {0x02b1b, 0x02b1c}, // Black Large Square ..White Large Square 412 | {0x02b50, 0x02b50}, // White Medium Star ..White Medium Star 413 | {0x02b55, 0x02b55}, // Heavy Large Circle ..Heavy Large Circle 414 | {0x02e80, 0x02e99}, // Cjk Radical Repeat ..Cjk Radical Rap 415 | {0x02e9b, 0x02ef3}, // Cjk Radical Choke ..Cjk Radical C-simplified 416 | {0x02f00, 0x02fd5}, // Kangxi Radical One ..Kangxi Radical Flute 417 | {0x02ff0, 0x02ffb}, // Ideographic Description ..Ideographic Description 418 | {0x03000, 0x0303e}, // Ideographic Space ..Ideographic Variation In 419 | {0x03041, 0x03096}, // Hiragana Letter Small A ..Hiragana Letter Small Ke 420 | {0x03099, 0x030ff}, // Combining Katakana-hirag..Katakana Digraph Koto 421 | {0x03105, 0x0312f}, // Bopomofo Letter B ..Bopomofo Letter Nn 422 | {0x03131, 0x0318e}, // Hangul Letter Kiyeok ..Hangul Letter Araeae 423 | {0x03190, 0x031e3}, // Ideographic Annotation L..Cjk Stroke Q 424 | {0x031f0, 0x0321e}, // Katakana Letter Small Ku..Parenthesized Korean Cha 425 | {0x03220, 0x03247}, // Parenthesized Ideograph ..Circled Ideograph Koto 426 | {0x03250, 0x04dbf}, // Partnership Sign ..Cjk Unified Ideograph-4d 427 | {0x04e00, 0x0a48c}, // Cjk Unified Ideograph-4e..Yi Syllable Yyr 428 | {0x0a490, 0x0a4c6}, // Yi Radical Qot ..Yi Radical Ke 429 | {0x0a960, 0x0a97c}, // Hangul Choseong Tikeut-m..Hangul Choseong Ssangyeo 430 | {0x0ac00, 0x0d7a3}, // Hangul Syllable Ga ..Hangul Syllable Hih 431 | {0x0f900, 0x0faff}, // Cjk Compatibility Ideogr..(nil) 432 | {0x0fe10, 0x0fe19}, // Presentation Form For Ve..Presentation Form For Ve 433 | {0x0fe30, 0x0fe52}, // Presentation Form For Ve..Small Full Stop 434 | {0x0fe54, 0x0fe66}, // Small Semicolon ..Small Equals Sign 435 | {0x0fe68, 0x0fe6b}, // Small Reverse Solidus ..Small Commercial At 436 | {0x0ff01, 0x0ff60}, // Fullwidth Exclamation Ma..Fullwidth Right White Pa 437 | {0x0ffe0, 0x0ffe6}, // Fullwidth Cent Sign ..Fullwidth Won Sign 438 | {0x16fe0, 0x16fe4}, // Tangut Iteration Mark ..Khitan Small Script Fill 439 | {0x16ff0, 0x16ff1}, // Vietnamese Alternate Rea..Vietnamese Alternate Rea 440 | {0x17000, 0x187f7}, // (nil) ..(nil) 441 | {0x18800, 0x18cd5}, // Tangut Component-001 ..Khitan Small Script Char 442 | {0x18d00, 0x18d08}, // (nil) ..(nil) 443 | {0x1aff0, 0x1aff3}, // Katakana Letter Minnan T..Katakana Letter Minnan T 444 | {0x1aff5, 0x1affb}, // Katakana Letter Minnan T..Katakana Letter Minnan N 445 | {0x1affd, 0x1affe}, // Katakana Letter Minnan N..Katakana Letter Minnan N 446 | {0x1b000, 0x1b122}, // Katakana Letter Archaic ..Katakana Letter Archaic 447 | {0x1b132, 0x1b132}, // (nil) ..(nil) 448 | {0x1b150, 0x1b152}, // Hiragana Letter Small Wi..Hiragana Letter Small Wo 449 | {0x1b155, 0x1b155}, // (nil) ..(nil) 450 | {0x1b164, 0x1b167}, // Katakana Letter Small Wi..Katakana Letter Small N 451 | {0x1b170, 0x1b2fb}, // Nushu Character-1b170 ..Nushu Character-1b2fb 452 | {0x1f004, 0x1f004}, // Mahjong Tile Red Dragon ..Mahjong Tile Red Dragon 453 | {0x1f0cf, 0x1f0cf}, // Playing Card Black Joker..Playing Card Black Joker 454 | {0x1f18e, 0x1f18e}, // Negative Squared Ab ..Negative Squared Ab 455 | {0x1f191, 0x1f19a}, // Squared Cl ..Squared Vs 456 | {0x1f200, 0x1f202}, // Square Hiragana Hoka ..Squared Katakana Sa 457 | {0x1f210, 0x1f23b}, // Squared Cjk Unified Ideo..Squared Cjk Unified Ideo 458 | {0x1f240, 0x1f248}, // Tortoise Shell Bracketed..Tortoise Shell Bracketed 459 | {0x1f250, 0x1f251}, // Circled Ideograph Advant..Circled Ideograph Accept 460 | {0x1f260, 0x1f265}, // Rounded Symbol For Fu ..Rounded Symbol For Cai 461 | {0x1f300, 0x1f320}, // Cyclone ..Shooting Star 462 | {0x1f32d, 0x1f335}, // Hot Dog ..Cactus 463 | {0x1f337, 0x1f37c}, // Tulip ..Baby Bottle 464 | {0x1f37e, 0x1f393}, // Bottle With Popping Cork..Graduation Cap 465 | {0x1f3a0, 0x1f3ca}, // Carousel Horse ..Swimmer 466 | {0x1f3cf, 0x1f3d3}, // Cricket Bat And Ball ..Table Tennis Paddle And 467 | {0x1f3e0, 0x1f3f0}, // House Building ..European Castle 468 | {0x1f3f4, 0x1f3f4}, // Waving Black Flag ..Waving Black Flag 469 | {0x1f3f8, 0x1f43e}, // Badminton Racquet And Sh..Paw Prints 470 | {0x1f440, 0x1f440}, // Eyes ..Eyes 471 | {0x1f442, 0x1f4fc}, // Ear ..Videocassette 472 | {0x1f4ff, 0x1f53d}, // Prayer Beads ..Down-pointing Small Red 473 | {0x1f54b, 0x1f54e}, // Kaaba ..Menorah With Nine Branch 474 | {0x1f550, 0x1f567}, // Clock Face One Oclock ..Clock Face Twelve-thirty 475 | {0x1f57a, 0x1f57a}, // Man Dancing ..Man Dancing 476 | {0x1f595, 0x1f596}, // Reversed Hand With Middl..Raised Hand With Part Be 477 | {0x1f5a4, 0x1f5a4}, // Black Heart ..Black Heart 478 | {0x1f5fb, 0x1f64f}, // Mount Fuji ..Person With Folded Hands 479 | {0x1f680, 0x1f6c5}, // Rocket ..Left Luggage 480 | {0x1f6cc, 0x1f6cc}, // Sleeping Accommodation ..Sleeping Accommodation 481 | {0x1f6d0, 0x1f6d2}, // Place Of Worship ..Shopping Trolley 482 | {0x1f6d5, 0x1f6d7}, // Hindu Temple ..Elevator 483 | {0x1f6dc, 0x1f6df}, // (nil) ..Ring Buoy 484 | {0x1f6eb, 0x1f6ec}, // Airplane Departure ..Airplane Arriving 485 | {0x1f6f4, 0x1f6fc}, // Scooter ..Roller Skate 486 | {0x1f7e0, 0x1f7eb}, // Large Orange Circle ..Large Brown Square 487 | {0x1f7f0, 0x1f7f0}, // Heavy Equals Sign ..Heavy Equals Sign 488 | {0x1f90c, 0x1f93a}, // Pinched Fingers ..Fencer 489 | {0x1f93c, 0x1f945}, // Wrestlers ..Goal Net 490 | {0x1f947, 0x1f9ff}, // First Place Medal ..Nazar Amulet 491 | {0x1fa70, 0x1fa7c}, // Ballet Shoes ..Crutch 492 | {0x1fa80, 0x1fa88}, // Yo-yo ..(nil) 493 | {0x1fa90, 0x1fabd}, // Ringed Planet ..(nil) 494 | {0x1fabf, 0x1fac5}, // (nil) ..Person With Crown 495 | {0x1face, 0x1fadb}, // (nil) ..(nil) 496 | {0x1fae0, 0x1fae8}, // Melting Face ..(nil) 497 | {0x1faf0, 0x1faf8}, // Hand With Index Finger A..(nil) 498 | {0x20000, 0x2fffd}, // Cjk Unified Ideograph-20..(nil) 499 | {0x30000, 0x3fffd}, // Cjk Unified Ideograph-30..(nil) 500 | }; 501 | 502 | static bool intable(struct width_interval* table, int table_length, int c) { 503 | // First quick check for Latin1 etc. characters. 504 | if (c < table[0].start) return false; 505 | 506 | // Binary search in table. 507 | int bot = 0; 508 | int top = table_length - 1; 509 | while (top >= bot) { 510 | int mid = (bot + top) / 2; 511 | if (table[mid].end < c) { 512 | bot = mid + 1; 513 | } else if (table[mid].start > c) { 514 | top = mid - 1; 515 | } else { 516 | return true; 517 | } 518 | } 519 | return false; 520 | } 521 | 522 | int wcwidth(wchar_t ucs) { 523 | // NOTE: created by hand, there isn't anything identifiable other than 524 | // general Cf category code to identify these, and some characters in Cf 525 | // category code are of non-zero width. 526 | if (ucs == 0 || 527 | ucs == 0x034F || 528 | (0x200B <= ucs && ucs <= 0x200F) || 529 | ucs == 0x2028 || 530 | ucs == 0x2029 || 531 | (0x202A <= ucs && ucs <= 0x202E) || 532 | (0x2060 <= ucs && ucs <= 0x2063)) { 533 | return 0; 534 | } 535 | 536 | // C0/C1 control characters. 537 | if (ucs < 32 || (0x07F <= ucs && ucs < 0x0A0)) return -1; 538 | 539 | // Combining characters with zero width. 540 | if (intable(ZERO_WIDTH, sizeof(ZERO_WIDTH)/sizeof(struct width_interval), ucs)) return 0; 541 | 542 | return intable(WIDE_EASTASIAN, sizeof(WIDE_EASTASIAN)/sizeof(struct width_interval), ucs) ? 2 : 1; 543 | } 544 | -------------------------------------------------------------------------------- /wcwidth.h: -------------------------------------------------------------------------------- 1 | #ifndef WCWIDTH_H_INCLUDED 2 | #define WCWIDTH_H_INCLUDED 3 | 4 | #include 5 | 6 | __BEGIN_DECLS 7 | 8 | int wcwidth(wchar_t ucs); 9 | 10 | __END_DECLS 11 | 12 | #endif 13 | --------------------------------------------------------------------------------