├── .github ├── dependabot.yml └── workflows │ ├── ci.yml │ └── release.yml ├── CHANGELOG.md ├── LICENSE ├── README.md ├── default.nix ├── dev ├── .gitignore ├── Cargo.lock ├── Cargo.toml ├── flake.lock ├── flake.nix ├── rustfmt.toml ├── src │ └── main.rs └── tests │ ├── _snapshots │ ├── ascii │ ├── basic │ └── length │ ├── ascii │ └── expr.nix │ ├── basic │ └── expr.nix │ └── length │ └── expr.nix ├── flake.nix ├── namaka.toml └── table.nix /.github/dependabot.yml: -------------------------------------------------------------------------------- 1 | version: 2 2 | 3 | updates: 4 | - package-ecosystem: github-actions 5 | directory: / 6 | schedule: 7 | interval: daily 8 | -------------------------------------------------------------------------------- /.github/workflows/ci.yml: -------------------------------------------------------------------------------- 1 | name: ci 2 | 3 | on: 4 | push: 5 | branches: 6 | - main 7 | pull_request: 8 | 9 | jobs: 10 | check: 11 | name: check 12 | runs-on: ubuntu-latest 13 | steps: 14 | - name: Checkout 15 | uses: actions/checkout@v4 16 | 17 | - name: Install nix 18 | uses: cachix/install-nix-action@v25 19 | 20 | - name: Run checks 21 | run: nix flake check ./dev 22 | -------------------------------------------------------------------------------- /.github/workflows/release.yml: -------------------------------------------------------------------------------- 1 | name: release 2 | 3 | on: 4 | push: 5 | tags: 6 | - v[0-9]+.[0-9]+.[0-9]+ 7 | workflow_dispatch: 8 | inputs: 9 | tag: 10 | description: The existing tag to publish to FlakeHub 11 | type: string 12 | required: true 13 | 14 | jobs: 15 | release: 16 | runs-on: ubuntu-latest 17 | if: github.event_name != 'workflow_dispatch' 18 | steps: 19 | - uses: softprops/action-gh-release@v1 20 | with: 21 | body: "[CHANGELOG.md](https://github.com/figsoda/utf8/blob/main/CHANGELOG.md)" 22 | 23 | flakehub: 24 | runs-on: ubuntu-latest 25 | permissions: 26 | id-token: write 27 | contents: read 28 | steps: 29 | - uses: actions/checkout@v4 30 | with: 31 | ref: ${{ inputs.tag != null && format('refs/tags/{0}', inputs.tag) || '' }} 32 | - uses: DeterminateSystems/nix-installer-action@v9 33 | - uses: DeterminateSystems/flakehub-push@v3 34 | with: 35 | visibility: public 36 | tag: ${{ inputs.tag }} 37 | -------------------------------------------------------------------------------- /CHANGELOG.md: -------------------------------------------------------------------------------- 1 | # Changelog 2 | 3 | ## v0.1.0 - 2023-05-28 4 | 5 | First release 6 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | Mozilla Public License Version 2.0 2 | ================================== 3 | 4 | 1. Definitions 5 | -------------- 6 | 7 | 1.1. "Contributor" 8 | means each individual or legal entity that creates, contributes to 9 | the creation of, or owns Covered Software. 10 | 11 | 1.2. "Contributor Version" 12 | means the combination of the Contributions of others (if any) used 13 | by a Contributor and that particular Contributor's Contribution. 14 | 15 | 1.3. "Contribution" 16 | means Covered Software of a particular Contributor. 17 | 18 | 1.4. "Covered Software" 19 | means Source Code Form to which the initial Contributor has attached 20 | the notice in Exhibit A, the Executable Form of such Source Code 21 | Form, and Modifications of such Source Code Form, in each case 22 | including portions thereof. 23 | 24 | 1.5. "Incompatible With Secondary Licenses" 25 | means 26 | 27 | (a) that the initial Contributor has attached the notice described 28 | in Exhibit B to the Covered Software; or 29 | 30 | (b) that the Covered Software was made available under the terms of 31 | version 1.1 or earlier of the License, but not also under the 32 | terms of a Secondary License. 33 | 34 | 1.6. "Executable Form" 35 | means any form of the work other than Source Code Form. 36 | 37 | 1.7. "Larger Work" 38 | means a work that combines Covered Software with other material, in 39 | a separate file or files, that is not Covered Software. 40 | 41 | 1.8. "License" 42 | means this document. 43 | 44 | 1.9. "Licensable" 45 | means having the right to grant, to the maximum extent possible, 46 | whether at the time of the initial grant or subsequently, any and 47 | all of the rights conveyed by this License. 48 | 49 | 1.10. "Modifications" 50 | means any of the following: 51 | 52 | (a) any file in Source Code Form that results from an addition to, 53 | deletion from, or modification of the contents of Covered 54 | Software; or 55 | 56 | (b) any new file in Source Code Form that contains any Covered 57 | Software. 58 | 59 | 1.11. "Patent Claims" of a Contributor 60 | means any patent claim(s), including without limitation, method, 61 | process, and apparatus claims, in any patent Licensable by such 62 | Contributor that would be infringed, but for the grant of the 63 | License, by the making, using, selling, offering for sale, having 64 | made, import, or transfer of either its Contributions or its 65 | Contributor Version. 66 | 67 | 1.12. "Secondary License" 68 | means either the GNU General Public License, Version 2.0, the GNU 69 | Lesser General Public License, Version 2.1, the GNU Affero General 70 | Public License, Version 3.0, or any later versions of those 71 | licenses. 72 | 73 | 1.13. "Source Code Form" 74 | means the form of the work preferred for making modifications. 75 | 76 | 1.14. "You" (or "Your") 77 | means an individual or a legal entity exercising rights under this 78 | License. For legal entities, "You" includes any entity that 79 | controls, is controlled by, or is under common control with You. For 80 | purposes of this definition, "control" means (a) the power, direct 81 | or indirect, to cause the direction or management of such entity, 82 | whether by contract or otherwise, or (b) ownership of more than 83 | fifty percent (50%) of the outstanding shares or beneficial 84 | ownership of such entity. 85 | 86 | 2. License Grants and Conditions 87 | -------------------------------- 88 | 89 | 2.1. Grants 90 | 91 | Each Contributor hereby grants You a world-wide, royalty-free, 92 | non-exclusive license: 93 | 94 | (a) under intellectual property rights (other than patent or trademark) 95 | Licensable by such Contributor to use, reproduce, make available, 96 | modify, display, perform, distribute, and otherwise exploit its 97 | Contributions, either on an unmodified basis, with Modifications, or 98 | as part of a Larger Work; and 99 | 100 | (b) under Patent Claims of such Contributor to make, use, sell, offer 101 | for sale, have made, import, and otherwise transfer either its 102 | Contributions or its Contributor Version. 103 | 104 | 2.2. Effective Date 105 | 106 | The licenses granted in Section 2.1 with respect to any Contribution 107 | become effective for each Contribution on the date the Contributor first 108 | distributes such Contribution. 109 | 110 | 2.3. Limitations on Grant Scope 111 | 112 | The licenses granted in this Section 2 are the only rights granted under 113 | this License. No additional rights or licenses will be implied from the 114 | distribution or licensing of Covered Software under this License. 115 | Notwithstanding Section 2.1(b) above, no patent license is granted by a 116 | Contributor: 117 | 118 | (a) for any code that a Contributor has removed from Covered Software; 119 | or 120 | 121 | (b) for infringements caused by: (i) Your and any other third party's 122 | modifications of Covered Software, or (ii) the combination of its 123 | Contributions with other software (except as part of its Contributor 124 | Version); or 125 | 126 | (c) under Patent Claims infringed by Covered Software in the absence of 127 | its Contributions. 128 | 129 | This License does not grant any rights in the trademarks, service marks, 130 | or logos of any Contributor (except as may be necessary to comply with 131 | the notice requirements in Section 3.4). 132 | 133 | 2.4. Subsequent Licenses 134 | 135 | No Contributor makes additional grants as a result of Your choice to 136 | distribute the Covered Software under a subsequent version of this 137 | License (see Section 10.2) or under the terms of a Secondary License (if 138 | permitted under the terms of Section 3.3). 139 | 140 | 2.5. Representation 141 | 142 | Each Contributor represents that the Contributor believes its 143 | Contributions are its original creation(s) or it has sufficient rights 144 | to grant the rights to its Contributions conveyed by this License. 145 | 146 | 2.6. Fair Use 147 | 148 | This License is not intended to limit any rights You have under 149 | applicable copyright doctrines of fair use, fair dealing, or other 150 | equivalents. 151 | 152 | 2.7. Conditions 153 | 154 | Sections 3.1, 3.2, 3.3, and 3.4 are conditions of the licenses granted 155 | in Section 2.1. 156 | 157 | 3. Responsibilities 158 | ------------------- 159 | 160 | 3.1. Distribution of Source Form 161 | 162 | All distribution of Covered Software in Source Code Form, including any 163 | Modifications that You create or to which You contribute, must be under 164 | the terms of this License. You must inform recipients that the Source 165 | Code Form of the Covered Software is governed by the terms of this 166 | License, and how they can obtain a copy of this License. You may not 167 | attempt to alter or restrict the recipients' rights in the Source Code 168 | Form. 169 | 170 | 3.2. Distribution of Executable Form 171 | 172 | If You distribute Covered Software in Executable Form then: 173 | 174 | (a) such Covered Software must also be made available in Source Code 175 | Form, as described in Section 3.1, and You must inform recipients of 176 | the Executable Form how they can obtain a copy of such Source Code 177 | Form by reasonable means in a timely manner, at a charge no more 178 | than the cost of distribution to the recipient; and 179 | 180 | (b) You may distribute such Executable Form under the terms of this 181 | License, or sublicense it under different terms, provided that the 182 | license for the Executable Form does not attempt to limit or alter 183 | the recipients' rights in the Source Code Form under this License. 184 | 185 | 3.3. Distribution of a Larger Work 186 | 187 | You may create and distribute a Larger Work under terms of Your choice, 188 | provided that You also comply with the requirements of this License for 189 | the Covered Software. If the Larger Work is a combination of Covered 190 | Software with a work governed by one or more Secondary Licenses, and the 191 | Covered Software is not Incompatible With Secondary Licenses, this 192 | License permits You to additionally distribute such Covered Software 193 | under the terms of such Secondary License(s), so that the recipient of 194 | the Larger Work may, at their option, further distribute the Covered 195 | Software under the terms of either this License or such Secondary 196 | License(s). 197 | 198 | 3.4. Notices 199 | 200 | You may not remove or alter the substance of any license notices 201 | (including copyright notices, patent notices, disclaimers of warranty, 202 | or limitations of liability) contained within the Source Code Form of 203 | the Covered Software, except that You may alter any license notices to 204 | the extent required to remedy known factual inaccuracies. 205 | 206 | 3.5. Application of Additional Terms 207 | 208 | You may choose to offer, and to charge a fee for, warranty, support, 209 | indemnity or liability obligations to one or more recipients of Covered 210 | Software. However, You may do so only on Your own behalf, and not on 211 | behalf of any Contributor. You must make it absolutely clear that any 212 | such warranty, support, indemnity, or liability obligation is offered by 213 | You alone, and You hereby agree to indemnify every Contributor for any 214 | liability incurred by such Contributor as a result of warranty, support, 215 | indemnity or liability terms You offer. You may include additional 216 | disclaimers of warranty and limitations of liability specific to any 217 | jurisdiction. 218 | 219 | 4. Inability to Comply Due to Statute or Regulation 220 | --------------------------------------------------- 221 | 222 | If it is impossible for You to comply with any of the terms of this 223 | License with respect to some or all of the Covered Software due to 224 | statute, judicial order, or regulation then You must: (a) comply with 225 | the terms of this License to the maximum extent possible; and (b) 226 | describe the limitations and the code they affect. Such description must 227 | be placed in a text file included with all distributions of the Covered 228 | Software under this License. Except to the extent prohibited by statute 229 | or regulation, such description must be sufficiently detailed for a 230 | recipient of ordinary skill to be able to understand it. 231 | 232 | 5. Termination 233 | -------------- 234 | 235 | 5.1. The rights granted under this License will terminate automatically 236 | if You fail to comply with any of its terms. However, if You become 237 | compliant, then the rights granted under this License from a particular 238 | Contributor are reinstated (a) provisionally, unless and until such 239 | Contributor explicitly and finally terminates Your grants, and (b) on an 240 | ongoing basis, if such Contributor fails to notify You of the 241 | non-compliance by some reasonable means prior to 60 days after You have 242 | come back into compliance. Moreover, Your grants from a particular 243 | Contributor are reinstated on an ongoing basis if such Contributor 244 | notifies You of the non-compliance by some reasonable means, this is the 245 | first time You have received notice of non-compliance with this License 246 | from such Contributor, and You become compliant prior to 30 days after 247 | Your receipt of the notice. 248 | 249 | 5.2. If You initiate litigation against any entity by asserting a patent 250 | infringement claim (excluding declaratory judgment actions, 251 | counter-claims, and cross-claims) alleging that a Contributor Version 252 | directly or indirectly infringes any patent, then the rights granted to 253 | You by any and all Contributors for the Covered Software under Section 254 | 2.1 of this License shall terminate. 255 | 256 | 5.3. In the event of termination under Sections 5.1 or 5.2 above, all 257 | end user license agreements (excluding distributors and resellers) which 258 | have been validly granted by You or Your distributors under this License 259 | prior to termination shall survive termination. 260 | 261 | ************************************************************************ 262 | * * 263 | * 6. Disclaimer of Warranty * 264 | * ------------------------- * 265 | * * 266 | * Covered Software is provided under this License on an "as is" * 267 | * basis, without warranty of any kind, either expressed, implied, or * 268 | * statutory, including, without limitation, warranties that the * 269 | * Covered Software is free of defects, merchantable, fit for a * 270 | * particular purpose or non-infringing. The entire risk as to the * 271 | * quality and performance of the Covered Software is with You. * 272 | * Should any Covered Software prove defective in any respect, You * 273 | * (not any Contributor) assume the cost of any necessary servicing, * 274 | * repair, or correction. This disclaimer of warranty constitutes an * 275 | * essential part of this License. No use of any Covered Software is * 276 | * authorized under this License except under this disclaimer. * 277 | * * 278 | ************************************************************************ 279 | 280 | ************************************************************************ 281 | * * 282 | * 7. Limitation of Liability * 283 | * -------------------------- * 284 | * * 285 | * Under no circumstances and under no legal theory, whether tort * 286 | * (including negligence), contract, or otherwise, shall any * 287 | * Contributor, or anyone who distributes Covered Software as * 288 | * permitted above, be liable to You for any direct, indirect, * 289 | * special, incidental, or consequential damages of any character * 290 | * including, without limitation, damages for lost profits, loss of * 291 | * goodwill, work stoppage, computer failure or malfunction, or any * 292 | * and all other commercial damages or losses, even if such party * 293 | * shall have been informed of the possibility of such damages. This * 294 | * limitation of liability shall not apply to liability for death or * 295 | * personal injury resulting from such party's negligence to the * 296 | * extent applicable law prohibits such limitation. Some * 297 | * jurisdictions do not allow the exclusion or limitation of * 298 | * incidental or consequential damages, so this exclusion and * 299 | * limitation may not apply to You. * 300 | * * 301 | ************************************************************************ 302 | 303 | 8. Litigation 304 | ------------- 305 | 306 | Any litigation relating to this License may be brought only in the 307 | courts of a jurisdiction where the defendant maintains its principal 308 | place of business and such litigation shall be governed by laws of that 309 | jurisdiction, without reference to its conflict-of-law provisions. 310 | Nothing in this Section shall prevent a party's ability to bring 311 | cross-claims or counter-claims. 312 | 313 | 9. Miscellaneous 314 | ---------------- 315 | 316 | This License represents the complete agreement concerning the subject 317 | matter hereof. If any provision of this License is held to be 318 | unenforceable, such provision shall be reformed only to the extent 319 | necessary to make it enforceable. Any law or regulation which provides 320 | that the language of a contract shall be construed against the drafter 321 | shall not be used to construe this License against a Contributor. 322 | 323 | 10. Versions of the License 324 | --------------------------- 325 | 326 | 10.1. New Versions 327 | 328 | Mozilla Foundation is the license steward. Except as provided in Section 329 | 10.3, no one other than the license steward has the right to modify or 330 | publish new versions of this License. Each version will be given a 331 | distinguishing version number. 332 | 333 | 10.2. Effect of New Versions 334 | 335 | You may distribute the Covered Software under the terms of the version 336 | of the License under which You originally received the Covered Software, 337 | or under the terms of any subsequent version published by the license 338 | steward. 339 | 340 | 10.3. Modified Versions 341 | 342 | If you create software not governed by this License, and you want to 343 | create a new license for such software, you may create and use a 344 | modified version of this License if you rename the license and remove 345 | any references to the name of the license steward (except to note that 346 | such modified license differs from this License). 347 | 348 | 10.4. Distributing Source Code Form that is Incompatible With Secondary 349 | Licenses 350 | 351 | If You choose to distribute Source Code Form that is Incompatible With 352 | Secondary Licenses under the terms of this version of the License, the 353 | notice described in Exhibit B of this License must be attached. 354 | 355 | Exhibit A - Source Code Form License Notice 356 | ------------------------------------------- 357 | 358 | This Source Code Form is subject to the terms of the Mozilla Public 359 | License, v. 2.0. If a copy of the MPL was not distributed with this 360 | file, You can obtain one at http://mozilla.org/MPL/2.0/. 361 | 362 | If it is not possible or desirable to put the notice in a particular 363 | file, then You may include the notice in a location (such as a LICENSE 364 | file in a relevant directory) where a recipient would be likely to look 365 | for such a notice. 366 | 367 | You may add additional accurate notices of copyright ownership. 368 | 369 | Exhibit B - "Incompatible With Secondary Licenses" Notice 370 | --------------------------------------------------------- 371 | 372 | This Source Code Form is "Incompatible With Secondary Licenses", as 373 | defined by the Mozilla Public License, v. 2.0. 374 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # utf8 2 | 3 | UTF-8 support for Nix 4 | 5 | ## Why 6 | 7 | Strings in Nix are byte strings, and builtin functions like `substring` 8 | (and by extension some `lib` functions in [nixpkgs](https://github.com/nixos/nixpkgs)) 9 | processes bytes instead of UTF-8 code points. 10 | That means these functions can create invalid strings when given strings with UTF-8. 11 | This library basically allows you to convert it to a list of UTF-8 code points. 12 | 13 | ## Usage 14 | 15 | Try it out with flakes 16 | 17 | ```bash 18 | nix repl github:figsoda/utf8#lib --extra-experimental-features "flakes nix-command repl-flake" 19 | ``` 20 | 21 | or locally 22 | 23 | ```bash 24 | nix repl -f . 25 | ``` 26 | 27 | ### `chars` 28 | 29 | Type: `String -> [ String ]` 30 | 31 | Split a string into a list of code points 32 | 33 | ``` 34 | nix-repl> chars "你好,世界!" 35 | [ "你" "好" "," "世" "界" "!" ] 36 | ``` 37 | 38 | ### `head` 39 | 40 | Type: `String -> String` 41 | 42 | Return the first code point of the string 43 | 44 | ``` 45 | nix-repl> head "你好,世界!" 46 | "你" 47 | ``` 48 | 49 | ### `tail` 50 | 51 | Type: `String -> String` 52 | 53 | Return the string without the first code point 54 | 55 | ``` 56 | nix-repl> tail "你好,世界!" 57 | "好,世界!" 58 | ``` 59 | 60 | ### `length` 61 | 62 | Type: `String -> Int` 63 | 64 | Return the number of code points in the string 65 | 66 | ``` 67 | nix-repl> length "你好,世界!" 68 | 6 69 | ``` 70 | 71 | ## Development 72 | 73 | ```bash 74 | nix run ./dev # regenerate table.nix 75 | 76 | nix develop ./dev 77 | namaka check # run tests 78 | namaka review # review pending snapshots 79 | ``` 80 | -------------------------------------------------------------------------------- /default.nix: -------------------------------------------------------------------------------- 1 | let 2 | inherit (builtins) 3 | substring 4 | ; 5 | 6 | table = import ./table.nix; 7 | 8 | head = str: substring 0 table.${substring 0 1 str} str; 9 | 10 | tail = str: substring table.${substring 0 1 str} (-1) str; 11 | 12 | chars = str: if str == "" then [ ] else [ (head str) ] ++ chars (tail str); 13 | 14 | length = str: if str == "" then 0 else 1 + length (tail str); 15 | in 16 | 17 | { 18 | inherit chars head length tail; 19 | } 20 | -------------------------------------------------------------------------------- /dev/.gitignore: -------------------------------------------------------------------------------- 1 | /target 2 | -------------------------------------------------------------------------------- /dev/Cargo.lock: -------------------------------------------------------------------------------- 1 | # This file is automatically @generated by Cargo. 2 | # It is not intended for manual editing. 3 | version = 3 4 | 5 | [[package]] 6 | name = "utf8-gen" 7 | version = "0.1.0" 8 | -------------------------------------------------------------------------------- /dev/Cargo.toml: -------------------------------------------------------------------------------- 1 | [package] 2 | name = "utf8-gen" 3 | version = "0.1.0" 4 | edition = "2021" 5 | -------------------------------------------------------------------------------- /dev/flake.lock: -------------------------------------------------------------------------------- 1 | { 2 | "nodes": { 3 | "fenix": { 4 | "inputs": { 5 | "nixpkgs": [ 6 | "nixpkgs" 7 | ], 8 | "rust-analyzer-src": "rust-analyzer-src" 9 | }, 10 | "locked": { 11 | "lastModified": 1685686868, 12 | "narHash": "sha256-PFcFAdzA5yYP1m2eFuVlgtJeVnmkckUtCTTo+2wyc1s=", 13 | "owner": "nix-community", 14 | "repo": "fenix", 15 | "rev": "3ba3e566c85c2a07e1152cfa758fa727052ae8b1", 16 | "type": "github" 17 | }, 18 | "original": { 19 | "owner": "nix-community", 20 | "repo": "fenix", 21 | "type": "github" 22 | } 23 | }, 24 | "flake-parts": { 25 | "inputs": { 26 | "nixpkgs-lib": [ 27 | "nixpkgs" 28 | ] 29 | }, 30 | "locked": { 31 | "lastModified": 1685662779, 32 | "narHash": "sha256-cKDDciXGpMEjP1n6HlzKinN0H+oLmNpgeCTzYnsA2po=", 33 | "owner": "hercules-ci", 34 | "repo": "flake-parts", 35 | "rev": "71fb97f0d875fd4de4994dfb849f2c75e17eb6c3", 36 | "type": "github" 37 | }, 38 | "original": { 39 | "owner": "hercules-ci", 40 | "repo": "flake-parts", 41 | "type": "github" 42 | } 43 | }, 44 | "haumea": { 45 | "inputs": { 46 | "nixpkgs": [ 47 | "namaka", 48 | "nixpkgs" 49 | ] 50 | }, 51 | "locked": { 52 | "lastModified": 1685133229, 53 | "narHash": "sha256-FePm/Gi9PBSNwiDFq3N+DWdfxFq0UKsVVTJS3cQPn94=", 54 | "owner": "nix-community", 55 | "repo": "haumea", 56 | "rev": "34dd58385092a23018748b50f9b23de6266dffc2", 57 | "type": "github" 58 | }, 59 | "original": { 60 | "owner": "nix-community", 61 | "ref": "v0.2.2", 62 | "repo": "haumea", 63 | "type": "github" 64 | } 65 | }, 66 | "namaka": { 67 | "inputs": { 68 | "haumea": "haumea", 69 | "nixpkgs": [ 70 | "nixpkgs" 71 | ] 72 | }, 73 | "locked": { 74 | "lastModified": 1685739139, 75 | "narHash": "sha256-CLGEW11Fo1v4vj0XSqiyW1EbhRZFO7dkgM43eKwItrk=", 76 | "owner": "nix-community", 77 | "repo": "namaka", 78 | "rev": "d9a2cc83c1d0f68bd613f1fc909d0ef2cfffcf2e", 79 | "type": "github" 80 | }, 81 | "original": { 82 | "owner": "nix-community", 83 | "ref": "v0.2.0", 84 | "repo": "namaka", 85 | "type": "github" 86 | } 87 | }, 88 | "nixpkgs": { 89 | "locked": { 90 | "lastModified": 1685655444, 91 | "narHash": "sha256-6EujQNAeaUkWvpEZZcVF8qSfQrNVWFNNGbUJxv/A5a8=", 92 | "owner": "nixos", 93 | "repo": "nixpkgs", 94 | "rev": "e635192892f5abbc2289eaac3a73cdb249abaefd", 95 | "type": "github" 96 | }, 97 | "original": { 98 | "owner": "nixos", 99 | "ref": "nixos-unstable", 100 | "repo": "nixpkgs", 101 | "type": "github" 102 | } 103 | }, 104 | "root": { 105 | "inputs": { 106 | "fenix": "fenix", 107 | "flake-parts": "flake-parts", 108 | "namaka": "namaka", 109 | "nixpkgs": "nixpkgs" 110 | } 111 | }, 112 | "rust-analyzer-src": { 113 | "flake": false, 114 | "locked": { 115 | "lastModified": 1685637732, 116 | "narHash": "sha256-MN+gEn1S8NAq3SW9sqxcI0+xBRNUJAPzv6z7hU7LDQE=", 117 | "owner": "rust-lang", 118 | "repo": "rust-analyzer", 119 | "rev": "0b4c09b1d2d3e6be0499f2683743716661821bf2", 120 | "type": "github" 121 | }, 122 | "original": { 123 | "owner": "rust-lang", 124 | "ref": "nightly", 125 | "repo": "rust-analyzer", 126 | "type": "github" 127 | } 128 | } 129 | }, 130 | "root": "root", 131 | "version": 7 132 | } 133 | -------------------------------------------------------------------------------- /dev/flake.nix: -------------------------------------------------------------------------------- 1 | { 2 | inputs = { 3 | fenix = { 4 | url = "github:nix-community/fenix"; 5 | inputs.nixpkgs.follows = "nixpkgs"; 6 | }; 7 | flake-parts = { 8 | url = "github:hercules-ci/flake-parts"; 9 | inputs.nixpkgs-lib.follows = "nixpkgs"; 10 | }; 11 | namaka = { 12 | url = "github:nix-community/namaka/v0.2.0"; 13 | inputs.nixpkgs.follows = "nixpkgs"; 14 | }; 15 | nixpkgs.url = "github:nixos/nixpkgs/nixos-unstable"; 16 | }; 17 | 18 | outputs = inputs@{ flake-parts, namaka, ... }: 19 | flake-parts.lib.mkFlake { inherit inputs; } { 20 | flake.checks = namaka.lib.load { 21 | src = ./tests; 22 | inputs = { 23 | utf8 = import ../.; 24 | }; 25 | }; 26 | 27 | systems = [ 28 | "aarch64-darwin" 29 | "aarch64-linux" 30 | "x86_64-darwin" 31 | "x86_64-linux" 32 | ]; 33 | 34 | perSystem = { inputs', pkgs, ... }: 35 | let 36 | rust = inputs'.fenix.packages.minimal.toolchain; 37 | rustPlatform = pkgs.makeRustPlatform { 38 | cargo = rust; 39 | rustc = rust; 40 | }; 41 | in 42 | { 43 | devShells.default = pkgs.mkShell { 44 | packages = [ 45 | inputs'.namaka.packages.default 46 | ]; 47 | }; 48 | 49 | packages.default = rustPlatform.buildRustPackage { 50 | pname = "utf8-gen"; 51 | version = "0.1.0"; 52 | src = ./.; 53 | cargoLock.lockFile = ./Cargo.lock; 54 | }; 55 | }; 56 | }; 57 | } 58 | -------------------------------------------------------------------------------- /dev/rustfmt.toml: -------------------------------------------------------------------------------- 1 | unstable_features = true 2 | 3 | condense_wildcard_suffixes = true 4 | format_code_in_doc_comments = true 5 | group_imports = "StdExternalCrate" 6 | imports_granularity = "Crate" 7 | newline_style = "Unix" 8 | normalize_comments = true 9 | normalize_doc_attributes = true 10 | reorder_impl_items = true 11 | spaces_around_ranges = true 12 | use_field_init_shorthand = true 13 | use_try_shorthand = true 14 | -------------------------------------------------------------------------------- /dev/src/main.rs: -------------------------------------------------------------------------------- 1 | #![feature(array_windows)] 2 | 3 | use std::{ 4 | fs::File, 5 | io::{self, Write}, 6 | }; 7 | 8 | fn main() -> io::Result<()> { 9 | let mut out = File::create("table.nix")?; 10 | writeln!(out, "# generated with `nix run ./dev`")?; 11 | writeln!(out, "{{")?; 12 | 13 | for (i, &[start, end]) in [0u8, 0b1100_0000, 0b1110_0000, 0b1111_0000, 0] 14 | .array_windows() 15 | .enumerate() 16 | { 17 | for x in start ..= end.wrapping_sub(1) { 18 | let esc = x.escape_ascii().to_string(); 19 | write!(out, " \"")?; 20 | if esc.contains("\\x") { 21 | out.write_all(&[x])?; 22 | } else { 23 | write!(out, "{esc}")?; 24 | } 25 | writeln!(out, "\" = {};", i + 1)?; 26 | } 27 | } 28 | 29 | writeln!(out, "}}")?; 30 | Ok(()) 31 | } 32 | -------------------------------------------------------------------------------- /dev/tests/_snapshots/ascii: -------------------------------------------------------------------------------- 1 | #json 2 | ["H","e","l","l","o",","," ","w","o","r","l","d","!"] -------------------------------------------------------------------------------- /dev/tests/_snapshots/basic: -------------------------------------------------------------------------------- 1 | #json 2 | ["你","好",",","世","界","!"] -------------------------------------------------------------------------------- /dev/tests/_snapshots/length: -------------------------------------------------------------------------------- 1 | #json 2 | 6 -------------------------------------------------------------------------------- /dev/tests/ascii/expr.nix: -------------------------------------------------------------------------------- 1 | { utf8 }: 2 | 3 | utf8.chars "Hello, world!" 4 | -------------------------------------------------------------------------------- /dev/tests/basic/expr.nix: -------------------------------------------------------------------------------- 1 | { utf8 }: 2 | 3 | utf8.chars "你好,世界!" 4 | -------------------------------------------------------------------------------- /dev/tests/length/expr.nix: -------------------------------------------------------------------------------- 1 | { utf8 }: 2 | 3 | utf8.length "你好,世界!" 4 | -------------------------------------------------------------------------------- /flake.nix: -------------------------------------------------------------------------------- 1 | { 2 | outputs = { self }: { 3 | lib = import self; 4 | }; 5 | } 6 | -------------------------------------------------------------------------------- /namaka.toml: -------------------------------------------------------------------------------- 1 | [check] 2 | cmd = ["nix", "eval", "./dev#checks"] 3 | 4 | [eval] 5 | cmd = ["nix", "eval", "./dev#checks"] 6 | -------------------------------------------------------------------------------- /table.nix: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/figsoda/utf8/ce04eef066a4a682f2ef0eba8e56e4da9b8f14aa/table.nix --------------------------------------------------------------------------------