├── .gitignore
├── .vscode
    ├── extensions.json
    ├── tasks.json
    └── settings.json
├── .gitattributes
├── .github
    └── workflows
    │   ├── build.yml
    │   └── pr.yml
├── .yo-rc.json
├── package.json
├── table-nonbinary-unicode-properties.html
├── gulpfile.js
├── LICENSE
├── table-unicode-general-category-values.html
├── README.md
├── table-binary-unicode-properties.html
├── table-unicode-script-values.html
└── spec.emu


/.gitignore:
--------------------------------------------------------------------------------
1 | node_modules
2 | coverage
3 | docs


--------------------------------------------------------------------------------
/.vscode/extensions.json:
--------------------------------------------------------------------------------
1 | {
2 | 	"recommendations": [
3 | 		"rbuckton.ecmarkup-vscode"
4 | 	]
5 | }


--------------------------------------------------------------------------------
/.gitattributes:
--------------------------------------------------------------------------------
1 | index.html  -diff merge=ours
2 | spec.js     -diff merge=ours
3 | spec.css    -diff merge=ours


--------------------------------------------------------------------------------
/.vscode/tasks.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     // See https://go.microsoft.com/fwlink/?LinkId=733558
 3 |     // for the documentation about the tasks.json format
 4 |     "version": "2.0.0",
 5 |     "tasks": [
 6 |         {
 7 |             "type": "gulp",
 8 |             "task": "build",
 9 |             "group": {
10 |                 "kind": "build",
11 |                 "isDefault": true
12 |             }
13 |         }
14 |     ]
15 | }


--------------------------------------------------------------------------------
/.vscode/settings.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "[markdown]": {
 3 |         "files.trimTrailingWhitespace": false
 4 |     },
 5 |     "[html]": {
 6 |         "editor.insertSpaces": true,
 7 |         "editor.tabSize": 2,
 8 |     },
 9 |     "[ecmarkup]": {
10 |         "editor.insertSpaces": true,
11 |         "editor.tabSize": 2,
12 |     },
13 |     "files.associations": {
14 |         "*.html": "ecmarkup",
15 |         "*.emu": "ecmarkup"
16 |     }
17 | }


--------------------------------------------------------------------------------
/.github/workflows/build.yml:
--------------------------------------------------------------------------------
 1 | name: Publish Spec to gh-pages
 2 | on:
 3 |   push:
 4 |     branches: [ main ]
 5 | jobs:
 6 |   build:
 7 |     runs-on: ubuntu-latest
 8 |     steps:
 9 |       - uses: actions/checkout@v2
10 |       - run: npm install --legacy-peer-deps
11 |       - run: npm run compile
12 |       - name: Deploy
13 |         uses: JamesIves/github-pages-deploy-action@4.1.4
14 |         with:
15 |           branch: gh-pages
16 |           folder: docs
17 |           clean-exclude: |
18 |             pr           
19 | 


--------------------------------------------------------------------------------
/.yo-rc.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "generator-ecmascript-proposal": {
 3 |     "promptValues": {
 4 |       "hasChampion": true,
 5 |       "championName": "Ron Buckton",
 6 |       "championGithub": "rbuckton",
 7 |       "spec": "https://rbuckton.github.io/proposal-regexp-modifiers",
 8 |       "stage": "0",
 9 |       "sections": [
10 |         "prior-art",
11 |         "syntax",
12 |         "semantics",
13 |         "examples",
14 |         "grammar",
15 |         "references",
16 |         "prior-discussion"
17 |       ],
18 |       "vscode": true,
19 |       "build": "gulp",
20 |       "githubWorkflowCI": true,
21 |       "githubWorkflowPR": true
22 |     }
23 |   }
24 | }
25 | 


--------------------------------------------------------------------------------
/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "proposal-regexp-modifiers",
 3 |   "version": "0.0.0",
 4 |   "private": true,
 5 |   "description": "Regular Expression Pattern Modifiers for ECMAScript",
 6 |   "homepage": "https://github.com/rbuckton/proposal-regexp-modifiers#readme",
 7 |   "author": {
 8 |     "name": "Ron Buckton",
 9 |     "email": "ron.buckton@microsoft.com"
10 |   },
11 |   "keywords": [
12 |     "javascript",
13 |     "ecmascript"
14 |   ],
15 |   "scripts": {
16 |     "compile": "gulp build",
17 |     "start": "gulp start"
18 |   },
19 |   "license": "SEE LICENSE IN https://tc39.github.io/ecma262/#sec-copyright-and-software-license",
20 |   "devDependencies": {
21 |     "@tc39/ecma262-biblio": "^2.0.2322",
22 |     "del": "^6.0.0",
23 |     "ecmarkup": "^12.1.0",
24 |     "gulp": "^4.0.2",
25 |     "gulp-emu": "^2.1.0",
26 |     "gulp-live-server": "0.0.31",
27 |     "gulp-rename": "^2.0.0"
28 |   }
29 | }
30 | 


--------------------------------------------------------------------------------
/table-nonbinary-unicode-properties.html:
--------------------------------------------------------------------------------
 1 | <emu-table id="table-nonbinary-unicode-properties">
 2 |   <emu-caption>Non-binary Unicode property aliases and their canonical property names</emu-caption>
 3 |   <table class="real-table unicode-property-table">
 4 |     <thead>
 5 |       <tr>
 6 |         <th>Property name and aliases</th>
 7 |         <th>Canonical property name</th>
 8 |       </tr>
 9 |     </thead>
10 |     <tr>
11 |       <td>`General_Category`</td>
12 |       <td rowspan="2"><a href="https://unicode.org/reports/tr18/#General_Category_Property">`General_Category`</a></td>
13 |     </tr>
14 |     <tr>
15 |       <td>`gc`</td>
16 |     </tr>
17 |     <tr>
18 |       <td>`Script`</td>
19 |       <td rowspan="2"><a href="https://unicode.org/reports/tr24/#Script">`Script`</a></td>
20 |     </tr>
21 |     <tr>
22 |       <td>`sc`</td>
23 |     </tr>
24 |     <tr>
25 |       <td>`Script_Extensions`</td>
26 |       <td rowspan="2"><a href="https://unicode.org/reports/tr24/#Script_Extensions">`Script_Extensions`</a></td>
27 |     </tr>
28 |     <tr>
29 |       <td>`scx`</td>
30 |     </tr>
31 |   </table>
32 | </emu-table>
33 | 


--------------------------------------------------------------------------------
/.github/workflows/pr.yml:
--------------------------------------------------------------------------------
 1 | name: Publish PR to gh-pages/pr/
 2 | on:
 3 |   pull_request:
 4 |     branches: [ main ]
 5 | jobs:
 6 |   build:
 7 |     runs-on: ubuntu-latest
 8 |     if: ${{ github.event.number }}
 9 |     steps:
10 |       - uses: actions/checkout@v2
11 |       - run: npm install --legacy-peer-deps
12 |       - run: npm run compile
13 |       - name: Deploy
14 |         uses: JamesIves/github-pages-deploy-action@4.1.4
15 |         with:
16 |           branch: gh-pages
17 |           folder: docs
18 |           target-folder: pr/${{ github.event.number }}/
19 |       - id: get-preview-url
20 |         name: Get preview url
21 |         run: echo "::set-output name=preview-url::https://tc39.es/$(basename $GITHUB_REPOSITORY)/pr/${{ github.event.number }}"
22 |         shell: bash
23 |       - name: Post Preview Comment
24 |         uses: phulsechinmay/rewritable-pr-comment@v0.3.0
25 |         with:
26 |           GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
27 |           COMMENT_IDENTIFIER: tc39_pr_preview_comment
28 |           message: |
29 |             A preview of this PR can be found at ${{ steps.get-preview-url.outputs.preview-url }}.
30 | 


--------------------------------------------------------------------------------
/gulpfile.js:
--------------------------------------------------------------------------------
 1 | const del = require("del");
 2 | const path = require("path");
 3 | const gulp = require("gulp");
 4 | const emu = require("gulp-emu");
 5 | const rename = require("gulp-rename");
 6 | const gls = require("gulp-live-server");
 7 | 
 8 | gulp.task("clean", () => del("docs/**/*"));
 9 | 
10 | gulp.task("build", () => gulp
11 |     .src(["spec.emu"])
12 |     .pipe(emu({
13 |         log: require("ecmarkup/lib/utils").logVerbose,
14 |         warn: err => {
15 |             const file = path.resolve(err.file || "spec.emu");
16 |             const message = `Warning: ${file}:${typeof err.line === "number" ? `${err.line}:${err.column}:` : ""} ${err.message}`;
17 |             require("ecmarkup/lib/utils").logWarning(message);
18 |         },
19 |         ecma262Biblio: false,
20 |     }))
21 |     .pipe(rename("index.html"))
22 |     .pipe(gulp.dest("docs")));
23 | 
24 | gulp.task("watch", () => gulp
25 |     .watch(["spec.emu"], gulp.task("build")));
26 | 
27 | gulp.task("start", gulp.parallel("watch", () => {
28 |     const server = gls.static("docs", 8080);
29 |     const promise = server.start();
30 |     (/** @type {import("chokidar").FSWatcher}*/(gulp.watch(["docs/**/*"])))
31 |         .on("change", file => {
32 |             server.notify({ path: path.resolve(file) });
33 |         });
34 |     return promise;
35 | }));
36 | 
37 | gulp.task("default", gulp.task("build"));


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | BSD 3-Clause License
 2 | 
 3 | Copyright (c) 2017, Ron Buckton, Ecma International
 4 | All rights reserved.
 5 | 
 6 | Redistribution and use in source and binary forms, with or without
 7 | modification, are permitted provided that the following conditions are met:
 8 | 
 9 | * Redistributions of source code must retain the above copyright notice, this
10 |   list of conditions and the following disclaimer.
11 | 
12 | * Redistributions in binary form must reproduce the above copyright notice,
13 |   this list of conditions and the following disclaimer in the documentation
14 |   and/or other materials provided with the distribution.
15 | 
16 | * Neither the name of the copyright holder nor the names of its
17 |   contributors may be used to endorse or promote products derived from
18 |   this software without specific prior written permission.
19 | 
20 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
21 | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
22 | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
23 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
24 | FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
25 | DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
26 | SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
27 | CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
28 | OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
29 | OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30 | 


--------------------------------------------------------------------------------
/table-unicode-general-category-values.html:
--------------------------------------------------------------------------------
  1 | <emu-table id="table-unicode-general-category-values">
  2 |   <emu-caption>Value aliases and canonical values for the Unicode property <a href="https://unicode.org/reports/tr18/#General_Category_Property">`General_Category`</a></emu-caption>
  3 |   <table class="real-table unicode-property-table">
  4 |     <thead>
  5 |       <tr>
  6 |         <th>Property value and aliases</th>
  7 |         <th>Canonical property value</th>
  8 |       </tr>
  9 |     </thead>
 10 |     <tr>
 11 |       <td>`Cased_Letter`</td>
 12 |       <td rowspan="2">`Cased_Letter`</td>
 13 |     </tr>
 14 |     <tr>
 15 |       <td>`LC`</td>
 16 |     </tr>
 17 |     <tr>
 18 |       <td>`Close_Punctuation`</td>
 19 |       <td rowspan="2">`Close_Punctuation`</td>
 20 |     </tr>
 21 |     <tr>
 22 |       <td>`Pe`</td>
 23 |     </tr>
 24 |     <tr>
 25 |       <td>`Connector_Punctuation`</td>
 26 |       <td rowspan="2">`Connector_Punctuation`</td>
 27 |     </tr>
 28 |     <tr>
 29 |       <td>`Pc`</td>
 30 |     </tr>
 31 |     <tr>
 32 |       <td>`Control`</td>
 33 |       <td rowspan="3">`Control`</td>
 34 |     </tr>
 35 |     <tr>
 36 |       <td>`Cc`</td>
 37 |     </tr>
 38 |     <tr>
 39 |       <td>`cntrl`</td>
 40 |     </tr>
 41 |     <tr>
 42 |       <td>`Currency_Symbol`</td>
 43 |       <td rowspan="2">`Currency_Symbol`</td>
 44 |     </tr>
 45 |     <tr>
 46 |       <td>`Sc`</td>
 47 |     </tr>
 48 |     <tr>
 49 |       <td>`Dash_Punctuation`</td>
 50 |       <td rowspan="2">`Dash_Punctuation`</td>
 51 |     </tr>
 52 |     <tr>
 53 |       <td>`Pd`</td>
 54 |     </tr>
 55 |     <tr>
 56 |       <td>`Decimal_Number`</td>
 57 |       <td rowspan="3">`Decimal_Number`</td>
 58 |     </tr>
 59 |     <tr>
 60 |       <td>`Nd`</td>
 61 |     </tr>
 62 |     <tr>
 63 |       <td>`digit`</td>
 64 |     </tr>
 65 |     <tr>
 66 |       <td>`Enclosing_Mark`</td>
 67 |       <td rowspan="2">`Enclosing_Mark`</td>
 68 |     </tr>
 69 |     <tr>
 70 |       <td>`Me`</td>
 71 |     </tr>
 72 |     <tr>
 73 |       <td>`Final_Punctuation`</td>
 74 |       <td rowspan="2">`Final_Punctuation`</td>
 75 |     </tr>
 76 |     <tr>
 77 |       <td>`Pf`</td>
 78 |     </tr>
 79 |     <tr>
 80 |       <td>`Format`</td>
 81 |       <td rowspan="2">`Format`</td>
 82 |     </tr>
 83 |     <tr>
 84 |       <td>`Cf`</td>
 85 |     </tr>
 86 |     <tr>
 87 |       <td>`Initial_Punctuation`</td>
 88 |       <td rowspan="2">`Initial_Punctuation`</td>
 89 |     </tr>
 90 |     <tr>
 91 |       <td>`Pi`</td>
 92 |     </tr>
 93 |     <tr>
 94 |       <td>`Letter`</td>
 95 |       <td rowspan="2">`Letter`</td>
 96 |     </tr>
 97 |     <tr>
 98 |       <td>`L`</td>
 99 |     </tr>
100 |     <tr>
101 |       <td>`Letter_Number`</td>
102 |       <td rowspan="2">`Letter_Number`</td>
103 |     </tr>
104 |     <tr>
105 |       <td>`Nl`</td>
106 |     </tr>
107 |     <tr>
108 |       <td>`Line_Separator`</td>
109 |       <td rowspan="2">`Line_Separator`</td>
110 |     </tr>
111 |     <tr>
112 |       <td>`Zl`</td>
113 |     </tr>
114 |     <tr>
115 |       <td>`Lowercase_Letter`</td>
116 |       <td rowspan="2">`Lowercase_Letter`</td>
117 |     </tr>
118 |     <tr>
119 |       <td>`Ll`</td>
120 |     </tr>
121 |     <tr>
122 |       <td>`Mark`</td>
123 |       <td rowspan="3">`Mark`</td>
124 |     </tr>
125 |     <tr>
126 |       <td>`M`</td>
127 |     </tr>
128 |     <tr>
129 |       <td>`Combining_Mark`</td>
130 |     </tr>
131 |     <tr>
132 |       <td>`Math_Symbol`</td>
133 |       <td rowspan="2">`Math_Symbol`</td>
134 |     </tr>
135 |     <tr>
136 |       <td>`Sm`</td>
137 |     </tr>
138 |     <tr>
139 |       <td>`Modifier_Letter`</td>
140 |       <td rowspan="2">`Modifier_Letter`</td>
141 |     </tr>
142 |     <tr>
143 |       <td>`Lm`</td>
144 |     </tr>
145 |     <tr>
146 |       <td>`Modifier_Symbol`</td>
147 |       <td rowspan="2">`Modifier_Symbol`</td>
148 |     </tr>
149 |     <tr>
150 |       <td>`Sk`</td>
151 |     </tr>
152 |     <tr>
153 |       <td>`Nonspacing_Mark`</td>
154 |       <td rowspan="2">`Nonspacing_Mark`</td>
155 |     </tr>
156 |     <tr>
157 |       <td>`Mn`</td>
158 |     </tr>
159 |     <tr>
160 |       <td>`Number`</td>
161 |       <td rowspan="2">`Number`</td>
162 |     </tr>
163 |     <tr>
164 |       <td>`N`</td>
165 |     </tr>
166 |     <tr>
167 |       <td>`Open_Punctuation`</td>
168 |       <td rowspan="2">`Open_Punctuation`</td>
169 |     </tr>
170 |     <tr>
171 |       <td>`Ps`</td>
172 |     </tr>
173 |     <tr>
174 |       <td>`Other`</td>
175 |       <td rowspan="2">`Other`</td>
176 |     </tr>
177 |     <tr>
178 |       <td>`C`</td>
179 |     </tr>
180 |     <tr>
181 |       <td>`Other_Letter`</td>
182 |       <td rowspan="2">`Other_Letter`</td>
183 |     </tr>
184 |     <tr>
185 |       <td>`Lo`</td>
186 |     </tr>
187 |     <tr>
188 |       <td>`Other_Number`</td>
189 |       <td rowspan="2">`Other_Number`</td>
190 |     </tr>
191 |     <tr>
192 |       <td>`No`</td>
193 |     </tr>
194 |     <tr>
195 |       <td>`Other_Punctuation`</td>
196 |       <td rowspan="2">`Other_Punctuation`</td>
197 |     </tr>
198 |     <tr>
199 |       <td>`Po`</td>
200 |     </tr>
201 |     <tr>
202 |       <td>`Other_Symbol`</td>
203 |       <td rowspan="2">`Other_Symbol`</td>
204 |     </tr>
205 |     <tr>
206 |       <td>`So`</td>
207 |     </tr>
208 |     <tr>
209 |       <td>`Paragraph_Separator`</td>
210 |       <td rowspan="2">`Paragraph_Separator`</td>
211 |     </tr>
212 |     <tr>
213 |       <td>`Zp`</td>
214 |     </tr>
215 |     <tr>
216 |       <td>`Private_Use`</td>
217 |       <td rowspan="2">`Private_Use`</td>
218 |     </tr>
219 |     <tr>
220 |       <td>`Co`</td>
221 |     </tr>
222 |     <tr>
223 |       <td>`Punctuation`</td>
224 |       <td rowspan="3">`Punctuation`</td>
225 |     </tr>
226 |     <tr>
227 |       <td>`P`</td>
228 |     </tr>
229 |     <tr>
230 |       <td>`punct`</td>
231 |     </tr>
232 |     <tr>
233 |       <td>`Separator`</td>
234 |       <td rowspan="2">`Separator`</td>
235 |     </tr>
236 |     <tr>
237 |       <td>`Z`</td>
238 |     </tr>
239 |     <tr>
240 |       <td>`Space_Separator`</td>
241 |       <td rowspan="2">`Space_Separator`</td>
242 |     </tr>
243 |     <tr>
244 |       <td>`Zs`</td>
245 |     </tr>
246 |     <tr>
247 |       <td>`Spacing_Mark`</td>
248 |       <td rowspan="2">`Spacing_Mark`</td>
249 |     </tr>
250 |     <tr>
251 |       <td>`Mc`</td>
252 |     </tr>
253 |     <tr>
254 |       <td>`Surrogate`</td>
255 |       <td rowspan="2">`Surrogate`</td>
256 |     </tr>
257 |     <tr>
258 |       <td>`Cs`</td>
259 |     </tr>
260 |     <tr>
261 |       <td>`Symbol`</td>
262 |       <td rowspan="2">`Symbol`</td>
263 |     </tr>
264 |     <tr>
265 |       <td>`S`</td>
266 |     </tr>
267 |     <tr>
268 |       <td>`Titlecase_Letter`</td>
269 |       <td rowspan="2">`Titlecase_Letter`</td>
270 |     </tr>
271 |     <tr>
272 |       <td>`Lt`</td>
273 |     </tr>
274 |     <tr>
275 |       <td>`Unassigned`</td>
276 |       <td rowspan="2">`Unassigned`</td>
277 |     </tr>
278 |     <tr>
279 |       <td>`Cn`</td>
280 |     </tr>
281 |     <tr>
282 |       <td>`Uppercase_Letter`</td>
283 |       <td rowspan="2">`Uppercase_Letter`</td>
284 |     </tr>
285 |     <tr>
286 |       <td>`Lu`</td>
287 |     </tr>
288 |   </table>
289 | </emu-table>
290 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | <!--#region:intro-->
  2 | # Regular Expression Pattern Modifiers for ECMAScript
  3 | 
  4 | <!--#endregion:intro-->
  5 | 
  6 | <!--#region:status-->
  7 | ## Status
  8 | 
  9 | **Stage:** 4  
 10 | **Champion:** Ron Buckton ([@rbuckton](https://github.com/rbuckton))  
 11 | 
 12 | _For detailed status of this proposal see [TODO](#todo), below._  
 13 | <!--#endregion:status-->
 14 | 
 15 | <!--#region:authors-->
 16 | ## Authors
 17 | 
 18 | * Ron Buckton ([@rbuckton](https://github.com/rbuckton))  
 19 | <!--#endregion:authors-->
 20 | 
 21 | <!--#region:motivations-->
 22 | # Motivations
 23 | 
 24 | One common capability amongst the majority of regular expression engines that
 25 | is commonly used by parsers, syntax highlighters, and other tools is the capability to
 26 | control a subset of regular expression flags such as:
 27 | 
 28 | - `i` &mdash; Ignore Case
 29 | - `m` &mdash; Multiline
 30 | - `s` &mdash; Single-line (a.k.a. "dot all")
 31 | - `x` &mdash; Extended mode (see https://github.com/rbuckton/proposal-regexp-x-mode)
 32 | 
 33 | Modifiers are especially helpful when regular expressions are defined in a context
 34 | where executable code cannot be evaluated, such as a JSON configuration file or 
 35 | TextMate tmLanguage grammar file.
 36 | 
 37 | As part of this proposal, we will investigate each existing (and future-proposed) RegExp flag
 38 | to determine whether they are feasible to used as modifiers.
 39 | 
 40 | <!--#endregion:motivations-->
 41 | 
 42 | <!--#region:prior-art-->
 43 | # Prior Art 
 44 | 
 45 | * [Perl](https://rbuckton.github.io/regexp-features/engines/perl.html#feature-modifiers)  
 46 | * [PCRE](https://rbuckton.github.io/regexp-features/engines/pcre.html#feature-modifiers)  
 47 | * [Boost.Regex](https://rbuckton.github.io/regexp-features/engines/boost.regex.html#feature-modifiers)  
 48 | * [.NET](https://rbuckton.github.io/regexp-features/engines/dotnet.html#feature-modifiers)  
 49 | * [Oniguruma](https://rbuckton.github.io/regexp-features/engines/oniguruma.html#feature-modifiers)  
 50 | * [Hyperscan](https://rbuckton.github.io/regexp-features/engines/hyperscan.html#feature-modifiers)  
 51 | * [ICU](https://rbuckton.github.io/regexp-features/engines/icu.html#feature-modifiers)  
 52 | * [Glib/GRegex](https://rbuckton.github.io/regexp-features/engines/glib-gregex.html#feature-modifiers)  
 53 | 
 54 | See https://rbuckton.github.io/regexp-features/features/modifiers.html for additional information.
 55 | <!--#endregion:prior-art-->
 56 | 
 57 | <!--#region:syntax-->
 58 | # Syntax
 59 | 
 60 | Modifiers allow you to change the currently active RegExp flags within a subexpression.
 61 | 
 62 | - `(?imsx-imsx:subexpression)` &mdash; Sets or unsets (using `-`) the specified RegExp flags for the subexpression.
 63 | - ~~`(?imsx-imsx)` &mdash; Sets or unsets (using `-`) the specified RegExp flags starting at the current position until the next closing `)` or the end of the pattern.~~
 64 | 
 65 | > NOTE: Certain flags cannot be modified mid-expression. These currently include `g` (global), `y` (sticky), `u` (unicode), and `d` (hasIndices).
 66 | 
 67 | > NOTE: The actual supported flags will be determined on a case-by-case basis. See [#1](https://github.com/tc39/proposal-regexp-modifiers/issues/1).
 68 | 
 69 | > NOTE: This has no conflicts with existing syntax, as ECMAScript currently produces an error for this syntax in both `u` and non-`u` modes.
 70 | 
 71 | > NOTE: The "self-bounded" form (`(?imsx-imsx:subexpression)`) advanced to Stage 2 on December 15th, 2021.
 72 | 
 73 | > NOTE: The "unbounded" form (`(?imsx-imsx)`) is no longer being considered as part of this proposal as of December 15th, 2021.
 74 | 
 75 | <!--#endregion:syntax-->
 76 | 
 77 | <!--#region:semantics-->
 78 | <!-- # Semantics -->
 79 | 
 80 | 
 81 | <!--#endregion:semantics-->
 82 | 
 83 | <!--#region:examples-->
 84 | # Examples
 85 | 
 86 | ```js
 87 | const re1 = /^[a-z](?-i:[a-z])$/i;
 88 | re1.test("ab"); // true
 89 | re1.test("Ab"); // true
 90 | re1.test("aB"); // false
 91 | 
 92 | const re2 = /^(?i:[a-z])[a-z]$/;
 93 | re2.test("ab"); // true
 94 | re2.test("Ab"); // true
 95 | re2.test("aB"); // false
 96 | ```
 97 | 
 98 | <!--#endregion:examples-->
 99 | 
100 | <!--#region:api-->
101 | <!--
102 | # API
103 | 
104 | > TODO: Provide description of High-level API.
105 | -->
106 | <!--#endregion:api-->
107 | 
108 | <!--#region:grammar-->
109 | <!-- # Grammar
110 | 
111 | ```grammarkdown
112 | ``` -->
113 | <!--#endregion:grammar-->
114 | 
115 | <!--#region:references-->
116 | <!-- # References
117 | 
118 | > TODO: Provide links to other specifications, etc.
119 | 
120 | * [Title](url)   -->
121 | <!--#endregion:references-->
122 | 
123 | # History
124 | 
125 | - October 27th, 2021 &mdash; Proposed for Stage 1 ([slides](https://1drv.ms/p/s!AjgWTO11Fk-Tkfl7c6yR-2P8T4gn0w?e=cvaUL2))
126 |   - Outcome: Advanced to Stage 1
127 | - December 15th, 2021 &mdash; Proposed for Stage 2 ([slides](https://1drv.ms/p/s!AjgWTO11Fk-Tkfs3yIyrh3hZ2k6PCQ?e=Yodx4H))
128 |   - Outcome: Advanced to Stage 2 with "self-bounded" form only ("unbounded" form did not advance).
129 |   - Stage 2 Reviewers: Richard Gibson, Waldemar Horwat
130 | - June 7th, 2022 &mdash; Proposed for Stage 3 ([slides](https://1drv.ms/p/s!AjgWTO11Fk-Tkf5daRnRsxu8BY5Nsg?e=UKVf8W))
131 |   - Outcome: [Advanced to Stage 3](https://github.com/tc39/notes/blob/31edb829db604fdb0255b21238b20898b66cee41/meetings/2022-06/jun-07.md)
132 | 
133 | <!--#region:todo-->
134 | # TODO
135 | 
136 | The following is a high-level list of tasks to progress through each stage of the [TC39 proposal process](https://tc39.github.io/process-document/):
137 | 
138 | ### Stage 1 Entrance Criteria
139 | 
140 | * [x] Identified a "[champion][Champion]" who will advance the addition.  
141 | * [x] [Prose][Prose] outlining the problem or need and the general shape of a solution.  
142 | * [x] Illustrative [examples][Examples] of usage.  
143 | * [ ] ~~High-level [API][API].~~  
144 | 
145 | ### Stage 2 Entrance Criteria
146 | 
147 | * [x] [Initial specification text][Specification].  
148 | * [ ] ~~[Transpiler support][Transpiler] (_Optional_)~~.  
149 | 
150 | ### Stage 2.7 Entrance Criteria
151 | 
152 | * [x] [Complete specification text][Specification].  
153 | * [x] Designated reviewers have [signed off][Stage3ReviewerSignOff] on the current spec text (1 of 2).  
154 | * [x] The ECMAScript editor has [signed off][Stage3EditorSignOff] on the current spec text.  
155 | 
156 | ### Stage 3 Entrance Criteria
157 | 
158 | * [x] [Test262](https://github.com/tc39/test262) acceptance tests have been written for mainline usage scenarios and [merged][Test262PullRequest].  
159 | 
160 | ### Stage 4 Entrance Criteria
161 | 
162 | * [x] Two compatible implementations which pass the acceptance tests:  
163 |   * [X] [V8][Implementation1] - Shipping in [Chrome 125](https://developer.chrome.com/release-notes/125)/Edge 125
164 |   * [x] [SpiderMonkey][Implementation2] - Shipping in FireFox 130 behind a flag, Shipping in FireFox 132b (Nightly) [unflagged](https://bugzilla.mozilla.org/show_bug.cgi?id=1913752)
165 |   * [ ] JSC  
166 |   * [ ] [Engine262](https://github.com/engine262/engine262/pull/229)  
167 | * [x] A [pull request][Ecma262PullRequest] has been sent to tc39/ecma262 with the integrated spec text.  
168 | * [ ] The ECMAScript editor has signed off on the [pull request][Ecma262PullRequest].  
169 |   * [x] [Kevin Gibbons](https://github.com/tc39/ecma262/pull/3221#pullrequestreview-1735554031)  
170 |   * [ ] [Michael Ficarra](https://github.com/tc39/ecma262/pull/3221#pullrequestreview-1784954743)  
171 | <!--#endregion:todo-->
172 | 
173 | <!-- The following links are used throughout the README: -->
174 | 
175 | [Process]: https://tc39.es/process-document/
176 | [Proposals]: https://github.com/tc39/proposals/
177 | [Grammarkdown]: http://github.com/rbuckton/grammarkdown#readme
178 | [Champion]: #status
179 | [Prose]: #motivations
180 | [Examples]: #examples
181 | [API]: #api
182 | [Specification]: https://rbuckton.github.io/proposal-regexp-modifiers
183 | 
184 | [Transpiler]: #todo
185 | [Stage3ReviewerSignOff]: #todo
186 | [Stage3EditorSignOff]: #todo
187 | [Test262PullRequest]: https://github.com/tc39/test262/pull/3960
188 | [Implementation1]: https://bugs.chromium.org/p/v8/issues/detail?id=12956
189 | [Implementation2]: https://bugzilla.mozilla.org/show_bug.cgi?id=1899813
190 | [Ecma262PullRequest]: https://github.com/tc39/ecma262/pull/3221
191 | 


--------------------------------------------------------------------------------
/table-binary-unicode-properties.html:
--------------------------------------------------------------------------------
  1 | <emu-table id="table-binary-unicode-properties">
  2 |   <emu-caption>Binary Unicode property aliases and their canonical property names</emu-caption>
  3 |   <table class="real-table unicode-property-table">
  4 |     <thead>
  5 |       <tr>
  6 |         <th>Property name and aliases</th>
  7 |         <th>Canonical property name</th>
  8 |       </tr>
  9 |     </thead>
 10 |     <tr>
 11 |       <td>`ASCII`</td>
 12 |       <td><a href="https://unicode.org/reports/tr18/#General_Category_Property">`ASCII`</a></td>
 13 |     </tr>
 14 |     <tr>
 15 |       <td>`ASCII_Hex_Digit`</td>
 16 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#ASCII_Hex_Digit">`ASCII_Hex_Digit`</a></td>
 17 |     </tr>
 18 |     <tr>
 19 |       <td>`AHex`</td>
 20 |     </tr>
 21 |     <tr>
 22 |       <td>`Alphabetic`</td>
 23 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Alphabetic">`Alphabetic`</a></td>
 24 |     </tr>
 25 |     <tr>
 26 |       <td>`Alpha`</td>
 27 |     </tr>
 28 |     <tr>
 29 |       <td>`Any`</td>
 30 |       <td><a href="https://unicode.org/reports/tr18/#General_Category_Property">`Any`</a></td>
 31 |     </tr>
 32 |     <tr>
 33 |       <td>`Assigned`</td>
 34 |       <td><a href="https://unicode.org/reports/tr18/#General_Category_Property">`Assigned`</a></td>
 35 |     </tr>
 36 |     <tr>
 37 |       <td>`Bidi_Control`</td>
 38 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Bidi_Control">`Bidi_Control`</a></td>
 39 |     </tr>
 40 |     <tr>
 41 |       <td>`Bidi_C`</td>
 42 |     </tr>
 43 |     <tr>
 44 |       <td>`Bidi_Mirrored`</td>
 45 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Bidi_Mirrored">`Bidi_Mirrored`</a></td>
 46 |     </tr>
 47 |     <tr>
 48 |       <td>`Bidi_M`</td>
 49 |     </tr>
 50 |     <tr>
 51 |       <td>`Case_Ignorable`</td>
 52 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Case_Ignorable">`Case_Ignorable`</a></td>
 53 |     </tr>
 54 |     <tr>
 55 |       <td>`CI`</td>
 56 |     </tr>
 57 |     <tr>
 58 |       <td>`Cased`</td>
 59 |       <td><a href="https://unicode.org/reports/tr44/#Cased">`Cased`</a></td>
 60 |     </tr>
 61 |     <tr>
 62 |       <td>`Changes_When_Casefolded`</td>
 63 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#CWCF">`Changes_When_Casefolded`</a></td>
 64 |     </tr>
 65 |     <tr>
 66 |       <td>`CWCF`</td>
 67 |     </tr>
 68 |     <tr>
 69 |       <td>`Changes_When_Casemapped`</td>
 70 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#CWCM">`Changes_When_Casemapped`</a></td>
 71 |     </tr>
 72 |     <tr>
 73 |       <td>`CWCM`</td>
 74 |     </tr>
 75 |     <tr>
 76 |       <td>`Changes_When_Lowercased`</td>
 77 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#CWL">`Changes_When_Lowercased`</a></td>
 78 |     </tr>
 79 |     <tr>
 80 |       <td>`CWL`</td>
 81 |     </tr>
 82 |     <tr>
 83 |       <td>`Changes_When_NFKC_Casefolded`</td>
 84 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#CWKCF">`Changes_When_NFKC_Casefolded`</a></td>
 85 |     </tr>
 86 |     <tr>
 87 |       <td>`CWKCF`</td>
 88 |     </tr>
 89 |     <tr>
 90 |       <td>`Changes_When_Titlecased`</td>
 91 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#CWT">`Changes_When_Titlecased`</a></td>
 92 |     </tr>
 93 |     <tr>
 94 |       <td>`CWT`</td>
 95 |     </tr>
 96 |     <tr>
 97 |       <td>`Changes_When_Uppercased`</td>
 98 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#CWU">`Changes_When_Uppercased`</a></td>
 99 |     </tr>
100 |     <tr>
101 |       <td>`CWU`</td>
102 |     </tr>
103 |     <tr>
104 |       <td>`Dash`</td>
105 |       <td><a href="https://unicode.org/reports/tr44/#Dash">`Dash`</a></td>
106 |     </tr>
107 |     <tr>
108 |       <td>`Default_Ignorable_Code_Point`</td>
109 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Default_Ignorable_Code_Point">`Default_Ignorable_Code_Point`</a></td>
110 |     </tr>
111 |     <tr>
112 |       <td>`DI`</td>
113 |     </tr>
114 |     <tr>
115 |       <td>`Deprecated`</td>
116 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Deprecated">`Deprecated`</a></td>
117 |     </tr>
118 |     <tr>
119 |       <td>`Dep`</td>
120 |     </tr>
121 |     <tr>
122 |       <td>`Diacritic`</td>
123 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Diacritic">`Diacritic`</a></td>
124 |     </tr>
125 |     <tr>
126 |       <td>`Dia`</td>
127 |     </tr>
128 |     <tr>
129 |       <td>`Emoji`</td>
130 |       <td><a href="https://unicode.org/reports/tr51/#Emoji_Properties">`Emoji`</a></td>
131 |     </tr>
132 |     <tr>
133 |       <td>`Emoji_Component`</td>
134 |       <td rowspan="2"><a href="https://unicode.org/reports/tr51/#Emoji_Properties">`Emoji_Component`</a></td>
135 |     </tr>
136 |     <tr>
137 |       <td>`EComp`</td>
138 |     </tr>
139 |     <tr>
140 |       <td>`Emoji_Modifier`</td>
141 |       <td rowspan="2"><a href="https://unicode.org/reports/tr51/#Emoji_Properties">`Emoji_Modifier`</a></td>
142 |     </tr>
143 |     <tr>
144 |       <td>`EMod`</td>
145 |     </tr>
146 |     <tr>
147 |       <td>`Emoji_Modifier_Base`</td>
148 |       <td rowspan="2"><a href="https://unicode.org/reports/tr51/#Emoji_Properties">`Emoji_Modifier_Base`</a></td>
149 |     </tr>
150 |     <tr>
151 |       <td>`EBase`</td>
152 |     </tr>
153 |     <tr>
154 |       <td>`Emoji_Presentation`</td>
155 |       <td rowspan="2"><a href="https://unicode.org/reports/tr51/#Emoji_Properties">`Emoji_Presentation`</a></td>
156 |     </tr>
157 |     <tr>
158 |       <td>`EPres`</td>
159 |     </tr>
160 |     <tr>
161 |       <td>`Extended_Pictographic`</td>
162 |       <td rowspan="2"><a href="https://unicode.org/reports/tr51/#Emoji_Properties">`Extended_Pictographic`</a></td>
163 |     </tr>
164 |     <tr>
165 |       <td>`ExtPict`</td>
166 |     </tr>
167 |     <tr>
168 |       <td>`Extender`</td>
169 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Extender">`Extender`</a></td>
170 |     </tr>
171 |     <tr>
172 |       <td>`Ext`</td>
173 |     </tr>
174 |     <tr>
175 |       <td>`Grapheme_Base`</td>
176 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Grapheme_Base">`Grapheme_Base`</a></td>
177 |     </tr>
178 |     <tr>
179 |       <td>`Gr_Base`</td>
180 |     </tr>
181 |     <tr>
182 |       <td>`Grapheme_Extend`</td>
183 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Grapheme_Extend">`Grapheme_Extend`</a></td>
184 |     </tr>
185 |     <tr>
186 |       <td>`Gr_Ext`</td>
187 |     </tr>
188 |     <tr>
189 |       <td>`Hex_Digit`</td>
190 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Hex_Digit">`Hex_Digit`</a></td>
191 |     </tr>
192 |     <tr>
193 |       <td>`Hex`</td>
194 |     </tr>
195 |     <tr>
196 |       <td>`IDS_Binary_Operator`</td>
197 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#IDS_Binary_Operator">`IDS_Binary_Operator`</a></td>
198 |     </tr>
199 |     <tr>
200 |       <td>`IDSB`</td>
201 |     </tr>
202 |     <tr>
203 |       <td>`IDS_Trinary_Operator`</td>
204 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#IDS_Trinary_Operator">`IDS_Trinary_Operator`</a></td>
205 |     </tr>
206 |     <tr>
207 |       <td>`IDST`</td>
208 |     </tr>
209 |     <tr>
210 |       <td>`ID_Continue`</td>
211 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#ID_Continue">`ID_Continue`</a></td>
212 |     </tr>
213 |     <tr>
214 |       <td>`IDC`</td>
215 |     </tr>
216 |     <tr>
217 |       <td>`ID_Start`</td>
218 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#ID_Start">`ID_Start`</a></td>
219 |     </tr>
220 |     <tr>
221 |       <td>`IDS`</td>
222 |     </tr>
223 |     <tr>
224 |       <td>`Ideographic`</td>
225 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Ideographic">`Ideographic`</a></td>
226 |     </tr>
227 |     <tr>
228 |       <td>`Ideo`</td>
229 |     </tr>
230 |     <tr>
231 |       <td>`Join_Control`</td>
232 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Join_Control">`Join_Control`</a></td>
233 |     </tr>
234 |     <tr>
235 |       <td>`Join_C`</td>
236 |     </tr>
237 |     <tr>
238 |       <td>`Logical_Order_Exception`</td>
239 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Logical_Order_Exception">`Logical_Order_Exception`</a></td>
240 |     </tr>
241 |     <tr>
242 |       <td>`LOE`</td>
243 |     </tr>
244 |     <tr>
245 |       <td>`Lowercase`</td>
246 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Lowercase">`Lowercase`</a></td>
247 |     </tr>
248 |     <tr>
249 |       <td>`Lower`</td>
250 |     </tr>
251 |     <tr>
252 |       <td>`Math`</td>
253 |       <td><a href="https://unicode.org/reports/tr44/#Math">`Math`</a></td>
254 |     </tr>
255 |     <tr>
256 |       <td>`Noncharacter_Code_Point`</td>
257 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Noncharacter_Code_Point">`Noncharacter_Code_Point`</a></td>
258 |     </tr>
259 |     <tr>
260 |       <td>`NChar`</td>
261 |     </tr>
262 |     <tr>
263 |       <td>`Pattern_Syntax`</td>
264 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Pattern_Syntax">`Pattern_Syntax`</a></td>
265 |     </tr>
266 |     <tr>
267 |       <td>`Pat_Syn`</td>
268 |     </tr>
269 |     <tr>
270 |       <td>`Pattern_White_Space`</td>
271 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Pattern_White_Space">`Pattern_White_Space`</a></td>
272 |     </tr>
273 |     <tr>
274 |       <td>`Pat_WS`</td>
275 |     </tr>
276 |     <tr>
277 |       <td>`Quotation_Mark`</td>
278 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Quotation_Mark">`Quotation_Mark`</a></td>
279 |     </tr>
280 |     <tr>
281 |       <td>`QMark`</td>
282 |     </tr>
283 |     <tr>
284 |       <td>`Radical`</td>
285 |       <td><a href="https://unicode.org/reports/tr44/#Radical">`Radical`</a></td>
286 |     </tr>
287 |     <tr>
288 |       <td>`Regional_Indicator`</td>
289 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Regional_Indicator">`Regional_Indicator`</a></td>
290 |     </tr>
291 |     <tr>
292 |       <td>`RI`</td>
293 |     </tr>
294 |     <tr>
295 |       <td>`Sentence_Terminal`</td>
296 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#STerm">`Sentence_Terminal`</a></td>
297 |     </tr>
298 |     <tr>
299 |       <td>`STerm`</td>
300 |     </tr>
301 |     <tr>
302 |       <td>`Soft_Dotted`</td>
303 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Soft_Dotted">`Soft_Dotted`</a></td>
304 |     </tr>
305 |     <tr>
306 |       <td>`SD`</td>
307 |     </tr>
308 |     <tr>
309 |       <td>`Terminal_Punctuation`</td>
310 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Terminal_Punctuation">`Terminal_Punctuation`</a></td>
311 |     </tr>
312 |     <tr>
313 |       <td>`Term`</td>
314 |     </tr>
315 |     <tr>
316 |       <td>`Unified_Ideograph`</td>
317 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Unified_Ideograph">`Unified_Ideograph`</a></td>
318 |     </tr>
319 |     <tr>
320 |       <td>`UIdeo`</td>
321 |     </tr>
322 |     <tr>
323 |       <td>`Uppercase`</td>
324 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Uppercase">`Uppercase`</a></td>
325 |     </tr>
326 |     <tr>
327 |       <td>`Upper`</td>
328 |     </tr>
329 |     <tr>
330 |       <td>`Variation_Selector`</td>
331 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#Variation_Selector">`Variation_Selector`</a></td>
332 |     </tr>
333 |     <tr>
334 |       <td>`VS`</td>
335 |     </tr>
336 |     <tr>
337 |       <td>`White_Space`</td>
338 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#White_Space">`White_Space`</a></td>
339 |     </tr>
340 |     <tr>
341 |       <td>`space`</td>
342 |     </tr>
343 |     <tr>
344 |       <td>`XID_Continue`</td>
345 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#XID_Continue">`XID_Continue`</a></td>
346 |     </tr>
347 |     <tr>
348 |       <td>`XIDC`</td>
349 |     </tr>
350 |     <tr>
351 |       <td>`XID_Start`</td>
352 |       <td rowspan="2"><a href="https://unicode.org/reports/tr44/#XID_Start">`XID_Start`</a></td>
353 |     </tr>
354 |     <tr>
355 |       <td>`XIDS`</td>
356 |     </tr>
357 |   </table>
358 | </emu-table>
359 | 


--------------------------------------------------------------------------------
/table-unicode-script-values.html:
--------------------------------------------------------------------------------
   1 | <emu-table id="table-unicode-script-values">
   2 |   <emu-caption>Value aliases and canonical values for the Unicode properties <a href="https://unicode.org/reports/tr24/#Script">`Script`</a> and <a href="https://unicode.org/reports/tr24/#Script_Extensions">`Script_Extensions`</a></emu-caption>
   3 |   <table class="real-table unicode-property-table">
   4 |     <thead>
   5 |       <tr>
   6 |         <th>Property value and aliases</th>
   7 |         <th>Canonical property value</th>
   8 |       </tr>
   9 |     </thead>
  10 |     <tr>
  11 |       <td>`Adlam`</td>
  12 |       <td rowspan="2">`Adlam`</td>
  13 |     </tr>
  14 |     <tr>
  15 |       <td>`Adlm`</td>
  16 |     </tr>
  17 |     <tr>
  18 |       <td>`Ahom`</td>
  19 |       <td>`Ahom`</td>
  20 |     </tr>
  21 |     <tr>
  22 |       <td>`Anatolian_Hieroglyphs`</td>
  23 |       <td rowspan="2">`Anatolian_Hieroglyphs`</td>
  24 |     </tr>
  25 |     <tr>
  26 |       <td>`Hluw`</td>
  27 |     </tr>
  28 |     <tr>
  29 |       <td>`Arabic`</td>
  30 |       <td rowspan="2">`Arabic`</td>
  31 |     </tr>
  32 |     <tr>
  33 |       <td>`Arab`</td>
  34 |     </tr>
  35 |     <tr>
  36 |       <td>`Armenian`</td>
  37 |       <td rowspan="2">`Armenian`</td>
  38 |     </tr>
  39 |     <tr>
  40 |       <td>`Armn`</td>
  41 |     </tr>
  42 |     <tr>
  43 |       <td>`Avestan`</td>
  44 |       <td rowspan="2">`Avestan`</td>
  45 |     </tr>
  46 |     <tr>
  47 |       <td>`Avst`</td>
  48 |     </tr>
  49 |     <tr>
  50 |       <td>`Balinese`</td>
  51 |       <td rowspan="2">`Balinese`</td>
  52 |     </tr>
  53 |     <tr>
  54 |       <td>`Bali`</td>
  55 |     </tr>
  56 |     <tr>
  57 |       <td>`Bamum`</td>
  58 |       <td rowspan="2">`Bamum`</td>
  59 |     </tr>
  60 |     <tr>
  61 |       <td>`Bamu`</td>
  62 |     </tr>
  63 |     <tr>
  64 |       <td>`Bassa_Vah`</td>
  65 |       <td rowspan="2">`Bassa_Vah`</td>
  66 |     </tr>
  67 |     <tr>
  68 |       <td>`Bass`</td>
  69 |     </tr>
  70 |     <tr>
  71 |       <td>`Batak`</td>
  72 |       <td rowspan="2">`Batak`</td>
  73 |     </tr>
  74 |     <tr>
  75 |       <td>`Batk`</td>
  76 |     </tr>
  77 |     <tr>
  78 |       <td>`Bengali`</td>
  79 |       <td rowspan="2">`Bengali`</td>
  80 |     </tr>
  81 |     <tr>
  82 |       <td>`Beng`</td>
  83 |     </tr>
  84 |     <tr>
  85 |       <td>`Bhaiksuki`</td>
  86 |       <td rowspan="2">`Bhaiksuki`</td>
  87 |     </tr>
  88 |     <tr>
  89 |       <td>`Bhks`</td>
  90 |     </tr>
  91 |     <tr>
  92 |       <td>`Bopomofo`</td>
  93 |       <td rowspan="2">`Bopomofo`</td>
  94 |     </tr>
  95 |     <tr>
  96 |       <td>`Bopo`</td>
  97 |     </tr>
  98 |     <tr>
  99 |       <td>`Brahmi`</td>
 100 |       <td rowspan="2">`Brahmi`</td>
 101 |     </tr>
 102 |     <tr>
 103 |       <td>`Brah`</td>
 104 |     </tr>
 105 |     <tr>
 106 |       <td>`Braille`</td>
 107 |       <td rowspan="2">`Braille`</td>
 108 |     </tr>
 109 |     <tr>
 110 |       <td>`Brai`</td>
 111 |     </tr>
 112 |     <tr>
 113 |       <td>`Buginese`</td>
 114 |       <td rowspan="2">`Buginese`</td>
 115 |     </tr>
 116 |     <tr>
 117 |       <td>`Bugi`</td>
 118 |     </tr>
 119 |     <tr>
 120 |       <td>`Buhid`</td>
 121 |       <td rowspan="2">`Buhid`</td>
 122 |     </tr>
 123 |     <tr>
 124 |       <td>`Buhd`</td>
 125 |     </tr>
 126 |     <tr>
 127 |       <td>`Canadian_Aboriginal`</td>
 128 |       <td rowspan="2">`Canadian_Aboriginal`</td>
 129 |     </tr>
 130 |     <tr>
 131 |       <td>`Cans`</td>
 132 |     </tr>
 133 |     <tr>
 134 |       <td>`Carian`</td>
 135 |       <td rowspan="2">`Carian`</td>
 136 |     </tr>
 137 |     <tr>
 138 |       <td>`Cari`</td>
 139 |     </tr>
 140 |     <tr>
 141 |       <td>`Caucasian_Albanian`</td>
 142 |       <td rowspan="2">`Caucasian_Albanian`</td>
 143 |     </tr>
 144 |     <tr>
 145 |       <td>`Aghb`</td>
 146 |     </tr>
 147 |     <tr>
 148 |       <td>`Chakma`</td>
 149 |       <td rowspan="2">`Chakma`</td>
 150 |     </tr>
 151 |     <tr>
 152 |       <td>`Cakm`</td>
 153 |     </tr>
 154 |     <tr>
 155 |       <td>`Cham`</td>
 156 |       <td>`Cham`</td>
 157 |     </tr>
 158 |     <tr>
 159 |       <td>`Chorasmian`</td>
 160 |       <td rowspan="2">`Chorasmian`</td>
 161 |     </tr>
 162 |     <tr>
 163 |       <td>`Chrs`</td>
 164 |     </tr>
 165 |     <tr>
 166 |       <td>`Cherokee`</td>
 167 |       <td rowspan="2">`Cherokee`</td>
 168 |     </tr>
 169 |     <tr>
 170 |       <td>`Cher`</td>
 171 |     </tr>
 172 |     <tr>
 173 |       <td>`Common`</td>
 174 |       <td rowspan="2">`Common`</td>
 175 |     </tr>
 176 |     <tr>
 177 |       <td>`Zyyy`</td>
 178 |     </tr>
 179 |     <tr>
 180 |       <td>`Coptic`</td>
 181 |       <td rowspan="3">`Coptic`</td>
 182 |     </tr>
 183 |     <tr>
 184 |       <td>`Copt`</td>
 185 |     </tr>
 186 |     <tr>
 187 |       <td>`Qaac`</td>
 188 |     </tr>
 189 |     <tr>
 190 |       <td>`Cuneiform`</td>
 191 |       <td rowspan="2">`Cuneiform`</td>
 192 |     </tr>
 193 |     <tr>
 194 |       <td>`Xsux`</td>
 195 |     </tr>
 196 |     <tr>
 197 |       <td>`Cypriot`</td>
 198 |       <td rowspan="2">`Cypriot`</td>
 199 |     </tr>
 200 |     <tr>
 201 |       <td>`Cprt`</td>
 202 |     </tr>
 203 |     <tr>
 204 |       <td>`Cyrillic`</td>
 205 |       <td rowspan="2">`Cyrillic`</td>
 206 |     </tr>
 207 |     <tr>
 208 |       <td>`Cyrl`</td>
 209 |     </tr>
 210 |     <tr>
 211 |       <td>`Deseret`</td>
 212 |       <td rowspan="2">`Deseret`</td>
 213 |     </tr>
 214 |     <tr>
 215 |       <td>`Dsrt`</td>
 216 |     </tr>
 217 |     <tr>
 218 |       <td>`Devanagari`</td>
 219 |       <td rowspan="2">`Devanagari`</td>
 220 |     </tr>
 221 |     <tr>
 222 |       <td>`Deva`</td>
 223 |     </tr>
 224 |     <tr>
 225 |       <td>`Dives_Akuru`</td>
 226 |       <td rowspan="2">`Dives_Akuru`</td>
 227 |     </tr>
 228 |     <tr>
 229 |       <td>`Diak`</td>
 230 |     </tr>
 231 |     <tr>
 232 |       <td>`Dogra`</td>
 233 |       <td rowspan="2">`Dogra`</td>
 234 |     </tr>
 235 |     <tr>
 236 |       <td>`Dogr`</td>
 237 |     </tr>
 238 |     <tr>
 239 |       <td>`Duployan`</td>
 240 |       <td rowspan="2">`Duployan`</td>
 241 |     </tr>
 242 |     <tr>
 243 |       <td>`Dupl`</td>
 244 |     </tr>
 245 |     <tr>
 246 |       <td>`Egyptian_Hieroglyphs`</td>
 247 |       <td rowspan="2">`Egyptian_Hieroglyphs`</td>
 248 |     </tr>
 249 |     <tr>
 250 |       <td>`Egyp`</td>
 251 |     </tr>
 252 |     <tr>
 253 |       <td>`Elbasan`</td>
 254 |       <td rowspan="2">`Elbasan`</td>
 255 |     </tr>
 256 |     <tr>
 257 |       <td>`Elba`</td>
 258 |     </tr>
 259 |     <tr>
 260 |       <td>`Elymaic`</td>
 261 |       <td rowspan="2">`Elymaic`</td>
 262 |     </tr>
 263 |     <tr>
 264 |       <td>`Elym`</td>
 265 |     </tr>
 266 |     <tr>
 267 |       <td>`Ethiopic`</td>
 268 |       <td rowspan="2">`Ethiopic`</td>
 269 |     </tr>
 270 |     <tr>
 271 |       <td>`Ethi`</td>
 272 |     </tr>
 273 |     <tr>
 274 |       <td>`Georgian`</td>
 275 |       <td rowspan="2">`Georgian`</td>
 276 |     </tr>
 277 |     <tr>
 278 |       <td>`Geor`</td>
 279 |     </tr>
 280 |     <tr>
 281 |       <td>`Glagolitic`</td>
 282 |       <td rowspan="2">`Glagolitic`</td>
 283 |     </tr>
 284 |     <tr>
 285 |       <td>`Glag`</td>
 286 |     </tr>
 287 |     <tr>
 288 |       <td>`Gothic`</td>
 289 |       <td rowspan="2">`Gothic`</td>
 290 |     </tr>
 291 |     <tr>
 292 |       <td>`Goth`</td>
 293 |     </tr>
 294 |     <tr>
 295 |       <td>`Grantha`</td>
 296 |       <td rowspan="2">`Grantha`</td>
 297 |     </tr>
 298 |     <tr>
 299 |       <td>`Gran`</td>
 300 |     </tr>
 301 |     <tr>
 302 |       <td>`Greek`</td>
 303 |       <td rowspan="2">`Greek`</td>
 304 |     </tr>
 305 |     <tr>
 306 |       <td>`Grek`</td>
 307 |     </tr>
 308 |     <tr>
 309 |       <td>`Gujarati`</td>
 310 |       <td rowspan="2">`Gujarati`</td>
 311 |     </tr>
 312 |     <tr>
 313 |       <td>`Gujr`</td>
 314 |     </tr>
 315 |     <tr>
 316 |       <td>`Gunjala_Gondi`</td>
 317 |       <td rowspan="2">`Gunjala_Gondi`</td>
 318 |     </tr>
 319 |     <tr>
 320 |       <td>`Gong`</td>
 321 |     </tr>
 322 |     <tr>
 323 |       <td>`Gurmukhi`</td>
 324 |       <td rowspan="2">`Gurmukhi`</td>
 325 |     </tr>
 326 |     <tr>
 327 |       <td>`Guru`</td>
 328 |     </tr>
 329 |     <tr>
 330 |       <td>`Han`</td>
 331 |       <td rowspan="2">`Han`</td>
 332 |     </tr>
 333 |     <tr>
 334 |       <td>`Hani`</td>
 335 |     </tr>
 336 |     <tr>
 337 |       <td>`Hangul`</td>
 338 |       <td rowspan="2">`Hangul`</td>
 339 |     </tr>
 340 |     <tr>
 341 |       <td>`Hang`</td>
 342 |     </tr>
 343 |     <tr>
 344 |       <td>`Hanifi_Rohingya`</td>
 345 |       <td rowspan="2">`Hanifi_Rohingya`</td>
 346 |     </tr>
 347 |     <tr>
 348 |       <td>`Rohg`</td>
 349 |     </tr>
 350 |     <tr>
 351 |       <td>`Hanunoo`</td>
 352 |       <td rowspan="2">`Hanunoo`</td>
 353 |     </tr>
 354 |     <tr>
 355 |       <td>`Hano`</td>
 356 |     </tr>
 357 |     <tr>
 358 |       <td>`Hatran`</td>
 359 |       <td rowspan="2">`Hatran`</td>
 360 |     </tr>
 361 |     <tr>
 362 |       <td>`Hatr`</td>
 363 |     </tr>
 364 |     <tr>
 365 |       <td>`Hebrew`</td>
 366 |       <td rowspan="2">`Hebrew`</td>
 367 |     </tr>
 368 |     <tr>
 369 |       <td>`Hebr`</td>
 370 |     </tr>
 371 |     <tr>
 372 |       <td>`Hiragana`</td>
 373 |       <td rowspan="2">`Hiragana`</td>
 374 |     </tr>
 375 |     <tr>
 376 |       <td>`Hira`</td>
 377 |     </tr>
 378 |     <tr>
 379 |       <td>`Imperial_Aramaic`</td>
 380 |       <td rowspan="2">`Imperial_Aramaic`</td>
 381 |     </tr>
 382 |     <tr>
 383 |       <td>`Armi`</td>
 384 |     </tr>
 385 |     <tr>
 386 |       <td>`Inherited`</td>
 387 |       <td rowspan="3">`Inherited`</td>
 388 |     </tr>
 389 |     <tr>
 390 |       <td>`Zinh`</td>
 391 |     </tr>
 392 |     <tr>
 393 |       <td>`Qaai`</td>
 394 |     </tr>
 395 |     <tr>
 396 |       <td>`Inscriptional_Pahlavi`</td>
 397 |       <td rowspan="2">`Inscriptional_Pahlavi`</td>
 398 |     </tr>
 399 |     <tr>
 400 |       <td>`Phli`</td>
 401 |     </tr>
 402 |     <tr>
 403 |       <td>`Inscriptional_Parthian`</td>
 404 |       <td rowspan="2">`Inscriptional_Parthian`</td>
 405 |     </tr>
 406 |     <tr>
 407 |       <td>`Prti`</td>
 408 |     </tr>
 409 |     <tr>
 410 |       <td>`Javanese`</td>
 411 |       <td rowspan="2">`Javanese`</td>
 412 |     </tr>
 413 |     <tr>
 414 |       <td>`Java`</td>
 415 |     </tr>
 416 |     <tr>
 417 |       <td>`Kaithi`</td>
 418 |       <td rowspan="2">`Kaithi`</td>
 419 |     </tr>
 420 |     <tr>
 421 |       <td>`Kthi`</td>
 422 |     </tr>
 423 |     <tr>
 424 |       <td>`Kannada`</td>
 425 |       <td rowspan="2">`Kannada`</td>
 426 |     </tr>
 427 |     <tr>
 428 |       <td>`Knda`</td>
 429 |     </tr>
 430 |     <tr>
 431 |       <td>`Katakana`</td>
 432 |       <td rowspan="2">`Katakana`</td>
 433 |     </tr>
 434 |     <tr>
 435 |       <td>`Kana`</td>
 436 |     </tr>
 437 |     <tr>
 438 |       <td>`Kayah_Li`</td>
 439 |       <td rowspan="2">`Kayah_Li`</td>
 440 |     </tr>
 441 |     <tr>
 442 |       <td>`Kali`</td>
 443 |     </tr>
 444 |     <tr>
 445 |       <td>`Kharoshthi`</td>
 446 |       <td rowspan="2">`Kharoshthi`</td>
 447 |     </tr>
 448 |     <tr>
 449 |       <td>`Khar`</td>
 450 |     </tr>
 451 |     <tr>
 452 |       <td>`Khitan_Small_Script`</td>
 453 |       <td rowspan="2">`Khitan_Small_Script`</td>
 454 |     </tr>
 455 |     <tr>
 456 |       <td>`Kits`</td>
 457 |     </tr>
 458 |     <tr>
 459 |       <td>`Khmer`</td>
 460 |       <td rowspan="2">`Khmer`</td>
 461 |     </tr>
 462 |     <tr>
 463 |       <td>`Khmr`</td>
 464 |     </tr>
 465 |     <tr>
 466 |       <td>`Khojki`</td>
 467 |       <td rowspan="2">`Khojki`</td>
 468 |     </tr>
 469 |     <tr>
 470 |       <td>`Khoj`</td>
 471 |     </tr>
 472 |     <tr>
 473 |       <td>`Khudawadi`</td>
 474 |       <td rowspan="2">`Khudawadi`</td>
 475 |     </tr>
 476 |     <tr>
 477 |       <td>`Sind`</td>
 478 |     </tr>
 479 |     <tr>
 480 |       <td>`Lao`</td>
 481 |       <td rowspan="2">`Lao`</td>
 482 |     </tr>
 483 |     <tr>
 484 |       <td>`Laoo`</td>
 485 |     </tr>
 486 |     <tr>
 487 |       <td>`Latin`</td>
 488 |       <td rowspan="2">`Latin`</td>
 489 |     </tr>
 490 |     <tr>
 491 |       <td>`Latn`</td>
 492 |     </tr>
 493 |     <tr>
 494 |       <td>`Lepcha`</td>
 495 |       <td rowspan="2">`Lepcha`</td>
 496 |     </tr>
 497 |     <tr>
 498 |       <td>`Lepc`</td>
 499 |     </tr>
 500 |     <tr>
 501 |       <td>`Limbu`</td>
 502 |       <td rowspan="2">`Limbu`</td>
 503 |     </tr>
 504 |     <tr>
 505 |       <td>`Limb`</td>
 506 |     </tr>
 507 |     <tr>
 508 |       <td>`Linear_A`</td>
 509 |       <td rowspan="2">`Linear_A`</td>
 510 |     </tr>
 511 |     <tr>
 512 |       <td>`Lina`</td>
 513 |     </tr>
 514 |     <tr>
 515 |       <td>`Linear_B`</td>
 516 |       <td rowspan="2">`Linear_B`</td>
 517 |     </tr>
 518 |     <tr>
 519 |       <td>`Linb`</td>
 520 |     </tr>
 521 |     <tr>
 522 |       <td>`Lisu`</td>
 523 |       <td>`Lisu`</td>
 524 |     </tr>
 525 |     <tr>
 526 |       <td>`Lycian`</td>
 527 |       <td rowspan="2">`Lycian`</td>
 528 |     </tr>
 529 |     <tr>
 530 |       <td>`Lyci`</td>
 531 |     </tr>
 532 |     <tr>
 533 |       <td>`Lydian`</td>
 534 |       <td rowspan="2">`Lydian`</td>
 535 |     </tr>
 536 |     <tr>
 537 |       <td>`Lydi`</td>
 538 |     </tr>
 539 |     <tr>
 540 |       <td>`Mahajani`</td>
 541 |       <td rowspan="2">`Mahajani`</td>
 542 |     </tr>
 543 |     <tr>
 544 |       <td>`Mahj`</td>
 545 |     </tr>
 546 |     <tr>
 547 |       <td>`Makasar`</td>
 548 |       <td rowspan="2">`Makasar`</td>
 549 |     </tr>
 550 |     <tr>
 551 |       <td>`Maka`</td>
 552 |     </tr>
 553 |     <tr>
 554 |       <td>`Malayalam`</td>
 555 |       <td rowspan="2">`Malayalam`</td>
 556 |     </tr>
 557 |     <tr>
 558 |       <td>`Mlym`</td>
 559 |     </tr>
 560 |     <tr>
 561 |       <td>`Mandaic`</td>
 562 |       <td rowspan="2">`Mandaic`</td>
 563 |     </tr>
 564 |     <tr>
 565 |       <td>`Mand`</td>
 566 |     </tr>
 567 |     <tr>
 568 |       <td>`Manichaean`</td>
 569 |       <td rowspan="2">`Manichaean`</td>
 570 |     </tr>
 571 |     <tr>
 572 |       <td>`Mani`</td>
 573 |     </tr>
 574 |     <tr>
 575 |       <td>`Marchen`</td>
 576 |       <td rowspan="2">`Marchen`</td>
 577 |     </tr>
 578 |     <tr>
 579 |       <td>`Marc`</td>
 580 |     </tr>
 581 |     <tr>
 582 |       <td>`Medefaidrin`</td>
 583 |       <td rowspan="2">`Medefaidrin`</td>
 584 |     </tr>
 585 |     <tr>
 586 |       <td>`Medf`</td>
 587 |     </tr>
 588 |     <tr>
 589 |       <td>`Masaram_Gondi`</td>
 590 |       <td rowspan="2">`Masaram_Gondi`</td>
 591 |     </tr>
 592 |     <tr>
 593 |       <td>`Gonm`</td>
 594 |     </tr>
 595 |     <tr>
 596 |       <td>`Meetei_Mayek`</td>
 597 |       <td rowspan="2">`Meetei_Mayek`</td>
 598 |     </tr>
 599 |     <tr>
 600 |       <td>`Mtei`</td>
 601 |     </tr>
 602 |     <tr>
 603 |       <td>`Mende_Kikakui`</td>
 604 |       <td rowspan="2">`Mende_Kikakui`</td>
 605 |     </tr>
 606 |     <tr>
 607 |       <td>`Mend`</td>
 608 |     </tr>
 609 |     <tr>
 610 |       <td>`Meroitic_Cursive`</td>
 611 |       <td rowspan="2">`Meroitic_Cursive`</td>
 612 |     </tr>
 613 |     <tr>
 614 |       <td>`Merc`</td>
 615 |     </tr>
 616 |     <tr>
 617 |       <td>`Meroitic_Hieroglyphs`</td>
 618 |       <td rowspan="2">`Meroitic_Hieroglyphs`</td>
 619 |     </tr>
 620 |     <tr>
 621 |       <td>`Mero`</td>
 622 |     </tr>
 623 |     <tr>
 624 |       <td>`Miao`</td>
 625 |       <td rowspan="2">`Miao`</td>
 626 |     </tr>
 627 |     <tr>
 628 |       <td>`Plrd`</td>
 629 |     </tr>
 630 |     <tr>
 631 |       <td>`Modi`</td>
 632 |       <td>`Modi`</td>
 633 |     </tr>
 634 |     <tr>
 635 |       <td>`Mongolian`</td>
 636 |       <td rowspan="2">`Mongolian`</td>
 637 |     </tr>
 638 |     <tr>
 639 |       <td>`Mong`</td>
 640 |     </tr>
 641 |     <tr>
 642 |       <td>`Mro`</td>
 643 |       <td rowspan="2">`Mro`</td>
 644 |     </tr>
 645 |     <tr>
 646 |       <td>`Mroo`</td>
 647 |     </tr>
 648 |     <tr>
 649 |       <td>`Multani`</td>
 650 |       <td rowspan="2">`Multani`</td>
 651 |     </tr>
 652 |     <tr>
 653 |       <td>`Mult`</td>
 654 |     </tr>
 655 |     <tr>
 656 |       <td>`Myanmar`</td>
 657 |       <td rowspan="2">`Myanmar`</td>
 658 |     </tr>
 659 |     <tr>
 660 |       <td>`Mymr`</td>
 661 |     </tr>
 662 |     <tr>
 663 |       <td>`Nabataean`</td>
 664 |       <td rowspan="2">`Nabataean`</td>
 665 |     </tr>
 666 |     <tr>
 667 |       <td>`Nbat`</td>
 668 |     </tr>
 669 |     <tr>
 670 |       <td>`Nandinagari`</td>
 671 |       <td rowspan="2">`Nandinagari`</td>
 672 |     </tr>
 673 |     <tr>
 674 |       <td>`Nand`</td>
 675 |     </tr>
 676 |     <tr>
 677 |       <td>`New_Tai_Lue`</td>
 678 |       <td rowspan="2">`New_Tai_Lue`</td>
 679 |     </tr>
 680 |     <tr>
 681 |       <td>`Talu`</td>
 682 |     </tr>
 683 |     <tr>
 684 |       <td>`Newa`</td>
 685 |       <td>`Newa`</td>
 686 |     </tr>
 687 |     <tr>
 688 |       <td>`Nko`</td>
 689 |       <td rowspan="2">`Nko`</td>
 690 |     </tr>
 691 |     <tr>
 692 |       <td>`Nkoo`</td>
 693 |     </tr>
 694 |     <tr>
 695 |       <td>`Nushu`</td>
 696 |       <td rowspan="2">`Nushu`</td>
 697 |     </tr>
 698 |     <tr>
 699 |       <td>`Nshu`</td>
 700 |     </tr>
 701 |     <tr>
 702 |       <td>`Nyiakeng_Puachue_Hmong`</td>
 703 |       <td rowspan="2">`Nyiakeng_Puachue_Hmong`</td>
 704 |     </tr>
 705 |     <tr>
 706 |       <td>`Hmnp`</td>
 707 |     </tr>
 708 |     <tr>
 709 |       <td>`Ogham`</td>
 710 |       <td rowspan="2">`Ogham`</td>
 711 |     </tr>
 712 |     <tr>
 713 |       <td>`Ogam`</td>
 714 |     </tr>
 715 |     <tr>
 716 |       <td>`Ol_Chiki`</td>
 717 |       <td rowspan="2">`Ol_Chiki`</td>
 718 |     </tr>
 719 |     <tr>
 720 |       <td>`Olck`</td>
 721 |     </tr>
 722 |     <tr>
 723 |       <td>`Old_Hungarian`</td>
 724 |       <td rowspan="2">`Old_Hungarian`</td>
 725 |     </tr>
 726 |     <tr>
 727 |       <td>`Hung`</td>
 728 |     </tr>
 729 |     <tr>
 730 |       <td>`Old_Italic`</td>
 731 |       <td rowspan="2">`Old_Italic`</td>
 732 |     </tr>
 733 |     <tr>
 734 |       <td>`Ital`</td>
 735 |     </tr>
 736 |     <tr>
 737 |       <td>`Old_North_Arabian`</td>
 738 |       <td rowspan="2">`Old_North_Arabian`</td>
 739 |     </tr>
 740 |     <tr>
 741 |       <td>`Narb`</td>
 742 |     </tr>
 743 |     <tr>
 744 |       <td>`Old_Permic`</td>
 745 |       <td rowspan="2">`Old_Permic`</td>
 746 |     </tr>
 747 |     <tr>
 748 |       <td>`Perm`</td>
 749 |     </tr>
 750 |     <tr>
 751 |       <td>`Old_Persian`</td>
 752 |       <td rowspan="2">`Old_Persian`</td>
 753 |     </tr>
 754 |     <tr>
 755 |       <td>`Xpeo`</td>
 756 |     </tr>
 757 |     <tr>
 758 |       <td>`Old_Sogdian`</td>
 759 |       <td rowspan="2">`Old_Sogdian`</td>
 760 |     </tr>
 761 |     <tr>
 762 |       <td>`Sogo`</td>
 763 |     </tr>
 764 |     <tr>
 765 |       <td>`Old_South_Arabian`</td>
 766 |       <td rowspan="2">`Old_South_Arabian`</td>
 767 |     </tr>
 768 |     <tr>
 769 |       <td>`Sarb`</td>
 770 |     </tr>
 771 |     <tr>
 772 |       <td>`Old_Turkic`</td>
 773 |       <td rowspan="2">`Old_Turkic`</td>
 774 |     </tr>
 775 |     <tr>
 776 |       <td>`Orkh`</td>
 777 |     </tr>
 778 |     <tr>
 779 |       <td>`Oriya`</td>
 780 |       <td rowspan="2">`Oriya`</td>
 781 |     </tr>
 782 |     <tr>
 783 |       <td>`Orya`</td>
 784 |     </tr>
 785 |     <tr>
 786 |       <td>`Osage`</td>
 787 |       <td rowspan="2">`Osage`</td>
 788 |     </tr>
 789 |     <tr>
 790 |       <td>`Osge`</td>
 791 |     </tr>
 792 |     <tr>
 793 |       <td>`Osmanya`</td>
 794 |       <td rowspan="2">`Osmanya`</td>
 795 |     </tr>
 796 |     <tr>
 797 |       <td>`Osma`</td>
 798 |     </tr>
 799 |     <tr>
 800 |       <td>`Pahawh_Hmong`</td>
 801 |       <td rowspan="2">`Pahawh_Hmong`</td>
 802 |     </tr>
 803 |     <tr>
 804 |       <td>`Hmng`</td>
 805 |     </tr>
 806 |     <tr>
 807 |       <td>`Palmyrene`</td>
 808 |       <td rowspan="2">`Palmyrene`</td>
 809 |     </tr>
 810 |     <tr>
 811 |       <td>`Palm`</td>
 812 |     </tr>
 813 |     <tr>
 814 |       <td>`Pau_Cin_Hau`</td>
 815 |       <td rowspan="2">`Pau_Cin_Hau`</td>
 816 |     </tr>
 817 |     <tr>
 818 |       <td>`Pauc`</td>
 819 |     </tr>
 820 |     <tr>
 821 |       <td>`Phags_Pa`</td>
 822 |       <td rowspan="2">`Phags_Pa`</td>
 823 |     </tr>
 824 |     <tr>
 825 |       <td>`Phag`</td>
 826 |     </tr>
 827 |     <tr>
 828 |       <td>`Phoenician`</td>
 829 |       <td rowspan="2">`Phoenician`</td>
 830 |     </tr>
 831 |     <tr>
 832 |       <td>`Phnx`</td>
 833 |     </tr>
 834 |     <tr>
 835 |       <td>`Psalter_Pahlavi`</td>
 836 |       <td rowspan="2">`Psalter_Pahlavi`</td>
 837 |     </tr>
 838 |     <tr>
 839 |       <td>`Phlp`</td>
 840 |     </tr>
 841 |     <tr>
 842 |       <td>`Rejang`</td>
 843 |       <td rowspan="2">`Rejang`</td>
 844 |     </tr>
 845 |     <tr>
 846 |       <td>`Rjng`</td>
 847 |     </tr>
 848 |     <tr>
 849 |       <td>`Runic`</td>
 850 |       <td rowspan="2">`Runic`</td>
 851 |     </tr>
 852 |     <tr>
 853 |       <td>`Runr`</td>
 854 |     </tr>
 855 |     <tr>
 856 |       <td>`Samaritan`</td>
 857 |       <td rowspan="2">`Samaritan`</td>
 858 |     </tr>
 859 |     <tr>
 860 |       <td>`Samr`</td>
 861 |     </tr>
 862 |     <tr>
 863 |       <td>`Saurashtra`</td>
 864 |       <td rowspan="2">`Saurashtra`</td>
 865 |     </tr>
 866 |     <tr>
 867 |       <td>`Saur`</td>
 868 |     </tr>
 869 |     <tr>
 870 |       <td>`Sharada`</td>
 871 |       <td rowspan="2">`Sharada`</td>
 872 |     </tr>
 873 |     <tr>
 874 |       <td>`Shrd`</td>
 875 |     </tr>
 876 |     <tr>
 877 |       <td>`Shavian`</td>
 878 |       <td rowspan="2">`Shavian`</td>
 879 |     </tr>
 880 |     <tr>
 881 |       <td>`Shaw`</td>
 882 |     </tr>
 883 |     <tr>
 884 |       <td>`Siddham`</td>
 885 |       <td rowspan="2">`Siddham`</td>
 886 |     </tr>
 887 |     <tr>
 888 |       <td>`Sidd`</td>
 889 |     </tr>
 890 |     <tr>
 891 |       <td>`SignWriting`</td>
 892 |       <td rowspan="2">`SignWriting`</td>
 893 |     </tr>
 894 |     <tr>
 895 |       <td>`Sgnw`</td>
 896 |     </tr>
 897 |     <tr>
 898 |       <td>`Sinhala`</td>
 899 |       <td rowspan="2">`Sinhala`</td>
 900 |     </tr>
 901 |     <tr>
 902 |       <td>`Sinh`</td>
 903 |     </tr>
 904 |     <tr>
 905 |       <td>`Sogdian`</td>
 906 |       <td rowspan="2">`Sogdian`</td>
 907 |     </tr>
 908 |     <tr>
 909 |       <td>`Sogd`</td>
 910 |     </tr>
 911 |     <tr>
 912 |       <td>`Sora_Sompeng`</td>
 913 |       <td rowspan="2">`Sora_Sompeng`</td>
 914 |     </tr>
 915 |     <tr>
 916 |       <td>`Sora`</td>
 917 |     </tr>
 918 |     <tr>
 919 |       <td>`Soyombo`</td>
 920 |       <td rowspan="2">`Soyombo`</td>
 921 |     </tr>
 922 |     <tr>
 923 |       <td>`Soyo`</td>
 924 |     </tr>
 925 |     <tr>
 926 |       <td>`Sundanese`</td>
 927 |       <td rowspan="2">`Sundanese`</td>
 928 |     </tr>
 929 |     <tr>
 930 |       <td>`Sund`</td>
 931 |     </tr>
 932 |     <tr>
 933 |       <td>`Syloti_Nagri`</td>
 934 |       <td rowspan="2">`Syloti_Nagri`</td>
 935 |     </tr>
 936 |     <tr>
 937 |       <td>`Sylo`</td>
 938 |     </tr>
 939 |     <tr>
 940 |       <td>`Syriac`</td>
 941 |       <td rowspan="2">`Syriac`</td>
 942 |     </tr>
 943 |     <tr>
 944 |       <td>`Syrc`</td>
 945 |     </tr>
 946 |     <tr>
 947 |       <td>`Tagalog`</td>
 948 |       <td rowspan="2">`Tagalog`</td>
 949 |     </tr>
 950 |     <tr>
 951 |       <td>`Tglg`</td>
 952 |     </tr>
 953 |     <tr>
 954 |       <td>`Tagbanwa`</td>
 955 |       <td rowspan="2">`Tagbanwa`</td>
 956 |     </tr>
 957 |     <tr>
 958 |       <td>`Tagb`</td>
 959 |     </tr>
 960 |     <tr>
 961 |       <td>`Tai_Le`</td>
 962 |       <td rowspan="2">`Tai_Le`</td>
 963 |     </tr>
 964 |     <tr>
 965 |       <td>`Tale`</td>
 966 |     </tr>
 967 |     <tr>
 968 |       <td>`Tai_Tham`</td>
 969 |       <td rowspan="2">`Tai_Tham`</td>
 970 |     </tr>
 971 |     <tr>
 972 |       <td>`Lana`</td>
 973 |     </tr>
 974 |     <tr>
 975 |       <td>`Tai_Viet`</td>
 976 |       <td rowspan="2">`Tai_Viet`</td>
 977 |     </tr>
 978 |     <tr>
 979 |       <td>`Tavt`</td>
 980 |     </tr>
 981 |     <tr>
 982 |       <td>`Takri`</td>
 983 |       <td rowspan="2">`Takri`</td>
 984 |     </tr>
 985 |     <tr>
 986 |       <td>`Takr`</td>
 987 |     </tr>
 988 |     <tr>
 989 |       <td>`Tamil`</td>
 990 |       <td rowspan="2">`Tamil`</td>
 991 |     </tr>
 992 |     <tr>
 993 |       <td>`Taml`</td>
 994 |     </tr>
 995 |     <tr>
 996 |       <td>`Tangut`</td>
 997 |       <td rowspan="2">`Tangut`</td>
 998 |     </tr>
 999 |     <tr>
1000 |       <td>`Tang`</td>
1001 |     </tr>
1002 |     <tr>
1003 |       <td>`Telugu`</td>
1004 |       <td rowspan="2">`Telugu`</td>
1005 |     </tr>
1006 |     <tr>
1007 |       <td>`Telu`</td>
1008 |     </tr>
1009 |     <tr>
1010 |       <td>`Thaana`</td>
1011 |       <td rowspan="2">`Thaana`</td>
1012 |     </tr>
1013 |     <tr>
1014 |       <td>`Thaa`</td>
1015 |     </tr>
1016 |     <tr>
1017 |       <td>`Thai`</td>
1018 |       <td>`Thai`</td>
1019 |     </tr>
1020 |     <tr>
1021 |       <td>`Tibetan`</td>
1022 |       <td rowspan="2">`Tibetan`</td>
1023 |     </tr>
1024 |     <tr>
1025 |       <td>`Tibt`</td>
1026 |     </tr>
1027 |     <tr>
1028 |       <td>`Tifinagh`</td>
1029 |       <td rowspan="2">`Tifinagh`</td>
1030 |     </tr>
1031 |     <tr>
1032 |       <td>`Tfng`</td>
1033 |     </tr>
1034 |     <tr>
1035 |       <td>`Tirhuta`</td>
1036 |       <td rowspan="2">`Tirhuta`</td>
1037 |     </tr>
1038 |     <tr>
1039 |       <td>`Tirh`</td>
1040 |     </tr>
1041 |     <tr>
1042 |       <td>`Ugaritic`</td>
1043 |       <td rowspan="2">`Ugaritic`</td>
1044 |     </tr>
1045 |     <tr>
1046 |       <td>`Ugar`</td>
1047 |     </tr>
1048 |     <tr>
1049 |       <td>`Vai`</td>
1050 |       <td rowspan="2">`Vai`</td>
1051 |     </tr>
1052 |     <tr>
1053 |       <td>`Vaii`</td>
1054 |     </tr>
1055 |     <tr>
1056 |       <td>`Wancho`</td>
1057 |       <td rowspan="2">`Wancho`</td>
1058 |     </tr>
1059 |     <tr>
1060 |       <td>`Wcho`</td>
1061 |     </tr>
1062 |     <tr>
1063 |       <td>`Warang_Citi`</td>
1064 |       <td rowspan="2">`Warang_Citi`</td>
1065 |     </tr>
1066 |     <tr>
1067 |       <td>`Wara`</td>
1068 |     </tr>
1069 |     <tr>
1070 |       <td>`Yezidi`</td>
1071 |       <td rowspan="2">`Yezidi`</td>
1072 |     </tr>
1073 |     <tr>
1074 |       <td>`Yezi`</td>
1075 |     </tr>
1076 |     <tr>
1077 |       <td>`Yi`</td>
1078 |       <td rowspan="2">`Yi`</td>
1079 |     </tr>
1080 |     <tr>
1081 |       <td>`Yiii`</td>
1082 |     </tr>
1083 |     <tr>
1084 |       <td>`Zanabazar_Square`</td>
1085 |       <td rowspan="2">`Zanabazar_Square`</td>
1086 |     </tr>
1087 |     <tr>
1088 |       <td>`Zanb`</td>
1089 |     </tr>
1090 |   </table>
1091 | </emu-table>
1092 | 


--------------------------------------------------------------------------------
/spec.emu:
--------------------------------------------------------------------------------
   1 | <!doctype html>
   2 | <meta charset="utf8">
   3 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/highlight.js/8.4/styles/github.min.css">
   4 | <link rel="spec" href="es2015" />
   5 | <pre class="metadata">
   6 | title: Regular Expression Pattern Modifiers for ECMAScript
   7 | stage: 3
   8 | contributors: Ron Buckton, Ecma International
   9 | </pre>
  10 | 
  11 | <emu-biblio href="node_modules/@tc39/ecma262-biblio/biblio.json"></emu-biblio>
  12 | 
  13 | <emu-intro id="sec-intro">
  14 |   <h1>Introduction</h1>
  15 |   <p>See <a href="https://github.com/tc39/proposal-regexp-modifiers#readme">the proposal repository</a> for background material and discussion.</p>
  16 | </emu-intro>
  17 | 
  18 | <emu-clause id="sec-text-processing">
  19 |   <h1>Text Processing</h1>
  20 | 
  21 |   <emu-clause id="sec-regexp-regular-expression-objects">
  22 |     <h1>RegExp (Regular Expression) Objects</h1>
  23 |     <p>A RegExp object contains a regular expression and the associated flags.</p>
  24 |     <emu-note>
  25 |       <p>The form and functionality of regular expressions is modelled after the regular expression facility in the Perl 5 programming language.</p>
  26 |     </emu-note>
  27 | 
  28 |     <emu-clause id="sec-patterns">
  29 |       <h1>Patterns</h1>
  30 |       <p>The RegExp constructor applies the following grammar to the input pattern String. An error occurs if the grammar cannot interpret the String as an expansion of |Pattern|.</p>
  31 |       <h2>Syntax</h2>
  32 |       <emu-grammar type="definition">
  33 |         Pattern[UnicodeMode, N] ::
  34 |           Disjunction[?UnicodeMode, ?N]
  35 | 
  36 |         Disjunction[UnicodeMode, N] ::
  37 |           Alternative[?UnicodeMode, ?N]
  38 |           Alternative[?UnicodeMode, ?N] `|` Disjunction[?UnicodeMode, ?N]
  39 | 
  40 |         Alternative[UnicodeMode, N] ::
  41 |           [empty]
  42 |           Alternative[?UnicodeMode, ?N] Term[?UnicodeMode, ?N]
  43 | 
  44 |         Term[UnicodeMode, N] ::
  45 |           Assertion[?UnicodeMode, ?N]
  46 |           Atom[?UnicodeMode, ?N]
  47 |           Atom[?UnicodeMode, ?N] Quantifier
  48 | 
  49 |         Assertion[UnicodeMode, N] ::
  50 |           `^`
  51 |           `$`
  52 |           `\` `b`
  53 |           `\` `B`
  54 |           `(` `?` `=` Disjunction[?UnicodeMode, ?N] `)`
  55 |           `(` `?` `!` Disjunction[?UnicodeMode, ?N] `)`
  56 |           `(` `?` `&lt;=` Disjunction[?UnicodeMode, ?N] `)`
  57 |           `(` `?` `&lt;!` Disjunction[?UnicodeMode, ?N] `)`
  58 | 
  59 |         Quantifier ::
  60 |           QuantifierPrefix
  61 |           QuantifierPrefix `?`
  62 | 
  63 |         QuantifierPrefix ::
  64 |           `*`
  65 |           `+`
  66 |           `?`
  67 |           `{` DecimalDigits[~Sep] `}`
  68 |           `{` DecimalDigits[~Sep] `,` `}`
  69 |           `{` DecimalDigits[~Sep] `,` DecimalDigits[~Sep] `}`
  70 | 
  71 |         Atom[UnicodeMode, N] ::
  72 |           PatternCharacter
  73 |           `.`
  74 |           `\` AtomEscape[?UnicodeMode, ?N]
  75 |           CharacterClass[?UnicodeMode]
  76 |           `(` GroupSpecifier[?UnicodeMode] Disjunction[?UnicodeMode, ?N] `)`
  77 |           <del>`(` `?` `:` Disjunction[?UnicodeMode, ?N] `)`</del>
  78 |           <ins>`(` `?` RegularExpressionFlags `:` Disjunction[?UnicodeMode, ?N] `)`</ins>
  79 |           <ins>`(` `?` RegularExpressionFlags `-` RegularExpressionFlags `:` Disjunction[?UnicodeMode, ?N] `)`</ins>
  80 | 
  81 |         SyntaxCharacter :: one of
  82 |           `^` `$` `\` `.` `*` `+` `?` `(` `)` `[` `]` `{` `}` `|`
  83 | 
  84 |         PatternCharacter ::
  85 |           SourceCharacter but not SyntaxCharacter
  86 | 
  87 |         AtomEscape[UnicodeMode, N] ::
  88 |           DecimalEscape
  89 |           CharacterClassEscape[?UnicodeMode]
  90 |           CharacterEscape[?UnicodeMode]
  91 |           [+N] `k` GroupName[?UnicodeMode]
  92 | 
  93 |         CharacterEscape[UnicodeMode] ::
  94 |           ControlEscape
  95 |           `c` ControlLetter
  96 |           `0` [lookahead &notin; DecimalDigit]
  97 |           HexEscapeSequence
  98 |           RegExpUnicodeEscapeSequence[?UnicodeMode]
  99 |           IdentityEscape[?UnicodeMode]
 100 | 
 101 |         ControlEscape :: one of
 102 |           `f` `n` `r` `t` `v`
 103 | 
 104 |         ControlLetter :: one of
 105 |           `a` `b` `c` `d` `e` `f` `g` `h` `i` `j` `k` `l` `m` `n` `o` `p` `q` `r` `s` `t` `u` `v` `w` `x` `y` `z`
 106 |           `A` `B` `C` `D` `E` `F` `G` `H` `I` `J` `K` `L` `M` `N` `O` `P` `Q` `R` `S` `T` `U` `V` `W` `X` `Y` `Z`
 107 | 
 108 |         GroupSpecifier[UnicodeMode] ::
 109 |           [empty]
 110 |           `?` GroupName[?UnicodeMode]
 111 | 
 112 |         GroupName[UnicodeMode] ::
 113 |           `&lt;` RegExpIdentifierName[?UnicodeMode] `&gt;`
 114 | 
 115 |         RegExpIdentifierName[UnicodeMode] ::
 116 |           RegExpIdentifierStart[?UnicodeMode]
 117 |           RegExpIdentifierName[?UnicodeMode] RegExpIdentifierPart[?UnicodeMode]
 118 | 
 119 |         RegExpIdentifierStart[UnicodeMode] ::
 120 |           IdentifierStartChar
 121 |           `\` RegExpUnicodeEscapeSequence[+UnicodeMode]
 122 |           [~UnicodeMode] UnicodeLeadSurrogate UnicodeTrailSurrogate
 123 | 
 124 |         RegExpIdentifierPart[UnicodeMode] ::
 125 |           IdentifierPartChar
 126 |           `\` RegExpUnicodeEscapeSequence[+UnicodeMode]
 127 |           [~UnicodeMode] UnicodeLeadSurrogate UnicodeTrailSurrogate
 128 | 
 129 |         RegExpUnicodeEscapeSequence[UnicodeMode] ::
 130 |           [+UnicodeMode] `u` HexLeadSurrogate `\u` HexTrailSurrogate
 131 |           [+UnicodeMode] `u` HexLeadSurrogate
 132 |           [+UnicodeMode] `u` HexTrailSurrogate
 133 |           [+UnicodeMode] `u` HexNonSurrogate
 134 |           [~UnicodeMode] `u` Hex4Digits
 135 |           [+UnicodeMode] `u{` CodePoint `}`
 136 | 
 137 |         UnicodeLeadSurrogate ::
 138 |           &gt; any Unicode code point in the inclusive range 0xD800 to 0xDBFF
 139 | 
 140 |         UnicodeTrailSurrogate ::
 141 |           &gt; any Unicode code point in the inclusive range 0xDC00 to 0xDFFF
 142 |       </emu-grammar>
 143 |       <p>Each `\\u` |HexTrailSurrogate| for which the choice of associated `u` |HexLeadSurrogate| is ambiguous shall be associated with the nearest possible `u` |HexLeadSurrogate| that would otherwise have no corresponding `\\u` |HexTrailSurrogate|.</p>
 144 |       <emu-grammar type="definition">
 145 |         HexLeadSurrogate ::
 146 |           Hex4Digits [> but only if the MV of |Hex4Digits| is in the inclusive range 0xD800 to 0xDBFF]
 147 | 
 148 |         HexTrailSurrogate ::
 149 |           Hex4Digits [> but only if the MV of |Hex4Digits| is in the inclusive range 0xDC00 to 0xDFFF]
 150 | 
 151 |         HexNonSurrogate ::
 152 |           Hex4Digits [> but only if the MV of |Hex4Digits| is not in the inclusive range 0xD800 to 0xDFFF]
 153 | 
 154 |         IdentityEscape[UnicodeMode] ::
 155 |           [+UnicodeMode] SyntaxCharacter
 156 |           [+UnicodeMode] `/`
 157 |           [~UnicodeMode] SourceCharacter but not UnicodeIDContinue
 158 | 
 159 |         DecimalEscape ::
 160 |           NonZeroDigit DecimalDigits[~Sep]? [lookahead &notin; DecimalDigit]
 161 | 
 162 |         CharacterClassEscape[UnicodeMode] ::
 163 |           `d`
 164 |           `D`
 165 |           `s`
 166 |           `S`
 167 |           `w`
 168 |           `W`
 169 |           [+UnicodeMode] `p{` UnicodePropertyValueExpression `}`
 170 |           [+UnicodeMode] `P{` UnicodePropertyValueExpression `}`
 171 | 
 172 |         UnicodePropertyValueExpression ::
 173 |           UnicodePropertyName `=` UnicodePropertyValue
 174 |           LoneUnicodePropertyNameOrValue
 175 | 
 176 |         UnicodePropertyName ::
 177 |           UnicodePropertyNameCharacters
 178 | 
 179 |         UnicodePropertyNameCharacters ::
 180 |           UnicodePropertyNameCharacter UnicodePropertyNameCharacters?
 181 | 
 182 |         UnicodePropertyValue ::
 183 |           UnicodePropertyValueCharacters
 184 | 
 185 |         LoneUnicodePropertyNameOrValue ::
 186 |           UnicodePropertyValueCharacters
 187 | 
 188 |         UnicodePropertyValueCharacters ::
 189 |           UnicodePropertyValueCharacter UnicodePropertyValueCharacters?
 190 | 
 191 |         UnicodePropertyValueCharacter ::
 192 |           UnicodePropertyNameCharacter
 193 |           DecimalDigit
 194 | 
 195 |         UnicodePropertyNameCharacter ::
 196 |           ControlLetter
 197 |           `_`
 198 | 
 199 |         CharacterClass[UnicodeMode] ::
 200 |           `[` [lookahead != `^`] ClassRanges[?UnicodeMode] `]`
 201 |           `[` `^` ClassRanges[?UnicodeMode] `]`
 202 | 
 203 |         ClassRanges[UnicodeMode] ::
 204 |           [empty]
 205 |           NonemptyClassRanges[?UnicodeMode]
 206 | 
 207 |         NonemptyClassRanges[UnicodeMode] ::
 208 |           ClassAtom[?UnicodeMode]
 209 |           ClassAtom[?UnicodeMode] NonemptyClassRangesNoDash[?UnicodeMode]
 210 |           ClassAtom[?UnicodeMode] `-` ClassAtom[?UnicodeMode] ClassRanges[?UnicodeMode]
 211 | 
 212 |         NonemptyClassRangesNoDash[UnicodeMode] ::
 213 |           ClassAtom[?UnicodeMode]
 214 |           ClassAtomNoDash[?UnicodeMode] NonemptyClassRangesNoDash[?UnicodeMode]
 215 |           ClassAtomNoDash[?UnicodeMode] `-` ClassAtom[?UnicodeMode] ClassRanges[?UnicodeMode]
 216 | 
 217 |         ClassAtom[UnicodeMode] ::
 218 |           `-`
 219 |           ClassAtomNoDash[?UnicodeMode]
 220 | 
 221 |         ClassAtomNoDash[UnicodeMode] ::
 222 |           SourceCharacter but not one of `\` or `]` or `-`
 223 |           `\` ClassEscape[?UnicodeMode]
 224 | 
 225 |         ClassEscape[UnicodeMode] ::
 226 |           `b`
 227 |           [+UnicodeMode] `-`
 228 |           CharacterClassEscape[?UnicodeMode]
 229 |           CharacterEscape[?UnicodeMode]
 230 |       </emu-grammar>
 231 | 
 232 |       <emu-note>
 233 |         <p>A number of productions in this section are given alternative definitions in section <emu-xref href="#sec-regular-expressions-patterns"></emu-xref>.</p>
 234 |       </emu-note>
 235 |     </emu-clause>
 236 | 
 237 |     <emu-clause id="sec-pattern-semantics">
 238 |       <h1>Pattern Semantics</h1>
 239 |       <emu-clause id="sec-notation">
 240 |         <h1>Notation</h1>
 241 |         <p>The descriptions below use the following aliases:</p>
 242 |         <ul>
 243 |           <li>
 244 |             _Input_ is a List whose elements are the characters of the String being matched by the regular expression pattern. Each character is either a code unit or a code point, depending upon the kind of pattern involved. The notation _Input_[_n_] means the _n_<sup>th</sup> character of _Input_, where _n_ can range between 0 (inclusive) and _InputLength_ (exclusive).
 245 |           </li>
 246 |           <li>
 247 |             _InputLength_ is the number of characters in _Input_.
 248 |           </li>
 249 |           <li>
 250 |             _NcapturingParens_ is the total number of left-capturing parentheses (i.e. the total number of <emu-grammar>Atom :: `(` GroupSpecifier Disjunction `)`</emu-grammar> Parse Nodes) in the pattern. A left-capturing parenthesis is any `(` pattern character that is matched by the `(` terminal of the <emu-grammar>Atom :: `(` GroupSpecifier Disjunction `)`</emu-grammar> production.
 251 |           </li>
 252 |           <li>
 253 |             _DotAll_ is *true* if the RegExp object's [[OriginalFlags]] internal slot contains *"s"* and otherwise is *false*.
 254 |           </li>
 255 |           <li>
 256 |             _IgnoreCase_ is *true* if the RegExp object's [[OriginalFlags]] internal slot contains *"i"* and otherwise is *false*.
 257 |           </li>
 258 |           <li>
 259 |             _Multiline_ is *true* if the RegExp object's [[OriginalFlags]] internal slot contains *"m"* and otherwise is *false*.
 260 |           </li>
 261 |           <li>
 262 |             _Unicode_ is *true* if the RegExp object's [[OriginalFlags]] internal slot contains *"u"* and otherwise is *false*.
 263 |           </li>
 264 |           <li oldids="sec-runtime-semantics-wordcharacters-abstract-operation">
 265 |             <del>_WordCharacters_ is the mathematical set that is the union of all sixty-three characters in *"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789_"* (letters, numbers, and U+005F (LOW LINE) in the Unicode Basic Latin block) and all characters _c_ for which _c_ is not in that set but Canonicalize(_c_) is. _WordCharacters_ cannot contain more than sixty-three characters unless _Unicode_ and _IgnoreCase_ are both *true*.</del>
 266 |           </li>
 267 |         </ul>
 268 |         <p>Furthermore, the descriptions below use the following internal data structures:</p>
 269 |         <ul>
 270 |           <li>
 271 |             A <em>CharSet</em> is a mathematical set of characters. When the _Unicode_ flag is *true*, &ldquo;all characters&rdquo; means the CharSet containing all code point values; otherwise &ldquo;all characters&rdquo; means the CharSet containing all code unit values.
 272 |           </li>
 273 |           <li>
 274 |             A <em>State</em> is an ordered pair (_endIndex_, _captures_) where _endIndex_ is an integer and _captures_ is a List of _NcapturingParens_ values. States are used to represent partial match states in the regular expression matching algorithms. The _endIndex_ is one plus the index of the last input character matched so far by the pattern, while _captures_ holds the results of capturing parentheses. The _n_<sup>th</sup> element of _captures_ is either a List of characters that represents the value obtained by the _n_<sup>th</sup> set of capturing parentheses or *undefined* if the _n_<sup>th</sup> set of capturing parentheses hasn't been reached yet. Due to backtracking, many States may be in use at any time during the matching process.
 275 |           </li>
 276 |           <li>
 277 |             A <em>MatchResult</em> is either a State or the special token ~failure~ that indicates that the match failed.
 278 |           </li>
 279 |           <li>
 280 |             A <em>Continuation</em> is an Abstract Closure that takes one State argument and returns a MatchResult result. The Continuation attempts to match the remaining portion (specified by the closure's captured values) of the pattern against _Input_, starting at the intermediate state given by its State argument. If the match succeeds, the Continuation returns the final State that it reached; if the match fails, the Continuation returns ~failure~.
 281 |           </li>
 282 |           <li>
 283 |             A <em>Matcher</em> is an Abstract Closure that takes two arguments&mdash;a State and a Continuation&mdash;and returns a MatchResult result. A Matcher attempts to match a middle subpattern (specified by the closure's captured values) of the pattern against _Input_, starting at the intermediate state given by its State argument. The Continuation argument should be a closure that matches the rest of the pattern. After matching the subpattern of a pattern to obtain a new State, the Matcher then calls Continuation on that new State to test if the rest of the pattern can match as well. If it can, the Matcher returns the State returned by Continuation; if not, the Matcher may try different choices at its choice points, repeatedly calling Continuation until it either succeeds or all possibilities have been exhausted.
 284 |           </li>
 285 |         </ul>
 286 |       </emu-clause>
 287 | 
 288 |       <ins class="block">
 289 |       <emu-clause id="sec-patterns-static-semantics-early-errors">
 290 |         <h1>Static Semantics: Early Errors</h1>
 291 |         <emu-grammar>Atom :: `(` `?` RegularExpressionFlags `:` Disjunction `)`</emu-grammar>
 292 |         <ul>
 293 |           <li>It is a Syntax Error if the source text matched by |RegularExpressionFlags| contains any code point other than `i`, `m`, or `s`, or if it contains the same code point more than once.
 294 |         </ul>
 295 |         <emu-grammar>Atom :: `(` `?` RegularExpressionFlags `-` RegularExpressionFlags `:` Disjunction `)`</emu-grammar>
 296 |         <ul>
 297 |           <li>It is a Syntax Error if the source text matched by the first |RegularExpressionFlags| and the source text matched by the second |RegularExpressionFlags| are both empty.
 298 |           <li>It is a Syntax Error if the source text matched by the first |RegularExpressionFlags| contains any code point other than `i`, `m`, or `s`, or contains the same code point more than once.
 299 |           <li>It is a Syntax Error if the source text matched by the second |RegularExpressionFlags| contains any code point other than `i`, `m`, or `s`, or contains the same code point more than once.
 300 |           <li>It is a Syntax Error if any code point in the source text matched by the first |RegularExpressionFlags| is also contained in the source text matched by the second |RegularExpressionFlags|.
 301 |         </ul>
 302 |       </emu-clause>
 303 | 
 304 |       <emu-clause id="sec-modifiers-records">
 305 |         <h1>Modifiers Records</h1>
 306 |         <p>A <dfn variants="Modifiers Records">Modifiers Record</dfn> is a Record value used to encapsulate information about the regular expression flags that apply to a subpattern.</p>
 307 |         <p>Modifiers Records have the fields listed in <emu-xref href="#table-modifiers-record"></emu-xref>.</p>
 308 |         <emu-table id="table-modifiers-record" caption="Modifiers Record Fields">
 309 |           <table>
 310 |             <tr>
 311 |               <th>Field Name</th>
 312 |               <th>Value</th>
 313 |               <th>Meaning</th>
 314 |             </tr>
 315 |             <tr>
 316 |               <td>[[DotAll]]</td>
 317 |               <td>a Boolean</td>
 318 |               <td>Indicates whether the *"s"* flag is currently enabled.</td>
 319 |             </tr>
 320 |             <tr>
 321 |               <td>[[IgnoreCase]]</td>
 322 |               <td>a Boolean</td>
 323 |               <td>Indicates whether the *"i"* flag is currently enabled.</td>
 324 |             </tr>
 325 |             <tr>
 326 |               <td>[[Multiline]]</td>
 327 |               <td>a Boolean</td>
 328 |               <td>Indicates whether the *"m"* flag is currently enabled.</td>
 329 |             </tr>
 330 |           </table>
 331 |         </emu-table>
 332 |       </emu-clause>
 333 |       </ins>
 334 | 
 335 |       <emu-clause id="sec-compilepattern" type="sdo" oldids="sec-pattern">
 336 |         <h1>Runtime Semantics: CompilePattern</h1>
 337 |         <dl class="header">
 338 |           <dt>description</dt>
 339 |           <dd>It returns an Abstract Closure that takes a String and a non-negative integer and returns a MatchResult.</dd>
 340 |         </dl>
 341 |         <emu-grammar>Pattern :: Disjunction</emu-grammar>
 342 |         <emu-alg>
 343 |           1. <ins>Let _modifiers_ be the Modifiers Record { [[DotAll]]: _DotAll_, [[IgnoreCase]]: _IgnoreCase_, [[Multiline]]: _Multiline_ }.</ins>
 344 |           1. Let _m_ be CompileSubpattern of |Disjunction| with argument<ins>s</ins> ~forward~<ins> and _modifiers_</ins>.
 345 |           1. Return a new Abstract Closure with parameters (_str_, _index_) that captures _m_ and performs the following steps when called:
 346 |             1. Assert: Type(_str_) is String.
 347 |             1. Assert: _index_ is a non-negative integer which is &le; the length of _str_.
 348 |             1. If _Unicode_ is *true*, let _Input_ be StringToCodePoints(_str_). Otherwise, let _Input_ be a List whose elements are the code units that are the elements of _str_. _Input_ will be used throughout the algorithms in <emu-xref href="#sec-pattern-semantics"></emu-xref>. Each element of _Input_ is considered to be a character.
 349 |             1. Let _InputLength_ be the number of characters contained in _Input_. This alias will be used throughout the algorithms in <emu-xref href="#sec-pattern-semantics"></emu-xref>.
 350 |             1. Let _listIndex_ be the index into _Input_ of the character that was obtained from element _index_ of _str_.
 351 |             1. Let _c_ be a new Continuation with parameters (_y_) that captures nothing and performs the following steps when called:
 352 |               1. Assert: _y_ is a State.
 353 |               1. Return _y_.
 354 |             1. Let _cap_ be a List of _NcapturingParens_ *undefined* values, indexed 1 through _NcapturingParens_.
 355 |             1. Let _x_ be the State (_listIndex_, _cap_).
 356 |             1. Return _m_(_x_, _c_).
 357 |         </emu-alg>
 358 |         <emu-note>
 359 |           <p>A Pattern compiles to an Abstract Closure value. RegExpBuiltinExec can then apply this procedure to a String and an offset within the String to determine whether the pattern would match starting at exactly that offset within the String, and, if it does match, what the values of the capturing parentheses would be. The algorithms in <emu-xref href="#sec-pattern-semantics"></emu-xref> are designed so that compiling a pattern may throw a *SyntaxError* exception; on the other hand, once the pattern is successfully compiled, applying the resulting Abstract Closure to find a match in a String cannot throw an exception (except for any implementation-defined exceptions that can occur anywhere such as out-of-memory).</p>
 360 |         </emu-note>
 361 |       </emu-clause>
 362 | 
 363 |       <emu-clause id="sec-compilesubpattern" type="sdo" oldids="sec-disjunction,sec-alternative,sec-term">
 364 |         <h1>
 365 |           Runtime Semantics: CompileSubpattern (
 366 |             _direction_: ~forward~ or ~backward~,
 367 |             <ins>_modifiers_: a Modifiers Record,</ins>
 368 |           ): a Matcher
 369 |         </h1>
 370 |         <dl class="header">
 371 |         </dl>
 372 |         <emu-note>
 373 |           <p>This section is amended in B.1.2.4.</p>
 374 |         </emu-note>
 375 | 
 376 |         <!-- Disjunction -->
 377 |         <emu-grammar>Disjunction :: Alternative `|` Disjunction</emu-grammar>
 378 |         <emu-alg>
 379 |           1. Let _m1_ be CompileSubpattern of |Alternative| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 380 |           1. Let _m2_ be CompileSubpattern of |Disjunction| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 381 |           1. Return a new Matcher with parameters (_x_, _c_) that captures _m1_ and _m2_ and performs the following steps when called:
 382 |             1. Assert: _x_ is a State.
 383 |             1. Assert: _c_ is a Continuation.
 384 |             1. Let _r_ be _m1_(_x_, _c_).
 385 |             1. If _r_ is not ~failure~, return _r_.
 386 |             1. Return _m2_(_x_, _c_).
 387 |         </emu-alg>
 388 |         <emu-note>
 389 |           <p>The `|` regular expression operator separates two alternatives. The pattern first tries to match the left |Alternative| (followed by the sequel of the regular expression); if it fails, it tries to match the right |Disjunction| (followed by the sequel of the regular expression). If the left |Alternative|, the right |Disjunction|, and the sequel all have choice points, all choices in the sequel are tried before moving on to the next choice in the left |Alternative|. If choices in the left |Alternative| are exhausted, the right |Disjunction| is tried instead of the left |Alternative|. Any capturing parentheses inside a portion of the pattern skipped by `|` produce *undefined* values instead of Strings. Thus, for example,</p>
 390 |           <pre><code class="javascript">/a|ab/.exec("abc")</code></pre>
 391 |           <p>returns the result *"a"* and not *"ab"*. Moreover,</p>
 392 |           <pre><code class="javascript">/((a)|(ab))((c)|(bc))/.exec("abc")</code></pre>
 393 |           <p>returns the array</p>
 394 |           <pre><code class="javascript">["abc", "a", "a", undefined, "bc", undefined, "bc"]</code></pre>
 395 |           <p>and not</p>
 396 |           <pre><code class="javascript">["abc", "ab", undefined, "ab", "c", "c", undefined]</code></pre>
 397 |           <p>The order in which the two alternatives are tried is independent of the value of _direction_.</p>
 398 |         </emu-note>
 399 | 
 400 |         <!-- Alternative -->
 401 |         <emu-grammar>Alternative :: [empty]</emu-grammar>
 402 |         <emu-alg>
 403 |           1. Return a new Matcher with parameters (_x_, _c_) that captures nothing and performs the following steps when called:
 404 |             1. Assert: _x_ is a State.
 405 |             1. Assert: _c_ is a Continuation.
 406 |             1. Return _c_(_x_).
 407 |         </emu-alg>
 408 |         <emu-grammar>Alternative :: Alternative Term</emu-grammar>
 409 |         <emu-alg>
 410 |           1. Let _m1_ be CompileSubpattern of |Alternative| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 411 |           1. Let _m2_ be CompileSubpattern of |Term| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 412 |           1. If _direction_ is ~forward~, then
 413 |             1. Let _m_ be a new Matcher with parameters (_x_, _c_) that captures _m1_ and _m2_ and performs the following steps when called:
 414 |               1. Assert: _x_ is a State.
 415 |               1. Assert: _c_ is a Continuation.
 416 |               1. Let _d_ be a new Continuation with parameters (_y_) that captures _c_ and _m2_ and performs the following steps when called:
 417 |                 1. Assert: _y_ is a State.
 418 |                 1. Return _m2_(_y_, _c_).
 419 |               1. Return _m1_(_x_, _d_).
 420 |           1. Else,
 421 |             1. Assert: _direction_ is ~backward~.
 422 |             1. Let _m_ be a new Matcher with parameters (_x_, _c_) that captures _m1_ and _m2_ and performs the following steps when called:
 423 |               1. Assert: _x_ is a State.
 424 |               1. Assert: _c_ is a Continuation.
 425 |               1. Let _d_ be a new Continuation with parameters (_y_) that captures _c_ and _m1_ and performs the following steps when called:
 426 |                 1. Assert: _y_ is a State.
 427 |                 1. Return _m1_(_y_, _c_).
 428 |               1. Return _m2_(_x_, _d_).
 429 |         </emu-alg>
 430 |         <emu-note>
 431 |           <p>Consecutive |Term|s try to simultaneously match consecutive portions of _Input_. When _direction_ is ~forward~, if the left |Alternative|, the right |Term|, and the sequel of the regular expression all have choice points, all choices in the sequel are tried before moving on to the next choice in the right |Term|, and all choices in the right |Term| are tried before moving on to the next choice in the left |Alternative|. When _direction_ is ~backward~, the evaluation order of |Alternative| and |Term| are reversed.</p>
 432 |         </emu-note>
 433 | 
 434 |         <!-- Term -->
 435 |         <emu-grammar>Term :: Assertion</emu-grammar>
 436 |         <emu-alg>
 437 |           1. Return CompileAssertion of |Assertion|<ins> with argument _modifiers_</ins>.
 438 |         </emu-alg>
 439 |         <emu-note>
 440 |           <p>The resulting Matcher is independent of _direction_.</p>
 441 |         </emu-note>
 442 |         <emu-grammar>Term :: Atom</emu-grammar>
 443 |         <emu-alg>
 444 |           1. Return CompileAtom of |Atom| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 445 |         </emu-alg>
 446 |         <emu-grammar>Term :: Atom Quantifier</emu-grammar>
 447 |         <emu-alg>
 448 |           1. Let _m_ be CompileAtom of |Atom| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 449 |           1. Let _q_ be CompileQuantifier of |Quantifier|.
 450 |           1. Assert: _q_.[[Min]] &le; _q_.[[Max]].
 451 |           1. Let _parenIndex_ be the number of left-capturing parentheses in the entire regular expression that occur to the left of this |Term|. This is the total number of <emu-grammar>Atom :: `(` GroupSpecifier Disjunction `)`</emu-grammar> Parse Nodes prior to or enclosing this |Term|.
 452 |           1. Let _parenCount_ be the number of left-capturing parentheses in |Atom|. This is the total number of <emu-grammar>Atom :: `(` GroupSpecifier Disjunction `)`</emu-grammar> Parse Nodes enclosed by |Atom|.
 453 |           1. Return a new Matcher with parameters (_x_, _c_) that captures _m_, _q_, _parenIndex_, and _parenCount_ and performs the following steps when called:
 454 |             1. Assert: _x_ is a State.
 455 |             1. Assert: _c_ is a Continuation.
 456 |             1. Return RepeatMatcher(_m_, _q_.[[Min]], _q_.[[Max]], _q_.[[Greedy]], _x_, _c_, _parenIndex_, _parenCount_).
 457 |         </emu-alg>
 458 |       </emu-clause>
 459 | 
 460 |       <emu-clause id="sec-compileassertion" type="sdo" oldids="sec-assertion">
 461 |         <h1>
 462 |           Runtime Semantics: CompileAssertion (
 463 |             <ins>_modifiers_: a Modifiers Record,</ins>
 464 |           ): a Matcher
 465 |         </h1>
 466 |         <dl class="header">
 467 |         </dl>
 468 |         <emu-note>
 469 |           <p>This section is amended in B.1.2.5.</p>
 470 |         </emu-note>
 471 |         <emu-grammar>Assertion :: `^`</emu-grammar>
 472 |         <emu-alg>
 473 |           1. Return a new Matcher with parameters (_x_, _c_) that captures nothing and performs the following steps when called:
 474 |             1. Assert: _x_ is a State.
 475 |             1. Assert: _c_ is a Continuation.
 476 |             1. Let _e_ be _x_'s _endIndex_.
 477 |             1. If _e_ = 0, or if <del>_Multiline_</del><ins>_modifiers_.[[Multiline]]</ins> is *true* and the character _Input_[_e_ - 1] is one of |LineTerminator|, then
 478 |               1. Return _c_(_x_).
 479 |             1. Return ~failure~.
 480 |         </emu-alg>
 481 |         <emu-note>
 482 |           <p>Even when the `y` flag is used with a pattern, `^` always matches only at the beginning of _Input_, or (if <del>_Multiline_</del><ins>_modifiers_.[[Multiline]]</ins> is *true*) at the beginning of a line.</p>
 483 |         </emu-note>
 484 |         <emu-grammar>Assertion :: `$`</emu-grammar>
 485 |         <emu-alg>
 486 |           1. Return a new Matcher with parameters (_x_, _c_) that captures nothing and performs the following steps when called:
 487 |             1. Assert: _x_ is a State.
 488 |             1. Assert: _c_ is a Continuation.
 489 |             1. Let _e_ be _x_'s _endIndex_.
 490 |             1. If _e_ = _InputLength_, or if <del>_Multiline_</del><ins>_modifiers_.[[Multiline]]</ins> is *true* and the character _Input_[_e_] is one of |LineTerminator|, then
 491 |               1. Return _c_(_x_).
 492 |             1. Return ~failure~.
 493 |         </emu-alg>
 494 |         <emu-grammar>Assertion :: `\` `b`</emu-grammar>
 495 |         <emu-alg>
 496 |           1. Return a new Matcher with parameters (_x_, _c_) that captures nothing and performs the following steps when called:
 497 |             1. Assert: _x_ is a State.
 498 |             1. Assert: _c_ is a Continuation.
 499 |             1. Let _e_ be _x_'s _endIndex_.
 500 |             1. Let _a_ be IsWordChar(_e_ - 1<ins>, _modifiers_</ins>).
 501 |             1. Let _b_ be IsWordChar(_e_<ins>, _modifiers_</ins>).
 502 |             1. If _a_ is *true* and _b_ is *false*, or if _a_ is *false* and _b_ is *true*, return _c_(_x_).
 503 |             1. Return ~failure~.
 504 |         </emu-alg>
 505 |         <emu-grammar>Assertion :: `\` `B`</emu-grammar>
 506 |         <emu-alg>
 507 |           1. Return a new Matcher with parameters (_x_, _c_) that captures nothing and performs the following steps when called:
 508 |             1. Assert: _x_ is a State.
 509 |             1. Assert: _c_ is a Continuation.
 510 |             1. Let _e_ be _x_'s _endIndex_.
 511 |             1. Let _a_ be IsWordChar(_e_ - 1<ins>, _modifiers_</ins>).
 512 |             1. Let _b_ be IsWordChar(_e_<ins>, _modifiers_</ins>).
 513 |             1. If _a_ is *true* and _b_ is *true*, or if _a_ is *false* and _b_ is *false*, return _c_(_x_).
 514 |             1. Return ~failure~.
 515 |         </emu-alg>
 516 |         <emu-grammar>Assertion :: `(` `?` `=` Disjunction `)`</emu-grammar>
 517 |         <emu-alg>
 518 |           1. Let _m_ be CompileSubpattern of |Disjunction| with argument<ins>s</ins> ~forward~<ins> and _modifiers_</ins>.
 519 |           1. Return a new Matcher with parameters (_x_, _c_) that captures _m_ and performs the following steps when called:
 520 |             1. Assert: _x_ is a State.
 521 |             1. Assert: _c_ is a Continuation.
 522 |             1. Let _d_ be a new Continuation with parameters (_y_) that captures nothing and performs the following steps when called:
 523 |               1. Assert: _y_ is a State.
 524 |               1. Return _y_.
 525 |             1. Let _r_ be _m_(_x_, _d_).
 526 |             1. If _r_ is ~failure~, return ~failure~.
 527 |             1. Let _y_ be _r_'s State.
 528 |             1. Let _cap_ be _y_'s _captures_ List.
 529 |             1. Let _xe_ be _x_'s _endIndex_.
 530 |             1. Let _z_ be the State (_xe_, _cap_).
 531 |             1. Return _c_(_z_).
 532 |         </emu-alg>
 533 |         <emu-grammar>Assertion :: `(` `?` `!` Disjunction `)`</emu-grammar>
 534 |         <emu-alg>
 535 |           1. Let _m_ be CompileSubpattern of |Disjunction| with argument<ins>s</ins> ~forward~<ins> and _modifiers_</ins>.
 536 |           1. Return a new Matcher with parameters (_x_, _c_) that captures _m_ and performs the following steps when called:
 537 |             1. Assert: _x_ is a State.
 538 |             1. Assert: _c_ is a Continuation.
 539 |             1. Let _d_ be a new Continuation with parameters (_y_) that captures nothing and performs the following steps when called:
 540 |               1. Assert: _y_ is a State.
 541 |               1. Return _y_.
 542 |             1. Let _r_ be _m_(_x_, _d_).
 543 |             1. If _r_ is not ~failure~, return ~failure~.
 544 |             1. Return _c_(_x_).
 545 |         </emu-alg>
 546 |         <emu-grammar>Assertion :: `(` `?` `&lt;=` Disjunction `)`</emu-grammar>
 547 |         <emu-alg>
 548 |           1. Let _m_ be CompileSubpattern of |Disjunction| with argument<ins>s</ins> ~backward~<ins> and _modifiers_</ins>.
 549 |           1. Return a new Matcher with parameters (_x_, _c_) that captures _m_ and performs the following steps when called:
 550 |             1. Assert: _x_ is a State.
 551 |             1. Assert: _c_ is a Continuation.
 552 |             1. Let _d_ be a new Continuation with parameters (_y_) that captures nothing and performs the following steps when called:
 553 |               1. Assert: _y_ is a State.
 554 |               1. Return _y_.
 555 |             1. Let _r_ be _m_(_x_, _d_).
 556 |             1. If _r_ is ~failure~, return ~failure~.
 557 |             1. Let _y_ be _r_'s State.
 558 |             1. Let _cap_ be _y_'s _captures_ List.
 559 |             1. Let _xe_ be _x_'s _endIndex_.
 560 |             1. Let _z_ be the State (_xe_, _cap_).
 561 |             1. Return _c_(_z_).
 562 |         </emu-alg>
 563 |         <emu-grammar>Assertion :: `(` `?` `&lt;!` Disjunction `)`</emu-grammar>
 564 |         <emu-alg>
 565 |           1. Let _m_ be CompileSubpattern of |Disjunction| with argument<ins>s</ins> ~backward~<ins> and _modifiers_</ins>.
 566 |           1. Return a new Matcher with parameters (_x_, _c_) that captures _m_ and performs the following steps when called:
 567 |             1. Assert: _x_ is a State.
 568 |             1. Assert: _c_ is a Continuation.
 569 |             1. Let _d_ be a new Continuation with parameters (_y_) that captures nothing and performs the following steps when called:
 570 |               1. Assert: _y_ is a State.
 571 |               1. Return _y_.
 572 |             1. Let _r_ be _m_(_x_, _d_).
 573 |             1. If _r_ is not ~failure~, return ~failure~.
 574 |             1. Return _c_(_x_).
 575 |         </emu-alg>
 576 | 
 577 |         <emu-clause id="sec-runtime-semantics-iswordchar-abstract-operation" type="abstract operation">
 578 |           <h1>
 579 |             IsWordChar (
 580 |               _e_: an integer,
 581 |               <ins>_modifiers_: a Modifiers Record,</ins>
 582 |             )
 583 |           </h1>
 584 |           <dl class="header">
 585 |           </dl>
 586 |           <emu-alg>
 587 |             1. If _e_ = -1 or _e_ is _InputLength_, return *false*.
 588 |             1. Let _c_ be the character _Input_[_e_].
 589 |             1. <ins>Let _wordCharacters_ be GetWordCharacters(_modifiers_).</ins>
 590 |             1. If _c_ is in <del>_WordCharacters_</del><ins>_wordCharacters_</ins>, return *true*.
 591 |             1. Return *false*.
 592 |           </emu-alg>
 593 |         </emu-clause>
 594 |       </emu-clause>
 595 | 
 596 |       <emu-clause id="sec-compileatom" type="sdo" oldids="sec-atom,sec-atomescape,sec-characterescape,sec-decimalescape">
 597 |         <h1>
 598 |           Runtime Semantics: CompileAtom (
 599 |             _direction_: ~forward~ or ~backward~,
 600 |             <ins>_modifiers_: a Modifiers Record,</ins>
 601 |           ): a Matcher
 602 |         </h1>
 603 |         <dl class="header">
 604 |         </dl>
 605 |         <emu-note>
 606 |           <p>This section is amended in B.1.2.6.</p>
 607 |         </emu-note>
 608 | 
 609 |         <!-- Atom -->
 610 |         <emu-grammar>Atom :: PatternCharacter</emu-grammar>
 611 |         <emu-alg>
 612 |           1. Let _ch_ be the character matched by |PatternCharacter|.
 613 |           1. Let _A_ be a one-element CharSet containing the character _ch_.
 614 |           1. Return CharacterSetMatcher(_A_, *false*, _direction_<ins>, _modifiers_</ins>).
 615 |         </emu-alg>
 616 |         <emu-grammar>Atom :: `.`</emu-grammar>
 617 |         <emu-alg>
 618 |           1. Let _A_ be the CharSet of all characters.
 619 |           1. If <del>_DotAll_</del><ins>_modifiers_.[[DotAll]]</ins> is not *true*, then
 620 |             1. Remove from _A_ all characters corresponding to a code point on the right-hand side of the |LineTerminator| production.
 621 |           1. Return CharacterSetMatcher(_A_, *false*, _direction_<ins>, _modifiers_</ins>).
 622 |         </emu-alg>
 623 |         <emu-grammar>Atom :: CharacterClass</emu-grammar>
 624 |         <emu-alg>
 625 |           1. Let _cc_ be CompileCharacterClass of |CharacterClass|.
 626 |           1. Return CharacterSetMatcher(_cc_.[[CharSet]], _cc_.[[Invert]], _direction_<ins>, _modifiers_</ins>).
 627 |         </emu-alg>
 628 |         <emu-grammar>Atom :: `(` GroupSpecifier Disjunction `)`</emu-grammar>
 629 |         <emu-alg>
 630 |           1. Let _m_ be CompileSubpattern of |Disjunction| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 631 |           1. Let _parenIndex_ be the number of left-capturing parentheses in the entire regular expression that occur to the left of this |Atom|. This is the total number of <emu-grammar>Atom :: `(` GroupSpecifier Disjunction `)`</emu-grammar> Parse Nodes prior to or enclosing this |Atom|.
 632 |           1. Return a new Matcher with parameters (_x_, _c_) that captures _direction_, _m_, and _parenIndex_ and performs the following steps when called:
 633 |             1. Assert: _x_ is a State.
 634 |             1. Assert: _c_ is a Continuation.
 635 |             1. Let _d_ be a new Continuation with parameters (_y_) that captures _x_, _c_, _direction_, and _parenIndex_ and performs the following steps when called:
 636 |               1. Assert: _y_ is a State.
 637 |               1. Let _cap_ be a copy of _y_'s _captures_ List.
 638 |               1. Let _xe_ be _x_'s _endIndex_.
 639 |               1. Let _ye_ be _y_'s _endIndex_.
 640 |               1. If _direction_ is ~forward~, then
 641 |                 1. Assert: _xe_ &le; _ye_.
 642 |                 1. Let _s_ be a List whose elements are the characters of _Input_ at indices _xe_ (inclusive) through _ye_ (exclusive).
 643 |               1. Else,
 644 |                 1. Assert: _direction_ is ~backward~.
 645 |                 1. Assert: _ye_ &le; _xe_.
 646 |                 1. Let _s_ be a List whose elements are the characters of _Input_ at indices _ye_ (inclusive) through _xe_ (exclusive).
 647 |               1. Set _cap_[_parenIndex_ + 1] to _s_.
 648 |               1. Let _z_ be the State (_ye_, _cap_).
 649 |               1. Return _c_(_z_).
 650 |             1. Return _m_(_x_, _d_).
 651 |         </emu-alg>
 652 | 
 653 |         <del class="block">
 654 |         <emu-grammar>Atom :: `(` `?` `:` Disjunction `)`</emu-grammar>
 655 |         <emu-alg>
 656 |           1. Return CompileSubpattern of |Disjunction| with argument<ins>s</ins> _direction_<ins> and _modifiers_</ins>.
 657 |         </emu-alg>
 658 |         </del>
 659 | 
 660 |         <ins class="block">
 661 |         <emu-grammar>Atom :: `(` `?` RegularExpressionFlags `:` Disjunction `)`</emu-grammar>
 662 |         <emu-alg>
 663 |           1. Let _addModifiers_ be the source text matched by |RegularExpressionFlags|.
 664 |           1. Let _removeModifiers_ be the empty String.
 665 |           1. Let _newModifiers_ be UpdateModifiers(_modifiers_, CodePointsToString(_addModifiers_), _removeModifiers_).
 666 |           1. Return CompileSubpattern of |Disjunction| with arguments _direction_ and _newModifiers_.
 667 |         </emu-alg>
 668 |         <emu-grammar>Atom :: `(` `?` RegularExpressionFlags `-` RegularExpressionFlags `:` Disjunction `)`</emu-grammar>
 669 |         <emu-alg>
 670 |           1. Let _addModifiers_ be the source text matched by the first |RegularExpressionFlags|.
 671 |           1. Let _removeModifiers_ be the source text matched by the second |RegularExpressionFlags|.
 672 |           1. Let _newModifiers_ be UpdateModifiers(_modifiers_, CodePointsToString(_addModifiers_), CodePointsToString(_removeModifiers_)).
 673 |           1. Return CompileSubpattern of |Disjunction| with arguments _direction_ and _newModifiers_.
 674 |         </emu-alg>
 675 |         </ins>
 676 | 
 677 |         <!-- AtomEscape -->
 678 |         <emu-grammar>AtomEscape :: DecimalEscape</emu-grammar>
 679 |         <emu-alg>
 680 |           1. Let _n_ be the CapturingGroupNumber of |DecimalEscape|.
 681 |           1. Assert: _n_ &le; _NcapturingParens_.
 682 |           1. Return BackreferenceMatcher(_n_, _direction_<ins>, _modifiers_</ins>).
 683 |         </emu-alg>
 684 |         <emu-note>
 685 |           <p>An escape sequence of the form `\\` followed by a non-zero decimal number _n_ matches the result of the _n_<sup>th</sup> set of capturing parentheses (<emu-xref href="#sec-notation"></emu-xref>). It is an error if the regular expression has fewer than _n_ capturing parentheses. If the regular expression has _n_ or more capturing parentheses but the _n_<sup>th</sup> one is *undefined* because it has not captured anything, then the backreference always succeeds.</p>
 686 |         </emu-note>
 687 |         <emu-grammar>AtomEscape :: CharacterEscape</emu-grammar>
 688 |         <emu-alg>
 689 |           1. Let _cv_ be the CharacterValue of |CharacterEscape|.
 690 |           1. Let _ch_ be the character whose character value is _cv_.
 691 |           1. Let _A_ be a one-element CharSet containing the character _ch_.
 692 |           1. Return CharacterSetMatcher(_A_, *false*, _direction_<ins>, _modifiers_</ins>).
 693 |         </emu-alg>
 694 |         <emu-grammar>AtomEscape :: CharacterClassEscape</emu-grammar>
 695 |         <emu-alg>
 696 |           1. Let _A_ be CompileToCharSet of |CharacterClassEscape|.
 697 |           1. Return CharacterSetMatcher(_A_, *false*, _direction_<ins>, _modifiers_</ins>).
 698 |         </emu-alg>
 699 |         <emu-grammar>AtomEscape :: `k` GroupName</emu-grammar>
 700 |         <emu-alg>
 701 |           1. Search the enclosing |Pattern| for an instance of a |GroupSpecifier| containing a |RegExpIdentifierName| which has a CapturingGroupName equal to the CapturingGroupName of the |RegExpIdentifierName| contained in |GroupName|.
 702 |           1. Assert: A unique such |GroupSpecifier| is found.
 703 |           1. Let _parenIndex_ be the number of left-capturing parentheses in the entire regular expression that occur to the left of the located |GroupSpecifier|. This is the total number of <emu-grammar>Atom :: `(` GroupSpecifier Disjunction `)`</emu-grammar> Parse Nodes prior to or enclosing the located |GroupSpecifier|, including its immediately enclosing |Atom|.
 704 |           1. Return BackreferenceMatcher(_parenIndex_, _direction_<ins>, _modifiers_</ins>).
 705 |         </emu-alg>
 706 | 
 707 |         <emu-clause id="sec-runtime-semantics-charactersetmatcher-abstract-operation" type="abstract operation">
 708 |           <h1>
 709 |             CharacterSetMatcher (
 710 |               _A_: a CharSet,
 711 |               _invert_: a Boolean,
 712 |               _direction_: ~forward~ or ~backward~,
 713 |               <ins>_modifiers_: a Modifiers Record,</ins>
 714 |             ): a Matcher
 715 |           </h1>
 716 |           <dl class="header">
 717 |           </dl>
 718 |           <emu-alg>
 719 |             1. Return a new Matcher with parameters (_x_, _c_) that captures _A_, _invert_, and _direction_ and performs the following steps when called:
 720 |               1. Assert: _x_ is a State.
 721 |               1. Assert: _c_ is a Continuation.
 722 |               1. Let _e_ be _x_'s _endIndex_.
 723 |               1. If _direction_ is ~forward~, let _f_ be _e_ + 1.
 724 |               1. Else, let _f_ be _e_ - 1.
 725 |               1. If _f_ &lt; 0 or _f_ &gt; _InputLength_, return ~failure~.
 726 |               1. Let _index_ be min(_e_, _f_).
 727 |               1. Let _ch_ be the character _Input_[_index_].
 728 |               1. Let _cc_ be Canonicalize(_ch_<ins>, _modifiers_</ins>).
 729 |               1. If there exists a member _a_ of _A_ such that Canonicalize(_a_, <ins>_modifiers_</ins>) is _cc_, let _found_ be *true*. Otherwise, let _found_ be *false*.
 730 |               1. If _invert_ is *false* and _found_ is *false*, return ~failure~.
 731 |               1. If _invert_ is *true* and _found_ is *true*, return ~failure~.
 732 |               1. Let _cap_ be _x_'s _captures_ List.
 733 |               1. Let _y_ be the State (_f_, _cap_).
 734 |               1. Return _c_(_y_).
 735 |           </emu-alg>
 736 |         </emu-clause>
 737 | 
 738 |         <emu-clause id="sec-backreference-matcher" type="abstract operation">
 739 |           <h1>
 740 |             BackreferenceMatcher (
 741 |               _n_: a positive integer,
 742 |               _direction_: ~forward~ or ~backward~,
 743 |               <ins>_modifiers_: a Modifiers Record,</ins>
 744 |             ): a Matcher
 745 |           </h1>
 746 |           <dl class="header">
 747 |           </dl>
 748 |           <emu-alg>
 749 |             1. Assert: _n_ &ge; 1.
 750 |             1. Return a new Matcher with parameters (_x_, _c_) that captures _n_ and _direction_ and performs the following steps when called:
 751 |               1. Assert: _x_ is a State.
 752 |               1. Assert: _c_ is a Continuation.
 753 |               1. Let _cap_ be _x_'s _captures_ List.
 754 |               1. Let _s_ be _cap_[_n_].
 755 |               1. If _s_ is *undefined*, return _c_(_x_).
 756 |               1. Let _e_ be _x_'s _endIndex_.
 757 |               1. Let _len_ be the number of elements in _s_.
 758 |               1. If _direction_ is ~forward~, let _f_ be _e_ + _len_.
 759 |               1. Else, let _f_ be _e_ - _len_.
 760 |               1. If _f_ &lt; 0 or _f_ &gt; _InputLength_, return ~failure~.
 761 |               1. Let _g_ be min(_e_, _f_).
 762 |               1. If there exists an integer _i_ between 0 (inclusive) and _len_ (exclusive) such that Canonicalize(_s_[_i_]<ins>, _modifiers_</ins>) is not the same character value as Canonicalize(_Input_[_g_ + _i_], <ins>_modifiers_</ins>), return ~failure~.
 763 |               1. Let _y_ be the State (_f_, _cap_).
 764 |               1. Return _c_(_y_).
 765 |           </emu-alg>
 766 |         </emu-clause>
 767 | 
 768 |         <emu-clause id="sec-runtime-semantics-canonicalize-ch" type="abstract operation">
 769 |           <h1>
 770 |             Canonicalize (
 771 |               _ch_: a character,
 772 |               <ins>_modifiers_: a Modifiers Record,</ins>
 773 |             ): a Matcher
 774 |           </h1>
 775 |           <dl class="header">
 776 |           </dl>
 777 |           <emu-alg>
 778 |             1. If _Unicode_ is *true* and <del>_IgnoreCase_</del><ins>_modifiers_.[[IgnoreCase]]</ins> is *true*, then
 779 |               1. If the file CaseFolding.txt of the Unicode Character Database provides a simple or common case folding mapping for _ch_, return the result of applying that mapping to _ch_.
 780 |               1. Return _ch_.
 781 |             1. If <del>_IgnoreCase_</del><ins>_modifiers_.[[IgnoreCase]]</ins> is *false*, return _ch_.
 782 |             1. Assert: _ch_ is a UTF-16 code unit.
 783 |             1. Let _cp_ be the code point whose numeric value is that of _ch_.
 784 |             1. Let _u_ be the result of toUppercase(&laquo; _cp_ &raquo;), according to the Unicode Default Case Conversion algorithm.
 785 |             1. Let _uStr_ be CodePointsToString(_u_).
 786 |             1. If _uStr_ does not consist of a single code unit, return _ch_.
 787 |             1. Let _cu_ be _uStr_'s single code unit element.
 788 |             1. If the numeric value of _ch_ &ge; 128 and the numeric value of _cu_ &lt; 128, return _ch_.
 789 |             1. Return _cu_.
 790 |           </emu-alg>
 791 |           <emu-note>
 792 |             <p>Parentheses of the form `(` |Disjunction| `)` serve both to group the components of the |Disjunction| pattern together and to save the result of the match. The result can be used either in a backreference (`\\` followed by a non-zero decimal number), referenced in a replace String, or returned as part of an array from the regular expression matching Abstract Closure. To inhibit the capturing behaviour of parentheses, use the form `(?:` |Disjunction| `)` instead.</p>
 793 |           </emu-note>
 794 |           <emu-note>
 795 |             <p>The form `(?=` |Disjunction| `)` specifies a zero-width positive lookahead. In order for it to succeed, the pattern inside |Disjunction| must match at the current position, but the current position is not advanced before matching the sequel. If |Disjunction| can match at the current position in several ways, only the first one is tried. Unlike other regular expression operators, there is no backtracking into a `(?=` form (this unusual behaviour is inherited from Perl). This only matters when the |Disjunction| contains capturing parentheses and the sequel of the pattern contains backreferences to those captures.</p>
 796 |             <p>For example,</p>
 797 |             <pre><code class="javascript">/(?=(a+))/.exec("baaabac")</code></pre>
 798 |             <p>matches the empty String immediately after the first `b` and therefore returns the array:</p>
 799 |             <pre><code class="javascript">["", "aaa"]</code></pre>
 800 |             <p>To illustrate the lack of backtracking into the lookahead, consider:</p>
 801 |             <pre><code class="javascript">/(?=(a+))a*b\1/.exec("baaabac")</code></pre>
 802 |             <p>This expression returns</p>
 803 |             <pre><code class="javascript">["aba", "a"]</code></pre>
 804 |             <p>and not:</p>
 805 |             <pre><code class="javascript">["aaaba", "a"]</code></pre>
 806 |           </emu-note>
 807 |           <emu-note>
 808 |             <p>The form `(?!` |Disjunction| `)` specifies a zero-width negative lookahead. In order for it to succeed, the pattern inside |Disjunction| must fail to match at the current position. The current position is not advanced before matching the sequel. |Disjunction| can contain capturing parentheses, but backreferences to them only make sense from within |Disjunction| itself. Backreferences to these capturing parentheses from elsewhere in the pattern always return *undefined* because the negative lookahead must fail for the pattern to succeed. For example,</p>
 809 |             <pre><code class="javascript">/(.*?)a(?!(a+)b\2c)\2(.*)/.exec("baaabaac")</code></pre>
 810 |             <p>looks for an `a` not immediately followed by some positive number n of `a`'s, a `b`, another n `a`'s (specified by the first `\\2`) and a `c`. The second `\\2` is outside the negative lookahead, so it matches against *undefined* and therefore always succeeds. The whole expression returns the array:</p>
 811 |             <pre><code class="javascript">["baaabaac", "ba", undefined, "abaac"]</code></pre>
 812 |           </emu-note>
 813 |           <emu-note>
 814 |             <p>In case-insignificant matches when _Unicode_ is *true*, all characters are implicitly case-folded using the simple mapping provided by the Unicode standard immediately before they are compared. The simple mapping always maps to a single code point, so it does not map, for example, `&szlig;` (U+00DF) to `SS`. It may however map a code point outside the Basic Latin range to a character within, for example, `&#x17f;` (U+017F) to `s`. Such characters are not mapped if _Unicode_ is *false*. This prevents Unicode code points such as U+017F and U+212A from matching regular expressions such as `/[a-z]/i`, but they will match `/[a-z]/ui`.</p>
 815 |           </emu-note>
 816 |         </emu-clause>
 817 |       </emu-clause>
 818 | 
 819 |       <emu-clause id="sec-compiletocharset" type="sdo" oldids="sec-classranges,sec-nonemptyclassranges,sec-nonemptyclassrangesnodash,sec-classatom,sec-classatomnodash,sec-classescape,sec-characterclassescape">
 820 |         <h1>Runtime Semantics: CompileToCharSet ( ): a CharSet</h1>
 821 |         <dl class="header">
 822 |         </dl>
 823 |         <emu-note>
 824 |           <p>This section is amended in <emu-xref href="#sec-compiletocharset-annexb"></emu-xref>.</p>
 825 |         </emu-note>
 826 | 
 827 |         <!-- ClassRanges -->
 828 |         <emu-grammar>ClassRanges :: [empty]</emu-grammar>
 829 |         <emu-alg>
 830 |           1. Return the empty CharSet.
 831 |         </emu-alg>
 832 | 
 833 |         <!-- NonemptyClassRanges -->
 834 |         <emu-grammar>NonemptyClassRanges :: ClassAtom NonemptyClassRangesNoDash</emu-grammar>
 835 |         <emu-alg>
 836 |           1. Let _A_ be CompileToCharSet of |ClassAtom|.
 837 |           1. Let _B_ be CompileToCharSet of |NonemptyClassRangesNoDash|.
 838 |           1. Return the union of CharSets _A_ and _B_.
 839 |         </emu-alg>
 840 |         <emu-grammar>NonemptyClassRanges :: ClassAtom `-` ClassAtom ClassRanges</emu-grammar>
 841 |         <emu-alg>
 842 |           1. Let _A_ be CompileToCharSet of the first |ClassAtom|.
 843 |           1. Let _B_ be CompileToCharSet of the second |ClassAtom|.
 844 |           1. Let _C_ be CompileToCharSet of |ClassRanges|.
 845 |           1. Let _D_ be CharacterRange(_A_, _B_).
 846 |           1. Return the union of _D_ and _C_.
 847 |         </emu-alg>
 848 | 
 849 |         <!-- NonemptyClassRangesNoDash -->
 850 |         <emu-grammar>NonemptyClassRangesNoDash :: ClassAtomNoDash NonemptyClassRangesNoDash</emu-grammar>
 851 |         <emu-alg>
 852 |           1. Let _A_ be CompileToCharSet of |ClassAtomNoDash|.
 853 |           1. Let _B_ be CompileToCharSet of |NonemptyClassRangesNoDash|.
 854 |           1. Return the union of CharSets _A_ and _B_.
 855 |         </emu-alg>
 856 |         <emu-grammar>NonemptyClassRangesNoDash :: ClassAtomNoDash `-` ClassAtom ClassRanges</emu-grammar>
 857 |         <emu-alg>
 858 |           1. Let _A_ be CompileToCharSet of |ClassAtomNoDash|.
 859 |           1. Let _B_ be CompileToCharSet of |ClassAtom|.
 860 |           1. Let _C_ be CompileToCharSet of |ClassRanges|.
 861 |           1. Let _D_ be CharacterRange(_A_, _B_).
 862 |           1. Return the union of _D_ and _C_.
 863 |         </emu-alg>
 864 |         <emu-note>
 865 |           <p>|ClassRanges| can expand into a single |ClassAtom| and/or ranges of two |ClassAtom| separated by dashes. In the latter case the |ClassRanges| includes all characters between the first |ClassAtom| and the second |ClassAtom|, inclusive; an error occurs if either |ClassAtom| does not represent a single character (for example, if one is \w) or if the first |ClassAtom|'s character value is greater than the second |ClassAtom|'s character value.</p>
 866 |         </emu-note>
 867 |         <emu-note>
 868 |           <p>Even if the pattern ignores case, the case of the two ends of a range is significant in determining which characters belong to the range. Thus, for example, the pattern `/[E-F]/i` matches only the letters `E`, `F`, `e`, and `f`, while the pattern `/[E-f]/i` matches all upper and lower-case letters in the Unicode Basic Latin block as well as the symbols `[`, `\\`, `]`, `^`, `_`, and <code>`</code>.</p>
 869 |         </emu-note>
 870 |         <emu-note>
 871 |           <p>A `-` character can be treated literally or it can denote a range. It is treated literally if it is the first or last character of |ClassRanges|, the beginning or end limit of a range specification, or immediately follows a range specification.</p>
 872 |         </emu-note>
 873 | 
 874 |         <!-- ClassAtom -->
 875 |         <emu-grammar>ClassAtom :: `-`</emu-grammar>
 876 |         <emu-alg>
 877 |           1. Return the CharSet containing the single character `-` U+002D (HYPHEN-MINUS).
 878 |         </emu-alg>
 879 | 
 880 |         <!-- ClassAtomNoDash -->
 881 |         <emu-grammar>ClassAtomNoDash :: SourceCharacter but not one of `\` or `]` or `-`</emu-grammar>
 882 |         <emu-alg>
 883 |           1. Return the CharSet containing the character matched by |SourceCharacter|.
 884 |         </emu-alg>
 885 | 
 886 |         <!-- ClassEscape -->
 887 |         <emu-grammar>
 888 |           ClassEscape :: `b`
 889 | 
 890 |           ClassEscape :: `-`
 891 | 
 892 |           ClassEscape :: CharacterEscape
 893 |         </emu-grammar>
 894 |         <emu-alg>
 895 |           1. Let _cv_ be the CharacterValue of this |ClassEscape|.
 896 |           1. Let _c_ be the character whose character value is _cv_.
 897 |           1. Return the CharSet containing the single character _c_.
 898 |         </emu-alg>
 899 |         <emu-note>
 900 |           <p>A |ClassAtom| can use any of the escape sequences that are allowed in the rest of the regular expression except for `\\b`, `\\B`, and backreferences. Inside a |CharacterClass|, `\\b` means the backspace character, while `\\B` and backreferences raise errors. Using a backreference inside a |ClassAtom| causes an error.</p>
 901 |         </emu-note>
 902 | 
 903 |         <!-- CharacterClassEscape -->
 904 |         <emu-grammar>CharacterClassEscape :: `d`</emu-grammar>
 905 |         <emu-alg>
 906 |           1. Return the ten-element CharSet containing the characters `0` through `9` inclusive.
 907 |         </emu-alg>
 908 |         <emu-grammar>CharacterClassEscape :: `D`</emu-grammar>
 909 |         <emu-alg>
 910 |           1. Return the CharSet containing all characters not in the CharSet returned by <emu-grammar>CharacterClassEscape :: `d`</emu-grammar> .
 911 |         </emu-alg>
 912 |         <emu-grammar>CharacterClassEscape :: `s`</emu-grammar>
 913 |         <emu-alg>
 914 |           1. Return the CharSet containing all characters corresponding to a code point on the right-hand side of the |WhiteSpace| or |LineTerminator| productions.
 915 |         </emu-alg>
 916 |         <emu-grammar>CharacterClassEscape :: `S`</emu-grammar>
 917 |         <emu-alg>
 918 |           1. Return the CharSet containing all characters not in the CharSet returned by <emu-grammar>CharacterClassEscape :: `s`</emu-grammar> .
 919 |         </emu-alg>
 920 |         <emu-grammar>CharacterClassEscape :: `w`</emu-grammar>
 921 |         <emu-alg>
 922 |           1. Return <del>_WordCharacters_</del><ins>GetWordCharacters(_modifiers_)</ins>.
 923 |         </emu-alg>
 924 |         <emu-grammar>CharacterClassEscape :: `W`</emu-grammar>
 925 |         <emu-alg>
 926 |           1. Return the CharSet containing all characters not in the CharSet returned by <emu-grammar>CharacterClassEscape :: `w`</emu-grammar> .
 927 |         </emu-alg>
 928 |         <emu-grammar>CharacterClassEscape :: `p{` UnicodePropertyValueExpression `}`</emu-grammar>
 929 |         <emu-alg>
 930 |           1. Return the CharSet containing all Unicode code points included in CompileToCharSet of |UnicodePropertyValueExpression|.
 931 |         </emu-alg>
 932 |         <emu-grammar>CharacterClassEscape :: `P{` UnicodePropertyValueExpression `}`</emu-grammar>
 933 |         <emu-alg>
 934 |           1. Return the CharSet containing all Unicode code points not included in CompileToCharSet of |UnicodePropertyValueExpression|.
 935 |         </emu-alg>
 936 |         <emu-grammar>UnicodePropertyValueExpression :: UnicodePropertyName `=` UnicodePropertyValue</emu-grammar>
 937 |         <emu-alg>
 938 |           1. Let _ps_ be SourceText of |UnicodePropertyName|.
 939 |           1. Let _p_ be UnicodeMatchProperty(_ps_).
 940 |           1. Assert: _p_ is a Unicode property name or property alias listed in the &ldquo;Property name and aliases&rdquo; column of <emu-xref href="#table-nonbinary-unicode-properties"></emu-xref>.
 941 |           1. Let _vs_ be SourceText of |UnicodePropertyValue|.
 942 |           1. Let _v_ be UnicodeMatchPropertyValue(_p_, _vs_).
 943 |           1. Return the CharSet containing all Unicode code points whose character database definition includes the property _p_ with value _v_.
 944 |         </emu-alg>
 945 |         <emu-grammar>UnicodePropertyValueExpression :: LoneUnicodePropertyNameOrValue</emu-grammar>
 946 |         <emu-alg>
 947 |           1. Let _s_ be SourceText of |LoneUnicodePropertyNameOrValue|.
 948 |           1. If UnicodeMatchPropertyValue(`General_Category`, _s_) is identical to a List of Unicode code points that is the name of a Unicode general category or general category alias listed in the &ldquo;Property value and aliases&rdquo; column of <emu-xref href="#table-unicode-general-category-values"></emu-xref>, then
 949 |             1. Return the CharSet containing all Unicode code points whose character database definition includes the property &ldquo;General_Category&rdquo; with value _s_.
 950 |           1. Let _p_ be UnicodeMatchProperty(_s_).
 951 |           1. Assert: _p_ is a binary Unicode property or binary property alias listed in the &ldquo;Property name and aliases&rdquo; column of <emu-xref href="#table-binary-unicode-properties"></emu-xref>.
 952 |           1. Return the CharSet containing all Unicode code points whose character database definition includes the property _p_ with value &ldquo;True&rdquo;.
 953 |         </emu-alg>
 954 |       </emu-clause>
 955 | 
 956 |       <ins class="block">
 957 |       <emu-clause id="sec-getwordcharacters" type="abstract operation">
 958 |         <h1>
 959 |           <ins>
 960 |           GetWordCharacters (
 961 |             _modifiers_: a Modifiers Record,
 962 |           ): a CharSet
 963 |           </ins>
 964 |         </h1>
 965 |         <dl class="header">
 966 |         </dl>
 967 |         <emu-alg>
 968 |           1. Let _wordCharacters_ be the mathematical set that is the union of all sixty-three characters in *"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789_"* (letters, numbers, and U+005F (LOW LINE) in the Unicode Basic Latin block) and all characters _c_ for which _c_ is not in that set but Canonicalize(_c_, _modifiers_) is.
 969 |           1. Return _wordCharacters_.
 970 |         </emu-alg>
 971 |         <emu-note>
 972 |           _wordCharacters_ cannot contain more than sixty-three characters unless _Unicode_ and _modifiers_.[[IgnoreCase]] are both *true*.
 973 |         </emu-note>
 974 |       </emu-clause>
 975 | 
 976 |       <emu-clause id="sec-updatemodifiers" type="abstract operation">
 977 |         <h1>
 978 |           <ins>
 979 |           UpdateModifiers (
 980 |             _modifiers_: a Modifiers Record,
 981 |             _add_: a String,
 982 |             _remove_: a String,
 983 |           ): a Modifiers
 984 |           </ins>
 985 |         </h1>
 986 |         <dl class="header">
 987 |         </dl>
 988 |         <emu-alg>
 989 |           1. Let _dotAll_ be _modifiers_.[[DotAll]].
 990 |           1. Let _ignoreCase_ be _modifiers_.[[IgnoreCase]].
 991 |           1. Let _multiline_ be _modifiers_.[[Multiline]].
 992 |           1. If _add_ contains *"s"*, set _dotAll_ to *true*.
 993 |           1. If _add_ contains *"i"*, set _ignoreCase_ to *true*.
 994 |           1. If _add_ contains *"m"*, set _multiline_ to *true*.
 995 |           1. If _remove_ contains *"s"*, set _dotAll_ to *false*.
 996 |           1. If _remove_ contains *"i"*, set _ignoreCase_ to *false*.
 997 |           1. If _remove_ contains *"m"*, set _multiline_ to *false*.
 998 |           1. Return the Modifiers Record { [[DotAll]]: _dotAll_, [[IgnoreCase]]: _ignoreCase_, [[Multiline]]: _multiline_ }.
 999 |         </emu-alg>
1000 |       </emu-clause>
1001 |       </ins>
1002 |     </emu-clause>
1003 |   </emu-clause>
1004 | </emu-clause>
1005 | 
1006 | <emu-annex id="sec-additional-ecmascript-features-for-web-browsers" namespace="annexB" normative>
1007 |   <h1>Additional ECMAScript Features for Web Browsers</h1>
1008 | 
1009 |   <emu-annex id="sec-additional-syntax">
1010 |     <h1>Additional Syntax</h1>
1011 | 
1012 |     <emu-annex id="sec-regular-expressions-patterns">
1013 |       <h1>Regular Expressions Patterns</h1>
1014 |       <p>The syntax of <emu-xref href="#sec-patterns"></emu-xref> is modified and extended as follows. These changes introduce ambiguities that are broken by the ordering of grammar productions and by contextual information. When parsing using the following grammar, each alternative is considered only if previous production alternatives do not match.</p>
1015 |       <p>This alternative pattern grammar and semantics only changes the syntax and semantics of BMP patterns. The following grammar extensions include productions parameterized with the [UnicodeMode] parameter. However, none of these extensions change the syntax of Unicode patterns recognized when parsing with the [UnicodeMode] parameter present on the goal symbol.</p>
1016 |       <h2>Syntax</h2>
1017 |       <emu-grammar type="definition">
1018 |         Term[UnicodeMode, N] ::
1019 |           [+UnicodeMode] Assertion[+UnicodeMode, ?N]
1020 |           [+UnicodeMode] Atom[+UnicodeMode, ?N] Quantifier
1021 |           [+UnicodeMode] Atom[+UnicodeMode, ?N]
1022 |           [~UnicodeMode] QuantifiableAssertion[?N] Quantifier
1023 |           [~UnicodeMode] Assertion[~UnicodeMode, ?N]
1024 |           [~UnicodeMode] ExtendedAtom[?N] Quantifier
1025 |           [~UnicodeMode] ExtendedAtom[?N]
1026 | 
1027 |         Assertion[UnicodeMode, N] ::
1028 |           `^`
1029 |           `$`
1030 |           `\` `b`
1031 |           `\` `B`
1032 |           [+UnicodeMode] `(` `?` `=` Disjunction[+UnicodeMode, ?N] `)`
1033 |           [+UnicodeMode] `(` `?` `!` Disjunction[+UnicodeMode, ?N] `)`
1034 |           [~UnicodeMode] QuantifiableAssertion[?N]
1035 |           `(` `?` `&lt;=` Disjunction[?UnicodeMode, ?N] `)`
1036 |           `(` `?` `&lt;!` Disjunction[?UnicodeMode, ?N] `)`
1037 | 
1038 |         QuantifiableAssertion[N] ::
1039 |           `(` `?` `=` Disjunction[~UnicodeMode, ?N] `)`
1040 |           `(` `?` `!` Disjunction[~UnicodeMode, ?N] `)`
1041 | 
1042 |         ExtendedAtom[N] ::
1043 |           `.`
1044 |           `\` AtomEscape[~UnicodeMode, ?N]
1045 |           `\` [lookahead == `c`]
1046 |           CharacterClass[~UnicodeMode]
1047 |           `(` Disjunction[~UnicodeMode, ?N] `)`
1048 |           <del>`(` `?` `:` Disjunction[~UnicodeMode, ?N] `)`</del>
1049 |           <ins>`(` `?` RegularExpressionFlags `:` Disjunction[?UnicodeMode, ?N] `)`</ins>
1050 |           <ins>`(` `?` RegularExpressionFlags `-` RegularExpressionFlags `:` Disjunction[?UnicodeMode, ?N] `)`</ins>
1051 |           InvalidBracedQuantifier
1052 |           ExtendedPatternCharacter
1053 | 
1054 |         InvalidBracedQuantifier ::
1055 |           `{` DecimalDigits[~Sep] `}`
1056 |           `{` DecimalDigits[~Sep] `,` `}`
1057 |           `{` DecimalDigits[~Sep] `,` DecimalDigits[~Sep] `}`
1058 | 
1059 |         ExtendedPatternCharacter ::
1060 |           SourceCharacter but not one of `^` `$` `\` `.` `*` `+` `?` `(` `)` `[` `|`
1061 | 
1062 |         AtomEscape[UnicodeMode, N] ::
1063 |           [+UnicodeMode] DecimalEscape
1064 |           [~UnicodeMode] DecimalEscape [> but only if the CapturingGroupNumber of |DecimalEscape| is &le; _NcapturingParens_]
1065 |           CharacterClassEscape[?UnicodeMode]
1066 |           CharacterEscape[?UnicodeMode, ?N]
1067 |           [+N] `k` GroupName[?UnicodeMode]
1068 | 
1069 |         CharacterEscape[UnicodeMode, N] ::
1070 |           ControlEscape
1071 |           `c` ControlLetter
1072 |           `0` [lookahead &notin; DecimalDigit]
1073 |           HexEscapeSequence
1074 |           RegExpUnicodeEscapeSequence[?UnicodeMode]
1075 |           [~UnicodeMode] LegacyOctalEscapeSequence
1076 |           IdentityEscape[?UnicodeMode, ?N]
1077 | 
1078 |         IdentityEscape[UnicodeMode, N] ::
1079 |           [+UnicodeMode] SyntaxCharacter
1080 |           [+UnicodeMode] `/`
1081 |           [~UnicodeMode] SourceCharacterIdentityEscape[?N]
1082 | 
1083 |         SourceCharacterIdentityEscape[N] ::
1084 |           [~N] SourceCharacter but not `c`
1085 |           [+N] SourceCharacter but not one of `c` or `k`
1086 | 
1087 |         ClassAtomNoDash[UnicodeMode, N] ::
1088 |           SourceCharacter but not one of `\` or `]` or `-`
1089 |           `\` ClassEscape[?UnicodeMode, ?N]
1090 |           `\` [lookahead == `c`]
1091 | 
1092 |         ClassEscape[UnicodeMode, N] ::
1093 |           `b`
1094 |           [+UnicodeMode] `-`
1095 |           [~UnicodeMode] `c` ClassControlLetter
1096 |           CharacterClassEscape[?UnicodeMode]
1097 |           CharacterEscape[?UnicodeMode, ?N]
1098 | 
1099 |         ClassControlLetter ::
1100 |           DecimalDigit
1101 |           `_`
1102 |       </emu-grammar>
1103 |       <emu-note>
1104 |         <p>When the same left-hand sides occurs with both [+UnicodeMode] and [\~UnicodeMode] guards it is to control the disambiguation priority.</p>
1105 |       </emu-note>
1106 |     </emu-annex>
1107 |   </emu-annex>
1108 | </emu-annex>


--------------------------------------------------------------------------------