├── .gitignore
├── .gitattributes
├── .pr-preview.json
├── .editorconfig
├── .github
    ├── ISSUE_TEMPLATE
    │   ├── config.yml
    │   ├── 0-new-issue.yml
    │   └── 1-new-feature.yml
    └── workflows
    │   └── build.yml
├── Makefile
├── README.md
├── LICENSE
└── review-drafts
    ├── 2018-07.bs
    ├── 2019-01.bs
    └── 2019-07.bs


/.gitignore:
--------------------------------------------------------------------------------
1 | /infra.spec.whatwg.org/
2 | /deploy.sh
3 | /infra.html
4 | 


--------------------------------------------------------------------------------
/.gitattributes:
--------------------------------------------------------------------------------
1 | *    text=auto
2 | *.bs diff=html linguist-language=HTML
3 | 


--------------------------------------------------------------------------------
/.pr-preview.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "src_file": "infra.bs",
 3 |   "type": "bikeshed",
 4 |   "params": {
 5 |     "force": 1,
 6 |     "md-status": "LS-PR",
 7 |     "md-Text-Macro": "PR-NUMBER {{ pull_request.number }}"
 8 |   }
 9 | }
10 | 


--------------------------------------------------------------------------------
/.editorconfig:
--------------------------------------------------------------------------------
 1 | root = true
 2 | 
 3 | [*]
 4 | end_of_line = lf
 5 | insert_final_newline = true
 6 | charset = utf-8
 7 | indent_size = 2
 8 | indent_style = space
 9 | trim_trailing_whitespace = true
10 | max_line_length = 100
11 | 
12 | [Makefile]
13 | indent_style = tab
14 | 
15 | [*.md]
16 | max_line_length = off
17 | 
18 | [*.bs]
19 | indent_size = 1
20 | 
21 | [*.py]
22 | indent_size = 4
23 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/config.yml:
--------------------------------------------------------------------------------
1 | blank_issues_enabled: false
2 | contact_links:
3 |   - name: Chat
4 |     url: https://whatwg.org/chat
5 |     about: Please do reach out with questions and feedback!
6 |   - name: Stack Overflow
7 |     url: https://stackoverflow.com/
8 |     about: If you're having trouble building a web page, this is not the right repository. Consider asking your question on Stack Overflow instead.
9 | 


--------------------------------------------------------------------------------
/.github/workflows/build.yml:
--------------------------------------------------------------------------------
 1 | name: Build
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     branches:
 6 |     - main
 7 |   push:
 8 |     branches:
 9 |     - main
10 |   workflow_dispatch:
11 | 
12 | jobs:
13 |   build:
14 |     name: Build
15 |     runs-on: ubuntu-22.04
16 |     steps:
17 |     - uses: actions/checkout@v3
18 |       with:
19 |         fetch-depth: 2
20 |     - uses: actions/setup-python@v4
21 |       with:
22 |         python-version: "3.11"
23 |     - run: pip install bikeshed && bikeshed update
24 |     # Note: `make deploy` will do a deploy dry run on PRs.
25 |     - run: make deploy
26 |       env:
27 |         SERVER: ${{ secrets.MARQUEE_SERVER }}
28 |         SERVER_PUBLIC_KEY: ${{ secrets.MARQUEE_PUBLIC_KEY }}
29 |         SERVER_DEPLOY_KEY: ${{ secrets.MARQUEE_DEPLOY_KEY }}
30 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/0-new-issue.yml:
--------------------------------------------------------------------------------
 1 | name: New issue
 2 | description: File a new issue against the Infra Standard.
 3 | body:
 4 |   - type: markdown
 5 |     attributes:
 6 |       value: |
 7 |         Before filling out this form, please familiarize yourself with the [Code of Conduct](https://whatwg.org/code-of-conduct). You might also find the [FAQ](https://whatwg.org/faq) and [Working Mode](https://whatwg.org/working-mode) useful.
 8 | 
 9 |         If at any point you have questions, please reach out to us on [Chat](https://whatwg.org/chat).
10 |   - type: textarea
11 |     attributes:
12 |       label: "What is the issue with the Infra Standard?"
13 |     validations:
14 |       required: true
15 |   - type: markdown
16 |     attributes:
17 |       value: "Thank you for taking the time to improve the Infra Standard!"
18 | 


--------------------------------------------------------------------------------
/Makefile:
--------------------------------------------------------------------------------
 1 | SHELL=/bin/bash -o pipefail
 2 | .PHONY: local remote deploy
 3 | 
 4 | remote: infra.bs
 5 | 	@ (HTTP_STATUS=$$(curl https://api.csswg.org/bikeshed/ \
 6 | 	                       --output infra.html \
 7 | 	                       --write-out "%{http_code}" \
 8 | 	                       --header "Accept: text/plain, text/html" \
 9 | 	                       -F die-on=warning \
10 | 	                       -F md-Text-Macro="COMMIT-SHA LOCAL COPY" \
11 | 	                       -F file=@infra.bs) && \
12 | 	[[ "$$HTTP_STATUS" -eq "200" ]]) || ( \
13 | 		echo ""; cat infra.html; echo ""; \
14 | 		rm -f infra.html; \
15 | 		exit 22 \
16 | 	);
17 | 
18 | local: infra.bs
19 | 	bikeshed spec infra.bs infra.html --md-Text-Macro="COMMIT-SHA LOCAL-COPY"
20 | 
21 | deploy: infra.bs
22 | 	curl --remote-name --fail https://resources.whatwg.org/build/deploy.sh
23 | 	bash ./deploy.sh
24 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/1-new-feature.yml:
--------------------------------------------------------------------------------
 1 | name: New feature
 2 | description: Request a new feature in the Infra Standard.
 3 | labels: ["addition/proposal", "needs implementer interest"]
 4 | body:
 5 |   - type: markdown
 6 |     attributes:
 7 |       value: |
 8 |         Before filling out this form, please familiarize yourself with the [Code of Conduct](https://whatwg.org/code-of-conduct), [FAQ](https://whatwg.org/faq), and [Working Mode](https://whatwg.org/working-mode). They help with setting expectations and making sure you know what is required. The FAQ ["How should I go about proposing new features to WHATWG standards?"](https://whatwg.org/faq#adding-new-features) is especially relevant.
 9 | 
10 |         If at any point you have questions, please reach out to us on [Chat](https://whatwg.org/chat).
11 |   - type: textarea
12 |     attributes:
13 |       label: "What problem are you trying to solve?"
14 |     validations:
15 |       required: true
16 |   - type: textarea
17 |     attributes:
18 |       label: "What solutions exist today?"
19 |   - type: textarea
20 |     attributes:
21 |       label: "How would you solve it?"
22 |   - type: textarea
23 |     attributes:
24 |       label: "Anything else?"
25 |   - type: markdown
26 |     attributes:
27 |       value: "Thank you for taking the time to improve the Infra Standard!"
28 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | This repository hosts the [Infra Standard](https://infra.spec.whatwg.org/).
  2 | 
  3 | ## Code of conduct
  4 | 
  5 | We are committed to providing a friendly, safe, and welcoming environment for all. Please read and respect the [Code of Conduct](https://whatwg.org/code-of-conduct).
  6 | 
  7 | ## Contribution opportunities
  8 | 
  9 | Folks notice minor and larger issues with the Infra Standard all the time and we'd love your help fixing those. Pull requests for typographical and grammar errors are also most welcome.
 10 | 
 11 | Issues labeled ["good first issue"](https://github.com/whatwg/infra/labels/good%20first%20issue) are a good place to get a taste for editing the Infra Standard. Note that we don't assign issues and there's no reason to ask for availability either, just provide a pull request.
 12 | 
 13 | If you are thinking of suggesting a new feature, read through the [FAQ](https://whatwg.org/faq) and [Working Mode](https://whatwg.org/working-mode) documents to get yourself familiarized with the process.
 14 | 
 15 | We'd be happy to help you with all of this [on Chat](https://whatwg.org/chat).
 16 | 
 17 | ## Pull requests
 18 | 
 19 | In short, change `infra.bs` and submit your patch, with a [good commit message](https://github.com/whatwg/meta/blob/main/COMMITTING.md).
 20 | 
 21 | Please add your name to the Acknowledgments section in your first pull request, even for trivial fixes. The names are sorted lexicographically.
 22 | 
 23 | To ensure your patch meets all the necessary requirements, please also see the [Contributor Guidelines](https://github.com/whatwg/meta/blob/main/CONTRIBUTING.md). Editors of the Infra Standard are expected to follow the [Maintainer Guidelines](https://github.com/whatwg/meta/blob/main/MAINTAINERS.md).
 24 | 
 25 | ## Tests
 26 | 
 27 | Tests are an essential part of the standardization process and will need to be created or adjusted as changes to the standard are made. Tests for the Infra Standard can be found in the `infra/` directory of [`web-platform-tests/wpt`](https://github.com/web-platform-tests/wpt).
 28 | 
 29 | A dashboard showing the tests running against browser engines can be seen at [wpt.fyi/results/infra](https://wpt.fyi/results/infra).
 30 | 
 31 | ## Building "locally"
 32 | 
 33 | For quick local iteration, run `make`; this will use a web service to build the standard, so that you don't have to install anything. See more in the [Contributor Guidelines](https://github.com/whatwg/meta/blob/main/CONTRIBUTING.md#building).
 34 | 
 35 | ## Formatting
 36 | 
 37 | Use a column width of 100 characters.
 38 | 
 39 | Do not use newlines inside "inline" elements, even if that means exceeding the column width requirement.
 40 | ```html
 41 | <p>The
 42 | <dfn method for=DOMTokenList lt=remove(tokens)|remove()><code>remove(<var>tokens</var>&hellip;)</code></dfn>
 43 | method, when invoked, must run these steps:
 44 | ```
 45 | is okay and
 46 |   ```html
 47 | <p>The <dfn method for=DOMTokenList
 48 | lt=remove(tokens)|remove()><code>remove(<var>tokens</var>&hellip;)</code></dfn> method, when
 49 | invoked, must run these steps:
 50 | ```
 51 | is not.
 52 | 
 53 | Using newlines between "inline" element tag names and their content is also forbidden. (This actually alters the content, by adding spaces.) That is
 54 | ```html
 55 | <a>token</a>
 56 | ```
 57 | is fine and
 58 | ```html
 59 | <a>token
 60 | </a>
 61 | ```
 62 | is not.
 63 | 
 64 | An `<li>` element always has a `<p>` element inside it, unless it's a child of `<ul class=brief>`.
 65 | 
 66 | If a "block" element contains a single "block" element, do not put it on a newline.
 67 | 
 68 | Do not indent for anything except a new "block" element. For instance
 69 | ```html
 70 |  <li><p>For each <var>token</var> in <var>tokens</var>, in given order, that is not in
 71 |  <a>tokens</a>, append <var>token</var> to <a>tokens</a>.
 72 | ```
 73 | is not indented, but
 74 | ```html
 75 | <ol>
 76 |  <li>
 77 |   <p>For each <var>token</var> in <var>tokens</var>, run these substeps:
 78 | 
 79 |   <ol>
 80 |    <li><p>If <var>token</var> is the empty string, <a>throw</a> a {{SyntaxError}} exception.
 81 | ```
 82 | is.
 83 | 
 84 | End tags may be included (if done consistently) and attributes may be quoted (using double quotes), though the prevalent theme is to omit end tags and not quote attributes (unless they contain a space).
 85 | 
 86 | Place one newline between paragraphs (including list elements). Place three newlines before `<h2>`, and two newlines before other headings. This does not apply when a nested heading follows the parent heading.
 87 | ```html
 88 | <ul>
 89 |  <li><p>Do not place a newline above.
 90 | 
 91 |  <li><p>Place a newline above.
 92 | </ul>
 93 | 
 94 | <p>Place a newline above.
 95 | 
 96 | 
 97 | <h3>Place two newlines above.</h3>
 98 | 
 99 | <h4>Placing one newline is OK here.</h4>
100 | 
101 | 
102 | <h4>Place two newlines above.</h4>
103 | ```
104 | Use camel-case for variable names and "spaced" names for definitions, algorithms, etc.
105 | ```html
106 | <p>A <a for=/>request</a> has an associated
107 | <dfn export for=request id=concept-request-redirect-mode>redirect mode</dfn>,...
108 | ```
109 | ```html
110 | <p>Let <var>redirectMode</var> be <var>request</var>'s <a for=request>redirect mode</a>.
111 | ```
112 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 | Copyright © WHATWG (Apple, Google, Mozilla, Microsoft).
  2 | 
  3 | This work is licensed under a Creative Commons Attribution 4.0 International
  4 | License. To the extent portions of it are incorporated into source code,
  5 | such portions in the source code are licensed under the BSD 3-Clause License instead.
  6 | 
  7 | - - - -
  8 | 
  9 | Creative Commons Attribution 4.0 International Public License
 10 | 
 11 | By exercising the Licensed Rights (defined below), You accept and agree
 12 | to be bound by the terms and conditions of this Creative Commons
 13 | Attribution 4.0 International Public License ("Public License"). To the
 14 | extent this Public License may be interpreted as a contract, You are
 15 | granted the Licensed Rights in consideration of Your acceptance of
 16 | these terms and conditions, and the Licensor grants You such rights in
 17 | consideration of benefits the Licensor receives from making the
 18 | Licensed Material available under these terms and conditions.
 19 | 
 20 | 
 21 | Section 1 -- Definitions.
 22 | 
 23 |   a. Adapted Material means material subject to Copyright and Similar
 24 |      Rights that is derived from or based upon the Licensed Material
 25 |      and in which the Licensed Material is translated, altered,
 26 |      arranged, transformed, or otherwise modified in a manner requiring
 27 |      permission under the Copyright and Similar Rights held by the
 28 |      Licensor. For purposes of this Public License, where the Licensed
 29 |      Material is a musical work, performance, or sound recording,
 30 |      Adapted Material is always produced where the Licensed Material is
 31 |      synched in timed relation with a moving image.
 32 | 
 33 |   b. Adapter's License means the license You apply to Your Copyright
 34 |      and Similar Rights in Your contributions to Adapted Material in
 35 |      accordance with the terms and conditions of this Public License.
 36 | 
 37 |   c. Copyright and Similar Rights means copyright and/or similar rights
 38 |      closely related to copyright including, without limitation,
 39 |      performance, broadcast, sound recording, and Sui Generis Database
 40 |      Rights, without regard to how the rights are labeled or
 41 |      categorized. For purposes of this Public License, the rights
 42 |      specified in Section 2(b)(1)-(2) are not Copyright and Similar
 43 |      Rights.
 44 | 
 45 |   d. Effective Technological Measures means those measures that, in the
 46 |      absence of proper authority, may not be circumvented under laws
 47 |      fulfilling obligations under Article 11 of the WIPO Copyright
 48 |      Treaty adopted on December 20, 1996, and/or similar international
 49 |      agreements.
 50 | 
 51 |   e. Exceptions and Limitations means fair use, fair dealing, and/or
 52 |      any other exception or limitation to Copyright and Similar Rights
 53 |      that applies to Your use of the Licensed Material.
 54 | 
 55 |   f. Licensed Material means the artistic or literary work, database,
 56 |      or other material to which the Licensor applied this Public
 57 |      License.
 58 | 
 59 |   g. Licensed Rights means the rights granted to You subject to the
 60 |      terms and conditions of this Public License, which are limited to
 61 |      all Copyright and Similar Rights that apply to Your use of the
 62 |      Licensed Material and that the Licensor has authority to license.
 63 | 
 64 |   h. Licensor means the individual(s) or entity(ies) granting rights
 65 |      under this Public License.
 66 | 
 67 |   i. Share means to provide material to the public by any means or
 68 |      process that requires permission under the Licensed Rights, such
 69 |      as reproduction, public display, public performance, distribution,
 70 |      dissemination, communication, or importation, and to make material
 71 |      available to the public including in ways that members of the
 72 |      public may access the material from a place and at a time
 73 |      individually chosen by them.
 74 | 
 75 |   j. Sui Generis Database Rights means rights other than copyright
 76 |      resulting from Directive 96/9/EC of the European Parliament and of
 77 |      the Council of 11 March 1996 on the legal protection of databases,
 78 |      as amended and/or succeeded, as well as other essentially
 79 |      equivalent rights anywhere in the world.
 80 | 
 81 |   k. You means the individual or entity exercising the Licensed Rights
 82 |      under this Public License. Your has a corresponding meaning.
 83 | 
 84 | 
 85 | Section 2 -- Scope.
 86 | 
 87 |   a. License grant.
 88 | 
 89 |        1. Subject to the terms and conditions of this Public License,
 90 |           the Licensor hereby grants You a worldwide, royalty-free,
 91 |           non-sublicensable, non-exclusive, irrevocable license to
 92 |           exercise the Licensed Rights in the Licensed Material to:
 93 | 
 94 |             a. reproduce and Share the Licensed Material, in whole or
 95 |                in part; and
 96 | 
 97 |             b. produce, reproduce, and Share Adapted Material.
 98 | 
 99 |        2. Exceptions and Limitations. For the avoidance of doubt, where
100 |           Exceptions and Limitations apply to Your use, this Public
101 |           License does not apply, and You do not need to comply with
102 |           its terms and conditions.
103 | 
104 |        3. Term. The term of this Public License is specified in Section
105 |           6(a).
106 | 
107 |        4. Media and formats; technical modifications allowed. The
108 |           Licensor authorizes You to exercise the Licensed Rights in
109 |           all media and formats whether now known or hereafter created,
110 |           and to make technical modifications necessary to do so. The
111 |           Licensor waives and/or agrees not to assert any right or
112 |           authority to forbid You from making technical modifications
113 |           necessary to exercise the Licensed Rights, including
114 |           technical modifications necessary to circumvent Effective
115 |           Technological Measures. For purposes of this Public License,
116 |           simply making modifications authorized by this Section 2(a)
117 |           (4) never produces Adapted Material.
118 | 
119 |        5. Downstream recipients.
120 | 
121 |             a. Offer from the Licensor -- Licensed Material. Every
122 |                recipient of the Licensed Material automatically
123 |                receives an offer from the Licensor to exercise the
124 |                Licensed Rights under the terms and conditions of this
125 |                Public License.
126 | 
127 |             b. No downstream restrictions. You may not offer or impose
128 |                any additional or different terms or conditions on, or
129 |                apply any Effective Technological Measures to, the
130 |                Licensed Material if doing so restricts exercise of the
131 |                Licensed Rights by any recipient of the Licensed
132 |                Material.
133 | 
134 |        6. No endorsement. Nothing in this Public License constitutes or
135 |           may be construed as permission to assert or imply that You
136 |           are, or that Your use of the Licensed Material is, connected
137 |           with, or sponsored, endorsed, or granted official status by,
138 |           the Licensor or others designated to receive attribution as
139 |           provided in Section 3(a)(1)(A)(i).
140 | 
141 |   b. Other rights.
142 | 
143 |        1. Moral rights, such as the right of integrity, are not
144 |           licensed under this Public License, nor are publicity,
145 |           privacy, and/or other similar personality rights; however, to
146 |           the extent possible, the Licensor waives and/or agrees not to
147 |           assert any such rights held by the Licensor to the limited
148 |           extent necessary to allow You to exercise the Licensed
149 |           Rights, but not otherwise.
150 | 
151 |        2. Patent and trademark rights are not licensed under this
152 |           Public License.
153 | 
154 |        3. To the extent possible, the Licensor waives any right to
155 |           collect royalties from You for the exercise of the Licensed
156 |           Rights, whether directly or through a collecting society
157 |           under any voluntary or waivable statutory or compulsory
158 |           licensing scheme. In all other cases the Licensor expressly
159 |           reserves any right to collect such royalties.
160 | 
161 | 
162 | Section 3 -- License Conditions.
163 | 
164 | Your exercise of the Licensed Rights is expressly made subject to the
165 | following conditions.
166 | 
167 |   a. Attribution.
168 | 
169 |        1. If You Share the Licensed Material (including in modified
170 |           form), You must:
171 | 
172 |             a. retain the following if it is supplied by the Licensor
173 |                with the Licensed Material:
174 | 
175 |                  i. identification of the creator(s) of the Licensed
176 |                     Material and any others designated to receive
177 |                     attribution, in any reasonable manner requested by
178 |                     the Licensor (including by pseudonym if
179 |                     designated);
180 | 
181 |                 ii. a copyright notice;
182 | 
183 |                iii. a notice that refers to this Public License;
184 | 
185 |                 iv. a notice that refers to the disclaimer of
186 |                     warranties;
187 | 
188 |                  v. a URI or hyperlink to the Licensed Material to the
189 |                     extent reasonably practicable;
190 | 
191 |             b. indicate if You modified the Licensed Material and
192 |                retain an indication of any previous modifications; and
193 | 
194 |             c. indicate the Licensed Material is licensed under this
195 |                Public License, and include the text of, or the URI or
196 |                hyperlink to, this Public License.
197 | 
198 |        2. You may satisfy the conditions in Section 3(a)(1) in any
199 |           reasonable manner based on the medium, means, and context in
200 |           which You Share the Licensed Material. For example, it may be
201 |           reasonable to satisfy the conditions by providing a URI or
202 |           hyperlink to a resource that includes the required
203 |           information.
204 | 
205 |        3. If requested by the Licensor, You must remove any of the
206 |           information required by Section 3(a)(1)(A) to the extent
207 |           reasonably practicable.
208 | 
209 |        4. If You Share Adapted Material You produce, the Adapter's
210 |           License You apply must not prevent recipients of the Adapted
211 |           Material from complying with this Public License.
212 | 
213 | 
214 | Section 4 -- Sui Generis Database Rights.
215 | 
216 | Where the Licensed Rights include Sui Generis Database Rights that
217 | apply to Your use of the Licensed Material:
218 | 
219 |   a. for the avoidance of doubt, Section 2(a)(1) grants You the right
220 |      to extract, reuse, reproduce, and Share all or a substantial
221 |      portion of the contents of the database;
222 | 
223 |   b. if You include all or a substantial portion of the database
224 |      contents in a database in which You have Sui Generis Database
225 |      Rights, then the database in which You have Sui Generis Database
226 |      Rights (but not its individual contents) is Adapted Material; and
227 | 
228 |   c. You must comply with the conditions in Section 3(a) if You Share
229 |      all or a substantial portion of the contents of the database.
230 | 
231 | For the avoidance of doubt, this Section 4 supplements and does not
232 | replace Your obligations under this Public License where the Licensed
233 | Rights include other Copyright and Similar Rights.
234 | 
235 | 
236 | Section 5 -- Disclaimer of Warranties and Limitation of Liability.
237 | 
238 |   a. UNLESS OTHERWISE SEPARATELY UNDERTAKEN BY THE LICENSOR, TO THE
239 |      EXTENT POSSIBLE, THE LICENSOR OFFERS THE LICENSED MATERIAL AS-IS
240 |      AND AS-AVAILABLE, AND MAKES NO REPRESENTATIONS OR WARRANTIES OF
241 |      ANY KIND CONCERNING THE LICENSED MATERIAL, WHETHER EXPRESS,
242 |      IMPLIED, STATUTORY, OR OTHER. THIS INCLUDES, WITHOUT LIMITATION,
243 |      WARRANTIES OF TITLE, MERCHANTABILITY, FITNESS FOR A PARTICULAR
244 |      PURPOSE, NON-INFRINGEMENT, ABSENCE OF LATENT OR OTHER DEFECTS,
245 |      ACCURACY, OR THE PRESENCE OR ABSENCE OF ERRORS, WHETHER OR NOT
246 |      KNOWN OR DISCOVERABLE. WHERE DISCLAIMERS OF WARRANTIES ARE NOT
247 |      ALLOWED IN FULL OR IN PART, THIS DISCLAIMER MAY NOT APPLY TO YOU.
248 | 
249 |   b. TO THE EXTENT POSSIBLE, IN NO EVENT WILL THE LICENSOR BE LIABLE
250 |      TO YOU ON ANY LEGAL THEORY (INCLUDING, WITHOUT LIMITATION,
251 |      NEGLIGENCE) OR OTHERWISE FOR ANY DIRECT, SPECIAL, INDIRECT,
252 |      INCIDENTAL, CONSEQUENTIAL, PUNITIVE, EXEMPLARY, OR OTHER LOSSES,
253 |      COSTS, EXPENSES, OR DAMAGES ARISING OUT OF THIS PUBLIC LICENSE OR
254 |      USE OF THE LICENSED MATERIAL, EVEN IF THE LICENSOR HAS BEEN
255 |      ADVISED OF THE POSSIBILITY OF SUCH LOSSES, COSTS, EXPENSES, OR
256 |      DAMAGES. WHERE A LIMITATION OF LIABILITY IS NOT ALLOWED IN FULL OR
257 |      IN PART, THIS LIMITATION MAY NOT APPLY TO YOU.
258 | 
259 |   c. The disclaimer of warranties and limitation of liability provided
260 |      above shall be interpreted in a manner that, to the extent
261 |      possible, most closely approximates an absolute disclaimer and
262 |      waiver of all liability.
263 | 
264 | 
265 | Section 6 -- Term and Termination.
266 | 
267 |   a. This Public License applies for the term of the Copyright and
268 |      Similar Rights licensed here. However, if You fail to comply with
269 |      this Public License, then Your rights under this Public License
270 |      terminate automatically.
271 | 
272 |   b. Where Your right to use the Licensed Material has terminated under
273 |      Section 6(a), it reinstates:
274 | 
275 |        1. automatically as of the date the violation is cured, provided
276 |           it is cured within 30 days of Your discovery of the
277 |           violation; or
278 | 
279 |        2. upon express reinstatement by the Licensor.
280 | 
281 |      For the avoidance of doubt, this Section 6(b) does not affect any
282 |      right the Licensor may have to seek remedies for Your violations
283 |      of this Public License.
284 | 
285 |   c. For the avoidance of doubt, the Licensor may also offer the
286 |      Licensed Material under separate terms or conditions or stop
287 |      distributing the Licensed Material at any time; however, doing so
288 |      will not terminate this Public License.
289 | 
290 |   d. Sections 1, 5, 6, 7, and 8 survive termination of this Public
291 |      License.
292 | 
293 | 
294 | Section 7 -- Other Terms and Conditions.
295 | 
296 |   a. The Licensor shall not be bound by any additional or different
297 |      terms or conditions communicated by You unless expressly agreed.
298 | 
299 |   b. Any arrangements, understandings, or agreements regarding the
300 |      Licensed Material not stated herein are separate from and
301 |      independent of the terms and conditions of this Public License.
302 | 
303 | 
304 | Section 8 -- Interpretation.
305 | 
306 |   a. For the avoidance of doubt, this Public License does not, and
307 |      shall not be interpreted to, reduce, limit, restrict, or impose
308 |      conditions on any use of the Licensed Material that could lawfully
309 |      be made without permission under this Public License.
310 | 
311 |   b. To the extent possible, if any provision of this Public License is
312 |      deemed unenforceable, it shall be automatically reformed to the
313 |      minimum extent necessary to make it enforceable. If the provision
314 |      cannot be reformed, it shall be severed from this Public License
315 |      without affecting the enforceability of the remaining terms and
316 |      conditions.
317 | 
318 |   c. No term or condition of this Public License will be waived and no
319 |      failure to comply consented to unless expressly agreed to by the
320 |      Licensor.
321 | 
322 |   d. Nothing in this Public License constitutes or may be interpreted
323 |      as a limitation upon, or waiver of, any privileges and immunities
324 |      that apply to the Licensor or You, including from the legal
325 |      processes of any jurisdiction or authority.
326 | 
327 | - - - -
328 | 
329 | BSD 3-Clause License
330 | 
331 | Redistribution and use in source and binary forms, with or without
332 | modification, are permitted provided that the following conditions are met:
333 | 
334 | 1. Redistributions of source code must retain the above copyright notice, this
335 |    list of conditions and the following disclaimer.
336 | 
337 | 2. Redistributions in binary form must reproduce the above copyright notice,
338 |    this list of conditions and the following disclaimer in the documentation
339 |    and/or other materials provided with the distribution.
340 | 
341 | 3. Neither the name of the copyright holder nor the names of its
342 |    contributors may be used to endorse or promote products derived from
343 |    this software without specific prior written permission.
344 | 
345 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
346 | AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
347 | IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
348 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
349 | FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
350 | DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
351 | SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
352 | CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
353 | OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
354 | OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
355 | 
356 | - - - -
357 | 


--------------------------------------------------------------------------------
/review-drafts/2018-07.bs:
--------------------------------------------------------------------------------
   1 | <pre class='metadata'>
   2 | Group: WHATWG
   3 | Date: 2018-07-23
   4 | H1: Infra
   5 | Shortname: infra
   6 | Text Macro: TWITTER infrastandard
   7 | Abstract: The Infra Standard aims to define the fundamental concepts upon which standards are built.
   8 | Translation: ja https://triple-underscore.github.io/infra-ja.html
   9 | </pre>
  10 | 
  11 | <pre class="anchors">
  12 | urlPrefix: https://tc39.github.io/ecma262/; spec: ECMA-262;
  13 |     type: dfn
  14 |         text: %JSONParse%; url: sec-json.parse
  15 |         text: List; url: sec-list-and-record-specification-type
  16 |         text: The String Type; url: sec-ecmascript-language-types-string-type
  17 |     type: abstract-op; text: Call; url: sec-call
  18 | </pre>
  19 | 
  20 | 
  21 | <h2 id=goals class=no-num>Goals</h2>
  22 | 
  23 | <ul>
  24 |  <li><p>Deduplicate boilerplate in standards.
  25 | 
  26 |  <li><p>Align standards on conventions, terminology, and data structures.
  27 | 
  28 |  <li><p>Be a place for concepts used by multiple standards without a good home.
  29 | 
  30 |  <li><p>Help write clear and readable algorithmic prose by clarifying otherwise ambiguous concepts.
  31 | </ul>
  32 | 
  33 | <p>Suggestions for more goals welcome.</p>
  34 | 
  35 | 
  36 | <h2 id=usage>Usage</h2>
  37 | 
  38 | <p>To make use of the Infra Standard in a document titled <var>X</var>, use
  39 | <samp><var>X</var> depends on the Infra Standard</samp>. Additionally, cross-referencing terminology
  40 | is encouraged to avoid ambiguity.
  41 | 
  42 | <p>Specification authors are also encouraged to add their specification to the
  43 | <a href=https://github.com/whatwg/infra/wiki/Dependent-specs>list of dependent specifications</a> in
  44 | order to help the editors ensure that any future breaking changes to the Infra Standard are
  45 | correctly reflected by any such dependencies.
  46 | 
  47 | 
  48 | <h2 id=conventions>Conventions</h2>
  49 | 
  50 | <h3 id=conformance>Conformance</h3>
  51 | 
  52 | <p>All assertions, diagrams, examples, and notes are non-normative, as are all sections explicitly
  53 | marked non-normative. Everything else is normative.
  54 | 
  55 | <p>The keywords "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", "SHOULD NOT",
  56 | "RECOMMENDED", "NOT RECOMMENDED", "MAY", and "OPTIONAL" are to be interpreted as described in
  57 | RFC 2119. [[!RFC2119]]
  58 | 
  59 | <p>These keywords have equivalent meaning when written in lowercase and cannot appear in
  60 | non-normative content.
  61 | 
  62 | <p class=note>This is a <a>willful violation</a> of RFC 8174, motivated by legibility and a desire
  63 | to preserve long-standing practice in many non-IETF-published pre-RFC 8174 documents. [[RFC8174]]
  64 | 
  65 | <p>All of the above is applicable to both this standard and any document that uses this standard.
  66 | Documents using this standard are encouraged to limit themselves to "must", "must not", "should",
  67 | and "may", and to use these in their lowercase form as that is generally considered to be more
  68 | readable.
  69 | 
  70 | <p>For non-normative content "strongly encouraged", "strongly discouraged", "encouraged",
  71 | "discouraged", "can", "cannot", "could", "could not", "might", and "might not" can be used instead.
  72 | 
  73 | 
  74 | <h3 id=other-specs>Compliance with other specifications</h3>
  75 | 
  76 | <p>In general, specifications interact with and rely on a wide variety of other specifications. In
  77 | certain circumstances, unfortunately, conflicting needs require a specification to violate the
  78 | requirements of other specifications. When this occurs, a document using the Infra Standard should
  79 | denote such transgressions as a <dfn export>willful violation</dfn>, and note the reason for that
  80 | violation.
  81 | 
  82 | <p class=example id=example-willful-violation>The previous section, [[#conformance]], documents a
  83 | <a>willful violation</a> of RFC 8174 committed by the Infra Standard.
  84 | 
  85 | 
  86 | <h3 id=terminology>Terminology</h3>
  87 | 
  88 | <p>The word "or", in cases where both inclusive "or" and exclusive "or" are possible (e.g., "if
  89 | either width or height is zero"), means an inclusive "or" (implying "or both"), unless it is called
  90 | out as being exclusive (with "but not both").
  91 | 
  92 | 
  93 | <h2 id=algorithms>Algorithms</h2>
  94 | 
  95 | <p>Algorithms, and requirements phrased in the imperative as part of algorithms (such as "strip any
  96 | leading spaces" or "return false") are to be interpreted with the meaning of the keyword (e.g.,
  97 | "must") used in introducing the algorithm or step. If no such keyword is used, must is implied.
  98 | 
  99 | <div class=example id=example-algorithms>
 100 |  <p>For example, were the spec to say:</p>
 101 | 
 102 |  <blockquote>
 103 |   <p class=allow-2119>To eat an orange, the user must:
 104 | 
 105 |   <ol class=brief>
 106 |    <li>Peel the orange.
 107 |    <li>Separate each slice of the orange.
 108 |    <li>Eat the orange slices.
 109 |   </ol>
 110 |  </blockquote>
 111 | 
 112 |  <p>it would be equivalent to the following:</p>
 113 | 
 114 |  <blockquote>
 115 |   <p>To eat an orange:
 116 | 
 117 |   <ol class=brief>
 118 |    <li class=allow-2119>The user must peel the orange.
 119 |    <li class=allow-2119>The user must separate each slice of the orange.
 120 |    <li class=allow-2119>The user must eat the orange slices.
 121 |   </ol>
 122 |  </blockquote>
 123 | 
 124 |  <p class=allow-2119>Here the key word is "must".</p>
 125 | 
 126 |  <p class=allow-2119>Modifying the above example, if the algorithm was introduced only with "To eat
 127 |  an orange:", it would still have the same meaning, as "must" is implied.
 128 | </div>
 129 | 
 130 | <p>Conformance requirements phrased as algorithms or specific steps may be implemented in any
 131 | manner, so long as the end result is equivalent. (In particular, the algorithms are intended to be
 132 | easy to follow, and not intended to be performant.)
 133 | 
 134 | <p class=note>Performance is tricky to get correct as it is influenced by user perception, computer
 135 | architectures, and different types of input that can change over time in how common they are. For
 136 | instance, a JavaScript engine likely has many different code paths for what is standardized as a
 137 | single algorithm, in order to optimize for speed or memory consumption. Standardizing all those code
 138 | paths would be an insurmountable task and not productive as they would not stand the test of time
 139 | as well as the single algorithm would. Therefore performance is best left as a field to compete
 140 | over.
 141 | 
 142 | 
 143 | <h3 id=variables>Variables</h3>
 144 | 
 145 | <p>A variable is declared with "let" and changed with "set".
 146 | 
 147 | <p class=example id=example-variable>Let |list| be a new <a>list</a>.</p>
 148 | 
 149 | <div class=example id=example-variable-null>
 150 |  <ol>
 151 |   <li><p>Let |value| be null.
 152 | 
 153 |   <li><p>If |input| is a <a>string</a>, then set |value| to |input|.
 154 | 
 155 |   <li><p>Otherwise, set |value| to |input|, <a>UTF-8 decoded</a>.
 156 | 
 157 |   <li><p><a>Assert</a>: |value| is a <a>string</a>.
 158 |  </ol>
 159 | </div>
 160 | 
 161 | <p class=example id=example-variable-ternary>Let <var ignore>activationTarget</var> be
 162 | <var ignore>target</var>, if <var ignore>isActivationEvent</var> is true and target has activation
 163 | behavior, and null otherwise.
 164 | 
 165 | <p>Variables must not be used before they are declared. Variables are
 166 | <a href=https://en.wikipedia.org/wiki/Scope_(computer_science)#Block_scope>block scoped</a>.
 167 | Variables must not be declared more than once per algorithm.
 168 | 
 169 | 
 170 | <h3 id=algorithm-control-flow>Control flow</h3>
 171 | 
 172 | <p>The control flow of algorithms is such that a requirement to "return" or "throw" terminates the
 173 | algorithm the statement was in. "Return" will hand the given value, if any, to its caller. "Throw"
 174 | will make the caller automatically rethrow the given value, if any, and thereby terminate the
 175 | caller's algorithm. Using prose the caller has the ability to "catch" the exception and perform
 176 | another action.
 177 | 
 178 | 
 179 | <h3 id=algorithm-conditional-abort>Conditional abort</h3>
 180 | 
 181 | <p>Sometimes it is useful to stop performing a series of steps once a condition becomes true.
 182 | 
 183 | <p>To do this, state that a given series of steps will <dfn export>abort when</dfn> a specific
 184 | <var>condition</var> is reached. This indicates that the specified steps must be evaluated, not
 185 | as-written, but by additionally inserting a step before each of them that evaluates
 186 | <var>condition</var>, and if <var>condition</var> evaluates to true, skips the remaining steps.
 187 | 
 188 | <p>In such algorithms, the subsequent step can be annotated to run <dfn export>if aborted</dfn>, in
 189 | which case it must run if any of the preceding steps were skipped due to the <var>condition</var>
 190 | of the preceding <a>abort when</a> step evaluated to true.
 191 | 
 192 | <div class=example id=example-conditional-abort>
 193 |  <p>The following algorithm
 194 | 
 195 |  <ol>
 196 |   <li><p>Let |result| be an empty <a>list</a>.
 197 | 
 198 |   <li>
 199 |    <p>Run these steps, but <a>abort when</a> the user clicks the "Cancel" button:
 200 | 
 201 |    <ol>
 202 |     <li><p>Compute the first million digits of <var>π</var>, and <a for=list>append</a> the result
 203 |     to |result|.
 204 | 
 205 |     <li><p>Compute the first million digits of |e|, and <a for=list>append</a> the result to
 206 |     |result|.
 207 | 
 208 |     <li><p>Compute the first million digits of <var>φ</var>, and <a for=list>append</a> the result
 209 |     to |result|.
 210 |    </ol>
 211 |   </li>
 212 | 
 213 |   <li><p><a>If aborted</a>, <a for=list>append</a> "<code>Didn't finish!</code>" to |result|.
 214 |  </ol>
 215 | 
 216 |  <p>is equivalent to the more verbose formulation</p>
 217 | 
 218 |  <ol>
 219 |   <li><p>Let |result| be an empty <a>list</a>.
 220 | 
 221 |   <li>
 222 |    <p>If the user has not clicked the "Cancel" button, then:
 223 | 
 224 |    <ol>
 225 |     <li><p>Compute the first million digits of <var>π</var>, and <a for=list>append</a> the result
 226 |     to |result|.
 227 | 
 228 |     <li>
 229 |      <p>If the user has not clicked the "Cancel" button, then:
 230 | 
 231 |      <ol>
 232 |       <li><p>Compute the first million digits of |e|, and <a for=list>append</a> the result to
 233 |       |result|.
 234 | 
 235 |       <li><p>If the user has not clicked the "Cancel" button, then compute the first million digits
 236 |       of <var>φ</var>, and <a for=list>append</a> the result to |result|.
 237 |      </ol>
 238 |    </ol>
 239 | 
 240 |   <li><p>If the user clicked the "Cancel" button, then <a for=list>append</a>
 241 |   "<code>Didn't finish!</code>" to |result|.
 242 |  </ol>
 243 | </div>
 244 | 
 245 | <p class=note>Whenever this construct is used, implementations are allowed to evaluate
 246 | <var>condition</var> during the specified steps rather than before and after each step, as long as
 247 | the end result is indistinguishable. For instance, as long as |result| in the above example is not
 248 | mutated during a compute operation, the user agent could stop the computation.
 249 | 
 250 | 
 251 | <h3 id=algorithm-iteration>Iteration</h3>
 252 | 
 253 | <p>There's a variety of ways to repeat a set of steps until a condition is reached.
 254 | 
 255 | <p class=note>The Infra Standard is not (yet) exhaustive on this; please file an issue if you need
 256 | something.
 257 | 
 258 | <dl>
 259 |  <dt>For each
 260 |  <dd><p>As defined <a for=list lt="for each">for lists</a> (and derivatives) and
 261 |  <a for=map lt="for each">maps</a>.
 262 | 
 263 |  <dt><dfn export for=iteration lt=while>While</dfn>
 264 |  <dd>
 265 |   <p>An instruction to repeat a set of steps as long as a condition is met.
 266 | 
 267 |   <div class=example id=example-while>
 268 |    <p>While |condition| is "<code>met</code>":
 269 | 
 270 |    <ol>
 271 |     <li><p>&hellip;
 272 |    </ol>
 273 |   </div>
 274 | </dl>
 275 | 
 276 | <p>An iteration's flow can be controlled via requirements to
 277 | <dfn export for=iteration>continue</dfn> or <dfn export for=iteration>break</dfn>.
 278 | <a for=iteration>Continue</a> will skip over any remaining steps in an iteration, proceeding to the
 279 | next item. If no further items remain, the iteration will stop. <a for=iteration>Break</a> will skip
 280 | over any remaining steps in an iteration, and skip over any remaining items as well, stopping the
 281 | iteration.
 282 | 
 283 | <div class=example id=example-break-continue>
 284 |  <p>Let |example| be the <a>list</a> « 1, 2, 3, 4 ». The following prose would perform |operation|
 285 |  upon 1, then 2, then 3, then 4:
 286 | 
 287 |  <ol>
 288 |   <li>
 289 |    <p><a for=list>For each</a> |item| of |example|:
 290 |    <ol>
 291 |     <li>Perform |operation| on |item|.
 292 |    </ol>
 293 |   </li>
 294 |  </ol>
 295 | 
 296 |  <p>The following prose would perform |operation| upon 1, then 2, then 4. 3 would be skipped.
 297 | 
 298 |  <ol>
 299 |   <li>
 300 |    <p><a for=list>For each</a> |item| of |example|:
 301 |    <ol>
 302 |     <li>If |item| is 3, then <a for=iteration>continue</a>.
 303 |     <li>Perform |operation| on |item|.
 304 |    </ol>
 305 |   </li>
 306 |  </ol>
 307 | 
 308 |  <p>The following prose would perform |operation| upon 1, then 2. 3 and 4 would be skipped.
 309 | 
 310 |  <ol>
 311 |   <li>
 312 |    <p><a for=list>For each</a> |item| of |example|:
 313 |    <ol>
 314 |     <li>If |item| is 3, then <a for=iteration>break</a>.
 315 |     <li>Perform |operation| on |item|.
 316 |    </ol>
 317 |   </li>
 318 |  </ol>
 319 | </div>
 320 | 
 321 | 
 322 | <h3 id=assertions>Assertions</h3>
 323 | 
 324 | <p>To improve readability, it can sometimes help to add assertions to algorithms, stating
 325 | invariants. To do this, write "<dfn export>Assert</dfn>:", followed by a statement that must be
 326 | true. If the statement ends up being false that indicates an issue with the document using the Infra
 327 | Standard that should be reported and addressed.
 328 | 
 329 | <p class=note>Since the statement can only ever be true, it has no implications for implementations.
 330 | 
 331 | <div class=example id=example-assert>
 332 |  <ol>
 333 |   <li><p>Let |x| be "<code>Aperture Science</code>".
 334 |   <li><p><a>Assert</a>: |x| is "<code>Aperture Science</code>".
 335 | </div>
 336 | 
 337 | 
 338 | <h2 id=primitive-data-types>Primitive data types</h2>
 339 | 
 340 | <h3 id=nulls>Nulls</h3>
 341 | 
 342 | <p>The value null is used to indicate the lack of a value. It can be used interchangeably with the
 343 | JavaScript <b>null</b> value. [[!ECMA-262]]
 344 | 
 345 | <p class=example id=example-null>Let <var ignore>element</var> be null.
 346 | 
 347 | <p class=example id=example-null-return>If <var>input</var> is the empty string, then return null.
 348 | 
 349 | 
 350 | <h3 id=booleans>Booleans</h3>
 351 | 
 352 | <p>A <dfn export>boolean</dfn> is either true or false.
 353 | 
 354 | <p class=example id=example-boolean>Let <var ignore>elementSeen</var> be false.
 355 | 
 356 | 
 357 | <h3 id=bytes>Bytes</h3>
 358 | 
 359 | <p>A <dfn export>byte</dfn> is a sequence of eight bits, represented as a double-digit hexadecimal
 360 | number in the range 0x00 to 0xFF, inclusive.
 361 | 
 362 | <p>An <dfn export>ASCII byte</dfn> is a <a>byte</a> in the range 0x00 (NUL) to 0x7F (DEL),
 363 | inclusive. As illustrated, an <a>ASCII byte</a>, excluding 0x28 and 0x29, may be followed by the
 364 | representation outlined in the <a href=https://tools.ietf.org/html/rfc20#section-2>Standard Code</a>
 365 | section of <cite>ASCII format for Network Interchange</cite>, between parentheses. [[!RFC20]]
 366 | 
 367 | <p>0x28 may be followed by "(left parenthesis)" and 0x29 by "(right parenthesis)".
 368 | 
 369 | <p class=example id=example-byte-notation>0x49 (I) when <a>UTF-8 decoded</a> becomes the
 370 | <a>code point</a> U+0049 (I).
 371 | 
 372 | 
 373 | <h3 id=byte-sequences>Byte sequences</h3>
 374 | 
 375 | <p>A <dfn export>byte sequence</dfn> is a sequence of <a>bytes</a>, represented as a space-separated
 376 | sequence of bytes. Byte sequences with bytes in the range 0x20 (SP) to 0x7E (~), inclusive, can
 377 | alternately be written as a string, but using backticks instead of quotation marks, to avoid
 378 | confusion with an actual <a>string</a>.
 379 | 
 380 | <div class=example id=example-byte-sequence-notation>
 381 |  <p>0x48 0x49 can also be represented as `<code>HI</code>`.
 382 | 
 383 |  <p>Headers, such as `<code>Content-Type</code>`, are <a>byte sequences</a>.
 384 | </div>
 385 | 
 386 | <p class=note>To get a <a>byte sequence</a> out of a <a>string</a>, using <a>UTF-8 encode</a> from
 387 | the Encoding Standard is encouraged. In rare circumstances <a>isomorphic encode</a> might be needed.
 388 | [[ENCODING]]
 389 | 
 390 | <p>A <a>byte sequence</a>'s <dfn export for="byte sequence">length</dfn> is the number of
 391 | <a>bytes</a> it contains.
 392 | 
 393 | <p>To <dfn export>byte-lowercase</dfn> a <a>byte sequence</a>, increase each <a>byte</a> it
 394 | contains, in the range 0x41 (A) to 0x5A (Z), inclusive, by 0x20.
 395 | 
 396 | <p>To <dfn export>byte-uppercase</dfn> a <a>byte sequence</a>, subtract each <a>byte</a> it
 397 | contains, in the range 0x61 (a) to 0x7A (z), inclusive, by 0x20.
 398 | 
 399 | <p>A <a>byte sequence</a> <var>A</var> is a <dfn export>byte-case-insensitive</dfn> match for a
 400 | <a>byte sequence</a> <var>B</var>, if the <a>byte-lowercase</a> of <var>A</var> is the
 401 | <a>byte-lowercase</a> of <var>B</var>.
 402 | 
 403 | <p>To <dfn export>isomorphic decode</dfn> a <a>byte sequence</a> <var>input</var>, return a
 404 | <a>string</a> whose <a for=string>length</a> is equal to <var>input</var>'s
 405 | <a for="byte sequence">length</a> and whose <a>code points</a> have the same values as
 406 | <var>input</var>'s <a>bytes</a>, in the same order.
 407 | 
 408 | 
 409 | <h3 id=code-points>Code points</h3>
 410 | 
 411 | <p>A <dfn export lt="code point|character">code point</dfn> is a Unicode code point and is
 412 | represented as a four-to-six digit hexadecimal number, typically prefixed with "U+".
 413 | 
 414 | <p>A <a>code point</a> may be followed by its name, by its rendered form between parentheses when it
 415 | is not U+0028 or U+0029, or by both. Documents using the Infra Standard are encouraged to follow
 416 | <a>code points</a> by their name when they cannot be rendered or are U+0028 or U+0029, and their
 417 | rendered form between parentheses otherwise, for legibility.
 418 | 
 419 | <p>A <a>code point</a>'s name is defined in the Unicode Standard and represented in
 420 | <a>ASCII uppercase</a>. [[!UNICODE]]
 421 | 
 422 | <div class=example id=example-code-point-notation>
 423 |  <p>The <a>code point</a> rendered as 🤔 is represented as U+1F914.
 424 | 
 425 |  <p>When referring to that <a>code point</a>, we might say "U+1F914 (🤔)", to provide extra context.
 426 |  Documents are allowed to use "U+1F914 THINKING FACE (🤔)" as well, though this is somewhat verbose.
 427 | </div>
 428 | 
 429 | <p class=example id=example-code-point-notation-hard-to-render><a>Code points</a> that are difficult
 430 | to render unambigiously, such as U+000A, can be referred to as "U+000A LF". U+0029 can be referred
 431 | to as "U+0029 RIGHT PARENTHESIS", because even though it renders, this avoids unmatched parentheses.
 432 | 
 433 | <p><a>Code points</a> are sometimes referred to as <a>characters</a> and in certain contexts are
 434 | prefixed with "0x" rather than "U+".
 435 | 
 436 | <p>A <dfn export>surrogate</dfn> is a <a>code point</a> that is in the range U+D800 to U+DFFF,
 437 | inclusive.
 438 | 
 439 | <p>A <dfn export>scalar value</dfn> is a <a>code point</a> that is not a <a>surrogate</a>.
 440 | 
 441 | <p>A <dfn export>noncharacter</dfn> is a <a>code point</a> that is in the range U+FDD0 to U+FDEF,
 442 | inclusive, or U+FFFE, U+FFFF, U+1FFFE, U+1FFFF, U+2FFFE, U+2FFFF, U+3FFFE, U+3FFFF, U+4FFFE,
 443 | U+4FFFF, U+5FFFE, U+5FFFF, U+6FFFE, U+6FFFF, U+7FFFE, U+7FFFF, U+8FFFE, U+8FFFF, U+9FFFE, U+9FFFF,
 444 | U+AFFFE, U+AFFFF, U+BFFFE, U+BFFFF, U+CFFFE, U+CFFFF, U+DFFFE, U+DFFFF, U+EFFFE, U+EFFFF, U+FFFFE,
 445 | U+FFFFF, U+10FFFE, or U+10FFFF.
 446 | 
 447 | <p>An <dfn export>ASCII code point</dfn> is a <a>code point</a> in the range U+0000 NULL to
 448 | U+007F DELETE, inclusive.
 449 | 
 450 | <p>An <dfn export lt="ASCII tab or newline|ASCII tabs or newlines">ASCII tab or newline</dfn> is
 451 | U+0009 TAB, U+000A LF, or U+000D CR.
 452 | 
 453 | <p><dfn export>ASCII whitespace</dfn> is U+0009 TAB, U+000A LF, U+000C FF, U+000D CR, or U+0020
 454 | SPACE.
 455 | 
 456 | <p class=note>"Whitespace" is a mass noun.
 457 | 
 458 | <p>A <dfn export>C0 control</dfn> is a <a>code point</a> in the range U+0000 NULL to
 459 | U+001F INFORMATION SEPARATOR ONE, inclusive.
 460 | 
 461 | <p>A <dfn export lt="C0 control or space|C0 controls or spaces">C0 control or space</dfn> is a
 462 | <a>C0 control</a> or U+0020 SPACE.
 463 | 
 464 | <p>A <dfn export>control</dfn> is a <a>C0 control</a> or a <a>code point</a> in the range
 465 | U+007F DELETE to U+009F APPLICATION PROGRAM COMMAND, inclusive.
 466 | 
 467 | <p>An <dfn export>ASCII digit</dfn> is a <a>code point</a> in the range U+0030 (0) to U+0039 (9),
 468 | inclusive.
 469 | 
 470 | <p>An <dfn export>ASCII upper hex digit</dfn> is an <a>ASCII digit</a> or a <a>code point</a> in the
 471 | range U+0041 (A) to U+0046 (F), inclusive.
 472 | 
 473 | <p>An <dfn export>ASCII lower hex digit</dfn> is an <a>ASCII digit</a> or a <a>code point</a> in the
 474 | range U+0061 (a) to U+0066 (f), inclusive.
 475 | 
 476 | <p>An <dfn export>ASCII hex digit</dfn> is an <a>ASCII upper hex digit</a> or
 477 | <a>ASCII lower hex digit</a>.
 478 | 
 479 | <p>An <dfn export>ASCII upper alpha</dfn> is a <a>code point</a> in the range U+0041 (A) to
 480 | U+005A (Z), inclusive.
 481 | 
 482 | <p>An <dfn export>ASCII lower alpha</dfn> is a <a>code point</a> in the range U+0061 (a) to
 483 | U+007A (z), inclusive.
 484 | 
 485 | <p>An <dfn export>ASCII alpha</dfn> is an <a>ASCII upper alpha</a> or <a>ASCII lower alpha</a>.
 486 | 
 487 | <p>An <dfn export>ASCII alphanumeric</dfn> is an <a>ASCII digit</a> or <a>ASCII alpha</a>.
 488 | 
 489 | 
 490 | <h3 id=strings>Strings</h3>
 491 | 
 492 | <p>A <dfn export>JavaScript string</dfn> is a sequence of unsigned 16-bit integers, also known as
 493 | <dfn export lt="code unit">code units</dfn>.
 494 | 
 495 | <p class=note>This is different from how the Unicode Standard defines "code unit". In particular it
 496 | refers exclusively to how the Unicode Standard defines it for Unicode 16-bit strings. [[UNICODE]]
 497 | 
 498 | <p>A <a>JavaScript string</a>'s <dfn export for="JavaScript string">length</dfn> is the number of
 499 | <a>code units</a> it contains.
 500 | 
 501 | <p>A <a>JavaScript string</a> can also be interpreted as containing <a>code points</a>, per the
 502 | conversion defined in <a>The String Type</a> section of the JavaScript specification. [[!ECMA-262]]
 503 | 
 504 | <p class=note>This conversion process converts surrogate pairs into their corresponding
 505 | <a>scalar value</a> and maps isolated surrogates to their corresponding <a>code point</a>, leaving
 506 | them effectively as-is.
 507 | 
 508 | <p class=example id=example-javascript-string-in-code-points>A <a>JavaScript string</a> consisting
 509 | of the <a>code units</a> 0xD83D, 0xDCA9, and 0xD800, when interpreted as containing
 510 | <a>code points</a>, would consist of the <a>code points</a> U+1F4A9 and U+D800.
 511 | 
 512 | <p>A <dfn export>scalar value string</dfn> is a sequence of <a>scalar values</a>.
 513 | 
 514 | <p class=note>A <a>scalar value string</a> is useful for any kind of I/O or other kind of operation
 515 | where <a>UTF-8 encode</a> comes into play.
 516 | <!-- It's also useful if you can imagine the subsystem to be implemented in Rust -->
 517 | 
 518 | <p><dfn export lt=string>String</dfn> can be used to refer to either a <a>JavaScript string</a> or
 519 | <a>scalar value string</a>, when it is clear from the context which is meant or when the distinction
 520 | is immaterial. <a>Strings</a> are denoted by double quotes and monospace font.
 521 | 
 522 | <p class=example id=example-string-notation>"<code>Hello, world!</code>" is a string.
 523 | 
 524 | <p>A <a>string</a>'s <dfn export for=string>length</dfn> is the number of <a>code points</a> it
 525 | contains.
 526 | 
 527 | <p>To <dfn export for="JavaScript string">convert</dfn> a <a>JavaScript string</a> into a
 528 | <a>scalar value string</a>, replace any <a>surrogates</a> with U+FFFD.
 529 | <!-- Obviates need for https://heycam.github.io/webidl/#dfn-obtain-unicode -->
 530 | 
 531 | <p class=note>The replaced surrogates are always isolated surrogates, since the process of
 532 | interpreting the JavaScript string as containing <a>code points</a> will have converted surrogate
 533 | pairs into <a>scalar values</a>.
 534 | 
 535 | <p>A <a>scalar value string</a> can always be used as <a>JavaScript string</a> implicitly since it
 536 | is a subset. The reverse is only possible if the <a>JavaScript string</a> is known to not contain
 537 | <a>surrogates</a>; otherwise a <a for="JavaScript string" lt=convert>conversion</a> must be
 538 | performed.
 539 | 
 540 | <p class=note>An implementation likely has to perform explicit conversion, depending on how it
 541 | actually ends up representing <a lt="JavaScript string">JavaScript</a> and
 542 | <a>scalar value strings</a>. It is even fairly typical for implementations to have multiple
 543 | implementations of just <a>JavaScript strings</a> for performance and memory reasons.
 544 | 
 545 | <hr>
 546 | 
 547 | <p>To <dfn export>isomorphic encode</dfn> a <a>string</a> <var>input</var>, run these steps:</p>
 548 | 
 549 | <ol>
 550 |  <li><p><a>Assert</a>: <var>input</var> contains no <a>code points</a> greater than U+00FF.
 551 | 
 552 |  <li><p>Return a <a>byte sequence</a> whose <a for="byte sequence">length</a> is equal to
 553 |  <var>input</var>'s <a for=string>length</a> and whose <a>bytes</a> have the same values as
 554 |  <var>input</var>'s <a>code points</a>, in the same order.
 555 | </ol>
 556 | 
 557 | <hr>
 558 | 
 559 | <p>An <dfn export>ASCII string</dfn> is a <a>string</a> whose <a>code points</a> are all
 560 | <a>ASCII code points</a>.
 561 | 
 562 | <p>To <dfn export>ASCII lowercase</dfn> a <a>string</a>, replace all <a>ASCII upper alphas</a> in
 563 | the <a>string</a> with their corresponding <a>code point</a> in <a>ASCII lower alpha</a>.
 564 | 
 565 | <p>To <dfn export>ASCII uppercase</dfn> a <a>string</a>, replace all <a>ASCII lower alphas</a> in
 566 | the <a>string</a> with their corresponding <a>code point</a> in <a>ASCII upper alpha</a>.
 567 | 
 568 | <p>A <a>string</a> <var>A</var> is an <dfn export>ASCII case-insensitive</dfn> match for a
 569 | <a>string</a> <var>B</var>, if the <a>ASCII lowercase</a> of <var>A</var> is the
 570 | <a>ASCII lowercase</a> of <var>B</var>.
 571 | <!-- TODO: define string equals? -->
 572 | 
 573 | <hr>
 574 | 
 575 | <p>To <dfn export>strip newlines</dfn> from a <a>string</a>, remove any U+000A LF and U+000D CR
 576 | <a>code points</a> from the <a>string</a>.
 577 | 
 578 | <p>To <dfn export>strip leading and trailing ASCII whitespace</dfn> from a <a>string</a>, remove all
 579 | <a>ASCII whitespace</a> that are at the start or the end of the <a>string</a>.
 580 | 
 581 | <p>To <dfn export>strip and collapse ASCII whitespace</dfn> in a <a>string</a>, replace any sequence
 582 | of one or more consecutive <a>code points</a> that are <a>ASCII whitespace</a> in the <a>string</a>
 583 | with a single U+0020 SPACE <a>code point</a>, and then remove any leading and trailing
 584 | <a>ASCII whitespace</a> from that string.
 585 | 
 586 | <hr>
 587 | 
 588 | <p>To <dfn export lt="collect a sequence of code points|collecting a sequence of code
 589 | points">collect a sequence of <a>code points</a></dfn> meeting a condition <var>condition</var> from
 590 | a <a>string</a> <var>input</var>, given a <dfn export for="string">position variable</dfn>
 591 | <var>position</var> tracking the position of the calling algorithm within <var>input</var>:</p>
 592 | 
 593 | <ol>
 594 |  <li><p>Let <var>result</var> be the empty <a>string</a>.
 595 | 
 596 |  <li>
 597 |   <p>While <var>position</var> doesn't point past the end of <var>input</var> and the
 598 |   <a>code point</a> at <var>position</var> within <var>input</var> meets the condition
 599 |   <var>condition</var>:
 600 | 
 601 |   <ol>
 602 |    <li><p>Append that <a>code point</a> to the end of <var>result</var>.
 603 | 
 604 |    <li><p>Advance <var>position</var> by 1.
 605 |   </ol>
 606 |  </li>
 607 | 
 608 |  <li><p>Return <var>result</var>.
 609 | </ol>
 610 | 
 611 | <p class=note>In addition to returning the collected <a>code points</a>, this algorithm updates the
 612 | <a>position variable</a> in the calling algorithm.
 613 | 
 614 | <p>To <dfn export>skip ASCII whitespace</dfn> within a <a>string</a> <var>input</var> given a
 615 | <a>position variable</a> <var>position</var>, <a>collect a sequence of code points</a> that are
 616 | <a>ASCII whitespace</a> from <var>input</var> given <var>position</var>. The collected
 617 | <a>code points</a> are not used, but <var>position</var> is still updated.
 618 | 
 619 | <hr>
 620 | 
 621 | <p>To <dfn export lt="strictly split|strictly split a string">strictly split a <a>string</a></dfn>
 622 | <var>input</var> on a particular delimiter <a>code point</a> <var>delimiter</var>:</p>
 623 | 
 624 | <ol>
 625 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 626 |  pointing at the start of <var>input</var>.
 627 | 
 628 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 629 | 
 630 |  <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 631 |  not equal to <var>delimiter</var> from <var>input</var>, given <var>position</var>.
 632 | 
 633 |  <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 634 | 
 635 |  <li>
 636 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 637 | 
 638 |   <ol>
 639 |    <li><p>Advance <var>position</var> to the next <a>code point</a> in <var>input</var>. (This
 640 |    skips past the delimiter.)
 641 | 
 642 |    <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 643 |    not equal to <var>delimiter</var> from <var>input</var>, given <var>position</var>.
 644 | 
 645 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 646 |   </ol>
 647 |  </li>
 648 | 
 649 |  <li><p>Return <var>tokens</var>.
 650 | </ol>
 651 | 
 652 | <p class=note>This algorithm is a "strict" split, as opposed to the commonly-used variants
 653 | <a lt="split on ASCII whitespace">for ASCII whitespace</a> and
 654 | <a lt="split on commas">for commas</a> below, which are both more lenient in various ways involving
 655 | interspersed <a>ASCII whitespace</a>.
 656 | 
 657 | <p>To <dfn export lt="split on ASCII whitespace|split a string on ASCII whitespace">split a
 658 | <a>string</a> <var>input</var> on ASCII whitespace</dfn>:
 659 | 
 660 | <ol>
 661 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 662 |  pointing at the start of <var>input</var>.
 663 | 
 664 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 665 | 
 666 |  <li><p><a>Skip ASCII whitespace</a> within <var>input</var> given <var>position</var>.
 667 | 
 668 |  <li>
 669 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 670 | 
 671 |   <ol>
 672 |    <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 673 |    not <a>ASCII whitespace</a> from <var>input</var>, given <var>position</var>.
 674 | 
 675 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 676 | 
 677 |    <li><p><a>Skip ASCII whitespace</a> within <var>input</var> given <var>position</var>.
 678 |   </ol>
 679 |  </li>
 680 | 
 681 |  <li><p>Return <var>tokens</var>.
 682 | </ol>
 683 | 
 684 | <p>To <dfn export lt="split on commas|split a string on commas">split a <a>string</a>
 685 | <var>input</var> on commas</dfn>:
 686 | 
 687 | <ol>
 688 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 689 |  pointing at the start of <var>input</var>.
 690 | 
 691 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 692 | 
 693 |  <li>
 694 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 695 | 
 696 |   <ol>
 697 |    <li>
 698 |     <p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 699 |     not U+002C (,) from <var>input</var>, given <var>position</var>.
 700 | 
 701 |     <p class=note><var>token</var> might be the empty string.
 702 |    </li>
 703 | 
 704 |    <li><a>Strip leading and trailing ASCII whitespace</a> from <var>token</var>.
 705 | 
 706 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 707 | 
 708 |    <li>
 709 |     <p>If <var>position</var> is not past the end of <var>input</var>, then:
 710 | 
 711 |     <ol>
 712 |      <li><p><a>Assert</a>: the <a>code point</a> at <var>position</var> within <var>input</var> is
 713 |      U+002C (,).
 714 | 
 715 |      <li><p>Advance <var>position</var> by 1.
 716 |     </ol>
 717 |    </li>
 718 |   </ol>
 719 |  </li>
 720 | 
 721 |  <li><p>Return <var>tokens</var>.
 722 | </ol>
 723 | 
 724 | <p>To <dfn export for=string lt=concatenate|concatenation>concatenate</dfn> a <a for=/>list</a> of
 725 | <a for=/>strings</a> <var>list</var>, using an optional separator string <var>separator</var>, run
 726 | these steps:
 727 | 
 728 | <ol>
 729 |  <li><p>If <var>list</var> <a for=list>is empty</a>, then return the empty string.
 730 | 
 731 |  <li><p>If <var>separator</var> is not given, then set <var>separator</var> to the empty string.
 732 | 
 733 |  <li><p>Return a <a for=/>string</a> whose contents are <var>list</var>'s <a for=list>items</a>, in
 734 |  order, separated from each other by <var>separator</var>.
 735 | </ol>
 736 | 
 737 | <p class=example id=example-string-concatenate>To serialize a set <var>set</var>, return the
 738 | <a for=string>concatenation</a> of <var>set</var> using U+0020 SPACE.
 739 | 
 740 | 
 741 | <h2 id=data-structures>Data structures</h2>
 742 | 
 743 | <p>Conventionally, specifications have operated on a variety of vague specification-level data
 744 | structures, based on shared understanding of their semantics. This generally works well, but can
 745 | lead to ambiguities around edge cases, such as iteration order or what happens when you
 746 | <a for=set>append</a> an <a for=set>item</a> to an <a>ordered set</a> that the set already
 747 | <a for=set>contains</a>. It has also led to a variety of divergent notation and phrasing, especially
 748 | around more complex data structures such as <a lt="ordered map">maps</a>.
 749 | 
 750 | <p>This standard provides a small set of common data structures, along with notation and phrasing
 751 | for working with them, in order to create common ground.
 752 | 
 753 | 
 754 | <h3 id=lists>Lists</h3>
 755 | 
 756 | <p>A <dfn export>list</dfn> is a specification type consisting of a finite ordered sequence of
 757 | <dfn export for=list,stack,queue,set lt=item>items</dfn>.
 758 | 
 759 | <p>For notational convenience, a literal syntax can be used to express <a>lists</a>, by surrounding
 760 | the list by « » characters and separating its <a for=list>items</a> with a comma. An indexing syntax
 761 | can be used by providing a zero-based index into a list inside square brackets. The index cannot be
 762 | out-of-bounds, except when used with <a for=list>exists</a>.
 763 | 
 764 | <p class=example id=example-list-notation>Let |example| be the <a>list</a> « "<code>a</code>",
 765 | "<code>b</code>", "<code>c</code>", "<code>a</code>" ». Then |example|[1] is the <a>string</a>
 766 | "<code>b</code>".
 767 | 
 768 | <hr>
 769 | 
 770 | <p>To <dfn export for=list>append</dfn> to a <a>list</a> that is not an <a>ordered set</a> is to
 771 | add the given <a for=list>item</a> to the end of the list.
 772 | 
 773 | <p>To <dfn export for=list>prepend</dfn> to a <a>list</a> that is not an <a>ordered set</a> is to
 774 | add the given <a for=list>item</a> to the beginning of the list.
 775 | 
 776 | <p>To <dfn export for=list>replace</dfn> within a <a>list</a> that is not an <a>ordered set</a> is
 777 | to replace all items from the list that match a given condition with the given <a for=list>item</a>,
 778 | or do nothing if none do.
 779 | 
 780 | <p class=note>The above definitions are modified when the <a>list</a> is an <a>ordered set</a>; see
 781 | below for <a for=set lt=append>ordered set append</a>, <a for=set>prepend</a>, and
 782 | <a for=set>replace</a>.
 783 | 
 784 | <p>To <dfn export for=list,set>insert</dfn> an <a for=list>item</a> into a <a>list</a> before an
 785 | index is to add the given item to the list between the given index &minus; 1 and the given index. If
 786 | the given index is 0, then <a for=list>prepend</a> the given item to the list.
 787 | 
 788 | <p>To <dfn export for=list,set>remove</dfn> zero or more <a for=list>items</a> from a <a>list</a> is
 789 | to remove all items from the list that match a given condition, or do nothing if none do.
 790 | 
 791 | <div class=example id=example-list-remove>
 792 |  <p><a for=list>Removing</a> |x| from the <a>list</a> « |x|, |y|, |z|, |x| » is to remove all
 793 |  items from the list that are equal to |x|. The list now is equivalent to « |y|, |z| ».
 794 | 
 795 |  <p><a for=list>Removing</a> all items that start with the <a>string</a> "<code>a</code>" from the
 796 |  <a>list</a> « "<code>a</code>", "<code>b</code>", "<code>ab</code>", "<code>ba</code>" » is to
 797 |  remove the items "<code>a</code>" and "<code>ab</code>". The list is now equivalent to «
 798 |  "<code>b</code>", "<code>ba</code>" ».
 799 | </div>
 800 | 
 801 | <p>To <dfn export for=list,stack,queue,set>empty</dfn> a <a>list</a> is to <a for=list>remove</a>
 802 | all of its <a for=list>items</a>.
 803 | 
 804 | <p>A <a>list</a> <dfn export for=list,stack,queue,set lt=contain|exist>contains</dfn> an
 805 | <a for=list>item</a> if it appears in the list. We can also denote this by saying that, for a
 806 | <a>list</a> |list| and an index |index|, "|list|[|index|] <a for=list>exists</a>".
 807 | 
 808 | <p>A <a>list</a>'s <dfn export for=list,stack,queue,set>size</dfn> is the number of
 809 | <a for=list>items</a> the list <a for=list>contains</a>.
 810 | 
 811 | <p>A <a>list</a> <dfn export for=list,stack,queue,set lt="is empty|is not empty">is empty</dfn> if
 812 | its <a for=list>size</a> is zero.
 813 | 
 814 | <p>To <dfn export for=list,set lt="iterate|for each">iterate</dfn> over a <a>list</a>, performing a
 815 | set of steps on each <a for=list>item</a> in order, use phrasing of the form
 816 | "<a for=list>For each</a> |item| of <var ignore>list</var>", and then operate on |item| in the
 817 | subsequent prose.
 818 | 
 819 | <p>To <dfn export for=list,stack,queue,set>clone</dfn> a <a>list</a> |list| is to create a new
 820 | <a>list</a> |clone|, of the same designation, and, <a for=list>for each</a> |item| of |list|,
 821 | <a for=list>append</a> |item| to |clone|, so that |clone| <a for=list>contains</a> the same
 822 | <a for=list>items</a>, in the same order as |list|.
 823 | 
 824 | Note: This is a "shallow clone", as the <a for=list>items</a> themselves are not cloned in any way.
 825 | 
 826 | <p class=example id=example-list-clone>Let |original| be the <a>ordered set</a> «
 827 | "<code>a</code>", "<code>b</code>", "<code>c</code>" ». <a for=set>Cloning</a> |original| creates
 828 | a new <a>ordered set</a> |clone|, so that <a for=set>replacing</a> "<code>a</code>" with
 829 | "<code>foo</code>" in |clone| gives « "<code>foo</code>", "<code>b</code>", "<code>c</code>" »,
 830 | while |original|[0] is still the <a>string</a> "<code>a</code>".
 831 | 
 832 | <hr>
 833 | 
 834 | <p>The <a>list</a> type originates from the JavaScript specification (where it is capitalized, as
 835 | <a spec=ecma-262>List</a>); we repeat some elements of its definition here for ease of reference,
 836 | and provide an expanded vocabulary for manipulating <a>lists</a>. Whenever JavaScript expects a
 837 | <a spec=ecma-262>List</a>, a <a>list</a> as defined here can be used; they are the same type.
 838 | [[!ECMA-262]]
 839 | 
 840 | <h4 id=stacks>Stacks</h4>
 841 | 
 842 | <p>Some <a>lists</a> are designated as <dfn export lt=stack>stacks</dfn>. A stack is a <a>list</a>,
 843 | but conventionally, the following operations are used to operate on it, instead of using
 844 | <a for=list>append</a>, <a for=list>prepend</a>, or <a for=list>remove</a>.
 845 | 
 846 | <p>To <dfn export for=stack>push</dfn> onto a <a>stack</a> is to <a for=list>append</a> to it.
 847 | 
 848 | <p>To <dfn export for=stack>pop</dfn> from a <a>stack</a> is to <a for=list>remove</a> its last
 849 | <a for=stack>item</a> and return it, if the <a>stack</a> <a for=stack>is not empty</a>, or to return
 850 | nothing otherwise.
 851 | 
 852 | <p>Although <a>stacks</a> are <a>lists</a>, <a for=list>for each</a> must not be used with them;
 853 | instead, a combination of <a>while</a> and <a for=stack>pop</a> is more appropriate.
 854 | 
 855 | <h4 id=queues>Queues</h4>
 856 | 
 857 | <p>Some <a>lists</a> are designated as <dfn export lt=queue>queues</dfn>. A queue is a <a>list</a>,
 858 | but conventionally, the following operations are used to operate on it, instead of using
 859 | <a for=list>append</a>, <a for=list>prepend</a>, or <a for=list>remove</a>.
 860 | 
 861 | <p>To <dfn export for=queue>enqueue</dfn> in a <a>queue</a> is to <a for=list>append</a> to it.
 862 | 
 863 | <p>To <dfn export for=queue>dequeue</dfn> from a <a>queue</a> is to <a for=list>remove</a> its first
 864 | <a for=queue>item</a> and return it, if the <a>queue</a> <a for=queue>is not empty</a>, or to return
 865 | nothing if it is.
 866 | 
 867 | <p>Although <a>queues</a> are <a>lists</a>, <a for=list>for each</a> must not be used with them;
 868 | instead, a combination of <a>while</a> and <a for=queue>dequeue</a> is more appropriate.
 869 | 
 870 | <h4 id=sets>Sets</h4>
 871 | 
 872 | <p>Some <a>lists</a> are designated as <dfn export lt="ordered set|set">ordered sets</dfn>. An
 873 | ordered set is a <a>list</a> with the additional semantic that it must not contain the same
 874 | <a for=set>item</a> twice.
 875 | 
 876 | <p class=note>Almost all cases on the web platform require an <em>ordered</em> set, instead of an
 877 | unordered one, since interoperability requires that any developer-exposed enumeration of the set's
 878 | contents be consistent between browsers. In those cases where order is not important, we still use
 879 | ordered sets; implementations can optimize based on the fact that the order is not observable.
 880 | 
 881 | <p>To <dfn export for=set>append</dfn> to an <a>ordered set</a> is to do nothing if the set already
 882 | <a for=list>contains</a> the given <a for=set>item</a>, or to perform the normal <a>list</a>
 883 | <a for=list>append</a> operation otherwise.
 884 | 
 885 | <p>To <dfn export for=set>prepend</dfn> to an <a>ordered set</a> is to do nothing if the set already
 886 | <a for=list>contains</a> the given <a for=set>item</a>, or to perform the normal <a>list</a>
 887 | <a for=list>prepend</a> operation otherwise.
 888 | 
 889 | <p>To <dfn export for=set lt=replace|replacing>replace</dfn> within an <a>ordered set</a>
 890 | <var>set</var>, given <var>item</var> and <var>replacement</var>: if <var>set</var>
 891 | <a for=set>contains</a> <var>item</var> or <var>replacement</var>, then replace the first instance
 892 | of either with <var>replacement</var> and <a for=set>remove</a> all other instances.
 893 | 
 894 | <p class=example id=example-set-replace><a for="set">Replacing</a> "a" with "c" within the
 895 | <a>ordered set</a> « "a", "b", "c" » gives « "c", "b" ». Within « "c", "b", "a" » it gives
 896 | « "c", "b" » as well.
 897 | 
 898 | <p>An <a>ordered set</a> |set| is a <dfn export for=set>subset</dfn> of another <a>ordered set</a>
 899 | |superset| (and conversely, |superset| is a <dfn export for=set>superset</dfn> of |set|) if,
 900 | <a for=list>for each</a> |item| of |set|, |superset| <a for=set>contains</a> |item|.
 901 | 
 902 | <p class=note>This implies that an <a>ordered set</a> is both a <a for=set>subset</a> and a
 903 | <a for=set>superset</a> of itself.
 904 | 
 905 | <p>The <dfn export for=set>intersection</dfn> of <a>ordered sets</a> |A| and |B|, is the result
 906 | of creating a new <a>ordered set</a> |set| and, <a for=list>for each</a> |item| of |A|, if |B|
 907 | <a for=set>contains</a> |item|, <a for=set>appending</a> |item| to |set|.
 908 | 
 909 | <p>The <dfn export for=set>union</dfn> of <a>ordered sets</a> |A| and |B|, is the result of
 910 | <a for=list>cloning</a> |A| as |set| and, <a for=list>for each</a> |item| of |B|,
 911 | <a for=set>appending</a> |item| to |set|.
 912 | 
 913 | <hr>
 914 | 
 915 | <p><dfn export lt="the range">The range</dfn> <var>n</var> to <var>m</var>, inclusive, creates a new
 916 | <a>ordered set</a> containing all of the integers from <var>n</var> up to and including <var>m</var>
 917 | in consecutively increasing order, as long as <var>m</var> is greather than or equal to
 918 | <var>n</var>.
 919 | 
 920 | <p class=example id=example-the-range><a for=set>For each</a> <var>n</var> of <a>the range</a> 1 to
 921 | 4, inclusive, &hellip;
 922 | 
 923 | 
 924 | <h3 id=maps>Maps</h3>
 925 | 
 926 | <p>An <dfn export lt="ordered map|map">ordered map</dfn>, or sometimes just "map", is a
 927 | specification type consisting of a finite ordered sequence of
 928 | <dfn for=map export>key</dfn>/<dfn for=map export>value</dfn> pairs, with no key appearing twice.
 929 | Each key/value pair is called an <dfn for=map export>entry</dfn>.
 930 | 
 931 | <p class=note>As with <a>ordered sets</a>, by default we assume that maps need to be ordered for
 932 | interoperability among implementations.
 933 | 
 934 | <p>A literal syntax can be used to express <a>ordered maps</a>, by surrounding the ordered map with
 935 | «[ ]» characters, denoting each of its <a for=map>entries</a> as |key| → |value|, and separating its
 936 | entries with a comma. An indexing syntax can be used to look up and set <a for=map>values</a> by
 937 | providing a <a for=map>key</a> inside square brackets.
 938 | 
 939 | <p class=example id=example-map-notation>Let |example| be the <a>ordered map</a> «[
 940 | "<code>a</code>" → `<code>x</code>`, "<code>b</code>" → `<code>y</code>` ]». Then
 941 | |example|["<code>a</code>"] is the <a>byte sequence</a> `<code>x</code>`.
 942 | 
 943 | <hr>
 944 | 
 945 | <p>To <dfn export for=map lt="get|get the value">get the value of an entry</dfn> in an
 946 | <a>ordered map</a> given a <a for=map>key</a> is to retrieve the <a for=map>value</a> of any
 947 | existing <a for=map>entry</a> if the map <a for=map>contains</a> an entry with the given key, or
 948 | to return nothing otherwise. We can also use the indexing syntax explained above.
 949 | 
 950 | <p>To <dfn export for=map lt="set|set the value">set the value of an entry</dfn> in an
 951 | <a>ordered map</a> to a given <a for=map>value</a> is to update the value of any existing
 952 | <a for=map>entry</a> if the map <a for=map>contains</a> an entry with the given <a for=map>key</a>,
 953 | or if none such exists, to add a new entry with the given key/value to the end of the map. We can
 954 | also denote this by saying, for an <a>ordered map</a> |map|, key |key|, and value |value|,
 955 | "<a for=map>set</a> |map|[|key|] to |value|".
 956 | 
 957 | <p>To <dfn export for=map lt=remove>remove an entry</dfn> from an <a>ordered map</a> is to remove
 958 | all <a for=map>entries</a> from the map that match a given condition, or do nothing if none do. If
 959 | the condition is having a certain <a for=map>key</a>, then we can also denote this by saying, for
 960 | an <a>ordered map</a> |map| and key |key|, "<a for=map>remove</a> |map|[|key|]".
 961 | 
 962 | <p>An <a>ordered map</a> <dfn export for=map lt=exist|contain id=map-exists>contains an
 963 | <a for=map>entry</a> with a given key</dfn> if there exists an entry with that <a for=map>key</a>.
 964 | We can also denote this by saying that, for an <a>ordered map</a> |map| and key |key|, "|map|[|key|]
 965 | <a for=map>exists</a>".
 966 | 
 967 | <p>To <dfn export for=map lt="getting the keys|get the keys">get the keys</dfn> of an
 968 | <a>ordered map</a>, return a new <a>ordered set</a> whose <a for=set>items</a> are each of the
 969 | <a for=map>keys</a> in the map's <a for=map>entries</a>.
 970 | 
 971 | <p>To <dfn export for=map lt="getting the values|get the values">get the values</dfn> of an
 972 | <a>ordered map</a>, return a new <a>list</a> whose <a for=list>items</a> are each of the
 973 | <a for=map>values</a> in the map's <a for=map>entries</a>.
 974 | 
 975 | <p>An <a>ordered map</a>'s <dfn export for=map>size</dfn> is the <a for=set>size</a> of the result
 976 | of running <a for=map>get the keys</a> on the map.
 977 | 
 978 | <p>An <a>ordered map</a> <dfn export for=map lt="is empty|is not empty">is empty</dfn> if its
 979 | <a for=map>size</a> is zero.
 980 | 
 981 | <p>To <dfn export for=map lt="iterate|for each">iterate</dfn> over an <a>ordered map</a>, performing
 982 | a set of steps on each <a for=map>entry</a> in order, use phrasing of the form
 983 | "<a for=map>For each</a> |key| → |value| of |map|", and then operate on |key| and |value| in the
 984 | subsequent prose.
 985 | 
 986 | 
 987 | <h3 id=structs>Structs</h3>
 988 | 
 989 | <p>A <dfn export>struct</dfn> is a specification type consisting of a finite set of
 990 | <dfn export for=struct,tuple,pair lt=item>items</dfn>, each of which has a unique and immutable
 991 | <dfn export for=struct,tuple,pair>name</dfn>.
 992 | 
 993 | <hr>
 994 | 
 995 | <p><a>Structs</a> with a defined order are also known as <dfn export lt=tuple>tuples</dfn>. For
 996 | notational convenience, a literal syntax can be used to express <a>tuples</a>, by surrounding the
 997 | tuple with parenthesis and separating its <a for=tuple>items</a> with a comma. To use this notation,
 998 | the <a for=tuple>names</a> need to be clear from context. This can be done by preceding the first
 999 | instance with the name given to the <a>tuple</a>.
1000 | 
1001 | <div class=example id=example-tuple>
1002 |  <!-- If https://github.com/tabatkins/bikeshed/issues/960 gets fixed we can show how to use <dfn>
1003 |  and <a> on these -->
1004 |  <p>A status is an example <a>tuple</a> consisting of a code (a three-digit number) and text (a byte
1005 |  sequence).
1006 | 
1007 |  <p>A nonsense algorithm that manipulates status tuples for the purpose of demonstrating their
1008 |  usage is then:</p>
1009 | 
1010 |  <ol>
1011 |   <li>Let |statusInstance| be the status (200, `<code>OK</code>`).
1012 |   <li>Set |statusInstance| to (301, `<code>FOO BAR</code>`).
1013 |   <li>If |statusInstance|'s code is 404, then &hellip;
1014 |  </ol>
1015 | </div>
1016 | 
1017 | <p class=note>It is intentional that not all <a>structs</a> are <a>tuples</a>. Documents using the
1018 | Infra Standard might need the flexibility to add new <a for=struct>names</a> to their struct
1019 | without breaking literal syntax used by their dependencies. In that case a tuple is not appropriate.
1020 | 
1021 | <hr>
1022 | 
1023 | <p><a>Tuples</a> with two <a for=tuple>items</a> are also known as <dfn export lt=pair>pairs</dfn>.
1024 | For <a>pairs</a>, a slightly shorter literal syntax can be used, separating the two
1025 | <a for=pair>items</a> with a / character.
1026 | 
1027 | <p class=example id=example-pair>Another way of expressing our |statusInstance| tuple above would be
1028 | as 200/`<code>OK</code>`.
1029 | 
1030 | 
1031 | <h2 id=json>JSON</h2>
1032 | 
1033 | <p>To <dfn export>parse JSON from bytes</dfn> given <var>bytes</var>, run these steps:
1034 | 
1035 | <ol>
1036 |  <li><p>Let <var>jsonText</var> be the result of running <a>UTF-8 decode</a> on <var>bytes</var>.
1037 |  [[!ENCODING]]
1038 | 
1039 |  <li>
1040 |   <p>Return ? <a abstract-op>Call</a>(<a>%JSONParse%</a>, undefined, « <var>jsonText</var> »).
1041 |   [[!ECMA-262]]
1042 | 
1043 |   <p class=note>The conventions used in this step are those of the JavaScript specification.
1044 | </ol>
1045 | 
1046 | 
1047 | <h2 id=forgiving-base64>Forgiving base64</h2>
1048 | 
1049 | <p>To <dfn export>forgiving-base64 encode</dfn> given a <a>byte sequence</a> <var>data</var>, apply
1050 | the base64 algorithm defined in section 4 of RFC 4648 to <var>data</var> and return the result.
1051 | [[!RFC4648]]
1052 | 
1053 | <p class="note no-backref">This is named <a>forgiving-base64 encode</a> for symmetry with
1054 | <a>forgiving-base64 decode</a>, which is different from the RFC as it defines error handling for
1055 | certain inputs.
1056 | 
1057 | <p>To <dfn export>forgiving-base64 decode</dfn> given a string <var>data</var>, run these steps:</p>
1058 | 
1059 | <ol>
1060 |  <li><p>Remove all <a>ASCII whitespace</a> from <var>data</var>.
1061 |  <!-- https://lists.w3.org/Archives/Public/public-whatwg-archive/2011May/0207.html -->
1062 | 
1063 |  <li>
1064 |   <p>If <var>data</var>'s <a for=string>length</a> divides by 4 leaving no remainder, then:
1065 | 
1066 |   <ol>
1067 |    <li><p>If <var>data</var> ends with one or two U+003D (=) <a>code points</a>, then remove them
1068 |    from <var>data</var>.
1069 |   </ol>
1070 | 
1071 |  <li><p>If <var>data</var>'s <a for=string>length</a> divides by 4 leaving a remainder of 1, then
1072 |  return failure.
1073 | 
1074 |  <li>
1075 |   <p>If <var>data</var> contains a <a>code point</a> that is not one of
1076 | 
1077 |   <ul class="brief">
1078 |    <li>U+002B (+)
1079 |    <li>U+002F (/)
1080 |    <li><a>ASCII alphanumeric</a>
1081 |   </ul>
1082 | 
1083 |   <p>then return failure.
1084 | 
1085 |  <li><p>Let <var>output</var> be an empty <a>byte sequence</a>.
1086 | 
1087 |  <li><p>Let <var>buffer</var> be an empty buffer that can have bits appended to it.
1088 | 
1089 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>data</var>, initially
1090 |  pointing at the start of <var>data</var>.
1091 | 
1092 |  <li>
1093 |   <p>While <var>position</var> does not point past the end of <var>data</var>:
1094 | 
1095 |   <ol>
1096 |    <li><p>Find the <a>code point</a> pointed to by <var>position</var> in the second column of
1097 |    Table 1: The Base 64 Alphabet of RFC 4648. Let <var>n</var> be the number given in the first cell
1098 |    of the same row. [[!RFC4648]]
1099 | 
1100 |    <li><p>Append the six bits corresponding to <var>n</var>, most significant bit first, to
1101 |    <var>buffer</var>.
1102 | 
1103 |    <li><p>If <var>buffer</var> has accumulated 24 bits, interpret them as three 8-bit big-endian
1104 |    numbers. Append three bytes with values equal to those numbers to <var>output</var>, in the same
1105 |    order, and then empty <var>buffer</var>.
1106 | 
1107 |    <li><p>Advance <var>position</var> by 1.
1108 |   </ol>
1109 | 
1110 |  <li>
1111 |   <p>If <var>buffer</var> is not empty, it contains either 12 or 18 bits. If it contains 12 bits,
1112 |   then discard the last four and interpret the remaining eight as an 8-bit big-endian number. If it
1113 |   contains 18 bits, then discard the last two and interpret the remaining 16 as two 8-bit big-endian
1114 |   numbers. Append the one or two bytes with values equal to those one or two numbers to
1115 |   <var>output</var>, in the same order.</p>
1116 | 
1117 |   <p class="note">The discarded bits mean that, for instance, "<code>YQ</code>" and
1118 |   "<code>YR</code>" both return `<code>a</code>`.
1119 | 
1120 |  <li><p>Return <var>output</var>.
1121 | </ol>
1122 | 
1123 | 
1124 | <h2 id=namespaces>Namespaces</h2>
1125 | 
1126 | <p>The <dfn export>HTML namespace</dfn> is "<code>http://www.w3.org/1999/xhtml</code>".
1127 | 
1128 | <p>The <dfn export>MathML namespace</dfn> is "<code>http://www.w3.org/1998/Math/MathML</code>".
1129 | 
1130 | <p>The <dfn export>SVG namespace</dfn> is "<code>http://www.w3.org/2000/svg</code>".
1131 | 
1132 | <p>The <dfn export>XLink namespace</dfn> is "<code>http://www.w3.org/1999/xlink</code>".
1133 | 
1134 | <p>The <dfn export>XML namespace</dfn> is "<code>http://www.w3.org/XML/1998/namespace</code>".
1135 | 
1136 | <p>The <dfn export>XMLNS namespace</dfn> is "<code>http://www.w3.org/2000/xmlns/</code>".
1137 | 
1138 | 
1139 | <h2 class=no-num id=acknowledgments>Acknowledgments</h2>
1140 | 
1141 | <p>Many thanks to
1142 | Addison Phillips,
1143 | Aryeh Gregor,
1144 | Chris Rebert,
1145 | Daniel Ehrenberg,
1146 | Dominic Farolino,
1147 | Jake Archibald,
1148 | Jungkee Song,
1149 | Leonid Vasilyev,
1150 | Malika Aubakirova,
1151 | Michael™ Smith,
1152 | Mike West,
1153 | Ms2ger,
1154 | Philip Jägenstedt,
1155 | Rashaun "Snuggs" Stovall,
1156 | Sergey Shekyan,
1157 | Simon Pieters,
1158 | Tab Atkins,
1159 | Tobie Langel,
1160 | triple-underscore,
1161 | and Xue Fuqiao
1162 | for being awesome!
1163 | 
1164 | <p>This standard is written by <a lang=nl href=https://annevankesteren.nl/>Anne van Kesteren</a>
1165 | (<a href=https://www.mozilla.org/>Mozilla</a>,
1166 | <a href=mailto:annevk@annevk.nl>annevk@annevk.nl</a>) and
1167 | <a href=https://domenic.me/>Domenic Denicola</a> (<a href=https://www.google.com/>Google</a>,
1168 | <a href=mailto:d@domenic.me>d@domenic.me</a>).
1169 | 


--------------------------------------------------------------------------------
/review-drafts/2019-01.bs:
--------------------------------------------------------------------------------
   1 | <pre class='metadata'>
   2 | Group: WHATWG
   3 | Date: 2019-01-23
   4 | H1: Infra
   5 | Shortname: infra
   6 | Text Macro: TWITTER infrastandard
   7 | Abstract: The Infra Standard aims to define the fundamental concepts upon which standards are built.
   8 | Translation: ja https://triple-underscore.github.io/infra-ja.html
   9 | </pre>
  10 | 
  11 | <pre class="anchors">
  12 | urlPrefix: https://tc39.github.io/ecma262/; spec: ECMA-262;
  13 |     type: dfn
  14 |         text: %JSONParse%; url: sec-json.parse
  15 |         text: %JSONStringify%; url: #sec-json.stringify
  16 |         text: List; url: sec-list-and-record-specification-type
  17 |         text: The String Type; url: sec-ecmascript-language-types-string-type
  18 |     type: abstract-op; text: Call; url: sec-call
  19 | </pre>
  20 | 
  21 | 
  22 | <h2 id=goals class=no-num>Goals</h2>
  23 | 
  24 | <ul>
  25 |  <li><p>Deduplicate boilerplate in standards.
  26 | 
  27 |  <li><p>Align standards on conventions, terminology, and data structures.
  28 | 
  29 |  <li><p>Be a place for concepts used by multiple standards without a good home.
  30 | 
  31 |  <li><p>Help write clear and readable algorithmic prose by clarifying otherwise ambiguous concepts.
  32 | </ul>
  33 | 
  34 | <p>Suggestions for more goals welcome.</p>
  35 | 
  36 | 
  37 | <h2 id=usage>Usage</h2>
  38 | 
  39 | <p>To make use of the Infra Standard in a document titled <var>X</var>, use
  40 | <samp><var>X</var> depends on the Infra Standard</samp>. Additionally, cross-referencing terminology
  41 | is encouraged to avoid ambiguity.
  42 | 
  43 | <p>Specification authors are also encouraged to add their specification to the
  44 | <a href=https://github.com/whatwg/infra/wiki/Dependent-specs>list of dependent specifications</a> in
  45 | order to help the editors ensure that any future breaking changes to the Infra Standard are
  46 | correctly reflected by any such dependencies.
  47 | 
  48 | 
  49 | <h2 id=conventions>Conventions</h2>
  50 | 
  51 | <h3 id=conformance>Conformance</h3>
  52 | 
  53 | <p>All assertions, diagrams, examples, and notes are non-normative, as are all sections explicitly
  54 | marked non-normative. Everything else is normative.
  55 | 
  56 | <p>The keywords "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", "SHOULD NOT",
  57 | "RECOMMENDED", "NOT RECOMMENDED", "MAY", and "OPTIONAL" are to be interpreted as described in
  58 | RFC 2119. [[!RFC2119]]
  59 | 
  60 | <p>These keywords have equivalent meaning when written in lowercase and cannot appear in
  61 | non-normative content.
  62 | 
  63 | <p class=note>This is a <a>willful violation</a> of RFC 8174, motivated by legibility and a desire
  64 | to preserve long-standing practice in many non-IETF-published pre-RFC 8174 documents. [[RFC8174]]
  65 | 
  66 | <p>All of the above is applicable to both this standard and any document that uses this standard.
  67 | Documents using this standard are encouraged to limit themselves to "must", "must not", "should",
  68 | and "may", and to use these in their lowercase form as that is generally considered to be more
  69 | readable.
  70 | 
  71 | <p>For non-normative content "strongly encouraged", "strongly discouraged", "encouraged",
  72 | "discouraged", "can", "cannot", "could", "could not", "might", and "might not" can be used instead.
  73 | 
  74 | 
  75 | <h3 id=other-specs>Compliance with other specifications</h3>
  76 | 
  77 | <p>In general, specifications interact with and rely on a wide variety of other specifications. In
  78 | certain circumstances, unfortunately, conflicting needs require a specification to violate the
  79 | requirements of other specifications. When this occurs, a document using the Infra Standard should
  80 | denote such transgressions as a <dfn export>willful violation</dfn>, and note the reason for that
  81 | violation.
  82 | 
  83 | <p class=example id=example-willful-violation>The previous section, [[#conformance]], documents a
  84 | <a>willful violation</a> of RFC 8174 committed by the Infra Standard.
  85 | 
  86 | 
  87 | <h3 id=terminology>Terminology</h3>
  88 | 
  89 | <p>The word "or", in cases where both inclusive "or" and exclusive "or" are possible (e.g., "if
  90 | either width or height is zero"), means an inclusive "or" (implying "or both"), unless it is called
  91 | out as being exclusive (with "but not both").
  92 | 
  93 | 
  94 | <h2 id=algorithms>Algorithms</h2>
  95 | 
  96 | <p>Algorithms, and requirements phrased in the imperative as part of algorithms (such as "strip any
  97 | leading spaces" or "return false") are to be interpreted with the meaning of the keyword (e.g.,
  98 | "must") used in introducing the algorithm or step. If no such keyword is used, must is implied.
  99 | 
 100 | <div class=example id=example-algorithms>
 101 |  <p>For example, were the spec to say:</p>
 102 | 
 103 |  <blockquote>
 104 |   <p class=allow-2119>To eat an orange, the user must:
 105 | 
 106 |   <ol class=brief>
 107 |    <li>Peel the orange.
 108 |    <li>Separate each slice of the orange.
 109 |    <li>Eat the orange slices.
 110 |   </ol>
 111 |  </blockquote>
 112 | 
 113 |  <p>it would be equivalent to the following:</p>
 114 | 
 115 |  <blockquote>
 116 |   <p>To eat an orange:
 117 | 
 118 |   <ol class=brief>
 119 |    <li class=allow-2119>The user must peel the orange.
 120 |    <li class=allow-2119>The user must separate each slice of the orange.
 121 |    <li class=allow-2119>The user must eat the orange slices.
 122 |   </ol>
 123 |  </blockquote>
 124 | 
 125 |  <p class=allow-2119>Here the key word is "must".</p>
 126 | 
 127 |  <p class=allow-2119>Modifying the above example, if the algorithm was introduced only with "To eat
 128 |  an orange:", it would still have the same meaning, as "must" is implied.
 129 | </div>
 130 | 
 131 | <p>Conformance requirements phrased as algorithms or specific steps may be implemented in any
 132 | manner, so long as the end result is equivalent. (In particular, the algorithms are intended to be
 133 | easy to follow, and not intended to be performant.)
 134 | 
 135 | <p class=note>Performance is tricky to get correct as it is influenced by user perception, computer
 136 | architectures, and different types of input that can change over time in how common they are. For
 137 | instance, a JavaScript engine likely has many different code paths for what is standardized as a
 138 | single algorithm, in order to optimize for speed or memory consumption. Standardizing all those code
 139 | paths would be an insurmountable task and not productive as they would not stand the test of time
 140 | as well as the single algorithm would. Therefore performance is best left as a field to compete
 141 | over.
 142 | 
 143 | 
 144 | <h3 id=variables>Variables</h3>
 145 | 
 146 | <p>A variable is declared with "let" and changed with "set".
 147 | 
 148 | <p class=example id=example-variable>Let |list| be a new <a>list</a>.</p>
 149 | 
 150 | <div class=example id=example-variable-null>
 151 |  <ol>
 152 |   <li><p>Let |value| be null.
 153 | 
 154 |   <li><p>If |input| is a <a>string</a>, then set |value| to |input|.
 155 | 
 156 |   <li><p>Otherwise, set |value| to |input|, <a>UTF-8 decoded</a>.
 157 | 
 158 |   <li><p><a>Assert</a>: |value| is a <a>string</a>.
 159 |  </ol>
 160 | </div>
 161 | 
 162 | <p class=example id=example-variable-ternary>Let <var ignore>activationTarget</var> be
 163 | <var ignore>target</var>, if <var ignore>isActivationEvent</var> is true and target has activation
 164 | behavior, and null otherwise.
 165 | 
 166 | <p>Variables must not be used before they are declared. Variables are
 167 | <a href=https://en.wikipedia.org/wiki/Scope_(computer_science)#Block_scope>block scoped</a>.
 168 | Variables must not be declared more than once per algorithm.
 169 | 
 170 | 
 171 | <h3 id=algorithm-control-flow>Control flow</h3>
 172 | 
 173 | <p>The control flow of algorithms is such that a requirement to "return" or "throw" terminates the
 174 | algorithm the statement was in. "Return" will hand the given value, if any, to its caller. "Throw"
 175 | will make the caller automatically rethrow the given value, if any, and thereby terminate the
 176 | caller's algorithm. Using prose the caller has the ability to "catch" the exception and perform
 177 | another action.
 178 | 
 179 | 
 180 | <h3 id=algorithm-conditional-abort>Conditional abort</h3>
 181 | 
 182 | <p>Sometimes it is useful to stop performing a series of steps once a condition becomes true.
 183 | 
 184 | <p>To do this, state that a given series of steps will <dfn export>abort when</dfn> a specific
 185 | <var>condition</var> is reached. This indicates that the specified steps must be evaluated, not
 186 | as-written, but by additionally inserting a step before each of them that evaluates
 187 | <var>condition</var>, and if <var>condition</var> evaluates to true, skips the remaining steps.
 188 | 
 189 | <p>In such algorithms, the subsequent step can be annotated to run <dfn export>if aborted</dfn>, in
 190 | which case it must run if any of the preceding steps were skipped due to the <var>condition</var>
 191 | of the preceding <a>abort when</a> step evaluated to true.
 192 | 
 193 | <div class=example id=example-conditional-abort>
 194 |  <p>The following algorithm
 195 | 
 196 |  <ol>
 197 |   <li><p>Let |result| be an empty <a>list</a>.
 198 | 
 199 |   <li>
 200 |    <p>Run these steps, but <a>abort when</a> the user clicks the "Cancel" button:
 201 | 
 202 |    <ol>
 203 |     <li><p>Compute the first million digits of <var>π</var>, and <a for=list>append</a> the result
 204 |     to |result|.
 205 | 
 206 |     <li><p>Compute the first million digits of |e|, and <a for=list>append</a> the result to
 207 |     |result|.
 208 | 
 209 |     <li><p>Compute the first million digits of <var>φ</var>, and <a for=list>append</a> the result
 210 |     to |result|.
 211 |    </ol>
 212 |   </li>
 213 | 
 214 |   <li><p><a>If aborted</a>, <a for=list>append</a> "<code>Didn't finish!</code>" to |result|.
 215 |  </ol>
 216 | 
 217 |  <p>is equivalent to the more verbose formulation</p>
 218 | 
 219 |  <ol>
 220 |   <li><p>Let |result| be an empty <a>list</a>.
 221 | 
 222 |   <li>
 223 |    <p>If the user has not clicked the "Cancel" button, then:
 224 | 
 225 |    <ol>
 226 |     <li><p>Compute the first million digits of <var>π</var>, and <a for=list>append</a> the result
 227 |     to |result|.
 228 | 
 229 |     <li>
 230 |      <p>If the user has not clicked the "Cancel" button, then:
 231 | 
 232 |      <ol>
 233 |       <li><p>Compute the first million digits of |e|, and <a for=list>append</a> the result to
 234 |       |result|.
 235 | 
 236 |       <li><p>If the user has not clicked the "Cancel" button, then compute the first million digits
 237 |       of <var>φ</var>, and <a for=list>append</a> the result to |result|.
 238 |      </ol>
 239 |    </ol>
 240 | 
 241 |   <li><p>If the user clicked the "Cancel" button, then <a for=list>append</a>
 242 |   "<code>Didn't finish!</code>" to |result|.
 243 |  </ol>
 244 | </div>
 245 | 
 246 | <p class=note>Whenever this construct is used, implementations are allowed to evaluate
 247 | <var>condition</var> during the specified steps rather than before and after each step, as long as
 248 | the end result is indistinguishable. For instance, as long as |result| in the above example is not
 249 | mutated during a compute operation, the user agent could stop the computation.
 250 | 
 251 | 
 252 | <h3 id=algorithm-iteration>Iteration</h3>
 253 | 
 254 | <p>There's a variety of ways to repeat a set of steps until a condition is reached.
 255 | 
 256 | <p class=note>The Infra Standard is not (yet) exhaustive on this; please file an issue if you need
 257 | something.
 258 | 
 259 | <dl>
 260 |  <dt>For each
 261 |  <dd><p>As defined <a for=list lt="for each">for lists</a> (and derivatives) and
 262 |  <a for=map lt="for each">maps</a>.
 263 | 
 264 |  <dt><dfn export for=iteration lt=while>While</dfn>
 265 |  <dd>
 266 |   <p>An instruction to repeat a set of steps as long as a condition is met.
 267 | 
 268 |   <div class=example id=example-while>
 269 |    <p>While |condition| is "<code>met</code>":
 270 | 
 271 |    <ol>
 272 |     <li><p>&hellip;
 273 |    </ol>
 274 |   </div>
 275 | </dl>
 276 | 
 277 | <p>An iteration's flow can be controlled via requirements to
 278 | <dfn export for=iteration>continue</dfn> or <dfn export for=iteration>break</dfn>.
 279 | <a for=iteration>Continue</a> will skip over any remaining steps in an iteration, proceeding to the
 280 | next item. If no further items remain, the iteration will stop. <a for=iteration>Break</a> will skip
 281 | over any remaining steps in an iteration, and skip over any remaining items as well, stopping the
 282 | iteration.
 283 | 
 284 | <div class=example id=example-break-continue>
 285 |  <p>Let |example| be the <a>list</a> « 1, 2, 3, 4 ». The following prose would perform |operation|
 286 |  upon 1, then 2, then 3, then 4:
 287 | 
 288 |  <ol>
 289 |   <li>
 290 |    <p><a for=list>For each</a> |item| of |example|:
 291 |    <ol>
 292 |     <li>Perform |operation| on |item|.
 293 |    </ol>
 294 |   </li>
 295 |  </ol>
 296 | 
 297 |  <p>The following prose would perform |operation| upon 1, then 2, then 4. 3 would be skipped.
 298 | 
 299 |  <ol>
 300 |   <li>
 301 |    <p><a for=list>For each</a> |item| of |example|:
 302 |    <ol>
 303 |     <li>If |item| is 3, then <a for=iteration>continue</a>.
 304 |     <li>Perform |operation| on |item|.
 305 |    </ol>
 306 |   </li>
 307 |  </ol>
 308 | 
 309 |  <p>The following prose would perform |operation| upon 1, then 2. 3 and 4 would be skipped.
 310 | 
 311 |  <ol>
 312 |   <li>
 313 |    <p><a for=list>For each</a> |item| of |example|:
 314 |    <ol>
 315 |     <li>If |item| is 3, then <a for=iteration>break</a>.
 316 |     <li>Perform |operation| on |item|.
 317 |    </ol>
 318 |   </li>
 319 |  </ol>
 320 | </div>
 321 | 
 322 | 
 323 | <h3 id=assertions>Assertions</h3>
 324 | 
 325 | <p>To improve readability, it can sometimes help to add assertions to algorithms, stating
 326 | invariants. To do this, write "<dfn export>Assert</dfn>:", followed by a statement that must be
 327 | true. If the statement ends up being false that indicates an issue with the document using the Infra
 328 | Standard that should be reported and addressed.
 329 | 
 330 | <p class=note>Since the statement can only ever be true, it has no implications for implementations.
 331 | 
 332 | <div class=example id=example-assert>
 333 |  <ol>
 334 |   <li><p>Let |x| be "<code>Aperture Science</code>".
 335 |   <li><p><a>Assert</a>: |x| is "<code>Aperture Science</code>".
 336 | </div>
 337 | 
 338 | 
 339 | <h2 id=primitive-data-types>Primitive data types</h2>
 340 | 
 341 | <h3 id=nulls>Nulls</h3>
 342 | 
 343 | <p>The value null is used to indicate the lack of a value. It can be used interchangeably with the
 344 | JavaScript <b>null</b> value. [[!ECMA-262]]
 345 | 
 346 | <p class=example id=example-null>Let <var ignore>element</var> be null.
 347 | 
 348 | <p class=example id=example-null-return>If <var>input</var> is the empty string, then return null.
 349 | 
 350 | 
 351 | <h3 id=booleans>Booleans</h3>
 352 | 
 353 | <p>A <dfn export>boolean</dfn> is either true or false.
 354 | 
 355 | <p class=example id=example-boolean>Let <var ignore>elementSeen</var> be false.
 356 | 
 357 | 
 358 | <h3 id=bytes>Bytes</h3>
 359 | 
 360 | <p>A <dfn export>byte</dfn> is a sequence of eight bits, represented as a double-digit hexadecimal
 361 | number in the range 0x00 to 0xFF, inclusive.
 362 | 
 363 | <p>An <dfn export>ASCII byte</dfn> is a <a>byte</a> in the range 0x00 (NUL) to 0x7F (DEL),
 364 | inclusive. As illustrated, an <a>ASCII byte</a>, excluding 0x28 and 0x29, may be followed by the
 365 | representation outlined in the <a href=https://tools.ietf.org/html/rfc20#section-2>Standard Code</a>
 366 | section of <cite>ASCII format for Network Interchange</cite>, between parentheses. [[!RFC20]]
 367 | 
 368 | <p>0x28 may be followed by "(left parenthesis)" and 0x29 by "(right parenthesis)".
 369 | 
 370 | <p class=example id=example-byte-notation>0x49 (I) when <a>UTF-8 decoded</a> becomes the
 371 | <a>code point</a> U+0049 (I).
 372 | 
 373 | 
 374 | <h3 id=byte-sequences>Byte sequences</h3>
 375 | 
 376 | <p>A <dfn export>byte sequence</dfn> is a sequence of <a>bytes</a>, represented as a space-separated
 377 | sequence of bytes. Byte sequences with bytes in the range 0x20 (SP) to 0x7E (~), inclusive, can
 378 | alternately be written as a string, but using backticks instead of quotation marks, to avoid
 379 | confusion with an actual <a>string</a>.
 380 | 
 381 | <div class=example id=example-byte-sequence-notation>
 382 |  <p>0x48 0x49 can also be represented as `<code>HI</code>`.
 383 | 
 384 |  <p>Headers, such as `<code>Content-Type</code>`, are <a>byte sequences</a>.
 385 | </div>
 386 | 
 387 | <p class=note>To get a <a>byte sequence</a> out of a <a>string</a>, using <a>UTF-8 encode</a> from
 388 | the Encoding Standard is encouraged. In rare circumstances <a>isomorphic encode</a> might be needed.
 389 | [[ENCODING]]
 390 | 
 391 | <p>A <a>byte sequence</a>'s <dfn export for="byte sequence">length</dfn> is the number of
 392 | <a>bytes</a> it contains.
 393 | 
 394 | <p>To <dfn export>byte-lowercase</dfn> a <a>byte sequence</a>, increase each <a>byte</a> it
 395 | contains, in the range 0x41 (A) to 0x5A (Z), inclusive, by 0x20.
 396 | 
 397 | <p>To <dfn export>byte-uppercase</dfn> a <a>byte sequence</a>, subtract each <a>byte</a> it
 398 | contains, in the range 0x61 (a) to 0x7A (z), inclusive, by 0x20.
 399 | 
 400 | <p>A <a>byte sequence</a> <var>A</var> is a <dfn export>byte-case-insensitive</dfn> match for a
 401 | <a>byte sequence</a> <var>B</var>, if the <a>byte-lowercase</a> of <var>A</var> is the
 402 | <a>byte-lowercase</a> of <var>B</var>.
 403 | 
 404 | <p>To <dfn export>isomorphic decode</dfn> a <a>byte sequence</a> <var>input</var>, return a
 405 | <a>string</a> whose <a for=string>length</a> is equal to <var>input</var>'s
 406 | <a for="byte sequence">length</a> and whose <a>code points</a> have the same values as
 407 | <var>input</var>'s <a>bytes</a>, in the same order.
 408 | 
 409 | 
 410 | <h3 id=code-points>Code points</h3>
 411 | 
 412 | <p>A <dfn export lt="code point|character">code point</dfn> is a Unicode code point and is
 413 | represented as a four-to-six digit hexadecimal number, typically prefixed with "U+".
 414 | 
 415 | <p>A <a>code point</a> may be followed by its name, by its rendered form between parentheses when it
 416 | is not U+0028 or U+0029, or by both. Documents using the Infra Standard are encouraged to follow
 417 | <a>code points</a> by their name when they cannot be rendered or are U+0028 or U+0029, and their
 418 | rendered form between parentheses otherwise, for legibility.
 419 | 
 420 | <p>A <a>code point</a>'s name is defined in the Unicode Standard and represented in
 421 | <a>ASCII uppercase</a>. [[!UNICODE]]
 422 | 
 423 | <div class=example id=example-code-point-notation>
 424 |  <p>The <a>code point</a> rendered as 🤔 is represented as U+1F914.
 425 | 
 426 |  <p>When referring to that <a>code point</a>, we might say "U+1F914 (🤔)", to provide extra context.
 427 |  Documents are allowed to use "U+1F914 THINKING FACE (🤔)" as well, though this is somewhat verbose.
 428 | </div>
 429 | 
 430 | <p class=example id=example-code-point-notation-hard-to-render><a>Code points</a> that are difficult
 431 | to render unambigiously, such as U+000A, can be referred to as "U+000A LF". U+0029 can be referred
 432 | to as "U+0029 RIGHT PARENTHESIS", because even though it renders, this avoids unmatched parentheses.
 433 | 
 434 | <p><a>Code points</a> are sometimes referred to as <a>characters</a> and in certain contexts are
 435 | prefixed with "0x" rather than "U+".
 436 | 
 437 | <p>A <dfn export>surrogate</dfn> is a <a>code point</a> that is in the range U+D800 to U+DFFF,
 438 | inclusive.
 439 | 
 440 | <p>A <dfn export>scalar value</dfn> is a <a>code point</a> that is not a <a>surrogate</a>.
 441 | 
 442 | <p>A <dfn export>noncharacter</dfn> is a <a>code point</a> that is in the range U+FDD0 to U+FDEF,
 443 | inclusive, or U+FFFE, U+FFFF, U+1FFFE, U+1FFFF, U+2FFFE, U+2FFFF, U+3FFFE, U+3FFFF, U+4FFFE,
 444 | U+4FFFF, U+5FFFE, U+5FFFF, U+6FFFE, U+6FFFF, U+7FFFE, U+7FFFF, U+8FFFE, U+8FFFF, U+9FFFE, U+9FFFF,
 445 | U+AFFFE, U+AFFFF, U+BFFFE, U+BFFFF, U+CFFFE, U+CFFFF, U+DFFFE, U+DFFFF, U+EFFFE, U+EFFFF, U+FFFFE,
 446 | U+FFFFF, U+10FFFE, or U+10FFFF.
 447 | 
 448 | <p>An <dfn export>ASCII code point</dfn> is a <a>code point</a> in the range U+0000 NULL to
 449 | U+007F DELETE, inclusive.
 450 | 
 451 | <p>An <dfn export lt="ASCII tab or newline|ASCII tabs or newlines">ASCII tab or newline</dfn> is
 452 | U+0009 TAB, U+000A LF, or U+000D CR.
 453 | 
 454 | <p><dfn export>ASCII whitespace</dfn> is U+0009 TAB, U+000A LF, U+000C FF, U+000D CR, or U+0020
 455 | SPACE.
 456 | 
 457 | <p class=note>"Whitespace" is a mass noun.
 458 | 
 459 | <p>A <dfn export>C0 control</dfn> is a <a>code point</a> in the range U+0000 NULL to
 460 | U+001F INFORMATION SEPARATOR ONE, inclusive.
 461 | 
 462 | <p>A <dfn export lt="C0 control or space|C0 controls or spaces">C0 control or space</dfn> is a
 463 | <a>C0 control</a> or U+0020 SPACE.
 464 | 
 465 | <p>A <dfn export>control</dfn> is a <a>C0 control</a> or a <a>code point</a> in the range
 466 | U+007F DELETE to U+009F APPLICATION PROGRAM COMMAND, inclusive.
 467 | 
 468 | <p>An <dfn export>ASCII digit</dfn> is a <a>code point</a> in the range U+0030 (0) to U+0039 (9),
 469 | inclusive.
 470 | 
 471 | <p>An <dfn export>ASCII upper hex digit</dfn> is an <a>ASCII digit</a> or a <a>code point</a> in the
 472 | range U+0041 (A) to U+0046 (F), inclusive.
 473 | 
 474 | <p>An <dfn export>ASCII lower hex digit</dfn> is an <a>ASCII digit</a> or a <a>code point</a> in the
 475 | range U+0061 (a) to U+0066 (f), inclusive.
 476 | 
 477 | <p>An <dfn export>ASCII hex digit</dfn> is an <a>ASCII upper hex digit</a> or
 478 | <a>ASCII lower hex digit</a>.
 479 | 
 480 | <p>An <dfn export>ASCII upper alpha</dfn> is a <a>code point</a> in the range U+0041 (A) to
 481 | U+005A (Z), inclusive.
 482 | 
 483 | <p>An <dfn export>ASCII lower alpha</dfn> is a <a>code point</a> in the range U+0061 (a) to
 484 | U+007A (z), inclusive.
 485 | 
 486 | <p>An <dfn export>ASCII alpha</dfn> is an <a>ASCII upper alpha</a> or <a>ASCII lower alpha</a>.
 487 | 
 488 | <p>An <dfn export>ASCII alphanumeric</dfn> is an <a>ASCII digit</a> or <a>ASCII alpha</a>.
 489 | 
 490 | 
 491 | <h3 id=strings>Strings</h3>
 492 | 
 493 | <p>A <dfn export>JavaScript string</dfn> is a sequence of unsigned 16-bit integers, also known as
 494 | <dfn export lt="code unit">code units</dfn>.
 495 | 
 496 | <p class=note>This is different from how the Unicode Standard defines "code unit". In particular it
 497 | refers exclusively to how the Unicode Standard defines it for Unicode 16-bit strings. [[UNICODE]]
 498 | 
 499 | <p>A <a>JavaScript string</a>'s <dfn export for="JavaScript string">length</dfn> is the number of
 500 | <a>code units</a> it contains.
 501 | 
 502 | <p>A <a>JavaScript string</a> can also be interpreted as containing <a>code points</a>, per the
 503 | conversion defined in <a>The String Type</a> section of the JavaScript specification. [[!ECMA-262]]
 504 | 
 505 | <p class=note>This conversion process converts surrogate pairs into their corresponding
 506 | <a>scalar value</a> and maps isolated surrogates to their corresponding <a>code point</a>, leaving
 507 | them effectively as-is.
 508 | 
 509 | <p class=example id=example-javascript-string-in-code-points>A <a>JavaScript string</a> consisting
 510 | of the <a>code units</a> 0xD83D, 0xDCA9, and 0xD800, when interpreted as containing
 511 | <a>code points</a>, would consist of the <a>code points</a> U+1F4A9 and U+D800.
 512 | 
 513 | <p>A <dfn export>scalar value string</dfn> is a sequence of <a>scalar values</a>.
 514 | 
 515 | <p class=note>A <a>scalar value string</a> is useful for any kind of I/O or other kind of operation
 516 | where <a>UTF-8 encode</a> comes into play.
 517 | <!-- It's also useful if you can imagine the subsystem to be implemented in Rust -->
 518 | 
 519 | <p><dfn export lt=string>String</dfn> can be used to refer to either a <a>JavaScript string</a> or
 520 | <a>scalar value string</a>, when it is clear from the context which is meant or when the distinction
 521 | is immaterial. <a>Strings</a> are denoted by double quotes and monospace font.
 522 | 
 523 | <p class=example id=example-string-notation>"<code>Hello, world!</code>" is a string.
 524 | 
 525 | <p>A <a>string</a>'s <dfn export for=string>length</dfn> is the number of <a>code points</a> it
 526 | contains.
 527 | 
 528 | <p>To <dfn export for="JavaScript string">convert</dfn> a <a>JavaScript string</a> into a
 529 | <a>scalar value string</a>, replace any <a>surrogates</a> with U+FFFD.
 530 | <!-- Obviates need for https://heycam.github.io/webidl/#dfn-obtain-unicode -->
 531 | 
 532 | <p class=note>The replaced surrogates are always isolated surrogates, since the process of
 533 | interpreting the JavaScript string as containing <a>code points</a> will have converted surrogate
 534 | pairs into <a>scalar values</a>.
 535 | 
 536 | <p>A <a>scalar value string</a> can always be used as <a>JavaScript string</a> implicitly since it
 537 | is a subset. The reverse is only possible if the <a>JavaScript string</a> is known to not contain
 538 | <a>surrogates</a>; otherwise a <a for="JavaScript string" lt=convert>conversion</a> must be
 539 | performed.
 540 | 
 541 | <p class=note>An implementation likely has to perform explicit conversion, depending on how it
 542 | actually ends up representing <a lt="JavaScript string">JavaScript</a> and
 543 | <a>scalar value strings</a>. It is even fairly typical for implementations to have multiple
 544 | implementations of just <a>JavaScript strings</a> for performance and memory reasons.
 545 | 
 546 | <hr>
 547 | 
 548 | <p>To <dfn export>isomorphic encode</dfn> a <a>string</a> <var>input</var>, run these steps:</p>
 549 | 
 550 | <ol>
 551 |  <li><p><a>Assert</a>: <var>input</var> contains no <a>code points</a> greater than U+00FF.
 552 | 
 553 |  <li><p>Return a <a>byte sequence</a> whose <a for="byte sequence">length</a> is equal to
 554 |  <var>input</var>'s <a for=string>length</a> and whose <a>bytes</a> have the same values as
 555 |  <var>input</var>'s <a>code points</a>, in the same order.
 556 | </ol>
 557 | 
 558 | <hr>
 559 | 
 560 | <p>An <dfn export>ASCII string</dfn> is a <a>string</a> whose <a>code points</a> are all
 561 | <a>ASCII code points</a>.
 562 | 
 563 | <p>To <dfn export>ASCII lowercase</dfn> a <a>string</a>, replace all <a>ASCII upper alphas</a> in
 564 | the <a>string</a> with their corresponding <a>code point</a> in <a>ASCII lower alpha</a>.
 565 | 
 566 | <p>To <dfn export>ASCII uppercase</dfn> a <a>string</a>, replace all <a>ASCII lower alphas</a> in
 567 | the <a>string</a> with their corresponding <a>code point</a> in <a>ASCII upper alpha</a>.
 568 | 
 569 | <p>A <a>string</a> <var>A</var> is an <dfn export>ASCII case-insensitive</dfn> match for a
 570 | <a>string</a> <var>B</var>, if the <a>ASCII lowercase</a> of <var>A</var> is the
 571 | <a>ASCII lowercase</a> of <var>B</var>.
 572 | <!-- TODO: define string equals? -->
 573 | 
 574 | <p>To <dfn export>ASCII encode</dfn> a <a>string</a> <var>input</var>, run these steps:
 575 | 
 576 | <ol>
 577 |  <li><p><a>Assert</a>: <var>input</var> is an <a>ASCII string</a>.
 578 | 
 579 |  <p class=note>Note: This precondition ensures that <a>isomorphic encode</a> and
 580 |  <a>UTF-8 encode</a> return the same <a>byte sequence</a> for this input.
 581 | 
 582 |  <li><p>Return the <a>isomorphic encoding</a> of <var>input</var>.
 583 | </ol>
 584 | 
 585 | <p>To <dfn export>ASCII decode</dfn> a <a>byte sequence</a> <var>input</var>, run these steps:
 586 | 
 587 | <ol>
 588 |  <li><p><a>Assert</a>: All bytes in <var>input</var> are <a>ASCII bytes</a>.
 589 | 
 590 |  <p class=note>Note: This precondition ensures that <a>isomorphic decode</a> and
 591 |  <a>UTF-8 decode</a> return the same <a>string</a> for this input.
 592 | 
 593 |  <li><p>Return the <a>isomorphic decoding</a> of <var>input</var>.
 594 | </ol>
 595 | 
 596 | 
 597 | <hr>
 598 | 
 599 | <p>To <dfn export>strip newlines</dfn> from a <a>string</a>, remove any U+000A LF and U+000D CR
 600 | <a>code points</a> from the <a>string</a>.
 601 | 
 602 | <p>To <dfn export>normalize newlines</dfn> in a <a>string</a>, replace every U+000D CR U+000A LF
 603 | <a>code point</a> pair with a single U+000A LF <a>code point</a>, and then replace every remaining
 604 | U+000D CR <a>code point</a> with a U+000A LF <a>code point</a>.
 605 | 
 606 | <p>To <dfn export>strip leading and trailing ASCII whitespace</dfn> from a <a>string</a>, remove all
 607 | <a>ASCII whitespace</a> that are at the start or the end of the <a>string</a>.
 608 | 
 609 | <p>To <dfn export>strip and collapse ASCII whitespace</dfn> in a <a>string</a>, replace any sequence
 610 | of one or more consecutive <a>code points</a> that are <a>ASCII whitespace</a> in the <a>string</a>
 611 | with a single U+0020 SPACE <a>code point</a>, and then remove any leading and trailing
 612 | <a>ASCII whitespace</a> from that string.
 613 | 
 614 | <hr>
 615 | 
 616 | <p>To <dfn export lt="collect a sequence of code points|collecting a sequence of code
 617 | points">collect a sequence of <a>code points</a></dfn> meeting a condition <var>condition</var> from
 618 | a <a>string</a> <var>input</var>, given a <dfn export for="string">position variable</dfn>
 619 | <var>position</var> tracking the position of the calling algorithm within <var>input</var>:</p>
 620 | 
 621 | <ol>
 622 |  <li><p>Let <var>result</var> be the empty <a>string</a>.
 623 | 
 624 |  <li>
 625 |   <p>While <var>position</var> doesn't point past the end of <var>input</var> and the
 626 |   <a>code point</a> at <var>position</var> within <var>input</var> meets the condition
 627 |   <var>condition</var>:
 628 | 
 629 |   <ol>
 630 |    <li><p>Append that <a>code point</a> to the end of <var>result</var>.
 631 | 
 632 |    <li><p>Advance <var>position</var> by 1.
 633 |   </ol>
 634 |  </li>
 635 | 
 636 |  <li><p>Return <var>result</var>.
 637 | </ol>
 638 | 
 639 | <p class=note>In addition to returning the collected <a>code points</a>, this algorithm updates the
 640 | <a>position variable</a> in the calling algorithm.
 641 | 
 642 | <p>To <dfn export>skip ASCII whitespace</dfn> within a <a>string</a> <var>input</var> given a
 643 | <a>position variable</a> <var>position</var>, <a>collect a sequence of code points</a> that are
 644 | <a>ASCII whitespace</a> from <var>input</var> given <var>position</var>. The collected
 645 | <a>code points</a> are not used, but <var>position</var> is still updated.
 646 | 
 647 | <hr>
 648 | 
 649 | <p>To <dfn export lt="strictly split|strictly split a string">strictly split a <a>string</a></dfn>
 650 | <var>input</var> on a particular delimiter <a>code point</a> <var>delimiter</var>:</p>
 651 | 
 652 | <ol>
 653 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 654 |  pointing at the start of <var>input</var>.
 655 | 
 656 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 657 | 
 658 |  <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 659 |  not equal to <var>delimiter</var> from <var>input</var>, given <var>position</var>.
 660 | 
 661 |  <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 662 | 
 663 |  <li>
 664 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 665 | 
 666 |   <ol>
 667 |    <li><p><a>Assert</a>: the <a>code point</a> at <var>position</var> within <var>input</var> is
 668 |    <var>delimiter</var>.
 669 | 
 670 |    <li><p>Advance <var>position</var> by 1.
 671 | 
 672 |    <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 673 |    not equal to <var>delimiter</var> from <var>input</var>, given <var>position</var>.
 674 | 
 675 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 676 |   </ol>
 677 |  </li>
 678 | 
 679 |  <li><p>Return <var>tokens</var>.
 680 | </ol>
 681 | 
 682 | <p class=note>This algorithm is a "strict" split, as opposed to the commonly-used variants
 683 | <a lt="split on ASCII whitespace">for ASCII whitespace</a> and
 684 | <a lt="split on commas">for commas</a> below, which are both more lenient in various ways involving
 685 | interspersed <a>ASCII whitespace</a>.
 686 | 
 687 | <p>To <dfn export lt="split on ASCII whitespace|split a string on ASCII whitespace">split a
 688 | <a>string</a> <var>input</var> on ASCII whitespace</dfn>:
 689 | 
 690 | <ol>
 691 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 692 |  pointing at the start of <var>input</var>.
 693 | 
 694 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 695 | 
 696 |  <li><p><a>Skip ASCII whitespace</a> within <var>input</var> given <var>position</var>.
 697 | 
 698 |  <li>
 699 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 700 | 
 701 |   <ol>
 702 |    <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 703 |    not <a>ASCII whitespace</a> from <var>input</var>, given <var>position</var>.
 704 | 
 705 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 706 | 
 707 |    <li><p><a>Skip ASCII whitespace</a> within <var>input</var> given <var>position</var>.
 708 |   </ol>
 709 |  </li>
 710 | 
 711 |  <li><p>Return <var>tokens</var>.
 712 | </ol>
 713 | 
 714 | <p>To <dfn export lt="split on commas|split a string on commas">split a <a>string</a>
 715 | <var>input</var> on commas</dfn>:
 716 | 
 717 | <ol>
 718 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 719 |  pointing at the start of <var>input</var>.
 720 | 
 721 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 722 | 
 723 |  <li>
 724 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 725 | 
 726 |   <ol>
 727 |    <li>
 728 |     <p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 729 |     not U+002C (,) from <var>input</var>, given <var>position</var>.
 730 | 
 731 |     <p class=note><var>token</var> might be the empty string.
 732 |    </li>
 733 | 
 734 |    <li><a>Strip leading and trailing ASCII whitespace</a> from <var>token</var>.
 735 | 
 736 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 737 | 
 738 |    <li>
 739 |     <p>If <var>position</var> is not past the end of <var>input</var>, then:
 740 | 
 741 |     <ol>
 742 |      <li><p><a>Assert</a>: the <a>code point</a> at <var>position</var> within <var>input</var> is
 743 |      U+002C (,).
 744 | 
 745 |      <li><p>Advance <var>position</var> by 1.
 746 |     </ol>
 747 |    </li>
 748 |   </ol>
 749 |  </li>
 750 | 
 751 |  <li><p>Return <var>tokens</var>.
 752 | </ol>
 753 | 
 754 | <p>To <dfn export for=string lt=concatenate|concatenation>concatenate</dfn> a <a for=/>list</a> of
 755 | <a for=/>strings</a> <var>list</var>, using an optional separator string <var>separator</var>, run
 756 | these steps:
 757 | 
 758 | <ol>
 759 |  <li><p>If <var>list</var> <a for=list>is empty</a>, then return the empty string.
 760 | 
 761 |  <li><p>If <var>separator</var> is not given, then set <var>separator</var> to the empty string.
 762 | 
 763 |  <li><p>Return a <a for=/>string</a> whose contents are <var>list</var>'s <a for=list>items</a>, in
 764 |  order, separated from each other by <var>separator</var>.
 765 | </ol>
 766 | 
 767 | <p class=example id=example-string-concatenate>To serialize a set <var>set</var>, return the
 768 | <a for=string>concatenation</a> of <var>set</var> using U+0020 SPACE.
 769 | 
 770 | 
 771 | <h2 id=data-structures>Data structures</h2>
 772 | 
 773 | <p>Conventionally, specifications have operated on a variety of vague specification-level data
 774 | structures, based on shared understanding of their semantics. This generally works well, but can
 775 | lead to ambiguities around edge cases, such as iteration order or what happens when you
 776 | <a for=set>append</a> an <a for=set>item</a> to an <a>ordered set</a> that the set already
 777 | <a for=set>contains</a>. It has also led to a variety of divergent notation and phrasing, especially
 778 | around more complex data structures such as <a lt="ordered map">maps</a>.
 779 | 
 780 | <p>This standard provides a small set of common data structures, along with notation and phrasing
 781 | for working with them, in order to create common ground.
 782 | 
 783 | 
 784 | <h3 id=lists>Lists</h3>
 785 | 
 786 | <p>A <dfn export>list</dfn> is a specification type consisting of a finite ordered sequence of
 787 | <dfn export for=list,stack,queue,set lt=item>items</dfn>.
 788 | 
 789 | <p>For notational convenience, a literal syntax can be used to express <a>lists</a>, by surrounding
 790 | the list by « » characters and separating its <a for=list>items</a> with a comma. An indexing syntax
 791 | can be used by providing a zero-based index into a list inside square brackets. The index cannot be
 792 | out-of-bounds, except when used with <a for=list>exists</a>.
 793 | 
 794 | <p class=example id=example-list-notation>Let |example| be the <a>list</a> « "<code>a</code>",
 795 | "<code>b</code>", "<code>c</code>", "<code>a</code>" ». Then |example|[1] is the <a>string</a>
 796 | "<code>b</code>".
 797 | 
 798 | <hr>
 799 | 
 800 | <p>To <dfn export for=list>append</dfn> to a <a>list</a> that is not an <a>ordered set</a> is to
 801 | add the given <a for=list>item</a> to the end of the list.
 802 | 
 803 | <p>To <dfn export for=list>prepend</dfn> to a <a>list</a> that is not an <a>ordered set</a> is to
 804 | add the given <a for=list>item</a> to the beginning of the list.
 805 | 
 806 | <p>To <dfn export for=list>replace</dfn> within a <a>list</a> that is not an <a>ordered set</a> is
 807 | to replace all items from the list that match a given condition with the given <a for=list>item</a>,
 808 | or do nothing if none do.
 809 | 
 810 | <p class=note>The above definitions are modified when the <a>list</a> is an <a>ordered set</a>; see
 811 | below for <a for=set lt=append>ordered set append</a>, <a for=set>prepend</a>, and
 812 | <a for=set>replace</a>.
 813 | 
 814 | <p>To <dfn export for=list,set>insert</dfn> an <a for=list>item</a> into a <a>list</a> before an
 815 | index is to add the given item to the list between the given index &minus; 1 and the given index. If
 816 | the given index is 0, then <a for=list>prepend</a> the given item to the list.
 817 | 
 818 | <p>To <dfn export for=list,set>remove</dfn> zero or more <a for=list>items</a> from a <a>list</a> is
 819 | to remove all items from the list that match a given condition, or do nothing if none do.
 820 | 
 821 | <div class=example id=example-list-remove>
 822 |  <p><a for=list>Removing</a> |x| from the <a>list</a> « |x|, |y|, |z|, |x| » is to remove all
 823 |  items from the list that are equal to |x|. The list now is equivalent to « |y|, |z| ».
 824 | 
 825 |  <p><a for=list>Removing</a> all items that start with the <a>string</a> "<code>a</code>" from the
 826 |  <a>list</a> « "<code>a</code>", "<code>b</code>", "<code>ab</code>", "<code>ba</code>" » is to
 827 |  remove the items "<code>a</code>" and "<code>ab</code>". The list is now equivalent to «
 828 |  "<code>b</code>", "<code>ba</code>" ».
 829 | </div>
 830 | 
 831 | <p>To <dfn export for=list,stack,queue,set>empty</dfn> a <a>list</a> is to <a for=list>remove</a>
 832 | all of its <a for=list>items</a>.
 833 | 
 834 | <p>A <a>list</a> <dfn export for=list,stack,queue,set lt=contain|exist>contains</dfn> an
 835 | <a for=list>item</a> if it appears in the list. We can also denote this by saying that, for a
 836 | <a>list</a> |list| and an index |index|, "|list|[|index|] <a for=list>exists</a>".
 837 | 
 838 | <p>A <a>list</a>'s <dfn export for=list,stack,queue,set>size</dfn> is the number of
 839 | <a for=list>items</a> the list <a for=list>contains</a>.
 840 | 
 841 | <p>A <a>list</a> <dfn export for=list,stack,queue,set lt="is empty|is not empty">is empty</dfn> if
 842 | its <a for=list>size</a> is zero.
 843 | 
 844 | <p>To <dfn export for=list,set lt="iterate|for each">iterate</dfn> over a <a>list</a>, performing a
 845 | set of steps on each <a for=list>item</a> in order, use phrasing of the form
 846 | "<a for=list>For each</a> |item| of <var ignore>list</var>", and then operate on |item| in the
 847 | subsequent prose.
 848 | 
 849 | <p>To <dfn export for=list,stack,queue,set>clone</dfn> a <a>list</a> |list| is to create a new
 850 | <a>list</a> |clone|, of the same designation, and, <a for=list>for each</a> |item| of |list|,
 851 | <a for=list>append</a> |item| to |clone|, so that |clone| <a for=list>contains</a> the same
 852 | <a for=list>items</a>, in the same order as |list|.
 853 | 
 854 | Note: This is a "shallow clone", as the <a for=list>items</a> themselves are not cloned in any way.
 855 | 
 856 | <p class=example id=example-list-clone>Let |original| be the <a>ordered set</a> «
 857 | "<code>a</code>", "<code>b</code>", "<code>c</code>" ». <a for=set>Cloning</a> |original| creates
 858 | a new <a>ordered set</a> |clone|, so that <a for=set>replacing</a> "<code>a</code>" with
 859 | "<code>foo</code>" in |clone| gives « "<code>foo</code>", "<code>b</code>", "<code>c</code>" »,
 860 | while |original|[0] is still the <a>string</a> "<code>a</code>".
 861 | 
 862 | <hr>
 863 | 
 864 | <p>The <a>list</a> type originates from the JavaScript specification (where it is capitalized, as
 865 | <a spec=ecma-262>List</a>); we repeat some elements of its definition here for ease of reference,
 866 | and provide an expanded vocabulary for manipulating <a>lists</a>. Whenever JavaScript expects a
 867 | <a spec=ecma-262>List</a>, a <a>list</a> as defined here can be used; they are the same type.
 868 | [[!ECMA-262]]
 869 | 
 870 | <h4 id=stacks>Stacks</h4>
 871 | 
 872 | <p>Some <a>lists</a> are designated as <dfn export lt=stack>stacks</dfn>. A stack is a <a>list</a>,
 873 | but conventionally, the following operations are used to operate on it, instead of using
 874 | <a for=list>append</a>, <a for=list>prepend</a>, or <a for=list>remove</a>.
 875 | 
 876 | <p>To <dfn export for=stack>push</dfn> onto a <a>stack</a> is to <a for=list>append</a> to it.
 877 | 
 878 | <p>To <dfn export for=stack>pop</dfn> from a <a>stack</a> is to <a for=list>remove</a> its last
 879 | <a for=stack>item</a> and return it, if the <a>stack</a> <a for=stack>is not empty</a>, or to return
 880 | nothing otherwise.
 881 | 
 882 | <p>Although <a>stacks</a> are <a>lists</a>, <a for=list>for each</a> must not be used with them;
 883 | instead, a combination of <a>while</a> and <a for=stack>pop</a> is more appropriate.
 884 | 
 885 | <h4 id=queues>Queues</h4>
 886 | 
 887 | <p>Some <a>lists</a> are designated as <dfn export lt=queue>queues</dfn>. A queue is a <a>list</a>,
 888 | but conventionally, the following operations are used to operate on it, instead of using
 889 | <a for=list>append</a>, <a for=list>prepend</a>, or <a for=list>remove</a>.
 890 | 
 891 | <p>To <dfn export for=queue>enqueue</dfn> in a <a>queue</a> is to <a for=list>append</a> to it.
 892 | 
 893 | <p>To <dfn export for=queue>dequeue</dfn> from a <a>queue</a> is to <a for=list>remove</a> its first
 894 | <a for=queue>item</a> and return it, if the <a>queue</a> <a for=queue>is not empty</a>, or to return
 895 | nothing if it is.
 896 | 
 897 | <p>Although <a>queues</a> are <a>lists</a>, <a for=list>for each</a> must not be used with them;
 898 | instead, a combination of <a>while</a> and <a for=queue>dequeue</a> is more appropriate.
 899 | 
 900 | <h4 id=sets>Sets</h4>
 901 | 
 902 | <p>Some <a>lists</a> are designated as <dfn export lt="ordered set|set">ordered sets</dfn>. An
 903 | ordered set is a <a>list</a> with the additional semantic that it must not contain the same
 904 | <a for=set>item</a> twice.
 905 | 
 906 | <p class=note>Almost all cases on the web platform require an <em>ordered</em> set, instead of an
 907 | unordered one, since interoperability requires that any developer-exposed enumeration of the set's
 908 | contents be consistent between browsers. In those cases where order is not important, we still use
 909 | ordered sets; implementations can optimize based on the fact that the order is not observable.
 910 | 
 911 | <p>To <dfn export for=set>append</dfn> to an <a>ordered set</a> is to do nothing if the set already
 912 | <a for=list>contains</a> the given <a for=set>item</a>, or to perform the normal <a>list</a>
 913 | <a for=list>append</a> operation otherwise.
 914 | 
 915 | <p>To <dfn export for=set>prepend</dfn> to an <a>ordered set</a> is to do nothing if the set already
 916 | <a for=list>contains</a> the given <a for=set>item</a>, or to perform the normal <a>list</a>
 917 | <a for=list>prepend</a> operation otherwise.
 918 | 
 919 | <p>To <dfn export for=set lt=replace|replacing>replace</dfn> within an <a>ordered set</a>
 920 | <var>set</var>, given <var>item</var> and <var>replacement</var>: if <var>set</var>
 921 | <a for=set>contains</a> <var>item</var> or <var>replacement</var>, then replace the first instance
 922 | of either with <var>replacement</var> and <a for=set>remove</a> all other instances.
 923 | 
 924 | <p class=example id=example-set-replace><a for="set">Replacing</a> "a" with "c" within the
 925 | <a>ordered set</a> « "a", "b", "c" » gives « "c", "b" ». Within « "c", "b", "a" » it gives
 926 | « "c", "b" » as well.
 927 | 
 928 | <p>An <a>ordered set</a> |set| is a <dfn export for=set>subset</dfn> of another <a>ordered set</a>
 929 | |superset| (and conversely, |superset| is a <dfn export for=set>superset</dfn> of |set|) if,
 930 | <a for=list>for each</a> |item| of |set|, |superset| <a for=set>contains</a> |item|.
 931 | 
 932 | <p class=note>This implies that an <a>ordered set</a> is both a <a for=set>subset</a> and a
 933 | <a for=set>superset</a> of itself.
 934 | 
 935 | <p>The <dfn export for=set>intersection</dfn> of <a>ordered sets</a> |A| and |B|, is the result
 936 | of creating a new <a>ordered set</a> |set| and, <a for=list>for each</a> |item| of |A|, if |B|
 937 | <a for=set>contains</a> |item|, <a for=set>appending</a> |item| to |set|.
 938 | 
 939 | <p>The <dfn export for=set>union</dfn> of <a>ordered sets</a> |A| and |B|, is the result of
 940 | <a for=list>cloning</a> |A| as |set| and, <a for=list>for each</a> |item| of |B|,
 941 | <a for=set>appending</a> |item| to |set|.
 942 | 
 943 | <hr>
 944 | 
 945 | <p><dfn export lt="the range">The range</dfn> <var>n</var> to <var>m</var>, inclusive, creates a new
 946 | <a>ordered set</a> containing all of the integers from <var>n</var> up to and including <var>m</var>
 947 | in consecutively increasing order, as long as <var>m</var> is greater than or equal to <var>n</var>.
 948 | 
 949 | <p class=example id=example-the-range><a for=set>For each</a> <var>n</var> of <a>the range</a> 1 to
 950 | 4, inclusive, &hellip;
 951 | 
 952 | 
 953 | <h3 id=maps>Maps</h3>
 954 | 
 955 | <p>An <dfn export lt="ordered map|map">ordered map</dfn>, or sometimes just "map", is a
 956 | specification type consisting of a finite ordered sequence of
 957 | <dfn for=map export>key</dfn>/<dfn for=map export>value</dfn> pairs, with no key appearing twice.
 958 | Each key/value pair is called an <dfn for=map export>entry</dfn>.
 959 | 
 960 | <p class=note>As with <a>ordered sets</a>, by default we assume that maps need to be ordered for
 961 | interoperability among implementations.
 962 | 
 963 | <p>A literal syntax can be used to express <a>ordered maps</a>, by surrounding the ordered map with
 964 | «[ ]» characters, denoting each of its <a for=map>entries</a> as |key| → |value|, and separating its
 965 | entries with a comma. An indexing syntax can be used to look up and set <a for=map>values</a> by
 966 | providing a <a for=map>key</a> inside square brackets.
 967 | 
 968 | <p class=example id=example-map-notation>Let |example| be the <a>ordered map</a> «[
 969 | "<code>a</code>" → `<code>x</code>`, "<code>b</code>" → `<code>y</code>` ]». Then
 970 | |example|["<code>a</code>"] is the <a>byte sequence</a> `<code>x</code>`.
 971 | 
 972 | <hr>
 973 | 
 974 | <p>To <dfn export for=map lt="get|get the value">get the value of an entry</dfn> in an
 975 | <a>ordered map</a> given a <a for=map>key</a> is to retrieve the <a for=map>value</a> of any
 976 | existing <a for=map>entry</a> if the map <a for=map>contains</a> an entry with the given key, or
 977 | to return nothing otherwise. We can also use the indexing syntax explained above.
 978 | 
 979 | <p>To <dfn export for=map lt="set|set the value">set the value of an entry</dfn> in an
 980 | <a>ordered map</a> to a given <a for=map>value</a> is to update the value of any existing
 981 | <a for=map>entry</a> if the map <a for=map>contains</a> an entry with the given <a for=map>key</a>,
 982 | or if none such exists, to add a new entry with the given key/value to the end of the map. We can
 983 | also denote this by saying, for an <a>ordered map</a> |map|, key |key|, and value |value|,
 984 | "<a for=map>set</a> |map|[|key|] to |value|".
 985 | 
 986 | <p>To <dfn export for=map lt=remove>remove an entry</dfn> from an <a>ordered map</a> is to remove
 987 | all <a for=map>entries</a> from the map that match a given condition, or do nothing if none do. If
 988 | the condition is having a certain <a for=map>key</a>, then we can also denote this by saying, for
 989 | an <a>ordered map</a> |map| and key |key|, "<a for=map>remove</a> |map|[|key|]".
 990 | 
 991 | <p>An <a>ordered map</a> <dfn export for=map lt=exist|contain id=map-exists>contains an
 992 | <a for=map>entry</a> with a given key</dfn> if there exists an entry with that <a for=map>key</a>.
 993 | We can also denote this by saying that, for an <a>ordered map</a> |map| and key |key|, "|map|[|key|]
 994 | <a for=map>exists</a>".
 995 | 
 996 | <p>To <dfn export for=map lt="getting the keys|get the keys">get the keys</dfn> of an
 997 | <a>ordered map</a>, return a new <a>ordered set</a> whose <a for=set>items</a> are each of the
 998 | <a for=map>keys</a> in the map's <a for=map>entries</a>.
 999 | 
1000 | <p>To <dfn export for=map lt="getting the values|get the values">get the values</dfn> of an
1001 | <a>ordered map</a>, return a new <a>list</a> whose <a for=list>items</a> are each of the
1002 | <a for=map>values</a> in the map's <a for=map>entries</a>.
1003 | 
1004 | <p>An <a>ordered map</a>'s <dfn export for=map>size</dfn> is the <a for=set>size</a> of the result
1005 | of running <a for=map>get the keys</a> on the map.
1006 | 
1007 | <p>An <a>ordered map</a> <dfn export for=map lt="is empty|is not empty">is empty</dfn> if its
1008 | <a for=map>size</a> is zero.
1009 | 
1010 | <p>To <dfn export for=map lt="iterate|for each">iterate</dfn> over an <a>ordered map</a>, performing
1011 | a set of steps on each <a for=map>entry</a> in order, use phrasing of the form
1012 | "<a for=map>For each</a> |key| → |value| of |map|", and then operate on |key| and |value| in the
1013 | subsequent prose.
1014 | 
1015 | 
1016 | <h3 id=structs>Structs</h3>
1017 | 
1018 | <p>A <dfn export>struct</dfn> is a specification type consisting of a finite set of
1019 | <dfn export for=struct,tuple,pair lt=item>items</dfn>, each of which has a unique and immutable
1020 | <dfn export for=struct,tuple,pair>name</dfn>.
1021 | 
1022 | <hr>
1023 | 
1024 | <p><a>Structs</a> with a defined order are also known as <dfn export lt=tuple>tuples</dfn>. For
1025 | notational convenience, a literal syntax can be used to express <a>tuples</a>, by surrounding the
1026 | tuple with parenthesis and separating its <a for=tuple>items</a> with a comma. To use this notation,
1027 | the <a for=tuple>names</a> need to be clear from context. This can be done by preceding the first
1028 | instance with the name given to the <a>tuple</a>.
1029 | 
1030 | <div class=example id=example-tuple>
1031 |  <!-- If https://github.com/tabatkins/bikeshed/issues/960 gets fixed we can show how to use <dfn>
1032 |  and <a> on these -->
1033 |  <p>A status is an example <a>tuple</a> consisting of a code (a three-digit number) and text (a byte
1034 |  sequence).
1035 | 
1036 |  <p>A nonsense algorithm that manipulates status tuples for the purpose of demonstrating their
1037 |  usage is then:</p>
1038 | 
1039 |  <ol>
1040 |   <li>Let |statusInstance| be the status (200, `<code>OK</code>`).
1041 |   <li>Set |statusInstance| to (301, `<code>FOO BAR</code>`).
1042 |   <li>If |statusInstance|'s code is 404, then &hellip;
1043 |  </ol>
1044 | </div>
1045 | 
1046 | <p class=note>It is intentional that not all <a>structs</a> are <a>tuples</a>. Documents using the
1047 | Infra Standard might need the flexibility to add new <a for=struct>names</a> to their struct
1048 | without breaking literal syntax used by their dependencies. In that case a tuple is not appropriate.
1049 | 
1050 | <hr>
1051 | 
1052 | <p><a>Tuples</a> with two <a for=tuple>items</a> are also known as <dfn export lt=pair>pairs</dfn>.
1053 | For <a>pairs</a>, a slightly shorter literal syntax can be used, separating the two
1054 | <a for=pair>items</a> with a / character.
1055 | 
1056 | <p class=example id=example-pair>Another way of expressing our |statusInstance| tuple above would be
1057 | as 200/`<code>OK</code>`.
1058 | 
1059 | 
1060 | <h2 id=json>JSON</h2>
1061 | 
1062 | <p>To <dfn export>parse JSON from bytes</dfn> given <var>bytes</var>, run these steps:
1063 | 
1064 | <ol>
1065 |  <li><p>Let <var>jsonText</var> be the result of running <a>UTF-8 decode</a> on <var>bytes</var>.
1066 |  [[!ENCODING]]
1067 | 
1068 |  <li>
1069 |   <p>Return ? <a abstract-op>Call</a>(<a>%JSONParse%</a>, undefined, « <var>jsonText</var> »).
1070 |   [[!ECMA-262]]
1071 | 
1072 |   <p class=note>The conventions used in this step are those of the JavaScript specification.
1073 | 
1074 | </ol>
1075 | 
1076 | <p>To <dfn export>serialize JSON to bytes</dfn> a given JavaScript value <var>value</var>, run these
1077 | steps:
1078 | 
1079 | <ol>
1080 |  <li>
1081 |   <p>Let <var>jsonString</var> be the result of
1082 |   ? <a abstract-op>Call</a>(<a>%JSONStringify%</a>, undefined, « <var>value</var> »).
1083 |   [[!ECMA-262]]
1084 |   <p class=note>The conventions used in this step are those of the JavaScript specification.
1085 |     Also, since no additional arguments are passed to <a>%JSONStringify%</a>, the resulting string
1086 |     will have no whitespace inserted.
1087 | 
1088 |  <li><p>Return the result of running <a>UTF-8 encode</a> on <var>jsonString</var>. [[!ENCODING]]
1089 | </ol>
1090 | 
1091 | 
1092 | <h2 id=forgiving-base64>Forgiving base64</h2>
1093 | 
1094 | <p>To <dfn export>forgiving-base64 encode</dfn> given a <a>byte sequence</a> <var>data</var>, apply
1095 | the base64 algorithm defined in section 4 of RFC 4648 to <var>data</var> and return the result.
1096 | [[!RFC4648]]
1097 | 
1098 | <p class="note no-backref">This is named <a>forgiving-base64 encode</a> for symmetry with
1099 | <a>forgiving-base64 decode</a>, which is different from the RFC as it defines error handling for
1100 | certain inputs.
1101 | 
1102 | <p>To <dfn export>forgiving-base64 decode</dfn> given a string <var>data</var>, run these steps:</p>
1103 | 
1104 | <ol>
1105 |  <li><p>Remove all <a>ASCII whitespace</a> from <var>data</var>.
1106 |  <!-- https://lists.w3.org/Archives/Public/public-whatwg-archive/2011May/0207.html -->
1107 | 
1108 |  <li>
1109 |   <p>If <var>data</var>'s <a for=string>length</a> divides by 4 leaving no remainder, then:
1110 | 
1111 |   <ol>
1112 |    <li><p>If <var>data</var> ends with one or two U+003D (=) <a>code points</a>, then remove them
1113 |    from <var>data</var>.
1114 |   </ol>
1115 | 
1116 |  <li><p>If <var>data</var>'s <a for=string>length</a> divides by 4 leaving a remainder of 1, then
1117 |  return failure.
1118 | 
1119 |  <li>
1120 |   <p>If <var>data</var> contains a <a>code point</a> that is not one of
1121 | 
1122 |   <ul class="brief">
1123 |    <li>U+002B (+)
1124 |    <li>U+002F (/)
1125 |    <li><a>ASCII alphanumeric</a>
1126 |   </ul>
1127 | 
1128 |   <p>then return failure.
1129 | 
1130 |  <li><p>Let <var>output</var> be an empty <a>byte sequence</a>.
1131 | 
1132 |  <li><p>Let <var>buffer</var> be an empty buffer that can have bits appended to it.
1133 | 
1134 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>data</var>, initially
1135 |  pointing at the start of <var>data</var>.
1136 | 
1137 |  <li>
1138 |   <p>While <var>position</var> does not point past the end of <var>data</var>:
1139 | 
1140 |   <ol>
1141 |    <li><p>Find the <a>code point</a> pointed to by <var>position</var> in the second column of
1142 |    Table 1: The Base 64 Alphabet of RFC 4648. Let <var>n</var> be the number given in the first cell
1143 |    of the same row. [[!RFC4648]]
1144 | 
1145 |    <li><p>Append the six bits corresponding to <var>n</var>, most significant bit first, to
1146 |    <var>buffer</var>.
1147 | 
1148 |    <li><p>If <var>buffer</var> has accumulated 24 bits, interpret them as three 8-bit big-endian
1149 |    numbers. Append three bytes with values equal to those numbers to <var>output</var>, in the same
1150 |    order, and then empty <var>buffer</var>.
1151 | 
1152 |    <li><p>Advance <var>position</var> by 1.
1153 |   </ol>
1154 | 
1155 |  <li>
1156 |   <p>If <var>buffer</var> is not empty, it contains either 12 or 18 bits. If it contains 12 bits,
1157 |   then discard the last four and interpret the remaining eight as an 8-bit big-endian number. If it
1158 |   contains 18 bits, then discard the last two and interpret the remaining 16 as two 8-bit big-endian
1159 |   numbers. Append the one or two bytes with values equal to those one or two numbers to
1160 |   <var>output</var>, in the same order.</p>
1161 | 
1162 |   <p class="note">The discarded bits mean that, for instance, "<code>YQ</code>" and
1163 |   "<code>YR</code>" both return `<code>a</code>`.
1164 | 
1165 |  <li><p>Return <var>output</var>.
1166 | </ol>
1167 | 
1168 | 
1169 | <h2 id=namespaces>Namespaces</h2>
1170 | 
1171 | <p>The <dfn export>HTML namespace</dfn> is "<code>http://www.w3.org/1999/xhtml</code>".
1172 | 
1173 | <p>The <dfn export>MathML namespace</dfn> is "<code>http://www.w3.org/1998/Math/MathML</code>".
1174 | 
1175 | <p>The <dfn export>SVG namespace</dfn> is "<code>http://www.w3.org/2000/svg</code>".
1176 | 
1177 | <p>The <dfn export>XLink namespace</dfn> is "<code>http://www.w3.org/1999/xlink</code>".
1178 | 
1179 | <p>The <dfn export>XML namespace</dfn> is "<code>http://www.w3.org/XML/1998/namespace</code>".
1180 | 
1181 | <p>The <dfn export>XMLNS namespace</dfn> is "<code>http://www.w3.org/2000/xmlns/</code>".
1182 | 
1183 | 
1184 | <h2 class=no-num id=acknowledgments>Acknowledgments</h2>
1185 | 
1186 | <p>Many thanks to
1187 | Addison Phillips,
1188 | Aryeh Gregor,
1189 | Chris Rebert,
1190 | Daniel Ehrenberg,
1191 | Dominic Farolino,
1192 | Jake Archibald,
1193 | Jeff Hodges,
1194 | Jungkee Song,
1195 | Leonid Vasilyev,
1196 | Malika Aubakirova,
1197 | Michael™ Smith,
1198 | Mike West,
1199 | Ms2ger,
1200 | Philip Jägenstedt,
1201 | Rashaun "Snuggs" Stovall,
1202 | Sergey Shekyan,
1203 | Simon Pieters,
1204 | Tab Atkins,
1205 | Tobie Langel,
1206 | triple-underscore,
1207 | and Xue Fuqiao
1208 | for being awesome!
1209 | 
1210 | <p>This standard is written by <a lang=nl href=https://annevankesteren.nl/>Anne van Kesteren</a>
1211 | (<a href=https://www.mozilla.org/>Mozilla</a>,
1212 | <a href=mailto:annevk@annevk.nl>annevk@annevk.nl</a>) and
1213 | <a href=https://domenic.me/>Domenic Denicola</a> (<a href=https://www.google.com/>Google</a>,
1214 | <a href=mailto:d@domenic.me>d@domenic.me</a>).
1215 | 


--------------------------------------------------------------------------------
/review-drafts/2019-07.bs:
--------------------------------------------------------------------------------
   1 | <pre class='metadata'>
   2 | Group: WHATWG
   3 | Date: 2019-07-16
   4 | H1: Infra
   5 | Shortname: infra
   6 | Text Macro: TWITTER infrastandard
   7 | Abstract: The Infra Standard aims to define the fundamental concepts upon which standards are built.
   8 | Translation: ja https://triple-underscore.github.io/infra-ja.html
   9 | </pre>
  10 | 
  11 | <pre class="anchors">
  12 | urlPrefix: https://tc39.github.io/ecma262/#; spec: ECMA-262;
  13 |     type: dfn
  14 |         text: %JSONParse%; url: sec-json.parse
  15 |         text: %JSONStringify%; url: sec-json.stringify
  16 |         text: List; url: sec-list-and-record-specification-type
  17 |         text: The String Type; url: sec-ecmascript-language-types-string-type
  18 |         text: realm; url: realm
  19 |     type: method; for: Array; text: sort(); url: sec-array.prototype.sort
  20 |     type: abstract-op;
  21 |         text: Call; url: sec-call
  22 |         text: Get; url: sec-get-o-p
  23 |         text: IsArray; url: sec-isarray
  24 |         text: ToLength; url: sec-tolength
  25 |         text: ToString; url: sec-tostring
  26 |         text: Type; url: sec-ecmascript-data-types-and-values
  27 | </pre>
  28 | 
  29 | 
  30 | <h2 id=goals class=no-num>Goals</h2>
  31 | 
  32 | <ul>
  33 |  <li><p>Deduplicate boilerplate in standards.
  34 | 
  35 |  <li><p>Align standards on conventions, terminology, and data structures.
  36 | 
  37 |  <li><p>Be a place for concepts used by multiple standards without a good home.
  38 | 
  39 |  <li><p>Help write clear and readable algorithmic prose by clarifying otherwise ambiguous concepts.
  40 | </ul>
  41 | 
  42 | <p>Suggestions for more goals welcome.</p>
  43 | 
  44 | 
  45 | <h2 id=usage>Usage</h2>
  46 | 
  47 | <p>To make use of the Infra Standard in a document titled <var>X</var>, use
  48 | <samp><var>X</var> depends on the Infra Standard</samp>. Additionally, cross-referencing terminology
  49 | is encouraged to avoid ambiguity.
  50 | 
  51 | <p>Specification authors are also encouraged to add their specification to the
  52 | <a href=https://github.com/whatwg/infra/wiki/Dependent-specs>list of dependent specifications</a> in
  53 | order to help the editors ensure that any future breaking changes to the Infra Standard are
  54 | correctly reflected by any such dependencies.
  55 | 
  56 | 
  57 | <h2 id=conventions>Conventions</h2>
  58 | 
  59 | <h3 id=conformance>Conformance</h3>
  60 | 
  61 | <p>All assertions, diagrams, examples, and notes are non-normative, as are all sections explicitly
  62 | marked non-normative. Everything else is normative.
  63 | 
  64 | <p>The keywords "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", "SHOULD NOT",
  65 | "RECOMMENDED", "NOT RECOMMENDED", "MAY", and "OPTIONAL" are to be interpreted as described in
  66 | RFC 2119. [[!RFC2119]]
  67 | 
  68 | <p>These keywords have equivalent meaning when written in lowercase and cannot appear in
  69 | non-normative content.
  70 | 
  71 | <p class=note>This is a <a>willful violation</a> of RFC 8174, motivated by legibility and a desire
  72 | to preserve long-standing practice in many non-IETF-published pre-RFC 8174 documents. [[RFC8174]]
  73 | 
  74 | <p>All of the above is applicable to both this standard and any document that uses this standard.
  75 | Documents using this standard are encouraged to limit themselves to "must", "must not", "should",
  76 | and "may", and to use these in their lowercase form as that is generally considered to be more
  77 | readable.
  78 | 
  79 | <p>For non-normative content "strongly encouraged", "strongly discouraged", "encouraged",
  80 | "discouraged", "can", "cannot", "could", "could not", "might", and "might not" can be used instead.
  81 | 
  82 | 
  83 | <h3 id=other-specs>Compliance with other specifications</h3>
  84 | 
  85 | <p>In general, specifications interact with and rely on a wide variety of other specifications. In
  86 | certain circumstances, unfortunately, conflicting needs require a specification to violate the
  87 | requirements of other specifications. When this occurs, a document using the Infra Standard should
  88 | denote such transgressions as a <dfn export>willful violation</dfn>, and note the reason for that
  89 | violation.
  90 | 
  91 | <p class=example id=example-willful-violation>The previous section, [[#conformance]], documents a
  92 | <a>willful violation</a> of RFC 8174 committed by the Infra Standard.
  93 | 
  94 | 
  95 | <h3 id=terminology>Terminology</h3>
  96 | 
  97 | <p>The word "or", in cases where both inclusive "or" and exclusive "or" are possible (e.g., "if
  98 | either width or height is zero"), means an inclusive "or" (implying "or both"), unless it is called
  99 | out as being exclusive (with "but not both").
 100 | 
 101 | 
 102 | <h2 id=algorithms>Algorithms</h2>
 103 | 
 104 | <p>Algorithms, and requirements phrased in the imperative as part of algorithms (such as "strip any
 105 | leading spaces" or "return false") are to be interpreted with the meaning of the keyword (e.g.,
 106 | "must") used in introducing the algorithm or step. If no such keyword is used, must is implied.
 107 | 
 108 | <div class=example id=example-algorithms>
 109 |  <p>For example, were the spec to say:</p>
 110 | 
 111 |  <blockquote>
 112 |   <p class=allow-2119>To eat an orange, the user must:
 113 | 
 114 |   <ol class=brief>
 115 |    <li>Peel the orange.
 116 |    <li>Separate each slice of the orange.
 117 |    <li>Eat the orange slices.
 118 |   </ol>
 119 |  </blockquote>
 120 | 
 121 |  <p>it would be equivalent to the following:</p>
 122 | 
 123 |  <blockquote>
 124 |   <p>To eat an orange:
 125 | 
 126 |   <ol class=brief>
 127 |    <li class=allow-2119>The user must peel the orange.
 128 |    <li class=allow-2119>The user must separate each slice of the orange.
 129 |    <li class=allow-2119>The user must eat the orange slices.
 130 |   </ol>
 131 |  </blockquote>
 132 | 
 133 |  <p class=allow-2119>Here the key word is "must".</p>
 134 | 
 135 |  <p class=allow-2119>Modifying the above example, if the algorithm was introduced only with "To eat
 136 |  an orange:", it would still have the same meaning, as "must" is implied.
 137 | </div>
 138 | 
 139 | <p>Conformance requirements phrased as algorithms or specific steps may be implemented in any
 140 | manner, so long as the end result is equivalent. (In particular, the algorithms are intended to be
 141 | easy to follow, and not intended to be performant.)
 142 | 
 143 | <p class=note>Performance is tricky to get correct as it is influenced by user perception, computer
 144 | architectures, and different types of input that can change over time in how common they are. For
 145 | instance, a JavaScript engine likely has many different code paths for what is standardized as a
 146 | single algorithm, in order to optimize for speed or memory consumption. Standardizing all those code
 147 | paths would be an insurmountable task and not productive as they would not stand the test of time
 148 | as well as the single algorithm would. Therefore performance is best left as a field to compete
 149 | over.
 150 | 
 151 | 
 152 | <h3 id=variables>Variables</h3>
 153 | 
 154 | <p>A variable is declared with "let" and changed with "set".
 155 | 
 156 | <p class=example id=example-variable>Let |list| be a new <a>list</a>.</p>
 157 | 
 158 | <div class=example id=example-variable-null>
 159 |  <ol>
 160 |   <li><p>Let |value| be null.
 161 | 
 162 |   <li><p>If |input| is a <a>string</a>, then set |value| to |input|.
 163 | 
 164 |   <li><p>Otherwise, set |value| to |input|, <a>UTF-8 decoded</a>.
 165 | 
 166 |   <li><p><a>Assert</a>: |value| is a <a>string</a>.
 167 |  </ol>
 168 | </div>
 169 | 
 170 | <p class=example id=example-variable-ternary>Let <var ignore>activationTarget</var> be
 171 | <var ignore>target</var> if <var ignore>isActivationEvent</var> is true and target has activation
 172 | behavior; otherwise null.
 173 | 
 174 | <p>Variables must not be used before they are declared. Variables are
 175 | <a href=https://en.wikipedia.org/wiki/Scope_(computer_science)#Block_scope>block scoped</a>.
 176 | Variables must not be declared more than once per algorithm.
 177 | 
 178 | 
 179 | <h3 id=algorithm-control-flow>Control flow</h3>
 180 | 
 181 | <p>The control flow of algorithms is such that a requirement to "return" or "throw" terminates the
 182 | algorithm the statement was in. "Return" will hand the given value, if any, to its caller. "Throw"
 183 | will make the caller automatically rethrow the given value, if any, and thereby terminate the
 184 | caller's algorithm. Using prose the caller has the ability to "catch" the exception and perform
 185 | another action.
 186 | 
 187 | 
 188 | <h3 id=algorithm-conditional-abort>Conditional abort</h3>
 189 | 
 190 | <p>Sometimes it is useful to stop performing a series of steps once a condition becomes true.
 191 | 
 192 | <p>To do this, state that a given series of steps will <dfn export>abort when</dfn> a specific
 193 | <var>condition</var> is reached. This indicates that the specified steps must be evaluated, not
 194 | as-written, but by additionally inserting a step before each of them that evaluates
 195 | <var>condition</var>, and if <var>condition</var> evaluates to true, skips the remaining steps.
 196 | 
 197 | <p>In such algorithms, the subsequent step can be annotated to run <dfn export>if aborted</dfn>, in
 198 | which case it must run if any of the preceding steps were skipped due to the <var>condition</var>
 199 | of the preceding <a>abort when</a> step evaluated to true.
 200 | 
 201 | <div class=example id=example-conditional-abort>
 202 |  <p>The following algorithm
 203 | 
 204 |  <ol>
 205 |   <li><p>Let |result| be an empty <a>list</a>.
 206 | 
 207 |   <li>
 208 |    <p>Run these steps, but <a>abort when</a> the user clicks the "Cancel" button:
 209 | 
 210 |    <ol>
 211 |     <li><p>Compute the first million digits of <var>π</var>, and <a for=list>append</a> the result
 212 |     to |result|.
 213 | 
 214 |     <li><p>Compute the first million digits of |e|, and <a for=list>append</a> the result to
 215 |     |result|.
 216 | 
 217 |     <li><p>Compute the first million digits of <var>φ</var>, and <a for=list>append</a> the result
 218 |     to |result|.
 219 |    </ol>
 220 |   </li>
 221 | 
 222 |   <li><p><a>If aborted</a>, <a for=list>append</a> "<code>Didn't finish!</code>" to |result|.
 223 |  </ol>
 224 | 
 225 |  <p>is equivalent to the more verbose formulation</p>
 226 | 
 227 |  <ol>
 228 |   <li><p>Let |result| be an empty <a>list</a>.
 229 | 
 230 |   <li>
 231 |    <p>If the user has not clicked the "Cancel" button, then:
 232 | 
 233 |    <ol>
 234 |     <li><p>Compute the first million digits of <var>π</var>, and <a for=list>append</a> the result
 235 |     to |result|.
 236 | 
 237 |     <li>
 238 |      <p>If the user has not clicked the "Cancel" button, then:
 239 | 
 240 |      <ol>
 241 |       <li><p>Compute the first million digits of |e|, and <a for=list>append</a> the result to
 242 |       |result|.
 243 | 
 244 |       <li><p>If the user has not clicked the "Cancel" button, then compute the first million digits
 245 |       of <var>φ</var>, and <a for=list>append</a> the result to |result|.
 246 |      </ol>
 247 |    </ol>
 248 | 
 249 |   <li><p>If the user clicked the "Cancel" button, then <a for=list>append</a>
 250 |   "<code>Didn't finish!</code>" to |result|.
 251 |  </ol>
 252 | </div>
 253 | 
 254 | <p class=note>Whenever this construct is used, implementations are allowed to evaluate
 255 | <var>condition</var> during the specified steps rather than before and after each step, as long as
 256 | the end result is indistinguishable. For instance, as long as |result| in the above example is not
 257 | mutated during a compute operation, the user agent could stop the computation.
 258 | 
 259 | 
 260 | <h3 id=algorithm-iteration>Iteration</h3>
 261 | 
 262 | <p>There's a variety of ways to repeat a set of steps until a condition is reached.
 263 | 
 264 | <p class=note>The Infra Standard is not (yet) exhaustive on this; please file an issue if you need
 265 | something.
 266 | 
 267 | <dl>
 268 |  <dt>For each
 269 |  <dd><p>As defined <a for=list lt="for each">for lists</a> (and derivatives) and
 270 |  <a for=map lt="for each">maps</a>.
 271 | 
 272 |  <dt><dfn export for=iteration lt=while>While</dfn>
 273 |  <dd>
 274 |   <p>An instruction to repeat a set of steps as long as a condition is met.
 275 | 
 276 |   <div class=example id=example-while>
 277 |    <p>While |condition| is "<code>met</code>":
 278 | 
 279 |    <ol>
 280 |     <li><p>&hellip;
 281 |    </ol>
 282 |   </div>
 283 | </dl>
 284 | 
 285 | <p>An iteration's flow can be controlled via requirements to
 286 | <dfn export for=iteration>continue</dfn> or <dfn export for=iteration>break</dfn>.
 287 | <a for=iteration>Continue</a> will skip over any remaining steps in an iteration, proceeding to the
 288 | next item. If no further items remain, the iteration will stop. <a for=iteration>Break</a> will skip
 289 | over any remaining steps in an iteration, and skip over any remaining items as well, stopping the
 290 | iteration.
 291 | 
 292 | <div class=example id=example-break-continue>
 293 |  <p>Let |example| be the <a>list</a> « 1, 2, 3, 4 ». The following prose would perform |operation|
 294 |  upon 1, then 2, then 3, then 4:
 295 | 
 296 |  <ol>
 297 |   <li>
 298 |    <p><a for=list>For each</a> |item| of |example|:
 299 |    <ol>
 300 |     <li>Perform |operation| on |item|.
 301 |    </ol>
 302 |   </li>
 303 |  </ol>
 304 | 
 305 |  <p>The following prose would perform |operation| upon 1, then 2, then 4. 3 would be skipped.
 306 | 
 307 |  <ol>
 308 |   <li>
 309 |    <p><a for=list>For each</a> |item| of |example|:
 310 |    <ol>
 311 |     <li>If |item| is 3, then <a for=iteration>continue</a>.
 312 |     <li>Perform |operation| on |item|.
 313 |    </ol>
 314 |   </li>
 315 |  </ol>
 316 | 
 317 |  <p>The following prose would perform |operation| upon 1, then 2. 3 and 4 would be skipped.
 318 | 
 319 |  <ol>
 320 |   <li>
 321 |    <p><a for=list>For each</a> |item| of |example|:
 322 |    <ol>
 323 |     <li>If |item| is 3, then <a for=iteration>break</a>.
 324 |     <li>Perform |operation| on |item|.
 325 |    </ol>
 326 |   </li>
 327 |  </ol>
 328 | </div>
 329 | 
 330 | 
 331 | <h3 id=assertions>Assertions</h3>
 332 | 
 333 | <p>To improve readability, it can sometimes help to add assertions to algorithms, stating
 334 | invariants. To do this, write "<dfn export>Assert</dfn>:", followed by a statement that must be
 335 | true. If the statement ends up being false that indicates an issue with the document using the Infra
 336 | Standard that should be reported and addressed.
 337 | 
 338 | <p class=note>Since the statement can only ever be true, it has no implications for implementations.
 339 | 
 340 | <div class=example id=example-assert>
 341 |  <ol>
 342 |   <li><p>Let |x| be "<code>Aperture Science</code>".
 343 |   <li><p><a>Assert</a>: |x| is "<code>Aperture Science</code>".
 344 | </div>
 345 | 
 346 | 
 347 | <h2 id=primitive-data-types>Primitive data types</h2>
 348 | 
 349 | <h3 id=nulls>Nulls</h3>
 350 | 
 351 | <p>The value null is used to indicate the lack of a value. It can be used interchangeably with the
 352 | JavaScript <b>null</b> value. [[!ECMA-262]]
 353 | 
 354 | <p class=example id=example-null>Let <var ignore>element</var> be null.
 355 | 
 356 | <p class=example id=example-null-return>If <var>input</var> is the empty string, then return null.
 357 | 
 358 | 
 359 | <h3 id=booleans>Booleans</h3>
 360 | 
 361 | <p>A <dfn export>boolean</dfn> is either true or false.
 362 | 
 363 | <p class=example id=example-boolean>Let <var ignore>elementSeen</var> be false.
 364 | 
 365 | 
 366 | <h3 id=bytes>Bytes</h3>
 367 | 
 368 | <p>A <dfn export>byte</dfn> is a sequence of eight bits, represented as a double-digit hexadecimal
 369 | number in the range 0x00 to 0xFF, inclusive.
 370 | 
 371 | <p>An <dfn export>ASCII byte</dfn> is a <a>byte</a> in the range 0x00 (NUL) to 0x7F (DEL),
 372 | inclusive. As illustrated, an <a>ASCII byte</a>, excluding 0x28 and 0x29, may be followed by the
 373 | representation outlined in the <a href=https://tools.ietf.org/html/rfc20#section-2>Standard Code</a>
 374 | section of <cite>ASCII format for Network Interchange</cite>, between parentheses. [[!RFC20]]
 375 | 
 376 | <p>0x28 may be followed by "(left parenthesis)" and 0x29 by "(right parenthesis)".
 377 | 
 378 | <p class=example id=example-byte-notation>0x49 (I) when <a>UTF-8 decoded</a> becomes the
 379 | <a>code point</a> U+0049 (I).
 380 | 
 381 | 
 382 | <h3 id=byte-sequences>Byte sequences</h3>
 383 | 
 384 | <p>A <dfn export>byte sequence</dfn> is a sequence of <a>bytes</a>, represented as a space-separated
 385 | sequence of bytes. Byte sequences with bytes in the range 0x20 (SP) to 0x7E (~), inclusive, can
 386 | alternately be written as a string, but using backticks instead of quotation marks, to avoid
 387 | confusion with an actual <a>string</a>.
 388 | 
 389 | <div class=example id=example-byte-sequence-notation>
 390 |  <p>0x48 0x49 can also be represented as `<code>HI</code>`.
 391 | 
 392 |  <p>Headers, such as `<code>Content-Type</code>`, are <a>byte sequences</a>.
 393 | </div>
 394 | 
 395 | <p class=note>To get a <a>byte sequence</a> out of a <a>string</a>, using <a>UTF-8 encode</a> from
 396 | the Encoding Standard is encouraged. In rare circumstances <a>isomorphic encode</a> might be needed.
 397 | [[ENCODING]]
 398 | 
 399 | <p>A <a>byte sequence</a>'s <dfn export for="byte sequence">length</dfn> is the number of
 400 | <a>bytes</a> it contains.
 401 | 
 402 | <p>To <dfn export>byte-lowercase</dfn> a <a>byte sequence</a>, increase each <a>byte</a> it
 403 | contains, in the range 0x41 (A) to 0x5A (Z), inclusive, by 0x20.
 404 | 
 405 | <p>To <dfn export>byte-uppercase</dfn> a <a>byte sequence</a>, subtract each <a>byte</a> it
 406 | contains, in the range 0x61 (a) to 0x7A (z), inclusive, by 0x20.
 407 | 
 408 | <p>A <a>byte sequence</a> <var>A</var> is a <dfn export>byte-case-insensitive</dfn> match for a
 409 | <a>byte sequence</a> <var>B</var>, if the <a>byte-lowercase</a> of <var>A</var> is the
 410 | <a>byte-lowercase</a> of <var>B</var>.
 411 | 
 412 | <hr>
 413 | 
 414 | <p>A <a>byte sequence</a> <var>a</var> <dfn export for="byte sequence">starts with</dfn> a
 415 | <a>byte sequence</a> <var>b</var> if the following steps return true:
 416 | 
 417 | <ol>
 418 |  <li><p>Let <var>i</var> be 0.
 419 | 
 420 |  <li>
 421 |   <p><a>While</a> true:
 422 | 
 423 |   <ol>
 424 |    <li><p>Let <var>aByte</var> be the <var>i</var>th <a>byte</a> of <var>a</var> if <var>i</var> is
 425 |    less than <var>a</var>'s <a for="byte sequence">length</a>; otherwise null.
 426 | 
 427 |    <li><p>Let <var>bByte</var> be the <var>i</var>th <a>byte</a> of <var>b</var> if <var>i</var> is
 428 |    less than <var>b</var>'s <a for="byte sequence">length</a>; otherwise null.
 429 | 
 430 |    <li><p>If <var>bByte</var> is null, then return true.
 431 | 
 432 |    <li><p>Return false if <var>aByte</var> is not <var>bByte</var>.
 433 | 
 434 |    <li><p>Set <var>i</var> to <var>i</var> + 1.
 435 |   </ol>
 436 |  </li>
 437 | </ol>
 438 | 
 439 | <p>A <a>byte sequence</a> <var>a</var> is <dfn export>byte less than</dfn> a <a>byte sequence</a>
 440 | <var>b</var> if the following steps return true:
 441 | 
 442 | <ol>
 443 |  <li><p>If <var>b</var> <a for="byte sequence">starts with</a> <var>a</var>, then return false.
 444 | 
 445 |  <li><p>If <var>a</var> <a for="byte sequence">starts with</a> <var>b</var>, then return true.
 446 | 
 447 |  <li><p>Let <var>n</var> be the smallest index such that the <var>n</var>th <a>byte</a> of
 448 |  <var>a</var> is different from the <var>n</var>th byte of <var>b</var>. (There has to be such an
 449 |  index, since neither byte sequence starts with the other.)
 450 | 
 451 |  <li><p>If the <var>n</var>th byte of <var>a</var> is less than the <var>n</var>th byte of
 452 |  <var>b</var>, then return true.
 453 | 
 454 |  <li><p>Return false.
 455 | </ol>
 456 | 
 457 | <hr>
 458 | 
 459 | <p>To <dfn export>isomorphic decode</dfn> a <a>byte sequence</a> <var>input</var>, return a
 460 | <a>string</a> whose <a for=string>length</a> is equal to <var>input</var>'s
 461 | <a for="byte sequence">length</a> and whose <a>code points</a> have the same values as
 462 | <var>input</var>'s <a>bytes</a>, in the same order.
 463 | 
 464 | 
 465 | <h3 id=code-points>Code points</h3>
 466 | 
 467 | <p>A <dfn export lt="code point|character">code point</dfn> is a Unicode code point and is
 468 | represented as a four-to-six digit hexadecimal number, typically prefixed with "U+".
 469 | 
 470 | <p>A <a>code point</a> may be followed by its name, by its rendered form between parentheses when it
 471 | is not U+0028 or U+0029, or by both. Documents using the Infra Standard are encouraged to follow
 472 | <a>code points</a> by their name when they cannot be rendered or are U+0028 or U+0029; otherwise,
 473 | follow them by their rendered form between parentheses, for legibility.
 474 | 
 475 | <p>A <a>code point</a>'s name is defined in the Unicode Standard and represented in
 476 | <a>ASCII uppercase</a>. [[!UNICODE]]
 477 | 
 478 | <div class=example id=example-code-point-notation>
 479 |  <p>The <a>code point</a> rendered as 🤔 is represented as U+1F914.
 480 | 
 481 |  <p>When referring to that <a>code point</a>, we might say "U+1F914 (🤔)", to provide extra context.
 482 |  Documents are allowed to use "U+1F914 THINKING FACE (🤔)" as well, though this is somewhat verbose.
 483 | </div>
 484 | 
 485 | <p class=example id=example-code-point-notation-hard-to-render><a>Code points</a> that are difficult
 486 | to render unambigiously, such as U+000A, can be referred to as "U+000A LF". U+0029 can be referred
 487 | to as "U+0029 RIGHT PARENTHESIS", because even though it renders, this avoids unmatched parentheses.
 488 | 
 489 | <p><a>Code points</a> are sometimes referred to as <a>characters</a> and in certain contexts are
 490 | prefixed with "0x" rather than "U+".
 491 | 
 492 | <p>A <dfn export>surrogate</dfn> is a <a>code point</a> that is in the range U+D800 to U+DFFF,
 493 | inclusive.
 494 | 
 495 | <p>A <dfn export>scalar value</dfn> is a <a>code point</a> that is not a <a>surrogate</a>.
 496 | 
 497 | <p>A <dfn export>noncharacter</dfn> is a <a>code point</a> that is in the range U+FDD0 to U+FDEF,
 498 | inclusive, or U+FFFE, U+FFFF, U+1FFFE, U+1FFFF, U+2FFFE, U+2FFFF, U+3FFFE, U+3FFFF, U+4FFFE,
 499 | U+4FFFF, U+5FFFE, U+5FFFF, U+6FFFE, U+6FFFF, U+7FFFE, U+7FFFF, U+8FFFE, U+8FFFF, U+9FFFE, U+9FFFF,
 500 | U+AFFFE, U+AFFFF, U+BFFFE, U+BFFFF, U+CFFFE, U+CFFFF, U+DFFFE, U+DFFFF, U+EFFFE, U+EFFFF, U+FFFFE,
 501 | U+FFFFF, U+10FFFE, or U+10FFFF.
 502 | 
 503 | <p>An <dfn export>ASCII code point</dfn> is a <a>code point</a> in the range U+0000 NULL to
 504 | U+007F DELETE, inclusive.
 505 | 
 506 | <p>An <dfn export lt="ASCII tab or newline|ASCII tabs or newlines">ASCII tab or newline</dfn> is
 507 | U+0009 TAB, U+000A LF, or U+000D CR.
 508 | 
 509 | <p><dfn export>ASCII whitespace</dfn> is U+0009 TAB, U+000A LF, U+000C FF, U+000D CR, or U+0020
 510 | SPACE.
 511 | 
 512 | <p class=note>"Whitespace" is a mass noun.
 513 | 
 514 | <p>A <dfn export>C0 control</dfn> is a <a>code point</a> in the range U+0000 NULL to
 515 | U+001F INFORMATION SEPARATOR ONE, inclusive.
 516 | 
 517 | <p>A <dfn export lt="C0 control or space|C0 controls or spaces">C0 control or space</dfn> is a
 518 | <a>C0 control</a> or U+0020 SPACE.
 519 | 
 520 | <p>A <dfn export>control</dfn> is a <a>C0 control</a> or a <a>code point</a> in the range
 521 | U+007F DELETE to U+009F APPLICATION PROGRAM COMMAND, inclusive.
 522 | 
 523 | <p>An <dfn export>ASCII digit</dfn> is a <a>code point</a> in the range U+0030 (0) to U+0039 (9),
 524 | inclusive.
 525 | 
 526 | <p>An <dfn export>ASCII upper hex digit</dfn> is an <a>ASCII digit</a> or a <a>code point</a> in the
 527 | range U+0041 (A) to U+0046 (F), inclusive.
 528 | 
 529 | <p>An <dfn export>ASCII lower hex digit</dfn> is an <a>ASCII digit</a> or a <a>code point</a> in the
 530 | range U+0061 (a) to U+0066 (f), inclusive.
 531 | 
 532 | <p>An <dfn export>ASCII hex digit</dfn> is an <a>ASCII upper hex digit</a> or
 533 | <a>ASCII lower hex digit</a>.
 534 | 
 535 | <p>An <dfn export>ASCII upper alpha</dfn> is a <a>code point</a> in the range U+0041 (A) to
 536 | U+005A (Z), inclusive.
 537 | 
 538 | <p>An <dfn export>ASCII lower alpha</dfn> is a <a>code point</a> in the range U+0061 (a) to
 539 | U+007A (z), inclusive.
 540 | 
 541 | <p>An <dfn export>ASCII alpha</dfn> is an <a>ASCII upper alpha</a> or <a>ASCII lower alpha</a>.
 542 | 
 543 | <p>An <dfn export>ASCII alphanumeric</dfn> is an <a>ASCII digit</a> or <a>ASCII alpha</a>.
 544 | 
 545 | 
 546 | <h3 id=strings>Strings</h3>
 547 | 
 548 | <p>A <dfn export>JavaScript string</dfn> is a sequence of unsigned 16-bit integers, also known as
 549 | <dfn export lt="code unit">code units</dfn>.
 550 | 
 551 | <p class=note>This is different from how the Unicode Standard defines "code unit". In particular it
 552 | refers exclusively to how the Unicode Standard defines it for Unicode 16-bit strings. [[UNICODE]]
 553 | 
 554 | <p>A <a>JavaScript string</a>'s <dfn export for="JavaScript string">length</dfn> is the number of
 555 | <a>code units</a> it contains.
 556 | 
 557 | <p>A <a>JavaScript string</a> can also be interpreted as containing <a>code points</a>, per the
 558 | conversion defined in <a>The String Type</a> section of the JavaScript specification. [[!ECMA-262]]
 559 | 
 560 | <p class=note>This conversion process converts surrogate pairs into their corresponding
 561 | <a>scalar value</a> and maps isolated surrogates to their corresponding <a>code point</a>, leaving
 562 | them effectively as-is.
 563 | 
 564 | <p class=example id=example-javascript-string-in-code-points>A <a>JavaScript string</a> consisting
 565 | of the <a>code units</a> 0xD83D, 0xDCA9, and 0xD800, when interpreted as containing
 566 | <a>code points</a>, would consist of the <a>code points</a> U+1F4A9 and U+D800.
 567 | 
 568 | <p>A <dfn export>scalar value string</dfn> is a sequence of <a>scalar values</a>.
 569 | 
 570 | <p class=note>A <a>scalar value string</a> is useful for any kind of I/O or other kind of operation
 571 | where <a>UTF-8 encode</a> comes into play.
 572 | <!-- It's also useful if you can imagine the subsystem to be implemented in Rust -->
 573 | 
 574 | <p><dfn export lt=string>String</dfn> can be used to refer to either a <a>JavaScript string</a> or
 575 | <a>scalar value string</a>, when it is clear from the context which is meant or when the distinction
 576 | is immaterial. <a>Strings</a> are denoted by double quotes and monospace font.
 577 | 
 578 | <p class=example id=example-string-notation>"<code>Hello, world!</code>" is a string.
 579 | 
 580 | <p>A <a>string</a>'s <dfn export for=string>length</dfn> is the number of <a>code points</a> it
 581 | contains.
 582 | 
 583 | <p>To <dfn export for="JavaScript string">convert</dfn> a <a>JavaScript string</a> into a
 584 | <a>scalar value string</a>, replace any <a>surrogates</a> with U+FFFD.
 585 | <!-- Obviates need for https://heycam.github.io/webidl/#dfn-obtain-unicode -->
 586 | 
 587 | <p class=note>The replaced surrogates are always isolated surrogates, since the process of
 588 | interpreting the JavaScript string as containing <a>code points</a> will have converted surrogate
 589 | pairs into <a>scalar values</a>.
 590 | 
 591 | <p>A <a>scalar value string</a> can always be used as <a>JavaScript string</a> implicitly since it
 592 | is a subset. The reverse is only possible if the <a>JavaScript string</a> is known to not contain
 593 | <a>surrogates</a>; otherwise a <a for="JavaScript string" lt=convert>conversion</a> must be
 594 | performed.
 595 | 
 596 | <p class=note>An implementation likely has to perform explicit conversion, depending on how it
 597 | actually ends up representing <a lt="JavaScript string">JavaScript</a> and
 598 | <a>scalar value strings</a>. It is even fairly typical for implementations to have multiple
 599 | implementations of just <a>JavaScript strings</a> for performance and memory reasons.
 600 | 
 601 | <hr>
 602 | 
 603 | <p>A <a>string</a> <var>a</var> is a
 604 | <dfn export lt="code unit prefix|starts with">code unit prefix</dfn> of a <a>string</a> <var>b</var>
 605 | if the following steps return true:
 606 | 
 607 | <ol>
 608 |  <li><p>Let <var>i</var> be 0.
 609 | 
 610 |  <li>
 611 |   <p><a>While</a> true:
 612 | 
 613 |   <ol>
 614 |    <li><p>Let <var>aCodeUnit</var> be the <var>i</var>th <a>code unit</a> of <var>a</var> if
 615 |    <var>i</var> is less than <var>a</var>'s <a for=string>length</a>; otherwise null.
 616 | 
 617 |    <li><p>Let <var>bCodeUnit</var> be the <var>i</var>th <a>code unit</a> of <var>b</var> if
 618 |    <var>i</var> is less than <var>b</var>'s <a for=string>length</a>; otherwise null.
 619 | 
 620 |    <li><p>If <var>bCodeUnit</var> is null, then return true.
 621 | 
 622 |    <li><p>Return false if <var>aCodeUnit</var> is different from <var>bCodeUnit</var>.
 623 | 
 624 |    <li><p>Set <var>i</var> to <var>i</var> + 1.
 625 |   </ol>
 626 |  </li>
 627 | </ol>
 628 | 
 629 | <p>When it is clear from context that <a>code units</a> are in play, e.g., because one of the
 630 | strings is a literal containing only characters that are in the range U+0020 SPACE to U+007E (~),
 631 | "<var>a</var> starts with <var>b</var>" can be used as a synonym for "<var>b</var> is a
 632 | <a>code unit prefix</a> of <var>a</var>".
 633 | 
 634 | <p class=example id=code-unit-prefix-example>With unknown values, it is good to be explicit:
 635 | <var ignore>targetString</var> is a <a>code unit prefix</a> of <var>userInput</var>. But with a
 636 | literal, we can use plainer language: <var>userInput</var> starts with "<code>!</code>".
 637 | 
 638 | <p>A <a>string</a> <var>a</var> is <dfn export>code unit less than</dfn> a <a>string</a>
 639 | <var>b</var> if the following steps return true:
 640 | 
 641 | <ol>
 642 |  <li><p>If <var>b</var> is a <a>code unit prefix</a> of <var>a</var>, then return false.
 643 | 
 644 |  <li><p>If <var>a</var> is a <a>code unit prefix</a> of <var>b</var>, then return true.
 645 | 
 646 |  <li><p>Let <var>n</var> be the smallest index such that the <var>n</var>th <a>code unit</a> of
 647 |  <var>a</var> is different from the <var>n</var>th code unit of <var>b</var>. (There has to be such
 648 |  an index, since neither string is a prefix of the other.)
 649 | 
 650 |  <li><p>If the <var>n</var>th code unit of <var>a</var> is less than the <var>n</var>th code unit of
 651 |  <var>b</var>, then return true.
 652 | 
 653 |  <li><p>Return false.
 654 | </ol>
 655 | 
 656 | <p class="note">This matches the ordering used by JavaScript's <code>&lt;</code> operator, and its
 657 | {{Array/sort()}} method on an array of strings. This ordering compares the 16-bit code units in each
 658 | string, producing a highly efficient, consistent, and deterministic sort order. The resulting
 659 | ordering will not match any particular alphabet or lexicographic order, particularly for
 660 | <a>code points</a> represented by a surrogate pair. [[!ECMA-262]]
 661 | 
 662 | <hr>
 663 | 
 664 | <p>To <dfn export>isomorphic encode</dfn> a <a>string</a> <var>input</var>, run these steps:</p>
 665 | 
 666 | <ol>
 667 |  <li><p><a>Assert</a>: <var>input</var> contains no <a>code points</a> greater than U+00FF.
 668 | 
 669 |  <li><p>Return a <a>byte sequence</a> whose <a for="byte sequence">length</a> is equal to
 670 |  <var>input</var>'s <a for=string>length</a> and whose <a>bytes</a> have the same values as
 671 |  <var>input</var>'s <a>code points</a>, in the same order.
 672 | </ol>
 673 | 
 674 | <hr>
 675 | 
 676 | <p>An <dfn export>ASCII string</dfn> is a <a>string</a> whose <a>code points</a> are all
 677 | <a>ASCII code points</a>.
 678 | 
 679 | <p>To <dfn export>ASCII lowercase</dfn> a <a>string</a>, replace all <a>ASCII upper alphas</a> in
 680 | the <a>string</a> with their corresponding <a>code point</a> in <a>ASCII lower alpha</a>.
 681 | 
 682 | <p>To <dfn export>ASCII uppercase</dfn> a <a>string</a>, replace all <a>ASCII lower alphas</a> in
 683 | the <a>string</a> with their corresponding <a>code point</a> in <a>ASCII upper alpha</a>.
 684 | 
 685 | <p>A <a>string</a> <var>A</var> is an <dfn export>ASCII case-insensitive</dfn> match for a
 686 | <a>string</a> <var>B</var>, if the <a>ASCII lowercase</a> of <var>A</var> is the
 687 | <a>ASCII lowercase</a> of <var>B</var>.
 688 | <!-- TODO: define string equals? -->
 689 | 
 690 | <p>To <dfn export>ASCII encode</dfn> a <a>string</a> <var>input</var>, run these steps:
 691 | 
 692 | <ol>
 693 |  <li><p><a>Assert</a>: <var>input</var> is an <a>ASCII string</a>.
 694 | 
 695 |  <p class=note>Note: This precondition ensures that <a>isomorphic encode</a> and
 696 |  <a>UTF-8 encode</a> return the same <a>byte sequence</a> for this input.
 697 | 
 698 |  <li><p>Return the <a>isomorphic encoding</a> of <var>input</var>.
 699 | </ol>
 700 | 
 701 | <p>To <dfn export>ASCII decode</dfn> a <a>byte sequence</a> <var>input</var>, run these steps:
 702 | 
 703 | <ol>
 704 |  <li><p><a>Assert</a>: All bytes in <var>input</var> are <a>ASCII bytes</a>.
 705 | 
 706 |  <p class=note>Note: This precondition ensures that <a>isomorphic decode</a> and
 707 |  <a>UTF-8 decode</a> return the same <a>string</a> for this input.
 708 | 
 709 |  <li><p>Return the <a>isomorphic decoding</a> of <var>input</var>.
 710 | </ol>
 711 | 
 712 | 
 713 | <hr>
 714 | 
 715 | <p>To <dfn export>strip newlines</dfn> from a <a>string</a>, remove any U+000A LF and U+000D CR
 716 | <a>code points</a> from the <a>string</a>.
 717 | 
 718 | <p>To <dfn export>normalize newlines</dfn> in a <a>string</a>, replace every U+000D CR U+000A LF
 719 | <a>code point</a> pair with a single U+000A LF <a>code point</a>, and then replace every remaining
 720 | U+000D CR <a>code point</a> with a U+000A LF <a>code point</a>.
 721 | 
 722 | <p>To <dfn export>strip leading and trailing ASCII whitespace</dfn> from a <a>string</a>, remove all
 723 | <a>ASCII whitespace</a> that are at the start or the end of the <a>string</a>.
 724 | 
 725 | <p>To <dfn export>strip and collapse ASCII whitespace</dfn> in a <a>string</a>, replace any sequence
 726 | of one or more consecutive <a>code points</a> that are <a>ASCII whitespace</a> in the <a>string</a>
 727 | with a single U+0020 SPACE <a>code point</a>, and then remove any leading and trailing
 728 | <a>ASCII whitespace</a> from that string.
 729 | 
 730 | <hr>
 731 | 
 732 | <p>To <dfn export lt="collect a sequence of code points|collecting a sequence of code
 733 | points">collect a sequence of <a>code points</a></dfn> meeting a condition <var>condition</var> from
 734 | a <a>string</a> <var>input</var>, given a <dfn export for="string">position variable</dfn>
 735 | <var>position</var> tracking the position of the calling algorithm within <var>input</var>:</p>
 736 | 
 737 | <ol>
 738 |  <li><p>Let <var>result</var> be the empty <a>string</a>.
 739 | 
 740 |  <li>
 741 |   <p>While <var>position</var> doesn't point past the end of <var>input</var> and the
 742 |   <a>code point</a> at <var>position</var> within <var>input</var> meets the condition
 743 |   <var>condition</var>:
 744 | 
 745 |   <ol>
 746 |    <li><p>Append that <a>code point</a> to the end of <var>result</var>.
 747 | 
 748 |    <li><p>Advance <var>position</var> by 1.
 749 |   </ol>
 750 |  </li>
 751 | 
 752 |  <li><p>Return <var>result</var>.
 753 | </ol>
 754 | 
 755 | <p class=note>In addition to returning the collected <a>code points</a>, this algorithm updates the
 756 | <a>position variable</a> in the calling algorithm.
 757 | 
 758 | <p>To <dfn export>skip ASCII whitespace</dfn> within a <a>string</a> <var>input</var> given a
 759 | <a>position variable</a> <var>position</var>, <a>collect a sequence of code points</a> that are
 760 | <a>ASCII whitespace</a> from <var>input</var> given <var>position</var>. The collected
 761 | <a>code points</a> are not used, but <var>position</var> is still updated.
 762 | 
 763 | <hr>
 764 | 
 765 | <p>To <dfn export lt="strictly split|strictly split a string">strictly split a <a>string</a></dfn>
 766 | <var>input</var> on a particular delimiter <a>code point</a> <var>delimiter</var>:</p>
 767 | 
 768 | <ol>
 769 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 770 |  pointing at the start of <var>input</var>.
 771 | 
 772 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 773 | 
 774 |  <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 775 |  not equal to <var>delimiter</var> from <var>input</var>, given <var>position</var>.
 776 | 
 777 |  <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 778 | 
 779 |  <li>
 780 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 781 | 
 782 |   <ol>
 783 |    <li><p><a>Assert</a>: the <a>code point</a> at <var>position</var> within <var>input</var> is
 784 |    <var>delimiter</var>.
 785 | 
 786 |    <li><p>Advance <var>position</var> by 1.
 787 | 
 788 |    <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 789 |    not equal to <var>delimiter</var> from <var>input</var>, given <var>position</var>.
 790 | 
 791 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 792 |   </ol>
 793 |  </li>
 794 | 
 795 |  <li><p>Return <var>tokens</var>.
 796 | </ol>
 797 | 
 798 | <p class=note>This algorithm is a "strict" split, as opposed to the commonly-used variants
 799 | <a lt="split on ASCII whitespace">for ASCII whitespace</a> and
 800 | <a lt="split on commas">for commas</a> below, which are both more lenient in various ways involving
 801 | interspersed <a>ASCII whitespace</a>.
 802 | 
 803 | <p>To <dfn export lt="split on ASCII whitespace|split a string on ASCII whitespace">split a
 804 | <a>string</a> <var>input</var> on ASCII whitespace</dfn>:
 805 | 
 806 | <ol>
 807 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 808 |  pointing at the start of <var>input</var>.
 809 | 
 810 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 811 | 
 812 |  <li><p><a>Skip ASCII whitespace</a> within <var>input</var> given <var>position</var>.
 813 | 
 814 |  <li>
 815 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 816 | 
 817 |   <ol>
 818 |    <li><p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 819 |    not <a>ASCII whitespace</a> from <var>input</var>, given <var>position</var>.
 820 | 
 821 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 822 | 
 823 |    <li><p><a>Skip ASCII whitespace</a> within <var>input</var> given <var>position</var>.
 824 |   </ol>
 825 |  </li>
 826 | 
 827 |  <li><p>Return <var>tokens</var>.
 828 | </ol>
 829 | 
 830 | <p>To <dfn export lt="split on commas|split a string on commas">split a <a>string</a>
 831 | <var>input</var> on commas</dfn>:
 832 | 
 833 | <ol>
 834 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>input</var>, initially
 835 |  pointing at the start of <var>input</var>.
 836 | 
 837 |  <li><p>Let <var>tokens</var> be a <a>list</a> of <a>strings</a>, initially empty.
 838 | 
 839 |  <li>
 840 |   <p>While <var>position</var> is not past the end of <var>input</var>:
 841 | 
 842 |   <ol>
 843 |    <li>
 844 |     <p>Let <var>token</var> be the result of <a>collecting a sequence of code points</a> that are
 845 |     not U+002C (,) from <var>input</var>, given <var>position</var>.
 846 | 
 847 |     <p class=note><var>token</var> might be the empty string.
 848 |    </li>
 849 | 
 850 |    <li><a>Strip leading and trailing ASCII whitespace</a> from <var>token</var>.
 851 | 
 852 |    <li><p><a for="list">Append</a> <var>token</var> to <var>tokens</var>.
 853 | 
 854 |    <li>
 855 |     <p>If <var>position</var> is not past the end of <var>input</var>, then:
 856 | 
 857 |     <ol>
 858 |      <li><p><a>Assert</a>: the <a>code point</a> at <var>position</var> within <var>input</var> is
 859 |      U+002C (,).
 860 | 
 861 |      <li><p>Advance <var>position</var> by 1.
 862 |     </ol>
 863 |    </li>
 864 |   </ol>
 865 |  </li>
 866 | 
 867 |  <li><p>Return <var>tokens</var>.
 868 | </ol>
 869 | 
 870 | <p>To <dfn export for=string lt=concatenate|concatenation>concatenate</dfn> a <a for=/>list</a> of
 871 | <a for=/>strings</a> <var>list</var>, using an optional separator string <var>separator</var>, run
 872 | these steps:
 873 | 
 874 | <ol>
 875 |  <li><p>If <var>list</var> <a for=list>is empty</a>, then return the empty string.
 876 | 
 877 |  <li><p>If <var>separator</var> is not given, then set <var>separator</var> to the empty string.
 878 | 
 879 |  <li><p>Return a <a for=/>string</a> whose contents are <var>list</var>'s <a for=list>items</a>, in
 880 |  order, separated from each other by <var>separator</var>.
 881 | </ol>
 882 | 
 883 | <p class=example id=example-string-concatenate>To serialize a set <var>set</var>, return the
 884 | <a for=string>concatenation</a> of <var>set</var> using U+0020 SPACE.
 885 | 
 886 | 
 887 | <h2 id=data-structures>Data structures</h2>
 888 | 
 889 | <p>Conventionally, specifications have operated on a variety of vague specification-level data
 890 | structures, based on shared understanding of their semantics. This generally works well, but can
 891 | lead to ambiguities around edge cases, such as iteration order or what happens when you
 892 | <a for=set>append</a> an <a for=set>item</a> to an <a>ordered set</a> that the set already
 893 | <a for=set>contains</a>. It has also led to a variety of divergent notation and phrasing, especially
 894 | around more complex data structures such as <a lt="ordered map">maps</a>.
 895 | 
 896 | <p>This standard provides a small set of common data structures, along with notation and phrasing
 897 | for working with them, in order to create common ground.
 898 | 
 899 | 
 900 | <h3 id=lists>Lists</h3>
 901 | 
 902 | <p>A <dfn export>list</dfn> is a specification type consisting of a finite ordered sequence of
 903 | <dfn export for=list,stack,queue,set lt=item>items</dfn>.
 904 | 
 905 | <p>For notational convenience, a literal syntax can be used to express <a>lists</a>, by surrounding
 906 | the list by « » characters and separating its <a for=list>items</a> with a comma. An indexing syntax
 907 | can be used by providing a zero-based index into a list inside square brackets. The index cannot be
 908 | out-of-bounds, except when used with <a for=list>exists</a>.
 909 | 
 910 | <p class=example id=example-list-notation>Let |example| be the <a>list</a> « "<code>a</code>",
 911 | "<code>b</code>", "<code>c</code>", "<code>a</code>" ». Then |example|[1] is the <a>string</a>
 912 | "<code>b</code>".
 913 | 
 914 | <hr>
 915 | 
 916 | <p>To <dfn export for=list>append</dfn> to a <a>list</a> that is not an <a>ordered set</a> is to
 917 | add the given <a for=list>item</a> to the end of the list.
 918 | 
 919 | <p>To <dfn export for=list>extend</dfn> a <a>list</a> |A| with a <a>list</a> |B|,
 920 | <a for=list>for each</a> |item| of |B|, <a for=list>append</a> |item| to |A|.
 921 | 
 922 | <div class=example id=example-list-extend>
 923 |  <ol>
 924 |   <li><p>Let |ghostbusters| be « "<code>Erin Gilbert</code>", "<code>Abby Yates</code>" ».
 925 | 
 926 |   <li><p><a for=list>Extend</a> |ghostbusters| with « "<code>Jillian Holtzmann</code>",
 927 |   "<code>Patty Tolan</code>" ».
 928 | 
 929 |   <li><p><a>Assert</a>: |ghostbusters|'s <a for=list>size</a> is 4.
 930 | 
 931 |   <li><p><a>Assert</a>: |ghostbusters|[2] is "<code>Jillian Holtzmann</code>".
 932 |  </ol>
 933 | </div>
 934 | 
 935 | <p>To <dfn export for=list>prepend</dfn> to a <a>list</a> that is not an <a>ordered set</a> is to
 936 | add the given <a for=list>item</a> to the beginning of the list.
 937 | 
 938 | <p>To <dfn export for=list>replace</dfn> within a <a>list</a> that is not an <a>ordered set</a> is
 939 | to replace all items from the list that match a given condition with the given <a for=list>item</a>,
 940 | or do nothing if none do.
 941 | 
 942 | <p class=note>The above definitions are modified when the <a>list</a> is an <a>ordered set</a>; see
 943 | below for <a for=set lt=append>ordered set append</a>, <a for=set>prepend</a>, and
 944 | <a for=set>replace</a>.
 945 | 
 946 | <p>To <dfn export for=list,set>insert</dfn> an <a for=list>item</a> into a <a>list</a> before an
 947 | index is to add the given item to the list between the given index &minus; 1 and the given index. If
 948 | the given index is 0, then <a for=list>prepend</a> the given item to the list.
 949 | 
 950 | <p>To <dfn export for=list,set>remove</dfn> zero or more <a for=list>items</a> from a <a>list</a> is
 951 | to remove all items from the list that match a given condition, or do nothing if none do.
 952 | 
 953 | <div class=example id=example-list-remove>
 954 |  <p><a for=list>Removing</a> |x| from the <a>list</a> « |x|, |y|, |z|, |x| » is to remove all
 955 |  items from the list that are equal to |x|. The list now is equivalent to « |y|, |z| ».
 956 | 
 957 |  <p><a for=list>Removing</a> all items that start with the <a>string</a> "<code>a</code>" from the
 958 |  <a>list</a> « "<code>a</code>", "<code>b</code>", "<code>ab</code>", "<code>ba</code>" » is to
 959 |  remove the items "<code>a</code>" and "<code>ab</code>". The list is now equivalent to «
 960 |  "<code>b</code>", "<code>ba</code>" ».
 961 | </div>
 962 | 
 963 | <p>To <dfn export for=list,stack,queue,set>empty</dfn> a <a>list</a> is to <a for=list>remove</a>
 964 | all of its <a for=list>items</a>.
 965 | 
 966 | <p>A <a>list</a> <dfn export for=list,stack,queue,set lt=contain|exist>contains</dfn> an
 967 | <a for=list>item</a> if it appears in the list. We can also denote this by saying that, for a
 968 | <a>list</a> |list| and an index |index|, "|list|[|index|] <a for=list>exists</a>".
 969 | 
 970 | <p>A <a>list</a>'s <dfn export for=list,stack,queue,set>size</dfn> is the number of
 971 | <a for=list>items</a> the list <a for=list>contains</a>.
 972 | 
 973 | <p>A <a>list</a> <dfn export for=list,stack,queue,set lt="is empty|is not empty">is empty</dfn> if
 974 | its <a for=list>size</a> is zero.
 975 | 
 976 | <p>To <dfn export for=list,set lt="iterate|for each">iterate</dfn> over a <a>list</a>, performing a
 977 | set of steps on each <a for=list>item</a> in order, use phrasing of the form
 978 | "<a for=list>For each</a> |item| of <var ignore>list</var>", and then operate on |item| in the
 979 | subsequent prose.
 980 | 
 981 | <p>To <dfn export for=list,stack,queue,set>clone</dfn> a <a>list</a> |list| is to create a new
 982 | <a>list</a> |clone|, of the same designation, and, <a for=list>for each</a> |item| of |list|,
 983 | <a for=list>append</a> |item| to |clone|, so that |clone| <a for=list>contains</a> the same
 984 | <a for=list>items</a>, in the same order as |list|.
 985 | 
 986 | Note: This is a "shallow clone", as the <a for=list>items</a> themselves are not cloned in any way.
 987 | 
 988 | <p class=example id=example-list-clone>Let |original| be the <a>ordered set</a> «
 989 | "<code>a</code>", "<code>b</code>", "<code>c</code>" ». <a for=set>Cloning</a> |original| creates
 990 | a new <a>ordered set</a> |clone|, so that <a for=set>replacing</a> "<code>a</code>" with
 991 | "<code>foo</code>" in |clone| gives « "<code>foo</code>", "<code>b</code>", "<code>c</code>" »,
 992 | while |original|[0] is still the <a>string</a> "<code>a</code>".
 993 | 
 994 | <p>To <dfn export for=list,stack,queue,set lt="sort in ascending order|sorting in ascending order|sort|sorting">sort in ascending order</dfn>
 995 | a <a>list</a> |list|, with a less than algorithm |lessThanAlgo|, is to create a new <a>list</a>
 996 | |sorted|, containing the same <a for=list>items</a> as |list| but sorted so that according to
 997 | |lessThanAlgo|, each item is less than the one following it, if any. For items that sort the same
 998 | (i.e., for which |lessThanAlgo| returns false for both comparisons), their relative order in
 999 | |sorted| must be the same as it was in |list|.
1000 | 
1001 | <p>To <dfn export for=list,stack,queue,set lt="sort in descending order|sorting in descending order">sort in descending order</dfn>
1002 | a <a>list</a> |list|, with a less than algorithm |lessThanAlgo|, is to create a new <a>list</a>
1003 | |sorted|, containing the same <a for=list>items</a> as |list| but sorted so that according to
1004 | |lessThanAlgo|, each item is less than the one preceding it, if any. For items that sort the same
1005 | (i.e., for which |lessThanAlgo| returns false for both comparisons), their relative order in
1006 | |sorted| must be the same as it was in |list|.
1007 | 
1008 | <p class=example id=example-list-sort>Let |original| be the <a>list</a> « (200, "<code>OK</code>"),
1009 | (404, "<code>Not Found</code>"), (null, "<code>OK</code>") ». <a for=list>Sorting</a> |original| in
1010 | ascending order, with |a| being less than |b| if |a|'s second <a for=struct>item</a> is
1011 | <a>code unit less than</a> |b|'s second <a for=struct>item</a>, gives the result « (404,
1012 | "<code>Not Found</code>"), (200, "<code>OK</code>"), (null, "<code>OK</code>") ».</p>
1013 | 
1014 | <hr>
1015 | 
1016 | <p>The <a>list</a> type originates from the JavaScript specification (where it is capitalized, as
1017 | <a spec=ecma-262>List</a>); we repeat some elements of its definition here for ease of reference,
1018 | and provide an expanded vocabulary for manipulating <a>lists</a>. Whenever JavaScript expects a
1019 | <a spec=ecma-262>List</a>, a <a>list</a> as defined here can be used; they are the same type.
1020 | [[!ECMA-262]]
1021 | 
1022 | <h4 id=stacks>Stacks</h4>
1023 | 
1024 | <p>Some <a>lists</a> are designated as <dfn export lt=stack>stacks</dfn>. A stack is a <a>list</a>,
1025 | but conventionally, the following operations are used to operate on it, instead of using
1026 | <a for=list>append</a>, <a for=list>prepend</a>, or <a for=list>remove</a>.
1027 | 
1028 | <p>To <dfn export for=stack>push</dfn> onto a <a>stack</a> is to <a for=list>append</a> to it.
1029 | 
1030 | <p>To <dfn export for=stack>pop</dfn> from a <a>stack</a>: if the <a>stack</a>
1031 | <a for=stack>is not empty</a>, then <a for=list>remove</a> its last <a for=stack>item</a> and return
1032 | it; otherwise, return nothing.
1033 | 
1034 | <p>Although <a>stacks</a> are <a>lists</a>, <a for=list>for each</a> must not be used with them;
1035 | instead, a combination of <a>while</a> and <a for=stack>pop</a> is more appropriate.
1036 | 
1037 | <h4 id=queues>Queues</h4>
1038 | 
1039 | <p>Some <a>lists</a> are designated as <dfn export lt=queue>queues</dfn>. A queue is a <a>list</a>,
1040 | but conventionally, the following operations are used to operate on it, instead of using
1041 | <a for=list>append</a>, <a for=list>prepend</a>, or <a for=list>remove</a>.
1042 | 
1043 | <p>To <dfn export for=queue>enqueue</dfn> in a <a>queue</a> is to <a for=list>append</a> to it.
1044 | 
1045 | <p>To <dfn export for=queue>dequeue</dfn> from a <a>queue</a> is to <a for=list>remove</a> its first
1046 | <a for=queue>item</a> and return it, if the <a>queue</a> <a for=queue>is not empty</a>, or to return
1047 | nothing if it is.
1048 | 
1049 | <p>Although <a>queues</a> are <a>lists</a>, <a for=list>for each</a> must not be used with them;
1050 | instead, a combination of <a>while</a> and <a for=queue>dequeue</a> is more appropriate.
1051 | 
1052 | <h4 id=sets>Sets</h4>
1053 | 
1054 | <p>Some <a>lists</a> are designated as <dfn export lt="ordered set|set">ordered sets</dfn>. An
1055 | ordered set is a <a>list</a> with the additional semantic that it must not contain the same
1056 | <a for=set>item</a> twice.
1057 | 
1058 | <p class=note>Almost all cases on the web platform require an <em>ordered</em> set, instead of an
1059 | unordered one, since interoperability requires that any developer-exposed enumeration of the set's
1060 | contents be consistent between browsers. In those cases where order is not important, we still use
1061 | ordered sets; implementations can optimize based on the fact that the order is not observable.
1062 | 
1063 | <p>To <dfn export for=set>append</dfn> to an <a>ordered set</a>: if the set <a for=list>contains</a>
1064 | the given <a for=set>item</a>, then do nothing; otherwise, perform the normal <a>list</a>
1065 | <a for=list>append</a> operation.
1066 | 
1067 | <p>To <dfn export for=set>prepend</dfn> to an <a>ordered set</a>: if the set
1068 | <a for=list>contains</a> the given <a for=set>item</a>, then do nothing; otherwise, perform the
1069 | normal <a>list</a> <a for=list>prepend</a> operation.
1070 | 
1071 | <p>To <dfn export for=set lt=replace|replacing>replace</dfn> within an <a>ordered set</a>
1072 | <var>set</var>, given <var>item</var> and <var>replacement</var>: if <var>set</var>
1073 | <a for=set>contains</a> <var>item</var> or <var>replacement</var>, then replace the first instance
1074 | of either with <var>replacement</var> and <a for=set>remove</a> all other instances.
1075 | 
1076 | <p class=example id=example-set-replace><a for="set">Replacing</a> "a" with "c" within the
1077 | <a>ordered set</a> « "a", "b", "c" » gives « "c", "b" ». Within « "c", "b", "a" » it gives
1078 | « "c", "b" » as well.
1079 | 
1080 | <p>An <a>ordered set</a> |set| is a <dfn export for=set>subset</dfn> of another <a>ordered set</a>
1081 | |superset| (and conversely, |superset| is a <dfn export for=set>superset</dfn> of |set|) if,
1082 | <a for=list>for each</a> |item| of |set|, |superset| <a for=set>contains</a> |item|.
1083 | 
1084 | <p class=note>This implies that an <a>ordered set</a> is both a <a for=set>subset</a> and a
1085 | <a for=set>superset</a> of itself.
1086 | 
1087 | <p>The <dfn export for=set>intersection</dfn> of <a>ordered sets</a> |A| and |B|, is the result
1088 | of creating a new <a>ordered set</a> |set| and, <a for=list>for each</a> |item| of |A|, if |B|
1089 | <a for=set>contains</a> |item|, <a for=set>appending</a> |item| to |set|.
1090 | 
1091 | <p>The <dfn export for=set>union</dfn> of <a>ordered sets</a> |A| and |B|, is the result of
1092 | <a for=list>cloning</a> |A| as |set| and, <a for=list>for each</a> |item| of |B|,
1093 | <a for=set>appending</a> |item| to |set|.
1094 | 
1095 | <hr>
1096 | 
1097 | <p><dfn export lt="the range">The range</dfn> <var>n</var> to <var>m</var>, inclusive, creates a new
1098 | <a>ordered set</a> containing all of the integers from <var>n</var> up to and including <var>m</var>
1099 | in consecutively increasing order, as long as <var>m</var> is greater than or equal to <var>n</var>.
1100 | 
1101 | <p class=example id=example-the-range><a for=set>For each</a> <var>n</var> of <a>the range</a> 1 to
1102 | 4, inclusive, &hellip;
1103 | 
1104 | 
1105 | <h3 id=maps>Maps</h3>
1106 | 
1107 | <p>An <dfn export lt="ordered map|map">ordered map</dfn>, or sometimes just "map", is a
1108 | specification type consisting of a finite ordered sequence of
1109 | <dfn for=map export>key</dfn>/<dfn for=map export>value</dfn> pairs, with no key appearing twice.
1110 | Each key/value pair is called an <dfn for=map export>entry</dfn>.
1111 | 
1112 | <p class=note>As with <a>ordered sets</a>, by default we assume that maps need to be ordered for
1113 | interoperability among implementations.
1114 | 
1115 | <p>A literal syntax can be used to express <a>ordered maps</a>, by surrounding the ordered map with
1116 | «[ ]» characters, denoting each of its <a for=map>entries</a> as |key| → |value|, and separating its
1117 | entries with a comma. An indexing syntax can be used to look up and set <a for=map>values</a> by
1118 | providing a <a for=map>key</a> inside square brackets. The index cannot be out-of-bounds, except
1119 | when used with <a for=map>exists</a>.
1120 | 
1121 | <p class=example id=example-map-notation>Let |example| be the <a>ordered map</a> «[
1122 | "<code>a</code>" → `<code>x</code>`, "<code>b</code>" → `<code>y</code>` ]». Then
1123 | |example|["<code>a</code>"] is the <a>byte sequence</a> `<code>x</code>`.
1124 | 
1125 | <hr>
1126 | 
1127 | <p>To <dfn export for=map lt="get|get the value">get the value of an entry</dfn> in an
1128 | <a>ordered map</a> given a <a for=map>key</a>, return the <a for=map>value</a> of the
1129 | <a for=map>entry</a> whose <a for=map>key</a> is the given key. We can also use the indexing syntax
1130 | explained above.
1131 | 
1132 | <p>To <dfn export for=map lt="set|set the value">set the value of an entry</dfn> in an
1133 | <a>ordered map</a> to a given <a for=map>value</a> is to update the value of any existing
1134 | <a for=map>entry</a> if the map <a for=map>contains</a> an entry with the given <a for=map>key</a>,
1135 | or if none such exists, to add a new entry with the given key/value to the end of the map. We can
1136 | also denote this by saying, for an <a>ordered map</a> |map|, key |key|, and value |value|,
1137 | "<a for=map>set</a> |map|[|key|] to |value|".
1138 | 
1139 | <p>To <dfn export for=map lt=remove>remove an entry</dfn> from an <a>ordered map</a> is to remove
1140 | all <a for=map>entries</a> from the map that match a given condition, or do nothing if none do. If
1141 | the condition is having a certain <a for=map>key</a>, then we can also denote this by saying, for
1142 | an <a>ordered map</a> |map| and key |key|, "<a for=map>remove</a> |map|[|key|]".
1143 | 
1144 | <p>An <a>ordered map</a> <dfn export for=map lt=exist|contain id=map-exists>contains an
1145 | <a for=map>entry</a> with a given key</dfn> if there exists an entry with that <a for=map>key</a>.
1146 | We can also denote this by saying that, for an <a>ordered map</a> |map| and key |key|, "|map|[|key|]
1147 | <a for=map>exists</a>".
1148 | 
1149 | <p>To <dfn export for=map lt="getting the keys|get the keys">get the keys</dfn> of an
1150 | <a>ordered map</a>, return a new <a>ordered set</a> whose <a for=set>items</a> are each of the
1151 | <a for=map>keys</a> in the map's <a for=map>entries</a>.
1152 | 
1153 | <p>To <dfn export for=map lt="getting the values|get the values">get the values</dfn> of an
1154 | <a>ordered map</a>, return a new <a>list</a> whose <a for=list>items</a> are each of the
1155 | <a for=map>values</a> in the map's <a for=map>entries</a>.
1156 | 
1157 | <p>An <a>ordered map</a>'s <dfn export for=map>size</dfn> is the <a for=set>size</a> of the result
1158 | of running <a for=map>get the keys</a> on the map.
1159 | 
1160 | <p>An <a>ordered map</a> <dfn export for=map lt="is empty|is not empty">is empty</dfn> if its
1161 | <a for=map>size</a> is zero.
1162 | 
1163 | <p>To <dfn export for=map lt="iterate|for each">iterate</dfn> over an <a>ordered map</a>, performing
1164 | a set of steps on each <a for=map>entry</a> in order, use phrasing of the form
1165 | "<a for=map>For each</a> |key| → |value| of |map|", and then operate on |key| and |value| in the
1166 | subsequent prose.
1167 | 
1168 | <p>To <dfn export for=map lt="sort in ascending order|sorting in ascending order|sort|sorting">sort in ascending order</dfn>
1169 | a <a>map</a> |map|, with a less than algorithm |lessThanAlgo|, is to create a new <a>map</a>
1170 | |sorted|, containing the same <a for=map>entries</a> as |map| but sorted so that according to
1171 | |lessThanAlgo|, each entry is less than the one following it, if any. For entries that sort the same
1172 | (i.e., for which |lessThanAlgo| returns false for both comparisons), their relative order in
1173 | |sorted| must be the same as it was in |map|.
1174 | 
1175 | <p>To <dfn export for=map lt="sort in descending order|sorting in descending order">sort in descending order</dfn>
1176 | a <a>map</a> |map|, with a less than algorithm |lessThanAlgo|, is to create a new <a>map</a>
1177 | |sorted|, containing the same <a for=map>entries</a> as |map| but sorted so that according to
1178 | |lessThanAlgo|, each entry is less than the one preceding it, if any. For entries that sort the same
1179 | (i.e., for which |lessThanAlgo| returns false for both comparisons), their relative order in
1180 | |sorted| must be the same as it was in |map|.
1181 | 
1182 | 
1183 | <h3 id=structs>Structs</h3>
1184 | 
1185 | <p>A <dfn export>struct</dfn> is a specification type consisting of a finite set of
1186 | <dfn export for=struct,tuple,pair lt=item>items</dfn>, each of which has a unique and immutable
1187 | <dfn export for=struct,tuple,pair>name</dfn>.
1188 | 
1189 | <hr>
1190 | 
1191 | <p><a>Structs</a> with a defined order are also known as <dfn export lt=tuple>tuples</dfn>. For
1192 | notational convenience, a literal syntax can be used to express <a>tuples</a>, by surrounding the
1193 | tuple with parenthesis and separating its <a for=tuple>items</a> with a comma. To use this notation,
1194 | the <a for=tuple>names</a> need to be clear from context. This can be done by preceding the first
1195 | instance with the name given to the <a>tuple</a>.
1196 | 
1197 | <div class=example id=example-tuple>
1198 |  <!-- If https://github.com/tabatkins/bikeshed/issues/960 gets fixed we can show how to use <dfn>
1199 |  and <a> on these -->
1200 |  <p>A status is an example <a>tuple</a> consisting of a code (a three-digit number) and text (a byte
1201 |  sequence).
1202 | 
1203 |  <p>A nonsense algorithm that manipulates status tuples for the purpose of demonstrating their
1204 |  usage is then:</p>
1205 | 
1206 |  <ol>
1207 |   <li>Let |statusInstance| be the status (200, `<code>OK</code>`).
1208 |   <li>Set |statusInstance| to (301, `<code>FOO BAR</code>`).
1209 |   <li>If |statusInstance|'s code is 404, then &hellip;
1210 |  </ol>
1211 | </div>
1212 | 
1213 | <p class=note>It is intentional that not all <a>structs</a> are <a>tuples</a>. Documents using the
1214 | Infra Standard might need the flexibility to add new <a for=struct>names</a> to their struct
1215 | without breaking literal syntax used by their dependencies. In that case a tuple is not appropriate.
1216 | 
1217 | <hr>
1218 | 
1219 | <p><a>Tuples</a> with two <a for=tuple>items</a> are also known as <dfn export lt=pair>pairs</dfn>.
1220 | For <a>pairs</a>, a slightly shorter literal syntax can be used, separating the two
1221 | <a for=pair>items</a> with a / character.
1222 | 
1223 | <p class=example id=example-pair>Another way of expressing our |statusInstance| tuple above would be
1224 | as 200/`<code>OK</code>`.
1225 | 
1226 | 
1227 | <h2 id=json>JSON</h2>
1228 | 
1229 | <p class=note>The conventions used in the algorithms in this section are those of the JavaScript
1230 | specification. [[!ECMA-262]]
1231 | 
1232 | <p>To <dfn export>parse JSON from bytes</dfn> given <var>bytes</var>, run these steps:
1233 | 
1234 | <ol>
1235 |  <li><p>Let <var>jsonText</var> be the result of running <a>UTF-8 decode</a> on <var>bytes</var>.
1236 |  [[!ENCODING]]
1237 | 
1238 |  <li><p>Return ? <a abstract-op>Call</a>(<a>%JSONParse%</a>, undefined, « <var>jsonText</var> »).
1239 | </ol>
1240 | 
1241 | <p>To <dfn export>serialize JSON to bytes</dfn> a given JavaScript value <var>value</var>, run these
1242 | steps:
1243 | 
1244 | <ol>
1245 |  <li>
1246 |   <p>Let <var>jsonString</var> be
1247 |   ? <a abstract-op>Call</a>(<a>%JSONStringify%</a>, undefined, « <var>value</var> »).
1248 | 
1249 |   <p class=note>Since no additional arguments are passed to <a>%JSONStringify%</a>, the resulting
1250 |   string will have no whitespace inserted.
1251 | 
1252 |  <li><p>Return the result of running <a>UTF-8 encode</a> on <var>jsonString</var>. [[!ENCODING]]
1253 | </ol>
1254 | 
1255 | <hr>
1256 | 
1257 | <p>The above two operations operate on JavaScript values directly; in particular, this means that
1258 | the involved objects or arrays are tied to a particular <a lt="realm">JavaScript realm</a>. In
1259 | standards, it is often more convenient to parse JSON into realm-independent <a>maps</a>,
1260 | <a>lists</a>, <a>strings</a>, <a>booleans</a>, numbers, and nulls.
1261 | 
1262 | <p>To <dfn export>parse JSON into Infra values</dfn>, given a <a>string</a> <var>jsonText</var>:
1263 | 
1264 | <ol>
1265 |  <li><p>Let |jsValue| be ? [$Call$](<a>%JSONParse%</a>, undefined, « |jsonText| »).
1266 | 
1267 |  <li><p>Return the result of [=converting a JSON-derived JavaScript value to an Infra value=], given
1268 |  |jsValue|.
1269 | </ol>
1270 | 
1271 | <p>To <dfn lt="convert a JSON-derived JavaScript value to an Infra value|converting a JSON-derived JavaScript value to an Infra value">convert a JSON-derived JavaScript value to an Infra value</dfn>,
1272 | given a JavaScript value <var>jsValue</var>:
1273 | 
1274 | <ol>
1275 |  <li><p>If [$Type$](|jsValue|) is Null, String, or Number, then return |jsValue|.
1276 | 
1277 |  <li>
1278 |   <p>If [$IsArray$](|jsValue|) is true, then:
1279 | 
1280 |    <ol>
1281 |     <li><p>Let |result| be an empty [=list=].
1282 | 
1283 |     <li><p>Let |length| be ! [$ToLength$](! [$Get$](|jsValue|, "<code>length</code>")).
1284 | 
1285 |     <li>
1286 |       <p>[=list/For each=] |index| of [=the range=] 0 to |length| &minus; 1, inclusive:
1287 | 
1288 |       <ol>
1289 |        <li><p>Let |indexName| be ! [$ToString$](|index|).
1290 | 
1291 |        <li><p>Let |jsValueAtIndex| be ! [$Get$](|jsValue|, |indexName|).
1292 | 
1293 |        <li><p>Let |infraValueAtIndex| be the result of [=converting a JSON-derived JavaScript value to an Infra value=],
1294 |        given |jsValueAtIndex|.
1295 | 
1296 |        <li><p>[=list/Append=] |infraValueAtIndex| to |result|.
1297 |       </ol>
1298 |     </li>
1299 | 
1300 |     <li><p>Return |result|.
1301 |    </ol>
1302 |  </li>
1303 | 
1304 |  <li><p>Let |result| be an empty [=ordered map=].
1305 | 
1306 |  <li>
1307 |   <p>[=list/For each=] |key| of ! |jsValue|.\[[OwnPropertyKeys]]():
1308 | 
1309 |    <ol>
1310 |     <li><p>Let |jsValueAtKey| be ! [$Get$](|jsValue|, |key|).
1311 | 
1312 |     <li><p>Let |infraValueAtKey| be the result of [=converting a JSON-derived JavaScript value to an Infra value=],
1313 |     given |jsValueAtKey|.
1314 | 
1315 |     <li><p>[=map/Set=] |result|[|key|] to |infraValueAtKey|.
1316 |    </ol>
1317 |  </li>
1318 | 
1319 |  <li><p>Return |result|.
1320 | </ol>
1321 | 
1322 | 
1323 | <h2 id=forgiving-base64>Forgiving base64</h2>
1324 | 
1325 | <p>To <dfn export>forgiving-base64 encode</dfn> given a <a>byte sequence</a> <var>data</var>, apply
1326 | the base64 algorithm defined in section 4 of RFC 4648 to <var>data</var> and return the result.
1327 | [[!RFC4648]]
1328 | 
1329 | <p class="note no-backref">This is named <a>forgiving-base64 encode</a> for symmetry with
1330 | <a>forgiving-base64 decode</a>, which is different from the RFC as it defines error handling for
1331 | certain inputs.
1332 | 
1333 | <p>To <dfn export>forgiving-base64 decode</dfn> given a string <var>data</var>, run these steps:</p>
1334 | 
1335 | <ol>
1336 |  <li><p>Remove all <a>ASCII whitespace</a> from <var>data</var>.
1337 |  <!-- https://lists.w3.org/Archives/Public/public-whatwg-archive/2011May/0207.html -->
1338 | 
1339 |  <li>
1340 |   <p>If <var>data</var>'s <a for=string>length</a> divides by 4 leaving no remainder, then:
1341 | 
1342 |   <ol>
1343 |    <li><p>If <var>data</var> ends with one or two U+003D (=) <a>code points</a>, then remove them
1344 |    from <var>data</var>.
1345 |   </ol>
1346 | 
1347 |  <li><p>If <var>data</var>'s <a for=string>length</a> divides by 4 leaving a remainder of 1, then
1348 |  return failure.
1349 | 
1350 |  <li>
1351 |   <p>If <var>data</var> contains a <a>code point</a> that is not one of
1352 | 
1353 |   <ul class="brief">
1354 |    <li>U+002B (+)
1355 |    <li>U+002F (/)
1356 |    <li><a>ASCII alphanumeric</a>
1357 |   </ul>
1358 | 
1359 |   <p>then return failure.
1360 | 
1361 |  <li><p>Let <var>output</var> be an empty <a>byte sequence</a>.
1362 | 
1363 |  <li><p>Let <var>buffer</var> be an empty buffer that can have bits appended to it.
1364 | 
1365 |  <li><p>Let <var>position</var> be a <a>position variable</a> for <var>data</var>, initially
1366 |  pointing at the start of <var>data</var>.
1367 | 
1368 |  <li>
1369 |   <p>While <var>position</var> does not point past the end of <var>data</var>:
1370 | 
1371 |   <ol>
1372 |    <li><p>Find the <a>code point</a> pointed to by <var>position</var> in the second column of
1373 |    Table 1: The Base 64 Alphabet of RFC 4648. Let <var>n</var> be the number given in the first cell
1374 |    of the same row. [[!RFC4648]]
1375 | 
1376 |    <li><p>Append the six bits corresponding to <var>n</var>, most significant bit first, to
1377 |    <var>buffer</var>.
1378 | 
1379 |    <li><p>If <var>buffer</var> has accumulated 24 bits, interpret them as three 8-bit big-endian
1380 |    numbers. Append three bytes with values equal to those numbers to <var>output</var>, in the same
1381 |    order, and then empty <var>buffer</var>.
1382 | 
1383 |    <li><p>Advance <var>position</var> by 1.
1384 |   </ol>
1385 | 
1386 |  <li>
1387 |   <p>If <var>buffer</var> is not empty, it contains either 12 or 18 bits. If it contains 12 bits,
1388 |   then discard the last four and interpret the remaining eight as an 8-bit big-endian number. If it
1389 |   contains 18 bits, then discard the last two and interpret the remaining 16 as two 8-bit big-endian
1390 |   numbers. Append the one or two bytes with values equal to those one or two numbers to
1391 |   <var>output</var>, in the same order.</p>
1392 | 
1393 |   <p class="note">The discarded bits mean that, for instance, "<code>YQ</code>" and
1394 |   "<code>YR</code>" both return `<code>a</code>`.
1395 | 
1396 |  <li><p>Return <var>output</var>.
1397 | </ol>
1398 | 
1399 | 
1400 | <h2 id=namespaces>Namespaces</h2>
1401 | 
1402 | <p>The <dfn export>HTML namespace</dfn> is "<code>http://www.w3.org/1999/xhtml</code>".
1403 | 
1404 | <p>The <dfn export>MathML namespace</dfn> is "<code>http://www.w3.org/1998/Math/MathML</code>".
1405 | 
1406 | <p>The <dfn export>SVG namespace</dfn> is "<code>http://www.w3.org/2000/svg</code>".
1407 | 
1408 | <p>The <dfn export>XLink namespace</dfn> is "<code>http://www.w3.org/1999/xlink</code>".
1409 | 
1410 | <p>The <dfn export>XML namespace</dfn> is "<code>http://www.w3.org/XML/1998/namespace</code>".
1411 | 
1412 | <p>The <dfn export>XMLNS namespace</dfn> is "<code>http://www.w3.org/2000/xmlns/</code>".
1413 | 
1414 | 
1415 | <h2 class=no-num id=acknowledgments>Acknowledgments</h2>
1416 | 
1417 | <p>Many thanks to
1418 | Addison Phillips,
1419 | Aryeh Gregor,
1420 | Chris Rebert,
1421 | Daniel Ehrenberg,
1422 | Dominic Farolino,
1423 | Jake Archibald,
1424 | Jeff Hodges,
1425 | Jungkee Song,
1426 | Leonid Vasilyev,
1427 | Maciej Stachowiak,
1428 | Malika Aubakirova,
1429 | Michael™ Smith,
1430 | Mike West,
1431 | Ms2ger,
1432 | Pavel "Al Arz" Kurochkin,
1433 | Philip Jägenstedt,
1434 | Rashaun "Snuggs" Stovall,
1435 | Sergey Shekyan,
1436 | Simon Pieters,
1437 | Tab Atkins,
1438 | Tobie Langel,
1439 | triple-underscore,
1440 | and Xue Fuqiao
1441 | for being awesome!
1442 | 
1443 | <p>This standard is written by <a lang=nl href=https://annevankesteren.nl/>Anne van Kesteren</a>
1444 | (<a href=https://www.mozilla.org/>Mozilla</a>,
1445 | <a href=mailto:annevk@annevk.nl>annevk@annevk.nl</a>) and
1446 | <a href=https://domenic.me/>Domenic Denicola</a> (<a href=https://www.google.com/>Google</a>,
1447 | <a href=mailto:d@domenic.me>d@domenic.me</a>).
1448 | 


--------------------------------------------------------------------------------