├── .clang-format
├── .editorconfig
├── .github
    ├── FUNDING.yml
    ├── ISSUE_TEMPLATE
    │   ├── 1-bug-report.yml
    │   ├── 2-feature-request.yml
    │   └── config.yml
    ├── dependabot.yml
    └── workflows
    │   ├── alpine.yml
    │   ├── cifuzz.yml
    │   ├── codeql.yml
    │   ├── dependency-review.yml
    │   ├── documentation.yml
    │   ├── emscripten.yml
    │   ├── lint_and_format_check.yml
    │   ├── macos_install.yml
    │   ├── pkg.yml
    │   ├── release-script-tests.yml
    │   ├── release_create.yml
    │   ├── release_prepare.yml
    │   ├── scorecard.yml
    │   ├── ubuntu-release.yml
    │   ├── ubuntu-s390x.yml
    │   ├── ubuntu-sanitized.yml
    │   ├── ubuntu-undef.yml
    │   ├── ubuntu.yml
    │   ├── ubuntu_install.yml
    │   ├── ubuntu_pedantic.yml
    │   ├── visual_studio.yml
    │   ├── visual_studio_clang.yml
    │   └── wpt-updater.yml
├── .gitignore
├── .python-version
├── CMakeLists.txt
├── LICENSE-APACHE
├── LICENSE-MIT
├── README.md
├── SECURITY.md
├── ada.pc.in
├── benchmarks
    ├── CMakeLists.txt
    ├── bbc_bench.cpp
    ├── bench.cpp
    ├── bench_search_params.cpp
    ├── benchmark_header.h
    ├── benchmark_template.cpp
    ├── competitors
    │   └── servo-url
    │   │   ├── Cargo.lock
    │   │   ├── Cargo.toml
    │   │   ├── README.md
    │   │   ├── cbindgen.toml
    │   │   ├── lib.rs
    │   │   └── servo_url.h
    ├── model_bench.cpp
    ├── percent_encode.cpp
    ├── performancecounters
    │   ├── apple_arm_events.h
    │   ├── event_counter.h
    │   └── linux-perf-events.h
    ├── urlpattern.cpp
    └── wpt_bench.cpp
├── cmake
    ├── CPM.cmake
    ├── JoinPaths.cmake
    ├── ada-config.cmake.in
    ├── ada-flags.cmake
    ├── add-cpp-test.cmake
    └── codecoverage.cmake
├── docs
    ├── RELEASE.md
    ├── cli.md
    └── doxygen
    │   ├── footer.html
    │   └── header.html
├── doxygen
├── fuzz
    ├── ada_c.c
    ├── ada_c.options
    ├── build.sh
    ├── can_parse.cc
    ├── idna.cc
    ├── parse.cc
    ├── parse.options
    ├── url.dict
    ├── url_pattern.cc
    ├── url_pattern.options
    └── url_search_params.cc
├── include
    ├── ada.h
    ├── ada
    │   ├── ada_idna.h
    │   ├── ada_version.h
    │   ├── character_sets-inl.h
    │   ├── character_sets.h
    │   ├── checkers-inl.h
    │   ├── checkers.h
    │   ├── common_defs.h
    │   ├── encoding_type.h
    │   ├── errors.h
    │   ├── expected.h
    │   ├── helpers.h
    │   ├── implementation-inl.h
    │   ├── implementation.h
    │   ├── log.h
    │   ├── parser-inl.h
    │   ├── parser.h
    │   ├── scheme-inl.h
    │   ├── scheme.h
    │   ├── serializers.h
    │   ├── state.h
    │   ├── unicode-inl.h
    │   ├── unicode.h
    │   ├── url-inl.h
    │   ├── url.h
    │   ├── url_aggregator-inl.h
    │   ├── url_aggregator.h
    │   ├── url_base-inl.h
    │   ├── url_base.h
    │   ├── url_components-inl.h
    │   ├── url_components.h
    │   ├── url_pattern-inl.h
    │   ├── url_pattern.h
    │   ├── url_pattern_helpers-inl.h
    │   ├── url_pattern_helpers.h
    │   ├── url_pattern_init.h
    │   ├── url_pattern_regex.h
    │   ├── url_search_params-inl.h
    │   └── url_search_params.h
    └── ada_c.h
├── pyproject.toml
├── singleheader
    ├── CMakeLists.txt
    ├── README.md
    ├── amalgamate.py
    ├── demo.c
    └── demo.cpp
├── src
    ├── CMakeLists.txt
    ├── ada.cpp
    ├── ada_c.cpp
    ├── ada_idna.cpp
    ├── checkers.cpp
    ├── helpers.cpp
    ├── implementation.cpp
    ├── parser.cpp
    ├── serializers.cpp
    ├── unicode.cpp
    ├── url.cpp
    ├── url_aggregator.cpp
    ├── url_components.cpp
    ├── url_pattern.cpp
    ├── url_pattern_helpers.cpp
    └── url_pattern_regex.cpp
├── tests
    ├── CMakeLists.txt
    ├── ada_c.cpp
    ├── basic_fuzzer.cpp
    ├── basic_tests.cpp
    ├── from_file_tests.cpp
    ├── installation
    │   └── CMakeLists.txt
    ├── url_components.cpp
    ├── url_search_params.cpp
    ├── wasm
    │   ├── CMakeLists.txt
    │   ├── test.js.in
    │   └── wasm.cpp
    ├── wpt
    │   ├── CMakeLists.txt
    │   ├── IdnaTestV2-removed.json
    │   ├── IdnaTestV2.json
    │   ├── ada_extra_setters_tests.json
    │   ├── ada_extra_urltestdata.json
    │   ├── ada_long_urltestdata.json
    │   ├── percent-encoding.json
    │   ├── setters_tests.json
    │   ├── toascii.json
    │   ├── urlpattern-compare-test-data.json
    │   ├── urlpatterntestdata.json
    │   ├── urltestdata-javascript-only.json
    │   ├── urltestdata.json
    │   └── verifydnslength_tests.json
    ├── wpt_url_tests.cpp
    └── wpt_urlpattern_tests.cpp
└── tools
    ├── CMakeLists.txt
    ├── cli
        ├── CMakeLists.txt
        ├── adaparse.cpp
        ├── benchmark_adaparse.sh
        ├── benchmark_write_to_file.sh
        └── line_iterator.h
    ├── prepare-doxygen.sh
    ├── release
        ├── __init__.py
        ├── create_release.py
        ├── lib
        │   ├── __init__.py
        │   ├── release.py
        │   ├── tests
        │   │   ├── __init__.py
        │   │   ├── samples
        │   │   │   ├── ada_version_h.txt
        │   │   │   ├── ada_version_h_expected.txt
        │   │   │   ├── cmakelists.txt
        │   │   │   ├── cmakelists_expected.txt
        │   │   │   ├── doxygen.txt
        │   │   │   └── doxygen_expected.txt
        │   │   ├── test_release.py
        │   │   └── test_update_versions.py
        │   └── versions.py
        ├── requirements.txt
        └── update_versions.py
    ├── run-clangcldocker.sh
    └── update-wpt.sh


/.clang-format:
--------------------------------------------------------------------------------
1 | BasedOnStyle: Google
2 | SortIncludes: Never
3 | 


--------------------------------------------------------------------------------
/.editorconfig:
--------------------------------------------------------------------------------
1 | root = true
2 | 
3 | [*]
4 | end_of_line = lf
5 | insert_final_newline = true
6 | indent_size = 2
7 | indent_style = space
8 | 


--------------------------------------------------------------------------------
/.github/FUNDING.yml:
--------------------------------------------------------------------------------
1 | github: [anonrig, lemire]
2 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/1-bug-report.yml:
--------------------------------------------------------------------------------
 1 | name: 🐛 Bug report
 2 | description: Create a report to help us improve
 3 | body:
 4 |   - type: markdown
 5 |     attributes:
 6 |       value: |
 7 |         Thank you for reporting an issue.
 8 | 
 9 |         Please fill in as much of the following form as you're able.
10 |   - type: input
11 |     attributes:
12 |       label: Version
13 |       description: Which Ada version are you referring to?
14 |   - type: input
15 |     attributes:
16 |       label: Platform
17 |       description: |
18 |         UNIX: output of `uname -a`
19 |         Windows: output of `"$([Environment]::OSVersion.VersionString) $(('x86', 'x64')[[Environment]::Is64BitOperatingSystem])"` in PowerShell console
20 |   - type: textarea
21 |     attributes:
22 |       label: What steps will reproduce the bug?
23 |       description: Enter details about your bug, preferably a simple code snippet that can be run directly without installing third-party dependencies.
24 |   - type: textarea
25 |     attributes:
26 |       label: How often does it reproduce? Is there a required condition?
27 |   - type: textarea
28 |     attributes:
29 |       label: What is the expected behavior?
30 |       description: If possible please provide textual output instead of screenshots.
31 |   - type: textarea
32 |     attributes:
33 |       label: What do you see instead?
34 |       description: If possible please provide textual output instead of screenshots.
35 |     validations:
36 |       required: true
37 |   - type: textarea
38 |     attributes:
39 |       label: Additional information
40 |       description: Tell us anything else you think we should know.
41 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/2-feature-request.yml:
--------------------------------------------------------------------------------
 1 | name: 🚀 Feature request
 2 | description: Suggest an idea for this project
 3 | labels: [feature request]
 4 | body:
 5 |   - type: markdown
 6 |     attributes:
 7 |       value: |
 8 |         Thank you for suggesting an idea to make Node.js better.
 9 | 
10 |         Please fill in as much of the following form as you're able.
11 |   - type: textarea
12 |     attributes:
13 |       label: What is the problem this feature will solve?
14 |     validations:
15 |       required: true
16 |   - type: textarea
17 |     attributes:
18 |       label: What is the feature you are proposing to solve the problem?
19 |     validations:
20 |       required: true
21 |   - type: textarea
22 |     attributes:
23 |       label: What alternatives have you considered?
24 | 


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/config.yml:
--------------------------------------------------------------------------------
1 | blank_issues_enabled: true
2 | contact_links:
3 |   - name: Looking for documentation?
4 |     url: https://ada-url.github.io/ada
5 |     about: Please navigate to our documentation website.
6 | 


--------------------------------------------------------------------------------
/.github/dependabot.yml:
--------------------------------------------------------------------------------
 1 | # Set update schedule for GitHub Actions
 2 | 
 3 | version: 2
 4 | updates:
 5 |   - package-ecosystem: github-actions
 6 |     directory: /
 7 |     schedule:
 8 |       interval: monthly
 9 | 
10 |   - package-ecosystem: cargo
11 |     directory: /benchmarks/competitors/servo-url
12 |     schedule:
13 |       interval: monthly
14 | 
15 |   - package-ecosystem: pip
16 |     directory: /tools/release
17 |     schedule:
18 |       interval: monthly
19 | 


--------------------------------------------------------------------------------
/.github/workflows/alpine.yml:
--------------------------------------------------------------------------------
 1 | name: Alpine Linux
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ubuntu-build:
25 |     runs-on: ubuntu-latest
26 |     steps:
27 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
28 |       - name: start docker
29 |         run: |
30 |           docker run -w /src -dit --name alpine -v $PWD:/src alpine:latest
31 |           echo 'docker exec alpine "$@";' > ./alpine.sh
32 |           chmod +x ./alpine.sh
33 |       - name: install packages
34 |         run: |
35 |           ./alpine.sh apk update
36 |           ./alpine.sh apk add build-base cmake g++ linux-headers git bash icu-dev
37 |       - name: cmake
38 |         run: |
39 |           ./alpine.sh cmake -D ADA_TESTING=ON -DADA_BENCHMARKS=ON -B build_for_alpine
40 |       - name: build
41 |         run: |
42 |           ./alpine.sh cmake --build build_for_alpine
43 |       - name: test
44 |         run: |
45 |           ./alpine.sh bash -c "cd build_for_alpine && ctest  ."
46 | 


--------------------------------------------------------------------------------
/.github/workflows/cifuzz.yml:
--------------------------------------------------------------------------------
 1 | name: CIFuzz
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     branches:
 6 |       - main
 7 | 
 8 | concurrency:
 9 |   group: ${{ github.workflow }}-${{ github.ref }}
10 |   cancel-in-progress: true
11 | 
12 | permissions: read-all
13 | 
14 | jobs:
15 |   Fuzzing:
16 |     runs-on: ubuntu-latest
17 |     strategy:
18 |       fail-fast: false
19 |       matrix:
20 |         sanitizer: [address, undefined, memory]
21 |     steps:
22 |       - name: Build Fuzzers (${{ matrix.sanitizer }})
23 |         id: build
24 |         uses: google/oss-fuzz/infra/cifuzz/actions/build_fuzzers@master
25 |         with:
26 |          oss-fuzz-project-name: 'ada-url'
27 |          language: c++
28 |          sanitizer: ${{ matrix.sanitizer }}
29 |       - name: Run Fuzzers (${{ matrix.sanitizer }})
30 |         uses: google/oss-fuzz/infra/cifuzz/actions/run_fuzzers@master
31 |         with:
32 |          oss-fuzz-project-name: 'ada-url'
33 |          language: c++
34 |          fuzz-seconds: 600
35 |          sanitizer: ${{ matrix.sanitizer }}
36 |       - name: Upload Crash
37 |         uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4.6.2
38 |         if: steps.build.outcome == 'success'
39 |         with:
40 |           name: ${{ matrix.sanitizer }}-artifacts
41 |           path: ./out/artifacts
42 | 


--------------------------------------------------------------------------------
/.github/workflows/codeql.yml:
--------------------------------------------------------------------------------
 1 | name: "CodeQL"
 2 | 
 3 | on:
 4 |   schedule:
 5 |     - cron: '0 0 * * 1'
 6 | 
 7 | permissions:
 8 |   contents: read
 9 |   security-events: write
10 |   pull-requests: read
11 |   actions: read
12 | 
13 | jobs:
14 |   analyze:
15 |     name: Analyze
16 | 
17 |     runs-on: ubuntu-latest
18 | 
19 |     permissions:
20 |       actions: read
21 |       contents: read
22 |       security-events: write
23 | 
24 |     strategy:
25 |       fail-fast: false
26 |       matrix:
27 |         language: [ 'cpp', 'python' ]
28 | 
29 |     steps:
30 |       - name: Checkout repository
31 |         uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
32 | 
33 |       # Initializes the CodeQL tools for scanning.
34 |       - name: Initialize CodeQL
35 |         uses: github/codeql-action/init@ff0a06e83cb2de871e5a09832bc6a81e7276941f # v2.2.5
36 |         with:
37 |           languages: ${{ matrix.language }}
38 | 
39 |       # Autobuild attempts to build any compiled languages  (C/C++, C#, Go, or Java).
40 |       # If this step fails, then you should remove it and run the build manually (see below)
41 |       - name: Autobuild
42 |         uses: github/codeql-action/autobuild@ff0a06e83cb2de871e5a09832bc6a81e7276941f # v2.2.5
43 | 
44 |       - name: Perform CodeQL Analysis
45 |         uses: github/codeql-action/analyze@ff0a06e83cb2de871e5a09832bc6a81e7276941f # v2.2.5
46 |         with:
47 |           category: "/language:${{matrix.language}}"
48 | 


--------------------------------------------------------------------------------
/.github/workflows/dependency-review.yml:
--------------------------------------------------------------------------------
 1 | name: 'Dependency Review'
 2 | 
 3 | on: [pull_request]
 4 | 
 5 | permissions:
 6 |   contents: read
 7 | 
 8 | jobs:
 9 |   dependency-review:
10 |     runs-on: ubuntu-latest
11 |     steps:
12 |       - name: 'Checkout Repository'
13 |         uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
14 |       - name: 'Dependency Review'
15 |         uses: actions/dependency-review-action@da24556b548a50705dd671f47852072ea4c105d9 # v4.7.1
16 | 


--------------------------------------------------------------------------------
/.github/workflows/documentation.yml:
--------------------------------------------------------------------------------
 1 | name: Doxygen GitHub Pages
 2 | 
 3 | on:
 4 |   release:
 5 |     types: [created]
 6 |   # Allows you to run this workflow manually from the Actions tab
 7 |   workflow_dispatch:
 8 | 
 9 | concurrency:
10 |   group: ${{ github.workflow }}-${{ github.ref }}
11 |   cancel-in-progress: true
12 | 
13 | permissions:
14 |   contents: read
15 | 
16 | jobs:
17 |   deploy:
18 |     permissions:
19 |       contents: write
20 |       pages: write
21 |       id-token: write
22 |     runs-on: ubuntu-latest
23 |     steps:
24 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
25 |       - name: Install theme
26 |         run: ./tools/prepare-doxygen.sh
27 |       - uses: mattnotmitt/doxygen-action@ded75d963c260fd8489801611a5079d149ebcc07 # edge
28 |         with:
29 |           doxyfile-path: './doxygen'
30 |       - name: Deploy to GitHub Pages
31 |         uses: peaceiris/actions-gh-pages@4f9cc6602d3f66b9c108549d475ec49e8ef4d45e # v4.0.0
32 |         with:
33 |           github_token: ${{ secrets.GITHUB_TOKEN }}
34 |           publish_dir: docs/html
35 | 


--------------------------------------------------------------------------------
/.github/workflows/emscripten.yml:
--------------------------------------------------------------------------------
 1 | name: emscripten
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   build:
25 |     runs-on: ubuntu-latest
26 |     steps:
27 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
28 |       - uses: actions/setup-node@49933ea5288caeca8642d1e84afbd3f7d6820020 # v4.4.0
29 |       - uses: mymindstorm/setup-emsdk@6ab9eb1bda2574c4ddb79809fc9247783eaf9021 # v14
30 |       - name: Verify
31 |         run: emcc -v
32 |       - name: Checkout
33 |         uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v3.6.0
34 |       - name: Configure
35 |         run: emcmake cmake -B buildwasm -D ADA_TESTING=ON -D ADA_TOOLS=OFF
36 |       - name: Build
37 |         run: cmake --build buildwasm
38 |       - name: Test
39 |         run: ctest --test-dir buildwasm
40 | 


--------------------------------------------------------------------------------
/.github/workflows/lint_and_format_check.yml:
--------------------------------------------------------------------------------
 1 | name: Lint and format
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   lint-and-format:
25 |     runs-on: ubuntu-latest
26 |     steps:
27 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
28 | 
29 |       - name: Run clang-format
30 |         uses: jidicula/clang-format-action@4726374d1aa3c6aecf132e5197e498979588ebc8 # v4.15.0
31 |         with:
32 |           clang-format-version: '17'
33 |           fallback-style: 'Google'
34 | 
35 |       - uses: chartboost/ruff-action@e18ae971ccee1b2d7bbef113930f00c670b78da4 # v1.0.0
36 |         name: Lint with Ruff
37 |         with:
38 |           version: 0.6.0
39 | 


--------------------------------------------------------------------------------
/.github/workflows/macos_install.yml:
--------------------------------------------------------------------------------
 1 | name: macOS (Installation)
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   macos-build:
25 |     strategy:
26 |       fail-fast: false
27 |       matrix:
28 |         shared: [OFF]
29 |         runs-on: [macos-13, macos-14, macos-15]
30 |     runs-on: ${{matrix.runs-on}}
31 |     steps:
32 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
33 |       - name: Prepare
34 |         run: cmake -D ADA_TESTING=ON -DBUILD_SHARED_LIBS=${{matrix.shared}} -DCMAKE_INSTALL_PREFIX:PATH=destination -B build
35 |       - name: Build
36 |         run: cmake --build build -j=3
37 |       - name: Install
38 |         run: cmake --install build
39 |       - name: Prepare test package
40 |         run: cmake -DCMAKE_INSTALL_PREFIX:PATH=../../destination -S tests/installation -B buildbabyada
41 |       - name: Build test package
42 |         run: cmake --build buildbabyada
43 |       - name: Run example
44 |         run: ./buildbabyada/main
45 | 


--------------------------------------------------------------------------------
/.github/workflows/pkg.yml:
--------------------------------------------------------------------------------
 1 | name: Debian pkg-config
 2 | 
 3 | on: [push, pull_request]
 4 | 
 5 | permissions:
 6 |   contents: read
 7 | 
 8 | jobs:
 9 |   pkg-config:
10 |     runs-on: ubuntu-latest
11 |     container:
12 |       image: debian:12
13 | 
14 |     steps:
15 |     - uses: actions/checkout@v4
16 | 
17 |     - name: Install dependencies
18 |       run: |
19 |         apt -y update
20 |         apt -y --no-install-recommends install g++ cmake make pkg-config
21 | 
22 |     - name: Build and install
23 |       run: |
24 |         cmake -B build
25 |         cmake --build build
26 |         cmake --install build
27 | 
28 |     - name: Test pkg-config
29 |       run: pkg-config --cflags --libs ada
30 | 


--------------------------------------------------------------------------------
/.github/workflows/release-script-tests.yml:
--------------------------------------------------------------------------------
 1 | name: Release Script Tests
 2 | 
 3 | on:
 4 |   # workflow_call is used to indicate that a workflow can be called by another workflow.
 5 |   workflow_call:
 6 |   pull_request:
 7 |     types: [opened, synchronize, reopened, ready_for_review]
 8 |     paths-ignore:
 9 |       - '**.md'
10 |       - 'docs/**'
11 |   push:
12 |     branches:
13 |       - main
14 |     paths-ignore:
15 |       - '**.md'
16 |       - 'docs/**'
17 | 
18 | permissions:
19 |   contents: read
20 | 
21 | jobs:
22 |   release-script-test:
23 |     runs-on: ubuntu-latest
24 |     defaults:
25 |       run:
26 |         working-directory: ./tools/release
27 | 
28 |     steps:
29 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
30 | 
31 |       - name: Prepare Python
32 |         uses: actions/setup-python@a26af69be951a213d495a4c3e4e4022e16d87065 # v5.6.0
33 |         with:
34 |           cache: 'pip' # caching pip dependencies
35 | 
36 |       - name: Install dependencies
37 |         run: pip install -r requirements.txt
38 | 
39 |       - name: Run tests
40 |         run: pytest -v
41 | 


--------------------------------------------------------------------------------
/.github/workflows/release_create.yml:
--------------------------------------------------------------------------------
 1 | name: Release Create
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [closed]
 6 | 
 7 | env:
 8 |   GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
 9 | 
10 | jobs:
11 |   check-release-conditions:
12 |     runs-on: ubuntu-latest
13 |     if: |
14 |       github.event.pull_request.merged == true &&
15 |       github.event.pull_request.base.ref == 'main' &&
16 |       startsWith(github.event.pull_request.head.ref, 'release/v') &&
17 |       startsWith(github.event.pull_request.user.login, 'github-actions')
18 | 
19 |     steps:
20 |       - name: Check release conditions
21 |         run: |
22 |           echo "All conditions have been met!"
23 | 
24 |   release-script-test:
25 |     needs: check-release-conditions
26 |     uses: ./.github/workflows/release-script-tests.yml
27 | 
28 |   create-release:
29 |     permissions:
30 |       contents: write
31 |     needs: release-script-test
32 |     runs-on: ubuntu-latest
33 |     if: ${{ needs.release-script-test.result == 'success' }}
34 | 
35 |     env:
36 |       NEXT_RELEASE_TAG: ${{ github.event.pull_request.head.ref }}
37 |     steps:
38 |       - name: Checkout
39 |         uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
40 | 
41 |       - name: Prepare Python
42 |         uses: actions/setup-python@a26af69be951a213d495a4c3e4e4022e16d87065 # v5.6.0
43 |         with:
44 |           cache: 'pip' # caching pip dependencies
45 | 
46 |       - name: Install dependencies
47 |         run: pip install -r ./tools/release/requirements.txt
48 | 
49 |       - name: Extract Tag from branch name
50 |         run: |
51 |           NEXT_RELEASE_TAG=$(echo $NEXT_RELEASE_TAG | sed 's/^release\///')
52 |           echo "NEXT_RELEASE_TAG=${NEXT_RELEASE_TAG}" >> $GITHUB_ENV
53 | 
54 |       - name: Target release Tag
55 |         run: echo "New tag $NEXT_RELEASE_TAG"
56 | 
57 |       - name: Amalgamation
58 |         run: ./singleheader/amalgamate.py
59 | 
60 |       - name: "Create release"
61 |         run: ./tools/release/create_release.py
62 | 


--------------------------------------------------------------------------------
/.github/workflows/release_prepare.yml:
--------------------------------------------------------------------------------
 1 | name: Release Prepare
 2 | 
 3 | on:
 4 |   workflow_dispatch:
 5 |     inputs:
 6 |       tag:
 7 |         type: string
 8 |         required: true
 9 |         description: "Tag for the next release. Ex.: v5.0.0"
10 | 
11 | env:
12 |   NEXT_RELEASE_TAG: ${{ github.event.inputs.tag }}
13 |   GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
14 | 
15 | jobs:
16 |   release-script-test:
17 |     uses: ./.github/workflows/release-script-tests.yml
18 | 
19 |   prepare-release-and-pull-request:
20 |     permissions:
21 |       contents: write
22 |       pull-requests: write
23 |     needs: release-script-test
24 |     runs-on: ubuntu-22.04-arm
25 |     if: ${{ needs.release-script-test.result == 'success' }}
26 |     env:
27 |       CXX: clang++-14
28 |     steps:
29 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
30 | 
31 |       - name: Prepare Python
32 |         uses: actions/setup-python@a26af69be951a213d495a4c3e4e4022e16d87065 # v5.6.0
33 |         with:
34 |           cache: 'pip' # caching pip dependencies
35 | 
36 |       - name: Install dependencies
37 |         run: pip install -r ./tools/release/requirements.txt
38 | 
39 |       - name: Update source code versions
40 |         run: ./tools/release/update_versions.py
41 | 
42 |       - name: Ada Build
43 |         run: cmake -B build && cmake --build build
44 |       - name: Ada Test
45 |         run: ctest --output-on-failure --test-dir build
46 | 
47 |       - name: Create PR with code updates for new release
48 |         uses: peter-evans/create-pull-request@f3a21bf3404eae73a97f65817ab35f351a1a63fe #v5.0.0
49 |         with:
50 |           commit-message: "chore: release ${{ env.NEXT_RELEASE_TAG }}"
51 |           branch: "release/${{ env.NEXT_RELEASE_TAG }}"
52 |           title: "chore: release ${{ env.NEXT_RELEASE_TAG }}"
53 |           token: ${{ env.GITHUB_TOKEN }}
54 |           body: |
55 |             This pull PR updates the source code version to ${{ env.NEXT_RELEASE_TAG }}
56 |           delete-branch: true
57 |           reviewers: "lemire,anonrig"
58 | 


--------------------------------------------------------------------------------
/.github/workflows/scorecard.yml:
--------------------------------------------------------------------------------
 1 | # This workflow uses actions that are not certified by GitHub. They are provided
 2 | # by a third-party and are governed by separate terms of service, privacy
 3 | # policy, and support documentation.
 4 | 
 5 | name: Scorecard supply-chain security
 6 | on:
 7 |   # For Branch-Protection check. Only the default branch is supported. See
 8 |   # https://github.com/ossf/scorecard/blob/main/docs/checks.md#branch-protection
 9 |   branch_protection_rule:
10 |   # To guarantee Maintained check is occasionally updated. See
11 |   # https://github.com/ossf/scorecard/blob/main/docs/checks.md#maintained
12 |   schedule:
13 |     - cron: '0 0 * * 1'
14 | 
15 | # Declare default permissions as read only.
16 | permissions: read-all
17 | 
18 | jobs:
19 |   analysis:
20 |     name: Scorecard analysis
21 |     runs-on: ubuntu-latest
22 |     permissions:
23 |       # Needed to upload the results to code-scanning dashboard.
24 |       security-events: write
25 |       # Needed to publish results and get a badge (see publish_results below).
26 |       id-token: write
27 |       # Uncomment the permissions below if installing in a private repository.
28 |       # contents: read
29 |       # actions: read
30 | 
31 |     steps:
32 |       - name: "Checkout code"
33 |         uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
34 |         with:
35 |           persist-credentials: false
36 | 
37 |       - name: "Run analysis"
38 |         uses: ossf/scorecard-action@05b42c624433fc40578a4040d5cf5e36ddca8cde # v2.4.2
39 |         with:
40 |           results_file: results.sarif
41 |           results_format: sarif
42 |           # (Optional) "write" PAT token. Uncomment the `repo_token` line below if:
43 |           # - you want to enable the Branch-Protection check on a *public* repository, or
44 |           # - you are installing Scorecard on a *private* repository
45 |           # To create the PAT, follow the steps in https://github.com/ossf/scorecard-action#authentication-with-fine-grained-pat-optional.
46 |           # repo_token: ${{ secrets.SCORECARD_TOKEN }}
47 | 
48 |           # Public repositories:
49 |           #   - Publish results to OpenSSF REST API for easy access by consumers
50 |           #   - Allows the repository to include the Scorecard badge.
51 |           #   - See https://github.com/ossf/scorecard-action#publishing-results.
52 |           # For private repositories:
53 |           #   - `publish_results` will always be set to `false`, regardless
54 |           #     of the value entered here.
55 |           publish_results: true
56 | 
57 |       # Upload the results as artifacts (optional). Commenting out will disable uploads of run results in SARIF
58 |       # format to the repository Actions tab.
59 |       - name: "Upload artifact"
60 |         uses: actions/upload-artifact@ea165f8d65b6e75b540449e92b4886f43607fa02 # v4.6.2
61 |         with:
62 |           name: SARIF file
63 |           path: results.sarif
64 |           retention-days: 5
65 | 
66 |       # Upload the results to GitHub's code scanning dashboard.
67 |       - name: "Upload to code-scanning"
68 |         uses: github/codeql-action/upload-sarif@ff0a06e83cb2de871e5a09832bc6a81e7276941f # v3.28.18
69 |         with:
70 |           sarif_file: results.sarif
71 | 


--------------------------------------------------------------------------------
/.github/workflows/ubuntu-release.yml:
--------------------------------------------------------------------------------
 1 | name: Ubuntu 22.04 (Release build)
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ubuntu-release-build:
25 |     runs-on: ubuntu-22.04
26 |     strategy:
27 |       matrix:
28 |         cxx: [g++-12, clang++-14]
29 |     steps:
30 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
31 |       - name: Setup Ninja
32 |         run: sudo apt-get install ninja-build
33 |       - name: Prepare
34 |         run: cmake -DBUILD_TESTING=OFF -DCMAKE_BUILD_TYPE=Release -G Ninja -B build
35 |         env:
36 |           CXX: ${{matrix.cxx}}
37 |       - name: Build
38 |         run: cmake --build build -j=4
39 |       - name: Test
40 |         run: ctest --output-on-failure --test-dir build
41 | 


--------------------------------------------------------------------------------
/.github/workflows/ubuntu-s390x.yml:
--------------------------------------------------------------------------------
 1 | name: Ubuntu s390x (GCC 12)
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   build:
25 |     runs-on: ubuntu-latest
26 |     steps:
27 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
28 |       - uses: uraimo/run-on-arch-action@d94c13912ea685de38fccc1109385b83fd79427d # v3.0.1
29 |         name: Test
30 |         id: runcmd
31 |         with:
32 |           arch: s390x
33 |           distro: ubuntu_latest
34 |           githubToken: ${{ github.token }}
35 |           install: |
36 |             apt-get update -q -y
37 |             apt-get install -y cmake make g++-12 gcc-12 git ninja-build
38 |           run: |
39 |             CC=gcc-12 CXX=g++-12 cmake -D ADA_TESTING=ON -DCMAKE_BUILD_TYPE=Release -G Ninja -B build
40 |             rm -r -f dependencies
41 |             CC=gcc-12 CXX=g++-12 cmake --build build -j=4
42 |             ctest --output-on-failure --test-dir build
43 | 


--------------------------------------------------------------------------------
/.github/workflows/ubuntu-sanitized.yml:
--------------------------------------------------------------------------------
 1 | name: Ubuntu 22.04 (GCC 12 SANITIZED)
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ubuntu-build:
25 |     runs-on: ubuntu-22.04
26 |     strategy:
27 |       matrix:
28 |         shared: [ON, OFF]
29 |     steps:
30 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
31 |       - name: Setup Ninja
32 |         run: sudo apt-get install ninja-build
33 |       - name: Prepare
34 |         run: cmake -D ADA_TESTING=ON -DADA_SANITIZE=ON -DADA_DEVELOPMENT_CHECKS=ON -DBUILD_SHARED_LIBS=${{matrix.shared}} -G Ninja -B build
35 |         env:
36 |           CXX: g++-12
37 |       - name: Build
38 |         run: cmake --build build -j=4
39 |       - name: Test
40 |         run: ctest --output-on-failure --test-dir build
41 | 


--------------------------------------------------------------------------------
/.github/workflows/ubuntu-undef.yml:
--------------------------------------------------------------------------------
 1 | name: Ubuntu 22.04 (GCC 12 SANITIZE UNDEFINED)
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ubuntu-build:
25 |     runs-on: ubuntu-22.04
26 |     strategy:
27 |       matrix:
28 |         shared: [ON, OFF]
29 |     steps:
30 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
31 |       - name: Setup Ninja
32 |         run: sudo apt-get install ninja-build
33 |       - name: Prepare
34 |         run: cmake -D ADA_TESTING=ON -D ADA_SANITIZE_UNDEFINED=ON -DADA_DEVELOPMENT_CHECKS=ON -DBUILD_SHARED_LIBS=${{matrix.shared}} -G Ninja -B build
35 |         env:
36 |           CXX: g++-12
37 |       - name: Build
38 |         run: cmake --build build -j=4
39 |       - name: Test
40 |         run: ctest --output-on-failure --test-dir build
41 | 


--------------------------------------------------------------------------------
/.github/workflows/ubuntu.yml:
--------------------------------------------------------------------------------
 1 | name: Ubuntu 22.04
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ubuntu-build:
25 |     strategy:
26 |       fail-fast: false
27 |       matrix:
28 |         shared: [ON, OFF]
29 |         cxx: [g++-12, clang++-15]
30 |         runs-on: [ubuntu-22.04, ubuntu-22.04-arm]
31 |     runs-on: ${{matrix.runs-on}}
32 |     steps:
33 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
34 |       - name: Setup Ninja
35 |         run: sudo apt-get install ninja-build
36 |       - name: Prepare
37 |         run: cmake -D ADA_TESTING=ON -D ADA_BENCHMARKS=ON -DBUILD_SHARED_LIBS=${{matrix.shared}} -G Ninja -B build
38 |         env:
39 |           CXX: ${{matrix.cxx}}
40 |       - name: Build
41 |         run: cmake --build build -j=4
42 |       - name: Test
43 |         run: ctest --output-on-failure --test-dir build
44 |       - name: Run default benchmark
45 |         run: cd build && benchmarks/bench
46 | 


--------------------------------------------------------------------------------
/.github/workflows/ubuntu_install.yml:
--------------------------------------------------------------------------------
 1 | name: Ubuntu 24.04 (Installation)
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ubuntu-build:
25 |     runs-on: ubuntu-24.04
26 |     strategy:
27 |       matrix:
28 |         shared: [ON, OFF]
29 |         cxx: [g++-12, clang++]
30 |     steps:
31 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
32 |       - name: Setup Ninja
33 |         run: sudo apt-get install ninja-build
34 |       - name: Prepare
35 |         run: cmake -D ADA_TESTING=ON -G Ninja -DBUILD_SHARED_LIBS=${{matrix.shared}} -DCMAKE_INSTALL_PREFIX:PATH=destination -B build
36 |         env:
37 |           CXX: ${{matrix.cxx}}
38 |       - name: Build
39 |         run: cmake --build build -j=4
40 |       - name: Install
41 |         run: cmake --install build
42 |       - name: Prepare test package
43 |         run: cmake -DCMAKE_INSTALL_PREFIX:PATH=../../destination -S tests/installation -B buildbabyada
44 |       - name: Build test package
45 |         run: cmake --build buildbabyada
46 |       - name: Run example
47 |         run: ./buildbabyada/main
48 | 


--------------------------------------------------------------------------------
/.github/workflows/ubuntu_pedantic.yml:
--------------------------------------------------------------------------------
 1 | name: Ubuntu 22.04 (GCC 12) Fails On Compiler Warnings
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ubuntu-build:
25 |     runs-on: ubuntu-22.04
26 |     strategy:
27 |       matrix:
28 |         shared: [ON, OFF]
29 |     steps:
30 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
31 |       - name: Setup Ninja
32 |         run: sudo apt-get install ninja-build
33 |       - name: Prepare
34 |         run: cmake -D ADA_TESTING=ON -DBUILD_SHARED_LIBS=${{matrix.shared}} -G Ninja -B build
35 |         env:
36 |           CXX: g++-12
37 |           CXXFLAGS: -Werror -Wextra -Wno-unused-parameter -Wimplicit-fallthrough
38 |       - name: Build
39 |         run: cmake --build build -j=4
40 |       - name: Test
41 |         run: ctest --output-on-failure --test-dir build
42 | 


--------------------------------------------------------------------------------
/.github/workflows/visual_studio.yml:
--------------------------------------------------------------------------------
 1 | name: VS17-CI
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ci:
25 |     name: windows-vs17
26 |     runs-on: windows-2025
27 |     strategy:
28 |       fail-fast: false
29 |       matrix:
30 |         include:
31 |           - {gen: Visual Studio 17 2022, arch: x64, devchecks: OFF, shared: OFF, config: Release}
32 |           - {gen: Visual Studio 17 2022, arch: x64, devchecks: ON, shared: OFF, config: Debug}
33 |           - {gen: Visual Studio 17 2022, arch: x64, devchecks: ON, shared: ON, config: Debug}
34 |           - {gen: Visual Studio 17 2022, arch: Win32, devchecks: ON, shared: OFF, config: Debug}
35 |           - {gen: Visual Studio 17 2022, arch: Win32, devchecks: ON, shared: ON, config: Debug}
36 |     steps:
37 |     - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
38 |     - name: Configure
39 |       run: |
40 |         cmake -D ADA_TESTING=ON -DADA_DEVELOPMENT_CHECKS="${{matrix.devchecks}}" -G "${{matrix.gen}}" -A ${{matrix.arch}} -DBUILD_SHARED_LIBS=${{matrix.shared}} -B build
41 |     - name: Build
42 |       run: cmake --build build --config "${{matrix.config}}" --verbose
43 |     - name: Run  tests
44 |       working-directory: build
45 |       run: ctest -C "${{matrix.config}}" --output-on-failure
46 | 


--------------------------------------------------------------------------------
/.github/workflows/visual_studio_clang.yml:
--------------------------------------------------------------------------------
 1 | name: VS17-clang-CI
 2 | 
 3 | on:
 4 |   pull_request:
 5 |     types: [opened, synchronize, reopened, ready_for_review]
 6 |     paths-ignore:
 7 |       - '**.md'
 8 |       - 'docs/**'
 9 |   push:
10 |     branches:
11 |       - main
12 |     paths-ignore:
13 |       - '**.md'
14 |       - 'docs/**'
15 | 
16 | permissions:
17 |   contents: read
18 | 
19 | concurrency:
20 |   group: ${{ github.workflow }}-${{ github.ref }}
21 |   cancel-in-progress: true
22 | 
23 | jobs:
24 |   ci:
25 |     name: windows-vs17
26 |     runs-on: windows-2025
27 |     strategy:
28 |       fail-fast: false
29 |       matrix:
30 |         include:
31 |           - {gen: Visual Studio 17 2022, arch: x64, devchecks: ON}
32 |     steps:
33 |     - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
34 |     - name: Configure
35 |       run: |
36 |         cmake -D ADA_TESTING=ON -DADA_DEVELOPMENT_CHECKS="${{matrix.devchecks}}" -G "${{matrix.gen}}" -A ${{matrix.arch}} -T ClangCL -B build
37 |     - name: Build Debug
38 |       run: cmake --build build --config Debug --verbose
39 |     - name: Run Debug tests
40 |       working-directory: build
41 |       run: ctest -C Debug  --output-on-failure
42 |     - name: Build Release
43 |       run: cmake --build build --config Release --verbose
44 |     - name: Run Release tests
45 |       working-directory: build
46 |       run: ctest -C Release  --output-on-failure
47 | 


--------------------------------------------------------------------------------
/.github/workflows/wpt-updater.yml:
--------------------------------------------------------------------------------
 1 | name: Update WPT
 2 | 
 3 | on:
 4 |   schedule:
 5 |     - cron: '0 0 * * *'
 6 | 
 7 | env:
 8 |   GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
 9 | 
10 | concurrency:
11 |   group: wpt-updater
12 |   cancel-in-progress: true
13 | 
14 | permissions:
15 |   contents: read
16 | 
17 | jobs:
18 |   issue:
19 |     runs-on: ubuntu-latest
20 |     permissions:
21 |       contents: write
22 |       pull-requests: write
23 |     strategy:
24 |       fail-fast: false
25 |       matrix:
26 |         module: [url, urlpattern]
27 |     steps:
28 |       - uses: actions/checkout@11bd71901bbe5b1630ceea73d27597364c9af683 # v4.2.2
29 |       - name: Fetch tests
30 |         run: tools/update-wpt.sh ${{matrix.module}}
31 |       - name: Open pull request
32 |         uses: peter-evans/create-pull-request@6d6857d36972b65feb161a90e484f2984215f83e #v6.0.5
33 |         with:
34 |           token: ${{secrets.GH_PAT}}
35 |           commit-message: "test: update web platform tests"
36 |           branch: automatic-update-wpt-${{matrix.module}}
37 |           title: Update web platform tests (${{matrix.module}})
38 |           body: |
39 |             This is an automated pull request for updating the WPT.
40 | 
41 |             - [Web Platform Tests](https://github.com/web-platform-tests/wpt/tree/master/url)
42 |             - [Commit History](https://github.com/web-platform-tests/wpt/commits/master/url/resources)
43 | 
44 |             cc @anonrig @lemire
45 |           team-reviewers: core
46 |           delete-branch: true
47 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | # common build directory
 2 | build
 3 | *-build-*
 4 | 
 5 | # Python cache
 6 | __pycache__
 7 | venv
 8 | 
 9 | cmake-build-debug
10 | 
11 | .cache
12 | docs/html
13 | docs/theme
14 | 
15 | # Generated using only the Github workflow
16 | benchmark_result.json
17 | 
18 | singleheader/ada.h
19 | singleheader/ada_c.h
20 | singleheader/ada.cpp
21 | singleheader/singleheader.zip
22 | 
23 | benchmarks/competitors/servo-url/debug
24 | benchmarks/competitors/servo-url/target
25 | 
26 | #ignore VScode
27 | .vscode/
28 | .idea
29 | 
30 | # bazel output
31 | bazel-*
32 | 


--------------------------------------------------------------------------------
/.python-version:
--------------------------------------------------------------------------------
1 | 3.12
2 | 


--------------------------------------------------------------------------------
/LICENSE-MIT:
--------------------------------------------------------------------------------
 1 | Copyright 2023 Yagiz Nizipli and Daniel Lemire
 2 | 
 3 | Permission is hereby granted, free of charge, to any person obtaining a copy of
 4 | this software and associated documentation files (the "Software"), to deal in
 5 | the Software without restriction, including without limitation the rights to
 6 | use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of
 7 | the Software, and to permit persons to whom the Software is furnished to do so,
 8 | subject to the following conditions:
 9 | 
10 | The above copyright notice and this permission notice shall be included in all
11 | copies or substantial portions of the Software.
12 | 
13 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS
15 | FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR
16 | COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER
17 | IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
18 | CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
19 | 


--------------------------------------------------------------------------------
/SECURITY.md:
--------------------------------------------------------------------------------
1 | # Security Policy
2 | 
3 | ## Reporting a Vulnerability
4 | 
5 | Please use the following contact information for reporting a vulnerability:
6 | 
7 | - [Daniel Lemire](https://github.com/lemire) - daniel@lemire.me
8 | - [Yagiz Nizipli](https://github.com/anonrig) - yagiz@nizipli.com
9 | 


--------------------------------------------------------------------------------
/ada.pc.in:
--------------------------------------------------------------------------------
 1 | prefix=@CMAKE_INSTALL_PREFIX@
 2 | includedir=@PKGCONFIG_INCLUDEDIR@
 3 | libdir=@PKGCONFIG_LIBDIR@
 4 | 
 5 | Name: @PROJECT_NAME@
 6 | Description: @PROJECT_DESCRIPTION@
 7 | URL: @PROJECT_HOMEPAGE_URL@
 8 | Version: @PROJECT_VERSION@
 9 | Cflags: -I${includedir} @PKGCONFIG_CFLAGS@
10 | Libs: -L${libdir} -l@PROJECT_NAME@
11 | @PKGCONFIG_LIBS_PRIVATE@
12 | 


--------------------------------------------------------------------------------
/benchmarks/bbc_bench.cpp:
--------------------------------------------------------------------------------
 1 | #include "benchmark_header.h"
 2 | 
 3 | /**
 4 |  * Realistic URL examples collected from the BBC homepage.
 5 |  */
 6 | std::string url_examples[] = {
 7 |     "https://static.files.bbci.co.uk/orbit/737a4ee2bed596eb65afc4d2ce9af568/js/"
 8 |     "polyfills.js",
 9 |     "https://static.files.bbci.co.uk/orbit/737a4ee2bed596eb65afc4d2ce9af568/"
10 |     "css/orbit-v5-ltr.min.css",
11 |     "https://static.files.bbci.co.uk/orbit/737a4ee2bed596eb65afc4d2ce9af568/js/"
12 |     "require.min.js",
13 |     "https://static.files.bbci.co.uk/fonts/reith/2.512/BBCReithSans_W_Rg.woff2",
14 |     "https://nav.files.bbci.co.uk/searchbox/c8bfe8595e453f2b9483fda4074e9d15/"
15 |     "css/box.css",
16 |     "https://static.files.bbci.co.uk/cookies/d3bb303e79f041fec95388e04f84e716/"
17 |     "cookie-banner/cookie-library.bundle.js",
18 |     "https://static.files.bbci.co.uk/account/id-cta/597/style/id-cta.css",
19 |     "https://gn-web-assets.api.bbc.com/wwhp/"
20 |     "20220908-1153-091014d07889c842a7bdc06e00fa711c9e04f049/responsive/css/"
21 |     "old-ie.min.css",
22 |     "https://gn-web-assets.api.bbc.com/wwhp/"
23 |     "20220908-1153-091014d07889c842a7bdc06e00fa711c9e04f049/modules/vendor/"
24 |     "bower/modernizr/modernizr.js"};
25 | 
26 | void init_data(const char* v = nullptr) {}
27 | 
28 | double url_examples_bytes = []() -> double {
29 |   size_t bytes{0};
30 |   for (std::string& url_string : url_examples) {
31 |     bytes += url_string.size();
32 |   }
33 |   return double(bytes);
34 | }();
35 | 
36 | #include "benchmark_template.cpp"
37 | 


--------------------------------------------------------------------------------
/benchmarks/bench.cpp:
--------------------------------------------------------------------------------
 1 | #include "benchmark_header.h"
 2 | 
 3 | /**
 4 |  * Realistic URL examples collected on the actual web.
 5 |  */
 6 | std::string url_examples_default[] = {
 7 |     "https://www.google.com/"
 8 |     "webhp?hl=en&amp;ictx=2&amp;sa=X&amp;ved=0ahUKEwil_"
 9 |     "oSxzJj8AhVtEFkFHTHnCGQQPQgI",
10 |     "https://support.google.com/websearch/"
11 |     "?p=ws_results_help&amp;hl=en-CA&amp;fg=1",
12 |     "https://en.wikipedia.org/wiki/Dog#Roles_with_humans",
13 |     "https://www.tiktok.com/@aguyandagolden/video/7133277734310038830",
14 |     "https://business.twitter.com/en/help/troubleshooting/"
15 |     "how-twitter-ads-work.html?ref=web-twc-ao-gbl-adsinfo&utm_source=twc&utm_"
16 |     "medium=web&utm_campaign=ao&utm_content=adsinfo",
17 |     "https://images-na.ssl-images-amazon.com/images/I/"
18 |     "41Gc3C8UysL.css?AUIClients/AmazonGatewayAuiAssets",
19 |     "https://www.reddit.com/?after=t3_zvz1ze",
20 |     "https://www.reddit.com/login/?dest=https%3A%2F%2Fwww.reddit.com%2F",
21 |     "postgresql://other:9818274x1!!@localhost:5432/"
22 |     "otherdb?connect_timeout=10&application_name=myapp",
23 |     "http://192.168.1.1",             // ipv4
24 |     "http://[2606:4700:4700::1111]",  // ipv6
25 | };
26 | 
27 | std::vector<std::string> url_examples;
28 | 
29 | double url_examples_bytes = []() -> double {
30 |   size_t bytes{0};
31 |   for (std::string& url_string : url_examples) {
32 |     bytes += url_string.size();
33 |   }
34 |   return double(bytes);
35 | }();
36 | 
37 | #ifdef ADA_URL_FILE
38 | const char* default_file = ADA_URL_FILE;
39 | #else
40 | const char* default_file = nullptr;
41 | #endif
42 | 
43 | size_t init_data(const char* input = default_file) {
44 |   // compute the number of bytes.
45 |   auto compute = []() -> double {
46 |     size_t bytes{0};
47 |     for (std::string& url_string : url_examples) {
48 |       bytes += url_string.size();
49 |     }
50 |     return double(bytes);
51 |   };
52 |   if (input == nullptr) {
53 |     for (const std::string& s : url_examples_default) {
54 |       url_examples.emplace_back(s);
55 |     }
56 |     url_examples_bytes = compute();
57 |     return url_examples.size();
58 |   }
59 | 
60 |   if (!file_exists(input)) {
61 |     std::cout << "File not found !" << input << std::endl;
62 |     for (const std::string& s : url_examples_default) {
63 |       url_examples.emplace_back(s);
64 |     }
65 |   } else {
66 |     std::cout << "Loading " << input << std::endl;
67 |     url_examples = split_string(read_file(input));
68 |   }
69 |   url_examples_bytes = compute();
70 |   return url_examples.size();
71 | }
72 | #include "benchmark_template.cpp"
73 | 


--------------------------------------------------------------------------------
/benchmarks/benchmark_header.h:
--------------------------------------------------------------------------------
 1 | #include <iostream>
 2 | #include <memory>
 3 | #include <cstdlib>
 4 | #include <sstream>
 5 | #include <fstream>
 6 | #include <filesystem>
 7 | 
 8 | #if ADA_VARIOUS_COMPETITION_ENABLED
 9 | #include <uriparser/Uri.h>
10 | #include <EdUrlParser.h>
11 | #include <http_parser.h>
12 | #endif
13 | #if ADA_url_whatwg_ENABLED
14 | #include <upa/url.h>
15 | #endif
16 | 
17 | #include "ada.h"
18 | #include "performancecounters/event_counter.h"
19 | event_collector collector;
20 | size_t N = 1000;
21 | 
22 | #include <benchmark/benchmark.h>
23 | 
24 | bool file_exists(const char* filename) {
25 |   namespace fs = std::filesystem;
26 |   std::filesystem::path f{filename};
27 |   if (std::filesystem::exists(filename)) {
28 |     return true;
29 |   } else {
30 |     return false;
31 |   }
32 | }
33 | 
34 | std::string read_file(std::string filename) {
35 |   constexpr size_t read_size = 4096;
36 |   auto stream = std::ifstream(filename.c_str());
37 |   stream.exceptions(std::ios_base::badbit);
38 |   std::string out;
39 |   std::string buf(read_size, '\0');
40 |   while (stream.read(&buf[0], read_size)) {
41 |     out.append(buf, 0, size_t(stream.gcount()));
42 |   }
43 |   out.append(buf, 0, size_t(stream.gcount()));
44 |   return out;
45 | }
46 | 
47 | std::vector<std::string> split_string(const std::string& str) {
48 |   std::vector<std::string> result;
49 |   std::stringstream ss{str};
50 |   for (std::string line; std::getline(ss, line, '\n');) {
51 |     std::string_view view = line;
52 |     // Some parsers like boost/url will refuse to parse a URL with trailing
53 |     // whitespace.
54 |     while (!view.empty() && std::isspace(view.back())) {
55 |       view.remove_suffix(1);
56 |     }
57 |     while (!view.empty() && std::isspace(view.front())) {
58 |       view.remove_prefix(1);
59 |     }
60 |     if (!view.empty()) {
61 |       result.emplace_back(view);
62 |     }
63 |   }
64 |   return result;
65 | }
66 | 


--------------------------------------------------------------------------------
/benchmarks/competitors/servo-url/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "servo-url"
 3 | version = "0.1.0"
 4 | edition = "2021"
 5 | 
 6 | [lib]
 7 | path = "lib.rs"
 8 | crate-type = ["cdylib"]
 9 | 
10 | [dependencies]
11 | url = "2.5.4"
12 | libc = "0.2"
13 | 
14 | [profile.release]
15 | opt-level = 3
16 | debug = false
17 | lto = true
18 | 


--------------------------------------------------------------------------------
/benchmarks/competitors/servo-url/README.md:
--------------------------------------------------------------------------------
 1 | ## Servo URL FFI
 2 | 
 3 | This folder includes FFI bindings for servo/url.
 4 | 
 5 | ### Links
 6 | 
 7 | - https://github.com/eqrion/cbindgen/blob/master/docs.md
 8 | - https://gist.github.com/zbraniecki/b251714d77ffebbc73c03447f2b2c69f
 9 | - https://github.com/Michael-F-Bryan/rust-ffi-guide/blob/master/book/setting_up.md
10 | 
11 | ### Building
12 | 
13 | - Generating cbindgen output
14 |   - Install dependencies with `brew install cbindgen`
15 |   - Generate with `cbindgen --config cbindgen.toml --crate servo-url --output servo_url.h`
16 | - Building
17 |   - Run with `cargo build --release`
18 | 


--------------------------------------------------------------------------------
/benchmarks/competitors/servo-url/cbindgen.toml:
--------------------------------------------------------------------------------
 1 | autogen_warning = "/* Warning, this file is autogenerated by cbindgen. Don't modify this manually. */"
 2 | include_version = true
 3 | braces = "SameLine"
 4 | line_length = 100
 5 | tab_width = 2
 6 | language = "C++"
 7 | namespaces = ["servo_url"]
 8 | include_guard = "servo_url_ffi_h"
 9 | 
10 | [parse]
11 | parse_deps = true
12 | include = ["url"]
13 | 


--------------------------------------------------------------------------------
/benchmarks/competitors/servo-url/lib.rs:
--------------------------------------------------------------------------------
 1 | use url::Url;
 2 | use std::slice;
 3 | use libc::{c_char, size_t};
 4 | 
 5 | extern crate url;
 6 | extern crate libc;
 7 | 
 8 | #[unsafe(no_mangle)]
 9 | pub extern "C" fn parse_url(raw_input: *const c_char, raw_input_length: size_t) -> *mut Url {
10 |   let input = unsafe { std::str::from_utf8_unchecked(slice::from_raw_parts(raw_input as *const u8, raw_input_length)) };
11 |   // This code would assume that the URL is parsed successfully:
12 |   // let result = Url::parse(input).unwrap();
13 |   // Box::into_raw(Box::new(result))
14 |   // But we might get an invalid input. So we want to return null in case of
15 |   // error. We can do it in such a manner:
16 |   match Url::parse(input) {
17 |     Ok(result) => Box::into_raw(Box::new(result)),
18 |     Err(_) => std::ptr::null_mut(),
19 |   }
20 | }
21 | 
22 | #[unsafe(no_mangle)]
23 | pub extern "C" fn parse_url_to_href(raw_input: *const c_char, raw_input_length: size_t) -> *const c_char {
24 |   let input = unsafe { std::str::from_utf8_unchecked(slice::from_raw_parts(raw_input as *const u8, raw_input_length)) };
25 |   match Url::parse(input) {
26 |     Ok(result) => std::ffi::CString::new(result.as_str()).unwrap().into_raw(),
27 |     Err(_) => std::ptr::null_mut(),
28 |   }
29 | }
30 | 
31 | #[unsafe(no_mangle)]
32 | pub extern "C" fn free_url(raw: *mut Url) {
33 |   if raw.is_null() {
34 |     return;
35 |   }
36 | 
37 |   unsafe { drop(Box::from_raw(raw)) }
38 | }
39 | 
40 | #[unsafe(no_mangle)]
41 | pub unsafe extern fn free_string(ptr: *const c_char) {
42 |     // Take the ownership back to rust and drop the owner
43 |     let _ = unsafe { std::ffi::CString::from_raw(ptr as *mut _) };
44 | }
45 | 


--------------------------------------------------------------------------------
/benchmarks/competitors/servo-url/servo_url.h:
--------------------------------------------------------------------------------
 1 | #ifndef servo_url_ffi_h
 2 | #define servo_url_ffi_h
 3 | 
 4 | /* This file was modified manually. */
 5 | 
 6 | #include <cstdarg>
 7 | #include <cstdint>
 8 | #include <cstdlib>
 9 | #include <ostream>
10 | #include <new>
11 | 
12 | namespace servo_url {
13 | 
14 | /// A parsed URL record.
15 | struct Url;
16 | 
17 | extern "C" {
18 | 
19 | Url *parse_url(const char *raw_input, size_t raw_input_length);
20 | 
21 | void free_url(Url *raw);
22 | 
23 | const char *parse_url_to_href(const char *raw_input, size_t raw_input_length);
24 | 
25 | void free_string(const char *);
26 | }  // extern "C"
27 | 
28 | }  // namespace servo_url
29 | 
30 | #endif  // servo_url_ffi_h
31 | 


--------------------------------------------------------------------------------
/benchmarks/performancecounters/event_counter.h:
--------------------------------------------------------------------------------
  1 | #ifndef __EVENT_COUNTER_H
  2 | #define __EVENT_COUNTER_H
  3 | 
  4 | #include <cctype>
  5 | #ifndef _MSC_VER
  6 | #include <dirent.h>
  7 | #endif
  8 | #include <cinttypes>
  9 | 
 10 | #include <cstring>
 11 | 
 12 | #include <chrono>
 13 | #include <vector>
 14 | 
 15 | #include "linux-perf-events.h"
 16 | #ifdef __linux__
 17 | #include <libgen.h>
 18 | #endif
 19 | 
 20 | #if __APPLE__ && __aarch64__
 21 | #include "apple_arm_events.h"
 22 | #endif
 23 | 
 24 | struct event_count {
 25 |   std::chrono::duration<double> elapsed;
 26 |   std::vector<unsigned long long> event_counts;
 27 |   event_count() : elapsed(0), event_counts{0, 0, 0, 0, 0} {}
 28 |   event_count(const std::chrono::duration<double> _elapsed,
 29 |               const std::vector<unsigned long long> _event_counts)
 30 |       : elapsed(_elapsed), event_counts(_event_counts) {}
 31 |   event_count(const event_count& other)
 32 |       : elapsed(other.elapsed), event_counts(other.event_counts) {}
 33 | 
 34 |   // The types of counters (so we can read the getter more easily)
 35 |   enum event_counter_types {
 36 |     CPU_CYCLES,
 37 |     INSTRUCTIONS,
 38 |     BRANCH_MISSES = 2,
 39 |     BRANCH = 4
 40 |   };
 41 | 
 42 |   double elapsed_sec() const {
 43 |     return std::chrono::duration<double>(elapsed).count();
 44 |   }
 45 |   double elapsed_ns() const {
 46 |     return std::chrono::duration<double, std::nano>(elapsed).count();
 47 |   }
 48 |   double cycles() const {
 49 |     return static_cast<double>(event_counts[CPU_CYCLES]);
 50 |   }
 51 |   double instructions() const {
 52 |     return static_cast<double>(event_counts[INSTRUCTIONS]);
 53 |   }
 54 |   double branches() const { return static_cast<double>(event_counts[BRANCH]); }
 55 |   double branch_misses() const {
 56 |     return static_cast<double>(event_counts[BRANCH_MISSES]);
 57 |   }
 58 |   event_count& operator=(const event_count& other) {
 59 |     this->elapsed = other.elapsed;
 60 |     this->event_counts = other.event_counts;
 61 |     return *this;
 62 |   }
 63 |   event_count operator+(const event_count& other) const {
 64 |     return event_count(elapsed + other.elapsed,
 65 |                        {
 66 |                            event_counts[0] + other.event_counts[0],
 67 |                            event_counts[1] + other.event_counts[1],
 68 |                            event_counts[2] + other.event_counts[2],
 69 |                            event_counts[3] + other.event_counts[3],
 70 |                            event_counts[4] + other.event_counts[4],
 71 |                        });
 72 |   }
 73 | 
 74 |   void operator+=(const event_count& other) { *this = *this + other; }
 75 | };
 76 | 
 77 | struct event_aggregate {
 78 |   bool has_events = false;
 79 |   int iterations = 0;
 80 |   event_count total{};
 81 |   event_count best{};
 82 |   event_count worst{};
 83 | 
 84 |   event_aggregate() = default;
 85 | 
 86 |   void operator<<(const event_count& other) {
 87 |     if (iterations == 0 || other.elapsed < best.elapsed) {
 88 |       best = other;
 89 |     }
 90 |     if (iterations == 0 || other.elapsed > worst.elapsed) {
 91 |       worst = other;
 92 |     }
 93 |     iterations++;
 94 |     total += other;
 95 |   }
 96 | 
 97 |   double elapsed_sec() const { return total.elapsed_sec() / iterations; }
 98 |   double elapsed_ns() const { return total.elapsed_ns() / iterations; }
 99 |   double cycles() const { return total.cycles() / iterations; }
100 |   double instructions() const { return total.instructions() / iterations; }
101 | };
102 | 
103 | struct event_collector {
104 |   event_count count{};
105 |   std::chrono::time_point<std::chrono::steady_clock> start_clock{};
106 | 
107 | #if defined(__linux__)
108 |   LinuxEvents<PERF_TYPE_HARDWARE> linux_events;
109 |   event_collector()
110 |       : linux_events(std::vector<int>{
111 |             PERF_COUNT_HW_CPU_CYCLES,
112 |             PERF_COUNT_HW_INSTRUCTIONS,
113 |         }) {}
114 |   bool has_events() { return linux_events.is_working(); }
115 | #elif __APPLE__ && __aarch64__
116 |   AppleEvents apple_events;
117 |   performance_counters diff;
118 |   event_collector() : diff(0) { apple_events.setup_performance_counters(); }
119 |   bool has_events() { return apple_events.setup_performance_counters(); }
120 | #else
121 |   event_collector() {}
122 |   bool has_events() { return false; }
123 | #endif
124 | 
125 |   inline void start() {
126 | #if defined(__linux)
127 |     linux_events.start();
128 | #elif __APPLE__ && __aarch64__
129 |     if (has_events()) {
130 |       diff = apple_events.get_counters();
131 |     }
132 | #endif
133 |     start_clock = std::chrono::steady_clock::now();
134 |   }
135 |   inline event_count& end() {
136 |     const auto end_clock = std::chrono::steady_clock::now();
137 | #if defined(__linux)
138 |     linux_events.end(count.event_counts);
139 | #elif __APPLE__ && __aarch64__
140 |     if (has_events()) {
141 |       performance_counters end = apple_events.get_counters();
142 |       diff = end - diff;
143 |     }
144 |     count.event_counts[0] = diff.cycles;
145 |     count.event_counts[1] = diff.instructions;
146 |     count.event_counts[2] = diff.missed_branches;
147 |     count.event_counts[3] = 0;
148 |     count.event_counts[4] = diff.branches;
149 | #endif
150 |     count.elapsed = end_clock - start_clock;
151 |     return count;
152 |   }
153 | };
154 | 
155 | #endif
156 | 


--------------------------------------------------------------------------------
/benchmarks/performancecounters/linux-perf-events.h:
--------------------------------------------------------------------------------
  1 | #pragma once
  2 | #ifdef __linux__
  3 | 
  4 | #include <asm/unistd.h>        // for __NR_perf_event_open
  5 | #include <linux/perf_event.h>  // for perf event constants
  6 | #include <sys/ioctl.h>         // for ioctl
  7 | #include <unistd.h>            // for syscall
  8 | 
  9 | #include <cerrno>   // for errno
 10 | #include <cstring>  // for memset
 11 | #include <stdexcept>
 12 | 
 13 | #include <iostream>
 14 | #include <vector>
 15 | 
 16 | template <int TYPE = PERF_TYPE_HARDWARE>
 17 | class LinuxEvents {
 18 |   int fd;
 19 |   bool working;
 20 |   perf_event_attr attribs{};
 21 |   size_t num_events{};
 22 |   std::vector<uint64_t> temp_result_vec{};
 23 |   std::vector<uint64_t> ids{};
 24 | 
 25 |  public:
 26 |   explicit LinuxEvents(std::vector<int> config_vec) : fd(0), working(true) {
 27 |     memset(&attribs, 0, sizeof(attribs));
 28 |     attribs.type = TYPE;
 29 |     attribs.size = sizeof(attribs);
 30 |     attribs.disabled = 1;
 31 |     attribs.exclude_kernel = 1;
 32 |     attribs.exclude_hv = 1;
 33 | 
 34 |     attribs.sample_period = 0;
 35 |     attribs.read_format = PERF_FORMAT_GROUP | PERF_FORMAT_ID;
 36 |     const int pid = 0;   // the current process
 37 |     const int cpu = -1;  // all CPUs
 38 |     const unsigned long flags = 0;
 39 | 
 40 |     int group = -1;  // no group
 41 |     num_events = config_vec.size();
 42 |     ids.resize(config_vec.size());
 43 |     uint32_t i = 0;
 44 |     for (auto config : config_vec) {
 45 |       attribs.config = config;
 46 |       int _fd = static_cast<int>(
 47 |           syscall(__NR_perf_event_open, &attribs, pid, cpu, group, flags));
 48 |       if (_fd == -1) {
 49 |         report_error("perf_event_open");
 50 |       }
 51 |       ioctl(_fd, PERF_EVENT_IOC_ID, &ids[i++]);
 52 |       if (group == -1) {
 53 |         group = _fd;
 54 |         fd = _fd;
 55 |       }
 56 |     }
 57 | 
 58 |     temp_result_vec.resize(num_events * 2 + 1);
 59 |   }
 60 | 
 61 |   ~LinuxEvents() {
 62 |     if (fd != -1) {
 63 |       close(fd);
 64 |     }
 65 |   }
 66 | 
 67 |   inline void start() {
 68 |     if (fd != -1) {
 69 |       if (ioctl(fd, PERF_EVENT_IOC_RESET, PERF_IOC_FLAG_GROUP) == -1) {
 70 |         report_error("ioctl(PERF_EVENT_IOC_RESET)");
 71 |       }
 72 | 
 73 |       if (ioctl(fd, PERF_EVENT_IOC_ENABLE, PERF_IOC_FLAG_GROUP) == -1) {
 74 |         report_error("ioctl(PERF_EVENT_IOC_ENABLE)");
 75 |       }
 76 |     }
 77 |   }
 78 | 
 79 |   inline void end(std::vector<unsigned long long> &results) {
 80 |     if (fd != -1) {
 81 |       if (ioctl(fd, PERF_EVENT_IOC_DISABLE, PERF_IOC_FLAG_GROUP) == -1) {
 82 |         report_error("ioctl(PERF_EVENT_IOC_DISABLE)");
 83 |       }
 84 | 
 85 |       if (read(fd, temp_result_vec.data(), temp_result_vec.size() * 8) == -1) {
 86 |         report_error("read");
 87 |       }
 88 |     }
 89 |     // our actual results are in slots 1,3,5, ... of this structure
 90 |     for (uint32_t i = 1; i < temp_result_vec.size(); i += 2) {
 91 |       results[i / 2] = temp_result_vec[i];
 92 |     }
 93 |     for (uint32_t i = 2; i < temp_result_vec.size(); i += 2) {
 94 |       if (ids[i / 2 - 1] != temp_result_vec[i]) {
 95 |         report_error("event mismatch");
 96 |       }
 97 |     }
 98 |   }
 99 | 
100 |   bool is_working() { return working; }
101 | 
102 |  private:
103 |   void report_error(const std::string &) { working = false; }
104 | };
105 | #endif


--------------------------------------------------------------------------------
/cmake/JoinPaths.cmake:
--------------------------------------------------------------------------------
 1 | function(join_paths joined_path first_path_segment)
 2 |   set(temp_path "${first_path_segment}")
 3 |   foreach(current_segment IN LISTS ARGN)
 4 |     if(NOT ("${current_segment}" STREQUAL ""))
 5 |       if(IS_ABSOLUTE "${current_segment}")
 6 |         set(temp_path "${current_segment}")
 7 |       else()
 8 |         set(temp_path "${temp_path}/${current_segment}")
 9 |       endif()
10 |     endif()
11 |   endforeach()
12 |   set(${joined_path} "${temp_path}" PARENT_SCOPE)
13 | endfunction()
14 | 


--------------------------------------------------------------------------------
/cmake/ada-config.cmake.in:
--------------------------------------------------------------------------------
1 | include("${CMAKE_CURRENT_LIST_DIR}/ada_targets.cmake")
2 | 


--------------------------------------------------------------------------------
/cmake/ada-flags.cmake:
--------------------------------------------------------------------------------
 1 | option(ADA_LOGGING "verbose output (useful for debugging)" OFF)
 2 | option(ADA_DEVELOPMENT_CHECKS "development checks (useful for debugging)" OFF)
 3 | option(ADA_SANITIZE "Sanitize addresses" OFF)
 4 | if(CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
 5 |   option(ADA_SANITIZE_BOUNDS_STRICT "Sanitize bounds (strict): only for GCC" OFF)
 6 | endif()
 7 | option(ADA_SANITIZE_UNDEFINED "Sanitize undefined behaviour" OFF)
 8 | if(ADA_SANITIZE)
 9 |   message(STATUS "Address sanitizer enabled.")
10 | endif()
11 | if(ADA_SANITIZE_WITHOUT_LEAKS)
12 |   message(STATUS "Address sanitizer (but not leak) enabled.")
13 | endif()
14 | if(ADA_SANITIZE_UNDEFINED)
15 |   message(STATUS "Undefined sanitizer enabled.")
16 | endif()
17 | option(ADA_COVERAGE "Compute coverage" OFF)
18 | option(ADA_TOOLS "Build cli tools (adaparse)" OFF)
19 | option(ADA_BENCHMARKS "Build benchmarks" OFF)
20 | option(ADA_TESTING "Build tests" OFF)
21 | option(ADA_USE_UNSAFE_STD_REGEX_PROVIDER "Enable unsafe regex provider that uses std::regex" OFF)
22 | option(ADA_INCLUDE_URL_PATTERN "Include URL pattern implementation" ON)
23 | 
24 | if (ADA_COVERAGE)
25 |     message(STATUS "You want to compute coverage. We assume that you have installed gcovr.")
26 |     if (NOT CMAKE_BUILD_TYPE)
27 |         set(CMAKE_BUILD_TYPE Debug CACHE STRING "Choose the type of build." FORCE)
28 |     endif()
29 |     #######################
30 |     # You need to install gcovr. Under macos, you may do so with brew.
31 |     # brew install gcovr
32 |     # Then build...
33 |     # cmake -D ADA_COVERAGE=ON  -B buildcoverage
34 |     # cmake --build buildcoverage
35 |     # cmake --build buildcoverage --target ada_coverage
36 |     #
37 |     # open buildcoverage/ada_coverage/index.html
38 |     #####################
39 |     include(${PROJECT_SOURCE_DIR}/cmake/codecoverage.cmake)
40 |     APPEND_COVERAGE_COMPILER_FLAGS()
41 |     setup_target_for_coverage_gcovr_html(NAME ada_coverage EXECUTABLE ctest EXCLUDE "${PROJECT_SOURCE_DIR}/dependencies/*" "${PROJECT_SOURCE_DIR}/tools/*"  "${PROJECT_SOURCE_DIR}/singleheader/*" ${PROJECT_SOURCE_DIR}/include/ada/common_defs.h)
42 | endif()
43 | 
44 | if (NOT CMAKE_BUILD_TYPE)
45 |   if(ADA_SANITIZE OR ADA_SANITIZE_WITHOUT_LEAKS OR ADA_SANITIZE_BOUNDS_STRICT OR ADA_SANITIZE_UNDEFINED)
46 |     message(STATUS "No build type selected, default to Debug because you have sanitizers.")
47 |     set(CMAKE_BUILD_TYPE Debug CACHE STRING "Choose the type of build." FORCE)
48 |   else()
49 |     message(STATUS "No build type selected, default to Release")
50 |     set(CMAKE_BUILD_TYPE Release CACHE STRING "Choose the type of build." FORCE)
51 |   endif()
52 | endif()
53 | 
54 | set(CMAKE_MODULE_PATH "${CMAKE_CURRENT_SOURCE_DIR}/tools/cmake")
55 | set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
56 | 
57 | set(CMAKE_CXX_STANDARD 20)
58 | set(CMAKE_CXX_STANDARD_REQUIRED ON)
59 | set(CMAKE_CXX_EXTENSIONS OFF)
60 | 
61 | find_program(CCACHE_FOUND ccache)
62 | if(CCACHE_FOUND)
63 |   message(STATUS "Ccache found using it as compiler launcher.")
64 |   set(CMAKE_C_COMPILER_LAUNCHER ccache)
65 |   set(CMAKE_CXX_COMPILER_LAUNCHER ccache)
66 | endif(CCACHE_FOUND)
67 | 


--------------------------------------------------------------------------------
/cmake/add-cpp-test.cmake:
--------------------------------------------------------------------------------
 1 | # Helper so we don't have to repeat ourselves so much
 2 | # Usage: add_cpp_test(testname [COMPILE_ONLY] [SOURCES a.cpp b.cpp ...] [LABELS acceptance per_implementation ...])
 3 | # SOURCES defaults to testname.cpp if not specified.
 4 | function(add_cpp_test TEST_NAME)
 5 |   # Parse arguments
 6 |   cmake_parse_arguments(PARSE_ARGV 1 ARGS "COMPILE_ONLY;LIBRARY;WILL_FAIL" "" "SOURCES;LABELS;DEPENDENCY_OF")
 7 |   if (NOT ARGS_SOURCES)
 8 |     list(APPEND ARGS_SOURCES ${TEST_NAME}.cpp)
 9 |   endif()
10 |   if (ARGS_COMPILE_ONLY)
11 |     list(APPEND ${ARGS_LABELS} compile_only)
12 |   endif()
13 |   if(ADA_SANITIZE)
14 |     add_compile_options(-fsanitize=address -fno-omit-frame-pointer -fno-sanitize-recover=all)
15 |     add_compile_definitions(ASAN_OPTIONS=detect_leaks=1)
16 |   endif()
17 |   if(ADA_SANITIZE_WITHOUT_LEAKS)
18 |     add_compile_options(-fsanitize=address -fno-omit-frame-pointer -fno-sanitize-recover=all)
19 |   endif()
20 |   if(ADA_SANITIZE_BOUNDS_STRICT)
21 |     add_compile_options(-fsanitize=bounds-strict -fno-sanitize-recover=all)
22 |     add_link_options(-fsanitize=bounds-strict)
23 |   endif()
24 |   if(ADA_SANITIZE_UNDEFINED)
25 |     add_compile_options(-fsanitize=undefined -fno-sanitize-recover=all)
26 |     add_link_options(-fsanitize=undefined)
27 |   endif()
28 |   # Add the compile target
29 |   if (ARGS_LIBRARY)
30 |     add_library(${TEST_NAME} STATIC ${ARGS_SOURCES})
31 |   else(ARGS_LIBRARY)
32 |     add_executable(${TEST_NAME} ${ARGS_SOURCES})
33 |   endif(ARGS_LIBRARY)
34 | 
35 |   # Add test
36 |   if (ARGS_COMPILE_ONLY OR ARGS_LIBRARY)
37 |     add_test(
38 |       NAME ${TEST_NAME}
39 |       COMMAND ${CMAKE_COMMAND} --build . --target ${TEST_NAME} --config $<CONFIGURATION>
40 |       WORKING_DIRECTORY ${PROJECT_BINARY_DIR}
41 |     )
42 |     set_target_properties(${TEST_NAME} PROPERTIES EXCLUDE_FROM_ALL TRUE EXCLUDE_FROM_DEFAULT_BUILD TRUE)
43 |   else()
44 |     add_test(${TEST_NAME} ${TEST_NAME})
45 | 
46 |     # Add to <label>_tests make targets
47 |     foreach(label ${ARGS_LABELS})
48 |       list(APPEND ARGS_DEPENDENCY_OF ${label})
49 |     endforeach(label ${ARGS_LABELS})
50 |   endif()
51 | 
52 |   # Add to test labels
53 |   if (ARGS_LABELS)
54 |     set_property(TEST ${TEST_NAME} APPEND PROPERTY LABELS ${ARGS_LABELS})
55 |   endif()
56 | 
57 |   # Add as a dependency of given targets
58 |   foreach(dependency_of ${ARGS_DEPENDENCY_OF})
59 |     if (NOT TARGET ${dependency_of}_tests)
60 |       add_custom_target(${dependency_of}_tests)
61 |       add_dependencies(all_tests ${dependency_of}_tests)
62 |     endif(NOT TARGET ${dependency_of}_tests)
63 |     add_dependencies(${dependency_of}_tests ${TEST_NAME})
64 |   endforeach(dependency_of ${ARGS_DEPENDENCY_OF})
65 | 
66 |   # If it will fail, mark the test as such
67 |   if (ARGS_WILL_FAIL)
68 |     set_property(TEST ${TEST_NAME} PROPERTY WILL_FAIL TRUE)
69 |   endif()
70 | endfunction()


--------------------------------------------------------------------------------
/docs/RELEASE.md:
--------------------------------------------------------------------------------
 1 | # Release Document
 2 | 
 3 | ## Preparation
 4 | 
 5 | In order to release a new version of Ada, please update the
 6 | following documents:
 7 | 
 8 | - [CMakeLists.txt](../CMakeLists.txt)
 9 | - [Doxygen](../doxygen)
10 | - [ada_version.h](../include/ada/ada_version.h)
11 | 
12 | ## Release
13 | 
14 | - Run amalgation script using `./singleheader/amalgamate.py`
15 | - Create a Github release with following format: `v1.0.0`
16 | - Upload the following documents to the release
17 |   - `./singleheader/ada.h`
18 |   - `./singleheader/ada.cpp`
19 |   - `./singleheader/singleheader.zip`
20 | 


--------------------------------------------------------------------------------
/docs/doxygen/footer.html:
--------------------------------------------------------------------------------
1 | <!-- HTML footer for doxygen 1.9.6-->
2 | <!-- start footer part -->
3 | <!--BEGIN GENERATE_TREEVIEW-->
4 | <div id="nav-path"><!-- id is needed for treeview function! --></div>
5 | <!--END GENERATE_TREEVIEW-->
6 | </body>
7 | </html>
8 | 


--------------------------------------------------------------------------------
/docs/doxygen/header.html:
--------------------------------------------------------------------------------
 1 | <!-- HTML header for doxygen 1.9.6-->
 2 | <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "https://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
 3 | <html xmlns="http://www.w3.org/1999/xhtml" lang="$langISO">
 4 | <head>
 5 | <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
 6 | <meta http-equiv="X-UA-Compatible" content="IE=11"/>
 7 | <meta name="generator" content="Doxygen $doxygenversion"/>
 8 | <meta name="viewport" content="width=device-width, initial-scale=1"/>
 9 | <!--BEGIN PROJECT_NAME--><title>$projectname: $title</title><!--END PROJECT_NAME-->
10 | <!--BEGIN !PROJECT_NAME--><title>$title</title><!--END !PROJECT_NAME-->
11 | <link href="$relpath^tabs.css" rel="stylesheet" type="text/css"/>
12 | <!--BEGIN DISABLE_INDEX-->
13 |   <!--BEGIN FULL_SIDEBAR-->
14 | <script type="text/javascript">var page_layout=1;</script>
15 |   <!--END FULL_SIDEBAR-->
16 | <!--END DISABLE_INDEX-->
17 | <script type="text/javascript" src="$relpath^jquery.js"></script>
18 | <script type="text/javascript" src="$relpath^dynsections.js"></script>
19 | <script type="text/javascript" src="$relpath^doxygen-awesome-darkmode-toggle.js"></script>
20 | <script type="text/javascript" src="$relpath^doxygen-awesome-fragment-copy-button.js"></script>
21 | <script type="text/javascript" src="$relpath^doxygen-awesome-paragraph-link.js"></script>
22 | <script type="text/javascript" src="$relpath^doxygen-awesome-interactive-toc.js"></script>
23 | <script type="text/javascript">
24 |   DoxygenAwesomeDarkModeToggle.init()
25 |   DoxygenAwesomeFragmentCopyButton.init()
26 |   DoxygenAwesomeParagraphLink.init()
27 |   DoxygenAwesomeInteractiveToc.init()
28 | </script>
29 | $treeview
30 | $search
31 | $mathjax
32 | $darkmode
33 | <link href="$relpath^$stylesheet" rel="stylesheet" type="text/css" />
34 | $extrastylesheet
35 | </head>
36 | <body>
37 | <!--BEGIN DISABLE_INDEX-->
38 |   <!--BEGIN FULL_SIDEBAR-->
39 | <div id="side-nav" class="ui-resizable side-nav-resizable"><!-- do not remove this div, it is closed by doxygen! -->
40 |   <!--END FULL_SIDEBAR-->
41 | <!--END DISABLE_INDEX-->
42 | 
43 | <div id="top"><!-- do not remove this div, it is closed by doxygen! -->
44 | 
45 | <!--BEGIN TITLEAREA-->
46 | <div id="titlearea">
47 | <table cellspacing="0" cellpadding="0">
48 |  <tbody>
49 |  <tr id="projectrow">
50 |   <!--BEGIN PROJECT_LOGO-->
51 |   <td id="projectlogo"><img alt="Logo" src="$relpath^$projectlogo"/></td>
52 |   <!--END PROJECT_LOGO-->
53 |   <!--BEGIN PROJECT_NAME-->
54 |   <td id="projectalign">
55 |    <div id="projectname">$projectname<!--BEGIN PROJECT_NUMBER--><span id="projectnumber">&#160;$projectnumber</span><!--END PROJECT_NUMBER-->
56 |    </div>
57 |    <!--BEGIN PROJECT_BRIEF--><div id="projectbrief">$projectbrief</div><!--END PROJECT_BRIEF-->
58 |   </td>
59 |   <!--END PROJECT_NAME-->
60 |   <!--BEGIN !PROJECT_NAME-->
61 |    <!--BEGIN PROJECT_BRIEF-->
62 |     <td>
63 |     <div id="projectbrief">$projectbrief</div>
64 |     </td>
65 |    <!--END PROJECT_BRIEF-->
66 |   <!--END !PROJECT_NAME-->
67 |   <!--BEGIN DISABLE_INDEX-->
68 |    <!--BEGIN SEARCHENGINE-->
69 |      <!--BEGIN !FULL_SIDEBAR-->
70 |     <td>$searchbox</td>
71 |      <!--END !FULL_SIDEBAR-->
72 |    <!--END SEARCHENGINE-->
73 |   <!--END DISABLE_INDEX-->
74 |  </tr>
75 |   <!--BEGIN SEARCHENGINE-->
76 |    <!--BEGIN FULL_SIDEBAR-->
77 |    <tr><td colspan="2">$searchbox</td></tr>
78 |    <!--END FULL_SIDEBAR-->
79 |   <!--END SEARCHENGINE-->
80 |  </tbody>
81 | </table>
82 | </div>
83 | <!--END TITLEAREA-->
84 | <!-- end header part -->
85 | 


--------------------------------------------------------------------------------
/fuzz/ada_c.c:
--------------------------------------------------------------------------------
 1 | #include "ada_c.h"
 2 | 
 3 | #include <stdbool.h>
 4 | #include <stdio.h>
 5 | #include <stdlib.h>
 6 | #include <string.h>
 7 | 
 8 | int LLVMFuzzerTestOneInput(const uint8_t* data, size_t size) {
 9 |   /**
10 |    * ada_c
11 |    */
12 |   ada_url out = ada_parse((char*)data, size);
13 |   bool is_valid = ada_is_valid(out);
14 | 
15 |   if (is_valid) {
16 |     ada_set_href(out, (char*)data, size);
17 |     ada_set_host(out, (char*)data, size);
18 |     ada_set_hostname(out, (char*)data, size);
19 |     ada_set_protocol(out, (char*)data, size);
20 |     ada_set_username(out, (char*)data, size);
21 |     ada_set_password(out, (char*)data, size);
22 |     ada_set_port(out, (char*)data, size);
23 |     ada_set_pathname(out, (char*)data, size);
24 |     ada_set_search(out, (char*)data, size);
25 |     ada_set_hash(out, (char*)data, size);
26 | 
27 |     ada_get_hash(out);
28 |     ada_get_host(out);
29 |     ada_get_host_type(out);
30 |     ada_get_hostname(out);
31 |     ada_get_href(out);
32 |     ada_owned_string out_get_origin = ada_get_origin(out);
33 |     ada_get_pathname(out);
34 |     ada_get_username(out);
35 |     ada_get_password(out);
36 |     ada_get_protocol(out);
37 |     ada_get_port(out);
38 |     ada_get_search(out);
39 |     ada_get_scheme_type(out);
40 | 
41 |     ada_has_credentials(out);
42 |     ada_has_empty_hostname(out);
43 |     ada_has_hostname(out);
44 |     ada_has_non_empty_username(out);
45 |     ada_has_non_empty_password(out);
46 |     ada_has_port(out);
47 |     ada_has_password(out);
48 |     ada_has_hash(out);
49 |     ada_has_search(out);
50 | 
51 |     ada_get_components(out);
52 | 
53 |     ada_clear_port(out);
54 |     ada_clear_hash(out);
55 |     ada_clear_search(out);
56 | 
57 |     ada_free_owned_string(out_get_origin);
58 |   }
59 | 
60 |   bool can_parse_result = ada_can_parse((char*)data, size);
61 | 
62 |   ada_free(out);
63 | 
64 |   return 0;
65 | }
66 | 


--------------------------------------------------------------------------------
/fuzz/ada_c.options:
--------------------------------------------------------------------------------
1 | [libfuzzer]
2 | dict = url.dict
3 | max_len = 1024
4 | 


--------------------------------------------------------------------------------
/fuzz/build.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | cd $SRC/ada-url
 4 | 
 5 | mkdir build
 6 | AMALGAMATE_OUTPUT_PATH=./build/singleheader python3 singleheader/amalgamate.py
 7 | 
 8 | $CXX $CFLAGS $CXXFLAGS \
 9 |      -std=c++20 \
10 |      -I build/singleheader \
11 |      -c fuzz/parse.cc -o parse.o
12 | 
13 | $CXX $CFLAGS $CXXFLAGS $LIB_FUZZING_ENGINE parse.o \
14 |      -o $OUT/parse
15 | 
16 | $CXX $CFLAGS $CXXFLAGS \
17 |      -std=c++20 \
18 |      -I build/singleheader \
19 |      -c fuzz/can_parse.cc -o can_parse.o
20 | 
21 | $CXX $CFLAGS $CXXFLAGS $LIB_FUZZING_ENGINE can_parse.o \
22 |      -o $OUT/can_parse
23 | 
24 | $CXX $CFLAGS $CXXFLAGS \
25 |      -std=c++20 \
26 |      -I build/singleheader \
27 |      -c fuzz/idna.cc -o idna.o
28 | 
29 | $CXX $CFLAGS $CXXFLAGS $LIB_FUZZING_ENGINE idna.o \
30 |      -o $OUT/idna
31 | 
32 | $CXX $CFLAGS $CXXFLAGS \
33 |      -std=c++20 \
34 |      -I build/singleheader \
35 |      -c fuzz/url_search_params.cc -o url_search_params.o
36 | 
37 | $CXX $CFLAGS $CXXFLAGS $LIB_FUZZING_ENGINE url_search_params.o \
38 |      -o $OUT/url_search_params
39 | 
40 | # IMPORTANT
41 | #
42 | # We use std_regex_provider for testing purposes.
43 | # It is not encouraged or recommended to be used within production
44 | # environments due to security problems.
45 | #
46 | # Please do not enable it on production systems!
47 | #
48 | $CXX -DADA_USE_UNSAFE_STD_REGEX_PROVIDER=1 \
49 |      $CFLAGS $CXXFLAGS \
50 |      -std=c++20 \
51 |      -I build/singleheader \
52 |      -c fuzz/url_pattern.cc -o url_pattern.o
53 | 
54 | $CXX -DADA_USE_UNSAFE_STD_REGEX_PROVIDER=1 \
55 |      $CFLAGS $CXXFLAGS $LIB_FUZZING_ENGINE \
56 |      url_pattern.o \
57 |      -o $OUT/url_pattern
58 | 
59 | $CXX $CFLAGS $CXXFLAGS \
60 |      -std=c++20 \
61 |      -I build/singleheader \
62 |      -c build/singleheader/ada.cpp -o ada.o
63 | 
64 | $CC $CFLAGS $CXXFLAGS \
65 |      -I build/singleheader \
66 |      -c fuzz/ada_c.c -o ada_c.o
67 | 
68 | $CXX $CFLAGS $CXXFLAGS $LIB_FUZZING_ENGINE ./ada.o ada_c.o \
69 |      -o $OUT/ada_c
70 | 
71 | cp $SRC/ada-url/fuzz/*.dict $SRC/ada-url/fuzz/*.options $OUT/
72 | 


--------------------------------------------------------------------------------
/fuzz/can_parse.cc:
--------------------------------------------------------------------------------
 1 | #include <fuzzer/FuzzedDataProvider.h>
 2 | 
 3 | #include <memory>
 4 | #include <string>
 5 | 
 6 | #include "ada.cpp"
 7 | #include "ada.h"
 8 | 
 9 | extern "C" int LLVMFuzzerTestOneInput(const uint8_t *data, size_t size) {
10 |   FuzzedDataProvider fdp(data, size);
11 |   std::string source = fdp.ConsumeRandomLengthString(256);
12 |   std::string base_source = fdp.ConsumeRandomLengthString(256);
13 | 
14 |   /**
15 |    * ada::can_parse
16 |    */
17 |   auto base_source_view =
18 |       std::string_view(base_source.data(), base_source.length());
19 |   ada::can_parse(source);
20 |   ada::can_parse(source, &base_source_view);
21 | 
22 |   return 0;
23 | }
24 | 


--------------------------------------------------------------------------------
/fuzz/idna.cc:
--------------------------------------------------------------------------------
 1 | #include <fuzzer/FuzzedDataProvider.h>
 2 | 
 3 | #include <memory>
 4 | #include <string>
 5 | 
 6 | #include "ada.cpp"
 7 | #include "ada.h"
 8 | 
 9 | extern "C" int LLVMFuzzerTestOneInput(const uint8_t *data, size_t size) {
10 |   FuzzedDataProvider fdp(data, size);
11 |   std::string source = fdp.ConsumeRandomLengthString(256);
12 | 
13 |   /**
14 |    * ada::idna
15 |    */
16 |   ada::idna::to_ascii(source);
17 |   ada::idna::to_unicode(source);
18 | 
19 |   return 0;
20 | }
21 | 


--------------------------------------------------------------------------------
/fuzz/parse.options:
--------------------------------------------------------------------------------
1 | [libfuzzer]
2 | dict = url.dict
3 | max_len = 1024
4 | 


--------------------------------------------------------------------------------
/fuzz/url.dict:
--------------------------------------------------------------------------------
 1 | # Protocols
 2 | "ftp:"
 3 | "file:///"
 4 | "file:"
 5 | "http:"
 6 | "https:"
 7 | "ws:"
 8 | "wss:"
 9 | 
10 | # Suffixes
11 | ".com"
12 | 
13 | # Full URLs
14 | "https://www.ada-url.com"
15 | 
16 | # Encoded characters
17 | "%2f"
18 | "%40"
19 | "%26"
20 | 
21 | # Misc
22 | "://"
23 | "//"
24 | "\\"
25 | "../"
26 | ";type=a"
27 | "xn--"
28 | 


--------------------------------------------------------------------------------
/fuzz/url_pattern.cc:
--------------------------------------------------------------------------------
 1 | #include <fuzzer/FuzzedDataProvider.h>
 2 | 
 3 | #include <memory>
 4 | #include <string>
 5 | 
 6 | #include "ada.cpp"
 7 | #include "ada.h"
 8 | 
 9 | using regex_provider = ada::url_pattern_regex::std_regex_provider;
10 | 
11 | std::string bytesToAlphanumeric(const std::string& source) {
12 |   static const char alphanumeric[] =
13 |       "abcdefghijklmnopqrstuvwxyz"
14 |       "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
15 |       "0123456789";
16 | 
17 |   std::string result;
18 |   result.reserve(source.size());
19 | 
20 |   for (char byte : source) {
21 |     int index = static_cast<unsigned char>(byte) % (sizeof(alphanumeric) - 1);
22 |     result.push_back(alphanumeric[index]);
23 |   }
24 | 
25 |   return result;
26 | }
27 | 
28 | void exercise_result(auto result) {
29 |   (void)result.get_protocol();
30 |   (void)result.get_username();
31 |   (void)result.get_password();
32 |   (void)result.get_hostname();
33 |   (void)result.get_port();
34 |   (void)result.get_pathname();
35 |   (void)result.get_search();
36 |   (void)result.get_hash();
37 |   (void)result.ignore_case();
38 |   (void)result.has_regexp_groups();
39 | }
40 | 
41 | extern "C" int LLVMFuzzerTestOneInput(const uint8_t* data, size_t size) {
42 |   FuzzedDataProvider fdp(data, size);
43 |   // We do not want to trigger arbitrary regex matching.
44 |   std::string source_1 =
45 |       "/" + bytesToAlphanumeric(fdp.ConsumeRandomLengthString(50)) + "/" +
46 |       bytesToAlphanumeric(fdp.ConsumeRandomLengthString(50));
47 |   std::string base_source_1 =
48 |       "/" + bytesToAlphanumeric(fdp.ConsumeRandomLengthString(50)) + "/" +
49 |       bytesToAlphanumeric(fdp.ConsumeRandomLengthString(50));
50 | 
51 |   std::string source_2 = "https://ada-url.com/*";
52 |   std::string base_source_2 = "https://ada-url.com";
53 | 
54 |   std::array<std::pair<std::string, std::string>, 2> sources = {{
55 |       {source_1, base_source_1},
56 |       {source_2, base_source_2},
57 |   }};
58 | 
59 |   for (const auto& [source, base_source] : sources) {
60 |     // Without base or options
61 |     auto result =
62 |         ada::parse_url_pattern<regex_provider>(source, nullptr, nullptr);
63 |     if (result) exercise_result(*result);
64 | 
65 |     // Testing with base_url
66 |     std::string_view base_source_view(base_source.data(), base_source.length());
67 |     auto result_with_base = ada::parse_url_pattern<regex_provider>(
68 |         source, &base_source_view, nullptr);
69 |     if (result_with_base) exercise_result(*result_with_base);
70 | 
71 |     // Testing with base_url and options
72 |     ada::url_pattern_options options{.ignore_case = fdp.ConsumeBool()};
73 |     auto result_with_base_and_options = ada::parse_url_pattern<regex_provider>(
74 |         source, &base_source_view, &options);
75 |     if (result_with_base_and_options)
76 |       exercise_result(*result_with_base_and_options);
77 | 
78 |     // Testing with url_pattern_init and base url.
79 |     ada::url_pattern_init init{.protocol = source,
80 |                                .username = source,
81 |                                .password = source,
82 |                                .hostname = source,
83 |                                .port = source,
84 |                                .pathname = source,
85 |                                .search = source,
86 |                                .hash = source};
87 |     auto result_with_init = ada::parse_url_pattern<regex_provider>(
88 |         init, &base_source_view, nullptr);
89 |     if (result_with_init) exercise_result(*result_with_init);
90 |   }
91 | 
92 |   return 0;
93 | }
94 | 


--------------------------------------------------------------------------------
/fuzz/url_pattern.options:
--------------------------------------------------------------------------------
1 | [libfuzzer]
2 | dict = url.dict
3 | max_len = 100
4 | rss_limit_mb = 16000
5 | timeout = 60
6 | 


--------------------------------------------------------------------------------
/fuzz/url_search_params.cc:
--------------------------------------------------------------------------------
 1 | #include <fuzzer/FuzzedDataProvider.h>
 2 | 
 3 | #include <memory>
 4 | #include <string>
 5 | 
 6 | #include "ada.cpp"
 7 | #include "ada.h"
 8 | 
 9 | extern "C" int LLVMFuzzerTestOneInput(const uint8_t *data, size_t size) {
10 |   FuzzedDataProvider fdp(data, size);
11 |   std::string source = fdp.ConsumeRandomLengthString(256);
12 |   std::string base_source = fdp.ConsumeRandomLengthString(256);
13 | 
14 |   /**
15 |    * ada::url_search_params
16 |    */
17 | 
18 |   auto base_source_view =
19 |       std::string_view(base_source.data(), base_source.length());
20 |   auto initialized = ada::url_search_params(base_source_view);
21 | 
22 |   auto search_params = ada::url_search_params();
23 |   search_params.append(source, base_source);
24 |   search_params.set(source, base_source);
25 |   search_params.to_string();
26 |   if (!search_params.has(base_source)) {
27 |     search_params.append(base_source, source);
28 |   }
29 |   search_params.remove(source);
30 |   search_params.remove(source, base_source);
31 |   if (search_params.has(base_source, source)) {
32 |     search_params.remove(base_source);
33 |     search_params.remove(base_source, source);
34 |   }
35 | 
36 |   auto keys = search_params.get_keys();
37 |   while (keys.has_next()) {
38 |     keys.next();
39 |   }
40 | 
41 |   auto values = search_params.get_values();
42 |   while (values.has_next()) {
43 |     values.next();
44 |   }
45 | 
46 |   auto entries = search_params.get_entries();
47 |   while (entries.has_next()) {
48 |     entries.next();
49 |   }
50 | 
51 |   // This is testing a private method used only for C API.
52 |   std::string resetted_value = fdp.ConsumeRandomLengthString(256);
53 |   search_params.reset(resetted_value);
54 | 
55 |   return 0;
56 | }
57 | 


--------------------------------------------------------------------------------
/include/ada.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file ada.h
 3 |  * @brief Includes all definitions for Ada.
 4 |  */
 5 | #ifndef ADA_H
 6 | #define ADA_H
 7 | 
 8 | #include "ada/ada_idna.h"
 9 | #include "ada/character_sets.h"
10 | #include "ada/character_sets-inl.h"
11 | #include "ada/checkers-inl.h"
12 | #include "ada/common_defs.h"
13 | #include "ada/log.h"
14 | #include "ada/encoding_type.h"
15 | #include "ada/helpers.h"
16 | #include "ada/parser.h"
17 | #include "ada/parser-inl.h"
18 | #include "ada/scheme.h"
19 | #include "ada/scheme-inl.h"
20 | #include "ada/serializers.h"
21 | #include "ada/state.h"
22 | #include "ada/unicode.h"
23 | #include "ada/url_base.h"
24 | #include "ada/url_base-inl.h"
25 | #include "ada/url-inl.h"
26 | #include "ada/url_components.h"
27 | #include "ada/url_components-inl.h"
28 | #include "ada/url_aggregator.h"
29 | #include "ada/url_aggregator-inl.h"
30 | #include "ada/url_search_params.h"
31 | #include "ada/url_search_params-inl.h"
32 | 
33 | #include "ada/url_pattern.h"
34 | #include "ada/url_pattern-inl.h"
35 | #include "ada/url_pattern_helpers.h"
36 | #include "ada/url_pattern_helpers-inl.h"
37 | #include "ada/url_pattern_regex.h"
38 | 
39 | // Public API
40 | #include "ada/ada_version.h"
41 | #include "ada/implementation.h"
42 | #include "ada/implementation-inl.h"
43 | 
44 | #endif  // ADA_H
45 | 


--------------------------------------------------------------------------------
/include/ada/ada_idna.h:
--------------------------------------------------------------------------------
  1 | /* auto-generated on 2025-03-08 13:17:11 -0500. Do not edit! */
  2 | /* begin file include/idna.h */
  3 | #ifndef ADA_IDNA_H
  4 | #define ADA_IDNA_H
  5 | 
  6 | /* begin file include/ada/idna/unicode_transcoding.h */
  7 | #ifndef ADA_IDNA_UNICODE_TRANSCODING_H
  8 | #define ADA_IDNA_UNICODE_TRANSCODING_H
  9 | 
 10 | #include <string>
 11 | #include <string_view>
 12 | 
 13 | namespace ada::idna {
 14 | 
 15 | size_t utf8_to_utf32(const char* buf, size_t len, char32_t* utf32_output);
 16 | 
 17 | size_t utf8_length_from_utf32(const char32_t* buf, size_t len);
 18 | 
 19 | size_t utf32_length_from_utf8(const char* buf, size_t len);
 20 | 
 21 | size_t utf32_to_utf8(const char32_t* buf, size_t len, char* utf8_output);
 22 | 
 23 | }  // namespace ada::idna
 24 | 
 25 | #endif  // ADA_IDNA_UNICODE_TRANSCODING_H
 26 | /* end file include/ada/idna/unicode_transcoding.h */
 27 | /* begin file include/ada/idna/mapping.h */
 28 | #ifndef ADA_IDNA_MAPPING_H
 29 | #define ADA_IDNA_MAPPING_H
 30 | 
 31 | #include <string>
 32 | #include <string_view>
 33 | 
 34 | namespace ada::idna {
 35 | 
 36 | // If the input is ascii, then the mapping is just -> lower case.
 37 | void ascii_map(char* input, size_t length);
 38 | // Map the characters according to IDNA, returning the empty string on error.
 39 | std::u32string map(std::u32string_view input);
 40 | 
 41 | }  // namespace ada::idna
 42 | 
 43 | #endif
 44 | /* end file include/ada/idna/mapping.h */
 45 | /* begin file include/ada/idna/normalization.h */
 46 | #ifndef ADA_IDNA_NORMALIZATION_H
 47 | #define ADA_IDNA_NORMALIZATION_H
 48 | 
 49 | #include <string>
 50 | #include <string_view>
 51 | 
 52 | namespace ada::idna {
 53 | 
 54 | // Normalize the characters according to IDNA (Unicode Normalization Form C).
 55 | void normalize(std::u32string& input);
 56 | 
 57 | }  // namespace ada::idna
 58 | #endif
 59 | /* end file include/ada/idna/normalization.h */
 60 | /* begin file include/ada/idna/punycode.h */
 61 | #ifndef ADA_IDNA_PUNYCODE_H
 62 | #define ADA_IDNA_PUNYCODE_H
 63 | 
 64 | #include <string>
 65 | #include <string_view>
 66 | 
 67 | namespace ada::idna {
 68 | 
 69 | bool punycode_to_utf32(std::string_view input, std::u32string& out);
 70 | bool verify_punycode(std::string_view input);
 71 | bool utf32_to_punycode(std::u32string_view input, std::string& out);
 72 | 
 73 | }  // namespace ada::idna
 74 | 
 75 | #endif  // ADA_IDNA_PUNYCODE_H
 76 | /* end file include/ada/idna/punycode.h */
 77 | /* begin file include/ada/idna/validity.h */
 78 | #ifndef ADA_IDNA_VALIDITY_H
 79 | #define ADA_IDNA_VALIDITY_H
 80 | 
 81 | #include <string>
 82 | #include <string_view>
 83 | 
 84 | namespace ada::idna {
 85 | 
 86 | /**
 87 |  * @see https://www.unicode.org/reports/tr46/#Validity_Criteria
 88 |  */
 89 | bool is_label_valid(std::u32string_view label);
 90 | 
 91 | }  // namespace ada::idna
 92 | 
 93 | #endif  // ADA_IDNA_VALIDITY_H
 94 | /* end file include/ada/idna/validity.h */
 95 | /* begin file include/ada/idna/to_ascii.h */
 96 | #ifndef ADA_IDNA_TO_ASCII_H
 97 | #define ADA_IDNA_TO_ASCII_H
 98 | 
 99 | #include <string>
100 | #include <string_view>
101 | 
102 | namespace ada::idna {
103 | 
104 | // Converts a domain (e.g., www.google.com) possibly containing international
105 | // characters to an ascii domain (with punycode). It will not do percent
106 | // decoding: percent decoding should be done prior to calling this function. We
107 | // do not remove tabs and spaces, they should have been removed prior to calling
108 | // this function. We also do not trim control characters. We also assume that
109 | // the input is not empty. We return "" on error.
110 | //
111 | //
112 | // This function may accept or even produce invalid domains.
113 | std::string to_ascii(std::string_view ut8_string);
114 | 
115 | // Returns true if the string contains a forbidden code point according to the
116 | // WHATGL URL specification:
117 | // https://url.spec.whatwg.org/#forbidden-domain-code-point
118 | bool contains_forbidden_domain_code_point(std::string_view ascii_string);
119 | 
120 | bool constexpr is_ascii(std::u32string_view view);
121 | bool constexpr is_ascii(std::string_view view);
122 | 
123 | }  // namespace ada::idna
124 | 
125 | #endif  // ADA_IDNA_TO_ASCII_H
126 | /* end file include/ada/idna/to_ascii.h */
127 | /* begin file include/ada/idna/to_unicode.h */
128 | 
129 | #ifndef ADA_IDNA_TO_UNICODE_H
130 | #define ADA_IDNA_TO_UNICODE_H
131 | 
132 | #include <string_view>
133 | 
134 | namespace ada::idna {
135 | 
136 | std::string to_unicode(std::string_view input);
137 | 
138 | }  // namespace ada::idna
139 | 
140 | #endif  // ADA_IDNA_TO_UNICODE_H
141 | /* end file include/ada/idna/to_unicode.h */
142 | /* begin file include/ada/idna/identifier.h */
143 | #ifndef ADA_IDNA_IDENTIFIER_H
144 | #define ADA_IDNA_IDENTIFIER_H
145 | 
146 | #include <string>
147 | #include <string_view>
148 | 
149 | namespace ada::idna {
150 | 
151 | // Verify if it is valid name code point given a Unicode code point and a
152 | // boolean first: If first is true return the result of checking if code point
153 | // is contained in the IdentifierStart set of code points. Otherwise return the
154 | // result of checking if code point is contained in the IdentifierPart set of
155 | // code points. Returns false if the input is empty or the code point is not
156 | // valid. There is minimal Unicode error handling: the input should be valid
157 | // UTF-8. https://urlpattern.spec.whatwg.org/#is-a-valid-name-code-point
158 | bool valid_name_code_point(char32_t code_point, bool first);
159 | 
160 | }  // namespace ada::idna
161 | 
162 | #endif
163 | /* end file include/ada/idna/identifier.h */
164 | 
165 | #endif
166 | /* end file include/idna.h */
167 | 


--------------------------------------------------------------------------------
/include/ada/ada_version.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file ada_version.h
 3 |  * @brief Definitions for Ada's version number.
 4 |  */
 5 | #ifndef ADA_ADA_VERSION_H
 6 | #define ADA_ADA_VERSION_H
 7 | 
 8 | #define ADA_VERSION "3.2.4"
 9 | 
10 | namespace ada {
11 | 
12 | enum {
13 |   ADA_VERSION_MAJOR = 3,
14 |   ADA_VERSION_MINOR = 2,
15 |   ADA_VERSION_REVISION = 4,
16 | };
17 | 
18 | }  // namespace ada
19 | 
20 | #endif  // ADA_ADA_VERSION_H
21 | 


--------------------------------------------------------------------------------
/include/ada/character_sets.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file character_sets.h
 3 |  * @brief Declaration of the character sets used by unicode functions.
 4 |  * @author Node.js
 5 |  * @see https://github.com/nodejs/node/blob/main/src/node_url_tables.cc
 6 |  */
 7 | #ifndef ADA_CHARACTER_SETS_H
 8 | #define ADA_CHARACTER_SETS_H
 9 | 
10 | #include "ada/common_defs.h"
11 | #include <cstdint>
12 | 
13 | /**
14 |  * These functions are not part of our public API and may
15 |  * change at any time.
16 |  * @private
17 |  * @namespace ada::character_sets
18 |  * @brief Includes the definitions for unicode character sets.
19 |  */
20 | namespace ada::character_sets {
21 | ada_really_inline constexpr bool bit_at(const uint8_t a[], uint8_t i);
22 | }  // namespace ada::character_sets
23 | 
24 | #endif  // ADA_CHARACTER_SETS_H
25 | 


--------------------------------------------------------------------------------
/include/ada/checkers-inl.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file checkers-inl.h
 3 |  * @brief Definitions for URL specific checkers used within Ada.
 4 |  */
 5 | #ifndef ADA_CHECKERS_INL_H
 6 | #define ADA_CHECKERS_INL_H
 7 | 
 8 | #include <bit>
 9 | #include <string_view>
10 | 
11 | namespace ada::checkers {
12 | 
13 | constexpr bool has_hex_prefix_unsafe(std::string_view input) {
14 |   // This is actually efficient code, see has_hex_prefix for the assembly.
15 |   constexpr bool is_little_endian = std::endian::native == std::endian::little;
16 |   constexpr uint16_t word0x = 0x7830;
17 |   uint16_t two_first_bytes =
18 |       static_cast<uint16_t>(input[0]) |
19 |       static_cast<uint16_t>((static_cast<uint16_t>(input[1]) << 8));
20 |   if constexpr (is_little_endian) {
21 |     two_first_bytes |= 0x2000;
22 |   } else {
23 |     two_first_bytes |= 0x020;
24 |   }
25 |   return two_first_bytes == word0x;
26 | }
27 | 
28 | constexpr bool has_hex_prefix(std::string_view input) {
29 |   return input.size() >= 2 && has_hex_prefix_unsafe(input);
30 | }
31 | 
32 | constexpr bool is_digit(char x) noexcept { return (x >= '0') & (x <= '9'); }
33 | 
34 | constexpr char to_lower(char x) noexcept { return (x | 0x20); }
35 | 
36 | constexpr bool is_alpha(char x) noexcept {
37 |   return (to_lower(x) >= 'a') && (to_lower(x) <= 'z');
38 | }
39 | 
40 | constexpr bool is_windows_drive_letter(std::string_view input) noexcept {
41 |   return input.size() >= 2 &&
42 |          (is_alpha(input[0]) && ((input[1] == ':') || (input[1] == '|'))) &&
43 |          ((input.size() == 2) || (input[2] == '/' || input[2] == '\\' ||
44 |                                   input[2] == '?' || input[2] == '#'));
45 | }
46 | 
47 | constexpr bool is_normalized_windows_drive_letter(
48 |     std::string_view input) noexcept {
49 |   return input.size() >= 2 && (is_alpha(input[0]) && (input[1] == ':'));
50 | }
51 | 
52 | }  // namespace ada::checkers
53 | 
54 | #endif  // ADA_CHECKERS_INL_H
55 | 


--------------------------------------------------------------------------------
/include/ada/checkers.h:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * @file checkers.h
  3 |  * @brief Declarations for URL specific checkers used within Ada.
  4 |  */
  5 | #ifndef ADA_CHECKERS_H
  6 | #define ADA_CHECKERS_H
  7 | 
  8 | #include "ada/common_defs.h"
  9 | 
 10 | #include <cstring>
 11 | #include <string_view>
 12 | 
 13 | /**
 14 |  * These functions are not part of our public API and may
 15 |  * change at any time.
 16 |  * @private
 17 |  * @namespace ada::checkers
 18 |  * @brief Includes the definitions for validation functions
 19 |  */
 20 | namespace ada::checkers {
 21 | 
 22 | /**
 23 |  * @private
 24 |  * Assuming that x is an ASCII letter, this function returns the lower case
 25 |  * equivalent.
 26 |  * @details More likely to be inlined by the compiler and constexpr.
 27 |  */
 28 | constexpr char to_lower(char x) noexcept;
 29 | 
 30 | /**
 31 |  * @private
 32 |  * Returns true if the character is an ASCII letter. Equivalent to std::isalpha
 33 |  * but more likely to be inlined by the compiler.
 34 |  *
 35 |  * @attention std::isalpha is not constexpr generally.
 36 |  */
 37 | constexpr bool is_alpha(char x) noexcept;
 38 | 
 39 | /**
 40 |  * @private
 41 |  * Check whether a string starts with 0x or 0X. The function is only
 42 |  * safe if input.size() >=2.
 43 |  *
 44 |  * @see has_hex_prefix
 45 |  */
 46 | constexpr bool has_hex_prefix_unsafe(std::string_view input);
 47 | /**
 48 |  * @private
 49 |  * Check whether a string starts with 0x or 0X.
 50 |  */
 51 | constexpr bool has_hex_prefix(std::string_view input);
 52 | 
 53 | /**
 54 |  * @private
 55 |  * Check whether x is an ASCII digit. More likely to be inlined than
 56 |  * std::isdigit.
 57 |  */
 58 | constexpr bool is_digit(char x) noexcept;
 59 | 
 60 | /**
 61 |  * @private
 62 |  * @details A string starts with a Windows drive letter if all of the following
 63 |  * are true:
 64 |  *
 65 |  *   - its length is greater than or equal to 2
 66 |  *   - its first two code points are a Windows drive letter
 67 |  *   - its length is 2 or its third code point is U+002F (/), U+005C (\), U+003F
 68 |  * (?), or U+0023 (#).
 69 |  *
 70 |  * https://url.spec.whatwg.org/#start-with-a-windows-drive-letter
 71 |  */
 72 | inline constexpr bool is_windows_drive_letter(std::string_view input) noexcept;
 73 | 
 74 | /**
 75 |  * @private
 76 |  * @details A normalized Windows drive letter is a Windows drive letter of which
 77 |  * the second code point is U+003A (:).
 78 |  */
 79 | inline constexpr bool is_normalized_windows_drive_letter(
 80 |     std::string_view input) noexcept;
 81 | 
 82 | /**
 83 |  * @private
 84 |  * Returns true if an input is an ipv4 address. It is assumed that the string
 85 |  * does not contain uppercase ASCII characters (the input should have been
 86 |  * lowered cased before calling this function) and is not empty.
 87 |  */
 88 | ada_really_inline constexpr bool is_ipv4(std::string_view view) noexcept;
 89 | 
 90 | /**
 91 |  * @private
 92 |  * Returns a bitset. If the first bit is set, then at least one character needs
 93 |  * percent encoding. If the second bit is set, a \\ is found. If the third bit
 94 |  * is set then we have a dot. If the fourth bit is set, then we have a percent
 95 |  * character.
 96 |  */
 97 | ada_really_inline constexpr uint8_t path_signature(
 98 |     std::string_view input) noexcept;
 99 | 
100 | /**
101 |  * @private
102 |  * Returns true if the length of the domain name and its labels are according to
103 |  * the specifications. The length of the domain must be 255 octets (253
104 |  * characters not including the last 2 which are the empty label reserved at the
105 |  * end). When the empty label is included (a dot at the end), the domain name
106 |  * can have 254 characters. The length of a label must be at least 1 and at most
107 |  * 63 characters.
108 |  * @see section 3.1. of https://www.rfc-editor.org/rfc/rfc1034
109 |  * @see https://www.unicode.org/reports/tr46/#ToASCII
110 |  */
111 | ada_really_inline constexpr bool verify_dns_length(
112 |     std::string_view input) noexcept;
113 | 
114 | }  // namespace ada::checkers
115 | 
116 | #endif  // ADA_CHECKERS_H
117 | 


--------------------------------------------------------------------------------
/include/ada/encoding_type.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file encoding_type.h
 3 |  * @brief Definition for supported encoding types.
 4 |  */
 5 | #ifndef ADA_ENCODING_TYPE_H
 6 | #define ADA_ENCODING_TYPE_H
 7 | 
 8 | #include "ada/common_defs.h"
 9 | #include <string>
10 | 
11 | namespace ada {
12 | 
13 | /**
14 |  * This specification defines three encodings with the same names as encoding
15 |  * schemes defined in the Unicode standard: UTF-8, UTF-16LE, and UTF-16BE.
16 |  *
17 |  * @see https://encoding.spec.whatwg.org/#encodings
18 |  */
19 | enum class encoding_type {
20 |   UTF8,
21 |   UTF_16LE,
22 |   UTF_16BE,
23 | };
24 | 
25 | /**
26 |  * Convert a encoding_type to string.
27 |  */
28 | ada_warn_unused std::string to_string(encoding_type type);
29 | 
30 | }  // namespace ada
31 | 
32 | #endif  // ADA_ENCODING_TYPE_H
33 | 


--------------------------------------------------------------------------------
/include/ada/errors.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file errors.h
 3 |  * @brief Definitions for the errors.
 4 |  */
 5 | #ifndef ADA_ERRORS_H
 6 | #define ADA_ERRORS_H
 7 | 
 8 | #include <cstdint>
 9 | namespace ada {
10 | enum class errors : uint8_t { type_error };
11 | }  // namespace ada
12 | #endif  // ADA_ERRORS_H


--------------------------------------------------------------------------------
/include/ada/implementation-inl.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file implementation-inl.h
 3 |  */
 4 | #ifndef ADA_IMPLEMENTATION_INL_H
 5 | #define ADA_IMPLEMENTATION_INL_H
 6 | 
 7 | #include "ada/url_pattern_regex.h"
 8 | 
 9 | #include "ada/expected.h"
10 | #include "ada/implementation.h"
11 | 
12 | #include <variant>
13 | #include <string_view>
14 | 
15 | namespace ada {
16 | 
17 | #if ADA_INCLUDE_URL_PATTERN
18 | template <url_pattern_regex::regex_concept regex_provider>
19 | ada_warn_unused tl::expected<url_pattern<regex_provider>, errors>
20 | parse_url_pattern(std::variant<std::string_view, url_pattern_init>&& input,
21 |                   const std::string_view* base_url,
22 |                   const url_pattern_options* options) {
23 |   return parser::parse_url_pattern_impl<regex_provider>(std::move(input),
24 |                                                         base_url, options);
25 | }
26 | #endif  // ADA_INCLUDE_URL_PATTERN
27 | 
28 | }  // namespace ada
29 | 
30 | #endif  // ADA_IMPLEMENTATION_INL_H
31 | 


--------------------------------------------------------------------------------
/include/ada/implementation.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file implementation.h
 3 |  * @brief Definitions for user facing functions for parsing URL and it's
 4 |  * components.
 5 |  */
 6 | #ifndef ADA_IMPLEMENTATION_H
 7 | #define ADA_IMPLEMENTATION_H
 8 | 
 9 | #include <string>
10 | #include <string_view>
11 | #include <optional>
12 | 
13 | #include "ada/url.h"
14 | #include "ada/common_defs.h"
15 | #include "ada/errors.h"
16 | #include "ada/url_pattern_init.h"
17 | 
18 | namespace ada {
19 | 
20 | template <class result_type = ada::url_aggregator>
21 | using result = tl::expected<result_type, ada::errors>;
22 | 
23 | /**
24 |  * The URL parser takes a scalar value string input, with an optional null or
25 |  * base URL base (default null). The parser assumes the input is a valid ASCII
26 |  * or UTF-8 string.
27 |  *
28 |  * @param input the string input to analyze (must be valid ASCII or UTF-8)
29 |  * @param base_url the optional URL input to use as a base url.
30 |  * @return a parsed URL.
31 |  */
32 | template <class result_type = ada::url_aggregator>
33 | ada_warn_unused ada::result<result_type> parse(
34 |     std::string_view input, const result_type* base_url = nullptr);
35 | 
36 | extern template ada::result<url> parse<url>(std::string_view input,
37 |                                             const url* base_url);
38 | extern template ada::result<url_aggregator> parse<url_aggregator>(
39 |     std::string_view input, const url_aggregator* base_url);
40 | 
41 | /**
42 |  * Verifies whether the URL strings can be parsed. The function assumes
43 |  * that the inputs are valid ASCII or UTF-8 strings.
44 |  * @see https://url.spec.whatwg.org/#dom-url-canparse
45 |  * @return If URL can be parsed or not.
46 |  */
47 | bool can_parse(std::string_view input,
48 |                const std::string_view* base_input = nullptr);
49 | 
50 | #if ADA_INCLUDE_URL_PATTERN
51 | /**
52 |  * Implementation of the URL pattern parsing algorithm.
53 |  * @see https://urlpattern.spec.whatwg.org
54 |  *
55 |  * @param input valid UTF-8 string or URLPatternInit struct
56 |  * @param base_url an optional valid UTF-8 string
57 |  * @param options an optional url_pattern_options struct
58 |  * @return url_pattern instance
59 |  */
60 | template <url_pattern_regex::regex_concept regex_provider>
61 | ada_warn_unused tl::expected<url_pattern<regex_provider>, errors>
62 | parse_url_pattern(std::variant<std::string_view, url_pattern_init>&& input,
63 |                   const std::string_view* base_url = nullptr,
64 |                   const url_pattern_options* options = nullptr);
65 | #endif  // ADA_INCLUDE_URL_PATTERN
66 | 
67 | /**
68 |  * Computes a href string from a file path. The function assumes
69 |  * that the input is a valid ASCII or UTF-8 string.
70 |  * @return a href string (starts with file:://)
71 |  */
72 | std::string href_from_file(std::string_view path);
73 | }  // namespace ada
74 | 
75 | #endif  // ADA_IMPLEMENTATION_H
76 | 


--------------------------------------------------------------------------------
/include/ada/log.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file log.h
 3 |  * @brief Includes the definitions for logging.
 4 |  * @private Excluded from docs through the doxygen file.
 5 |  */
 6 | #ifndef ADA_LOG_H
 7 | #define ADA_LOG_H
 8 | #include "ada/common_defs.h"
 9 | 
10 | // To enable logging, set ADA_LOGGING to 1:
11 | #ifndef ADA_LOGGING
12 | #define ADA_LOGGING 0
13 | #endif
14 | 
15 | #if ADA_LOGGING
16 | #include <iostream>
17 | #endif  // ADA_LOGGING
18 | 
19 | namespace ada {
20 | 
21 | /**
22 |  * Log a message. If you want to have no overhead when logging is disabled, use
23 |  * the ada_log macro.
24 |  * @private
25 |  */
26 | template <typename... Args>
27 | constexpr ada_really_inline void log([[maybe_unused]] Args... args) {
28 | #if ADA_LOGGING
29 |   ((std::cout << "ADA_LOG: ") << ... << args) << std::endl;
30 | #endif  // ADA_LOGGING
31 | }
32 | }  // namespace ada
33 | 
34 | #if ADA_LOGGING
35 | #ifndef ada_log
36 | #define ada_log(...)       \
37 |   do {                     \
38 |     ada::log(__VA_ARGS__); \
39 |   } while (0)
40 | #endif  // ada_log
41 | #else
42 | #define ada_log(...)
43 | #endif  // ADA_LOGGING
44 | 
45 | #endif  // ADA_LOG_H
46 | 


--------------------------------------------------------------------------------
/include/ada/parser.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file parser.h
 3 |  * @brief Definitions for the parser.
 4 |  */
 5 | #ifndef ADA_PARSER_H
 6 | #define ADA_PARSER_H
 7 | 
 8 | #include <string_view>
 9 | #include <variant>
10 | 
11 | #include "ada/expected.h"
12 | 
13 | #include "ada/url_pattern_regex.h"
14 | #include "ada/url_pattern_init.h"
15 | 
16 | /**
17 |  * @private
18 |  */
19 | namespace ada {
20 | struct url_aggregator;
21 | struct url;
22 | #if ADA_INCLUDE_URL_PATTERN
23 | template <url_pattern_regex::regex_concept regex_provider>
24 | class url_pattern;
25 | struct url_pattern_options;
26 | #endif  // ADA_INCLUDE_URL_PATTERN
27 | enum class errors : uint8_t;
28 | }  // namespace ada
29 | 
30 | /**
31 |  * @namespace ada::parser
32 |  * @brief Includes the definitions for supported parsers
33 |  */
34 | namespace ada::parser {
35 | /**
36 |  * Parses a url. The parameter user_input is the input to be parsed:
37 |  * it should be a valid UTF-8 string. The parameter base_url is an optional
38 |  * parameter that can be used to resolve relative URLs. If the base_url is
39 |  * provided, the user_input is resolved against the base_url.
40 |  */
41 | template <typename result_type = url_aggregator>
42 | result_type parse_url(std::string_view user_input,
43 |                       const result_type* base_url = nullptr);
44 | 
45 | extern template url_aggregator parse_url<url_aggregator>(
46 |     std::string_view user_input, const url_aggregator* base_url);
47 | extern template url parse_url<url>(std::string_view user_input,
48 |                                    const url* base_url);
49 | 
50 | template <typename result_type = url_aggregator, bool store_values = true>
51 | result_type parse_url_impl(std::string_view user_input,
52 |                            const result_type* base_url = nullptr);
53 | 
54 | extern template url_aggregator parse_url_impl<url_aggregator>(
55 |     std::string_view user_input, const url_aggregator* base_url);
56 | extern template url parse_url_impl<url>(std::string_view user_input,
57 |                                         const url* base_url);
58 | 
59 | #if ADA_INCLUDE_URL_PATTERN
60 | template <url_pattern_regex::regex_concept regex_provider>
61 | tl::expected<url_pattern<regex_provider>, errors> parse_url_pattern_impl(
62 |     std::variant<std::string_view, url_pattern_init>&& input,
63 |     const std::string_view* base_url, const url_pattern_options* options);
64 | #endif  // ADA_INCLUDE_URL_PATTERN
65 | 
66 | }  // namespace ada::parser
67 | 
68 | #endif  // ADA_PARSER_H
69 | 


--------------------------------------------------------------------------------
/include/ada/scheme-inl.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file scheme-inl.h
 3 |  * @brief Definitions for the URL scheme.
 4 |  */
 5 | #ifndef ADA_SCHEME_INL_H
 6 | #define ADA_SCHEME_INL_H
 7 | 
 8 | #include "ada/scheme.h"
 9 | 
10 | namespace ada::scheme {
11 | 
12 | /**
13 |  * @namespace ada::scheme::details
14 |  * @brief Includes the definitions for scheme specific entities
15 |  */
16 | namespace details {
17 | // for use with is_special and get_special_port
18 | // Spaces, if present, are removed from URL.
19 | constexpr std::string_view is_special_list[] = {"http", " ",   "https", "ws",
20 |                                                 "ftp",  "wss", "file",  " "};
21 | // for use with get_special_port
22 | constexpr uint16_t special_ports[] = {80, 0, 443, 80, 21, 443, 0, 0};
23 | }  // namespace details
24 | 
25 | /****
26 |  * @private
27 |  * In is_special, get_scheme_type, and get_special_port, we
28 |  * use a standard hashing technique to find the index of the scheme in
29 |  * the is_special_list. The hashing technique is based on the size of
30 |  * the scheme and the first character of the scheme. It ensures that we
31 |  * do at most one string comparison per call. If the protocol is
32 |  * predictible (e.g., it is always "http"), we can get a better average
33 |  * performance by using a simpler approach where we loop and compare
34 |  * scheme with all possible protocols starting with the most likely
35 |  * protocol. Doing multiple comparisons may have a poor worst case
36 |  * performance, however. In this instance, we choose a potentially
37 |  * slightly lower best-case performance for a better worst-case
38 |  * performance. We can revisit this choice at any time.
39 |  *
40 |  * Reference:
41 |  * Schmidt, Douglas C. "Gperf: A perfect hash function generator."
42 |  * More C++ gems 17 (2000).
43 |  *
44 |  * Reference: https://en.wikipedia.org/wiki/Perfect_hash_function
45 |  *
46 |  * Reference: https://github.com/ada-url/ada/issues/617
47 |  ****/
48 | 
49 | ada_really_inline constexpr bool is_special(std::string_view scheme) {
50 |   if (scheme.empty()) {
51 |     return false;
52 |   }
53 |   int hash_value = (2 * scheme.size() + (unsigned)(scheme[0])) & 7;
54 |   const std::string_view target = details::is_special_list[hash_value];
55 |   return (target[0] == scheme[0]) && (target.substr(1) == scheme.substr(1));
56 | }
57 | constexpr uint16_t get_special_port(std::string_view scheme) noexcept {
58 |   if (scheme.empty()) {
59 |     return 0;
60 |   }
61 |   int hash_value = (2 * scheme.size() + (unsigned)(scheme[0])) & 7;
62 |   const std::string_view target = details::is_special_list[hash_value];
63 |   if ((target[0] == scheme[0]) && (target.substr(1) == scheme.substr(1))) {
64 |     return details::special_ports[hash_value];
65 |   } else {
66 |     return 0;
67 |   }
68 | }
69 | constexpr uint16_t get_special_port(ada::scheme::type type) noexcept {
70 |   return details::special_ports[int(type)];
71 | }
72 | constexpr ada::scheme::type get_scheme_type(std::string_view scheme) noexcept {
73 |   if (scheme.empty()) {
74 |     return ada::scheme::NOT_SPECIAL;
75 |   }
76 |   int hash_value = (2 * scheme.size() + (unsigned)(scheme[0])) & 7;
77 |   const std::string_view target = details::is_special_list[hash_value];
78 |   if ((target[0] == scheme[0]) && (target.substr(1) == scheme.substr(1))) {
79 |     return ada::scheme::type(hash_value);
80 |   } else {
81 |     return ada::scheme::NOT_SPECIAL;
82 |   }
83 | }
84 | 
85 | }  // namespace ada::scheme
86 | 
87 | #endif  // ADA_SCHEME_INL_H
88 | 


--------------------------------------------------------------------------------
/include/ada/scheme.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file scheme.h
 3 |  * @brief Declarations for the URL scheme.
 4 |  */
 5 | #ifndef ADA_SCHEME_H
 6 | #define ADA_SCHEME_H
 7 | 
 8 | #include "ada/common_defs.h"
 9 | 
10 | #include <string>
11 | 
12 | /**
13 |  * @namespace ada::scheme
14 |  * @brief Includes the scheme declarations
15 |  */
16 | namespace ada::scheme {
17 | 
18 | /**
19 |  * Type of the scheme as an enum.
20 |  * Using strings to represent a scheme type is not ideal because
21 |  * checking for types involves string comparisons. It is faster to use
22 |  * a simple integer.
23 |  * In C++11, we are allowed to specify the underlying type of the enum.
24 |  * We pick an 8-bit integer (which allows up to 256 types). Specifying the
25 |  * type of the enum may help integration with other systems if the type
26 |  * variable is exposed (since its value will not depend on the compiler).
27 |  */
28 | enum type : uint8_t {
29 |   HTTP = 0,
30 |   NOT_SPECIAL = 1,
31 |   HTTPS = 2,
32 |   WS = 3,
33 |   FTP = 4,
34 |   WSS = 5,
35 |   FILE = 6
36 | };
37 | 
38 | /**
39 |  * A special scheme is an ASCII string that is listed in the first column of the
40 |  * following table. The default port for a special scheme is listed in the
41 |  * second column on the same row. The default port for any other ASCII string is
42 |  * null.
43 |  *
44 |  * @see https://url.spec.whatwg.org/#url-miscellaneous
45 |  * @param scheme
46 |  * @return If scheme is a special scheme
47 |  */
48 | ada_really_inline constexpr bool is_special(std::string_view scheme);
49 | 
50 | /**
51 |  * A special scheme is an ASCII string that is listed in the first column of the
52 |  * following table. The default port for a special scheme is listed in the
53 |  * second column on the same row. The default port for any other ASCII string is
54 |  * null.
55 |  *
56 |  * @see https://url.spec.whatwg.org/#url-miscellaneous
57 |  * @param scheme
58 |  * @return The special port
59 |  */
60 | constexpr uint16_t get_special_port(std::string_view scheme) noexcept;
61 | 
62 | /**
63 |  * Returns the port number of a special scheme.
64 |  * @see https://url.spec.whatwg.org/#special-scheme
65 |  */
66 | constexpr uint16_t get_special_port(ada::scheme::type type) noexcept;
67 | /**
68 |  * Returns the scheme of an input, or NOT_SPECIAL if it's not a special scheme
69 |  * defined by the spec.
70 |  */
71 | constexpr ada::scheme::type get_scheme_type(std::string_view scheme) noexcept;
72 | 
73 | }  // namespace ada::scheme
74 | 
75 | #endif  // ADA_SCHEME_H
76 | 


--------------------------------------------------------------------------------
/include/ada/serializers.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file serializers.h
 3 |  * @brief Definitions for the URL serializers.
 4 |  */
 5 | #ifndef ADA_SERIALIZERS_H
 6 | #define ADA_SERIALIZERS_H
 7 | 
 8 | #include "ada/common_defs.h"
 9 | 
10 | #include <array>
11 | #include <string>
12 | 
13 | /**
14 |  * @namespace ada::serializers
15 |  * @brief Includes the definitions for URL serializers
16 |  */
17 | namespace ada::serializers {
18 | 
19 | /**
20 |  * Finds and returns the longest sequence of 0 values in a ipv6 input.
21 |  */
22 | void find_longest_sequence_of_ipv6_pieces(
23 |     const std::array<uint16_t, 8>& address, size_t& compress,
24 |     size_t& compress_length) noexcept;
25 | 
26 | /**
27 |  * Serializes an ipv6 address.
28 |  * @details An IPv6 address is a 128-bit unsigned integer that identifies a
29 |  * network address.
30 |  * @see https://url.spec.whatwg.org/#concept-ipv6-serializer
31 |  */
32 | std::string ipv6(const std::array<uint16_t, 8>& address) noexcept;
33 | 
34 | /**
35 |  * Serializes an ipv4 address.
36 |  * @details An IPv4 address is a 32-bit unsigned integer that identifies a
37 |  * network address.
38 |  * @see https://url.spec.whatwg.org/#concept-ipv4-serializer
39 |  */
40 | std::string ipv4(uint64_t address) noexcept;
41 | 
42 | }  // namespace ada::serializers
43 | 
44 | #endif  // ADA_SERIALIZERS_H
45 | 


--------------------------------------------------------------------------------
/include/ada/state.h:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * @file state.h
  3 |  * @brief Definitions for the states of the URL state machine.
  4 |  */
  5 | #ifndef ADA_STATE_H
  6 | #define ADA_STATE_H
  7 | 
  8 | #include "ada/common_defs.h"
  9 | 
 10 | #include <string>
 11 | 
 12 | namespace ada {
 13 | 
 14 | /**
 15 |  * @see https://url.spec.whatwg.org/#url-parsing
 16 |  */
 17 | enum class state {
 18 |   /**
 19 |    * @see https://url.spec.whatwg.org/#authority-state
 20 |    */
 21 |   AUTHORITY,
 22 | 
 23 |   /**
 24 |    * @see https://url.spec.whatwg.org/#scheme-start-state
 25 |    */
 26 |   SCHEME_START,
 27 | 
 28 |   /**
 29 |    * @see https://url.spec.whatwg.org/#scheme-state
 30 |    */
 31 |   SCHEME,
 32 | 
 33 |   /**
 34 |    * @see https://url.spec.whatwg.org/#host-state
 35 |    */
 36 |   HOST,
 37 | 
 38 |   /**
 39 |    * @see https://url.spec.whatwg.org/#no-scheme-state
 40 |    */
 41 |   NO_SCHEME,
 42 | 
 43 |   /**
 44 |    * @see https://url.spec.whatwg.org/#fragment-state
 45 |    */
 46 |   FRAGMENT,
 47 | 
 48 |   /**
 49 |    * @see https://url.spec.whatwg.org/#relative-state
 50 |    */
 51 |   RELATIVE_SCHEME,
 52 | 
 53 |   /**
 54 |    * @see https://url.spec.whatwg.org/#relative-slash-state
 55 |    */
 56 |   RELATIVE_SLASH,
 57 | 
 58 |   /**
 59 |    * @see https://url.spec.whatwg.org/#file-state
 60 |    */
 61 |   FILE,
 62 | 
 63 |   /**
 64 |    * @see https://url.spec.whatwg.org/#file-host-state
 65 |    */
 66 |   FILE_HOST,
 67 | 
 68 |   /**
 69 |    * @see https://url.spec.whatwg.org/#file-slash-state
 70 |    */
 71 |   FILE_SLASH,
 72 | 
 73 |   /**
 74 |    * @see https://url.spec.whatwg.org/#path-or-authority-state
 75 |    */
 76 |   PATH_OR_AUTHORITY,
 77 | 
 78 |   /**
 79 |    * @see https://url.spec.whatwg.org/#special-authority-ignore-slashes-state
 80 |    */
 81 |   SPECIAL_AUTHORITY_IGNORE_SLASHES,
 82 | 
 83 |   /**
 84 |    * @see https://url.spec.whatwg.org/#special-authority-slashes-state
 85 |    */
 86 |   SPECIAL_AUTHORITY_SLASHES,
 87 | 
 88 |   /**
 89 |    * @see https://url.spec.whatwg.org/#special-relative-or-authority-state
 90 |    */
 91 |   SPECIAL_RELATIVE_OR_AUTHORITY,
 92 | 
 93 |   /**
 94 |    * @see https://url.spec.whatwg.org/#query-state
 95 |    */
 96 |   QUERY,
 97 | 
 98 |   /**
 99 |    * @see https://url.spec.whatwg.org/#path-state
100 |    */
101 |   PATH,
102 | 
103 |   /**
104 |    * @see https://url.spec.whatwg.org/#path-start-state
105 |    */
106 |   PATH_START,
107 | 
108 |   /**
109 |    * @see https://url.spec.whatwg.org/#cannot-be-a-base-url-path-state
110 |    */
111 |   OPAQUE_PATH,
112 | 
113 |   /**
114 |    * @see https://url.spec.whatwg.org/#port-state
115 |    */
116 |   PORT,
117 | };
118 | 
119 | /**
120 |  * Stringify a URL state machine state.
121 |  */
122 | ada_warn_unused std::string to_string(ada::state s);
123 | 
124 | }  // namespace ada
125 | 
126 | #endif  // ADA_STATE_H
127 | 


--------------------------------------------------------------------------------
/include/ada/unicode-inl.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file unicode-inl.h
 3 |  * @brief Definitions for unicode operations.
 4 |  */
 5 | #ifndef ADA_UNICODE_INL_H
 6 | #define ADA_UNICODE_INL_H
 7 | #include "ada/unicode.h"
 8 | #include "ada/character_sets.h"
 9 | 
10 | /**
11 |  * Unicode operations. These functions are not part of our public API and may
12 |  * change at any time.
13 |  *
14 |  * private
15 |  * @namespace ada::unicode
16 |  * @brief Includes the declarations for unicode operations
17 |  */
18 | namespace ada::unicode {
19 | ada_really_inline size_t percent_encode_index(const std::string_view input,
20 |                                               const uint8_t character_set[]) {
21 |   const char* data = input.data();
22 |   const size_t size = input.size();
23 | 
24 |   // Process 8 bytes at a time using unrolled loop
25 |   size_t i = 0;
26 |   for (; i + 8 <= size; i += 8) {
27 |     unsigned char chunk[8];
28 |     std::memcpy(&chunk, data + i,
29 |                 8);  // entices compiler to unconditionally process 8 characters
30 | 
31 |     // Check 8 characters at once
32 |     for (size_t j = 0; j < 8; j++) {
33 |       if (character_sets::bit_at(character_set, chunk[j])) {
34 |         return i + j;
35 |       }
36 |     }
37 |   }
38 | 
39 |   // Handle remaining bytes
40 |   for (; i < size; i++) {
41 |     if (character_sets::bit_at(character_set, data[i])) {
42 |       return i;
43 |     }
44 |   }
45 | 
46 |   return size;
47 | }
48 | }  // namespace ada::unicode
49 | 
50 | #endif  // ADA_UNICODE_INL_H
51 | 


--------------------------------------------------------------------------------
/include/ada/url_base-inl.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file url_base-inl.h
 3 |  * @brief Inline functions for url base
 4 |  */
 5 | #ifndef ADA_URL_BASE_INL_H
 6 | #define ADA_URL_BASE_INL_H
 7 | 
 8 | #include "ada/scheme.h"
 9 | #include "ada/checkers.h"
10 | #include "ada/url.h"
11 | 
12 | #include <string>
13 | #if ADA_REGULAR_VISUAL_STUDIO
14 | #include <intrin.h>
15 | #endif  // ADA_REGULAR_VISUAL_STUDIO
16 | 
17 | namespace ada {
18 | 
19 | [[nodiscard]] ada_really_inline constexpr bool url_base::is_special()
20 |     const noexcept {
21 |   return type != ada::scheme::NOT_SPECIAL;
22 | }
23 | 
24 | [[nodiscard]] inline uint16_t url_base::get_special_port() const noexcept {
25 |   return ada::scheme::get_special_port(type);
26 | }
27 | 
28 | [[nodiscard]] ada_really_inline uint16_t
29 | url_base::scheme_default_port() const noexcept {
30 |   return scheme::get_special_port(type);
31 | }
32 | 
33 | }  // namespace ada
34 | 
35 | #endif  // ADA_URL_BASE_INL_H
36 | 


--------------------------------------------------------------------------------
/include/ada/url_base.h:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * @file url_base.h
  3 |  * @brief Declaration for the basic URL definitions
  4 |  */
  5 | #ifndef ADA_URL_BASE_H
  6 | #define ADA_URL_BASE_H
  7 | 
  8 | #include "ada/common_defs.h"
  9 | #include "ada/scheme.h"
 10 | 
 11 | #include <string>
 12 | #include <string_view>
 13 | 
 14 | namespace ada {
 15 | 
 16 | /**
 17 |  * Type of URL host as an enum.
 18 |  */
 19 | enum url_host_type : uint8_t {
 20 |   /**
 21 |    * Represents common URLs such as "https://www.google.com"
 22 |    */
 23 |   DEFAULT = 0,
 24 |   /**
 25 |    * Represents ipv4 addresses such as "http://127.0.0.1"
 26 |    */
 27 |   IPV4 = 1,
 28 |   /**
 29 |    * Represents ipv6 addresses such as
 30 |    * "http://[2001:db8:3333:4444:5555:6666:7777:8888]"
 31 |    */
 32 |   IPV6 = 2,
 33 | };
 34 | 
 35 | /**
 36 |  * @brief Base class of URL implementations
 37 |  *
 38 |  * @details A url_base contains a few attributes: is_valid, has_opaque_path and
 39 |  * type. All non-trivial implementation details are in derived classes such as
 40 |  * ada::url and ada::url_aggregator.
 41 |  *
 42 |  * It is an abstract class that cannot be instantiated directly.
 43 |  */
 44 | struct url_base {
 45 |   virtual ~url_base() = default;
 46 | 
 47 |   /**
 48 |    * Used for returning the validity from the result of the URL parser.
 49 |    */
 50 |   bool is_valid{true};
 51 | 
 52 |   /**
 53 |    * A URL has an opaque path if its path is a string.
 54 |    */
 55 |   bool has_opaque_path{false};
 56 | 
 57 |   /**
 58 |    * URL hosts type
 59 |    */
 60 |   url_host_type host_type = url_host_type::DEFAULT;
 61 | 
 62 |   /**
 63 |    * @private
 64 |    */
 65 |   ada::scheme::type type{ada::scheme::type::NOT_SPECIAL};
 66 | 
 67 |   /**
 68 |    * A URL is special if its scheme is a special scheme. A URL is not special if
 69 |    * its scheme is not a special scheme.
 70 |    */
 71 |   [[nodiscard]] ada_really_inline constexpr bool is_special() const noexcept;
 72 | 
 73 |   /**
 74 |    * The origin getter steps are to return the serialization of this's URL's
 75 |    * origin. [HTML]
 76 |    * @return a newly allocated string.
 77 |    * @see https://url.spec.whatwg.org/#concept-url-origin
 78 |    */
 79 |   [[nodiscard]] virtual std::string get_origin() const noexcept = 0;
 80 | 
 81 |   /**
 82 |    * Returns true if this URL has a valid domain as per RFC 1034 and
 83 |    * corresponding specifications. Among other things, it requires
 84 |    * that the domain string has fewer than 255 octets.
 85 |    */
 86 |   [[nodiscard]] virtual bool has_valid_domain() const noexcept = 0;
 87 | 
 88 |   /**
 89 |    * @private
 90 |    *
 91 |    * Return the 'special port' if the URL is special and not 'file'.
 92 |    * Returns 0 otherwise.
 93 |    */
 94 |   [[nodiscard]] inline uint16_t get_special_port() const noexcept;
 95 | 
 96 |   /**
 97 |    * @private
 98 |    *
 99 |    * Get the default port if the url's scheme has one, returns 0 otherwise.
100 |    */
101 |   [[nodiscard]] ada_really_inline uint16_t scheme_default_port() const noexcept;
102 | 
103 |   /**
104 |    * @private
105 |    *
106 |    * Parse a port (16-bit decimal digit) from the provided input.
107 |    * We assume that the input does not contain spaces or tabs
108 |    * within the ASCII digits.
109 |    * It returns how many bytes were consumed when a number is successfully
110 |    * parsed.
111 |    * @return On failure, it returns zero.
112 |    * @see https://url.spec.whatwg.org/#host-parsing
113 |    */
114 |   virtual size_t parse_port(std::string_view view,
115 |                             bool check_trailing_content) noexcept = 0;
116 | 
117 |   virtual ada_really_inline size_t parse_port(std::string_view view) noexcept {
118 |     return this->parse_port(view, false);
119 |   }
120 | 
121 |   /**
122 |    * Returns a JSON string representation of this URL.
123 |    */
124 |   [[nodiscard]] virtual std::string to_string() const = 0;
125 | 
126 |   /** @private */
127 |   virtual inline void clear_pathname() = 0;
128 | 
129 |   /** @private */
130 |   virtual inline void clear_search() = 0;
131 | 
132 |   /** @private */
133 |   [[nodiscard]] virtual inline bool has_hash() const noexcept = 0;
134 | 
135 |   /** @private */
136 |   [[nodiscard]] virtual inline bool has_search() const noexcept = 0;
137 | 
138 | };  // url_base
139 | 
140 | }  // namespace ada
141 | 
142 | #endif
143 | 


--------------------------------------------------------------------------------
/include/ada/url_components-inl.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file url_components.h
 3 |  * @brief Declaration for the URL Components
 4 |  */
 5 | #ifndef ADA_URL_COMPONENTS_INL_H
 6 | #define ADA_URL_COMPONENTS_INL_H
 7 | 
 8 | #include "ada/url_components.h"
 9 | 
10 | namespace ada {
11 | 
12 | [[nodiscard]] constexpr bool url_components::check_offset_consistency()
13 |     const noexcept {
14 |   /**
15 |    * https://user:pass@example.com:1234/foo/bar?baz#quux
16 |    *       |     |    |          | ^^^^|       |   |
17 |    *       |     |    |          | |   |       |   `----- hash_start
18 |    *       |     |    |          | |   |       `--------- search_start
19 |    *       |     |    |          | |   `----------------- pathname_start
20 |    *       |     |    |          | `--------------------- port
21 |    *       |     |    |          `----------------------- host_end
22 |    *       |     |    `---------------------------------- host_start
23 |    *       |     `--------------------------------------- username_end
24 |    *       `--------------------------------------------- protocol_end
25 |    */
26 |   // These conditions can be made more strict.
27 |   if (protocol_end == url_components::omitted) {
28 |     return false;
29 |   }
30 |   uint32_t index = protocol_end;
31 | 
32 |   if (username_end == url_components::omitted) {
33 |     return false;
34 |   }
35 |   if (username_end < index) {
36 |     return false;
37 |   }
38 |   index = username_end;
39 | 
40 |   if (host_start == url_components::omitted) {
41 |     return false;
42 |   }
43 |   if (host_start < index) {
44 |     return false;
45 |   }
46 |   index = host_start;
47 | 
48 |   if (port != url_components::omitted) {
49 |     if (port > 0xffff) {
50 |       return false;
51 |     }
52 |     uint32_t port_length = helpers::fast_digit_count(port) + 1;
53 |     if (index + port_length < index) {
54 |       return false;
55 |     }
56 |     index += port_length;
57 |   }
58 | 
59 |   if (pathname_start == url_components::omitted) {
60 |     return false;
61 |   }
62 |   if (pathname_start < index) {
63 |     return false;
64 |   }
65 |   index = pathname_start;
66 | 
67 |   if (search_start != url_components::omitted) {
68 |     if (search_start < index) {
69 |       return false;
70 |     }
71 |     index = search_start;
72 |   }
73 | 
74 |   if (hash_start != url_components::omitted) {
75 |     if (hash_start < index) {
76 |       return false;
77 |     }
78 |   }
79 | 
80 |   return true;
81 | }
82 | 
83 | }  // namespace ada
84 | #endif
85 | 


--------------------------------------------------------------------------------
/include/ada/url_components.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file url_components.h
 3 |  * @brief Declaration for the URL Components
 4 |  */
 5 | #ifndef ADA_URL_COMPONENTS_H
 6 | #define ADA_URL_COMPONENTS_H
 7 | 
 8 | namespace ada {
 9 | 
10 | /**
11 |  * @brief URL Component representations using offsets.
12 |  *
13 |  * @details We design the url_components struct so that it is as small
14 |  * and simple as possible. This version uses 32 bytes.
15 |  *
16 |  * This struct is used to extract components from a single 'href'.
17 |  */
18 | struct url_components {
19 |   constexpr static uint32_t omitted = uint32_t(-1);
20 | 
21 |   url_components() = default;
22 |   url_components(const url_components &u) = default;
23 |   url_components(url_components &&u) noexcept = default;
24 |   url_components &operator=(url_components &&u) noexcept = default;
25 |   url_components &operator=(const url_components &u) = default;
26 |   ~url_components() = default;
27 | 
28 |   /*
29 |    * By using 32-bit integers, we implicitly assume that the URL string
30 |    * cannot exceed 4 GB.
31 |    *
32 |    * https://user:pass@example.com:1234/foo/bar?baz#quux
33 |    *       |     |    |          | ^^^^|       |   |
34 |    *       |     |    |          | |   |       |   `----- hash_start
35 |    *       |     |    |          | |   |       `--------- search_start
36 |    *       |     |    |          | |   `----------------- pathname_start
37 |    *       |     |    |          | `--------------------- port
38 |    *       |     |    |          `----------------------- host_end
39 |    *       |     |    `---------------------------------- host_start
40 |    *       |     `--------------------------------------- username_end
41 |    *       `--------------------------------------------- protocol_end
42 |    */
43 |   uint32_t protocol_end{0};
44 |   /**
45 |    * Username end is not `omitted` by default to make username and password
46 |    * getters less costly to implement.
47 |    */
48 |   uint32_t username_end{0};
49 |   uint32_t host_start{0};
50 |   uint32_t host_end{0};
51 |   uint32_t port{omitted};
52 |   uint32_t pathname_start{0};
53 |   uint32_t search_start{omitted};
54 |   uint32_t hash_start{omitted};
55 | 
56 |   /**
57 |    * Check the following conditions:
58 |    * protocol_end < username_end < ... < hash_start,
59 |    * expect when a value is omitted. It also computes
60 |    * a lower bound on  the possible string length that may match these
61 |    * offsets.
62 |    * @return true if the offset values are
63 |    *  consistent with a possible URL string
64 |    */
65 |   [[nodiscard]] constexpr bool check_offset_consistency() const noexcept;
66 | 
67 |   /**
68 |    * Converts a url_components to JSON stringified version.
69 |    */
70 |   [[nodiscard]] std::string to_string() const;
71 | 
72 | };  // struct url_components
73 | }  // namespace ada
74 | #endif
75 | 


--------------------------------------------------------------------------------
/include/ada/url_pattern_init.h:
--------------------------------------------------------------------------------
  1 | /**
  2 |  * @file url_pattern_init.h
  3 |  * @brief Declaration for the url_pattern_init implementation.
  4 |  */
  5 | #ifndef ADA_URL_PATTERN_INIT_H
  6 | #define ADA_URL_PATTERN_INIT_H
  7 | 
  8 | #include "ada/expected.h"
  9 | #include "ada/errors.h"
 10 | 
 11 | #include <string_view>
 12 | #include <string>
 13 | #include <optional>
 14 | 
 15 | #if ADA_TESTING
 16 | #include <iostream>
 17 | #endif  // ADA_TESTING
 18 | 
 19 | #if ADA_INCLUDE_URL_PATTERN
 20 | namespace ada {
 21 | 
 22 | // Important: C++20 allows us to use concept rather than `using` or `typedef
 23 | // and allows functions with second argument, which is optional (using either
 24 | // std::nullopt or a parameter with default value)
 25 | template <typename F>
 26 | concept url_pattern_encoding_callback = requires(F f, std::string_view sv) {
 27 |   { f(sv) } -> std::same_as<tl::expected<std::string, errors>>;
 28 | };
 29 | 
 30 | // A structure providing matching patterns for individual components
 31 | // of a URL. When a URLPattern is created, or when a URLPattern is
 32 | // used to match or test against a URL, the input can be given as
 33 | // either a string or a URLPatternInit struct. If a string is given,
 34 | // it will be parsed to create a URLPatternInit. The URLPatternInit
 35 | // API is defined as part of the URLPattern specification.
 36 | // All provided strings must be valid UTF-8.
 37 | struct url_pattern_init {
 38 |   enum class process_type : uint8_t {
 39 |     url,
 40 |     pattern,
 41 |   };
 42 | 
 43 |   // All strings must be valid UTF-8.
 44 |   // @see https://urlpattern.spec.whatwg.org/#process-a-urlpatterninit
 45 |   static tl::expected<url_pattern_init, errors> process(
 46 |       const url_pattern_init& init, process_type type,
 47 |       std::optional<std::string_view> protocol = std::nullopt,
 48 |       std::optional<std::string_view> username = std::nullopt,
 49 |       std::optional<std::string_view> password = std::nullopt,
 50 |       std::optional<std::string_view> hostname = std::nullopt,
 51 |       std::optional<std::string_view> port = std::nullopt,
 52 |       std::optional<std::string_view> pathname = std::nullopt,
 53 |       std::optional<std::string_view> search = std::nullopt,
 54 |       std::optional<std::string_view> hash = std::nullopt);
 55 | 
 56 |   // @see https://urlpattern.spec.whatwg.org/#process-protocol-for-init
 57 |   static tl::expected<std::string, errors> process_protocol(
 58 |       std::string_view value, process_type type);
 59 | 
 60 |   // @see https://urlpattern.spec.whatwg.org/#process-username-for-init
 61 |   static tl::expected<std::string, errors> process_username(
 62 |       std::string_view value, process_type type);
 63 | 
 64 |   // @see https://urlpattern.spec.whatwg.org/#process-password-for-init
 65 |   static tl::expected<std::string, errors> process_password(
 66 |       std::string_view value, process_type type);
 67 | 
 68 |   // @see https://urlpattern.spec.whatwg.org/#process-hostname-for-init
 69 |   static tl::expected<std::string, errors> process_hostname(
 70 |       std::string_view value, process_type type);
 71 | 
 72 |   // @see https://urlpattern.spec.whatwg.org/#process-port-for-init
 73 |   static tl::expected<std::string, errors> process_port(
 74 |       std::string_view port, std::string_view protocol, process_type type);
 75 | 
 76 |   // @see https://urlpattern.spec.whatwg.org/#process-pathname-for-init
 77 |   static tl::expected<std::string, errors> process_pathname(
 78 |       std::string_view value, std::string_view protocol, process_type type);
 79 | 
 80 |   // @see https://urlpattern.spec.whatwg.org/#process-search-for-init
 81 |   static tl::expected<std::string, errors> process_search(
 82 |       std::string_view value, process_type type);
 83 | 
 84 |   // @see https://urlpattern.spec.whatwg.org/#process-hash-for-init
 85 |   static tl::expected<std::string, errors> process_hash(std::string_view value,
 86 |                                                         process_type type);
 87 | 
 88 | #if ADA_TESTING
 89 |   friend void PrintTo(const url_pattern_init& init, std::ostream* os) {
 90 |     *os << "protocol: '" << init.protocol.value_or("undefined") << "', ";
 91 |     *os << "username: '" << init.username.value_or("undefined") << "', ";
 92 |     *os << "password: '" << init.password.value_or("undefined") << "', ";
 93 |     *os << "hostname: '" << init.hostname.value_or("undefined") << "', ";
 94 |     *os << "port: '" << init.port.value_or("undefined") << "', ";
 95 |     *os << "pathname: '" << init.pathname.value_or("undefined") << "', ";
 96 |     *os << "search: '" << init.search.value_or("undefined") << "', ";
 97 |     *os << "hash: '" << init.hash.value_or("undefined") << "', ";
 98 |     *os << "base_url: '" << init.base_url.value_or("undefined") << "', ";
 99 |   }
100 | #endif  // ADA_TESTING
101 | 
102 |   bool operator==(const url_pattern_init&) const;
103 |   // If present, must be valid UTF-8.
104 |   std::optional<std::string> protocol{};
105 |   // If present, must be valid UTF-8.
106 |   std::optional<std::string> username{};
107 |   // If present, must be valid UTF-8.
108 |   std::optional<std::string> password{};
109 |   // If present, must be valid UTF-8.
110 |   std::optional<std::string> hostname{};
111 |   // If present, must be valid UTF-8.
112 |   std::optional<std::string> port{};
113 |   // If present, must be valid UTF-8.
114 |   std::optional<std::string> pathname{};
115 |   // If present, must be valid UTF-8.
116 |   std::optional<std::string> search{};
117 |   // If present, must be valid UTF-8.
118 |   std::optional<std::string> hash{};
119 |   // If present, must be valid UTF-8.
120 |   std::optional<std::string> base_url{};
121 | };
122 | }  // namespace ada
123 | #endif  // ADA_INCLUDE_URL_PATTERN
124 | #endif  // ADA_URL_PATTERN_INIT_H
125 | 


--------------------------------------------------------------------------------
/include/ada/url_pattern_regex.h:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file url_search_params.h
 3 |  * @brief Declaration for the URL Search Params
 4 |  */
 5 | #ifndef ADA_URL_PATTERN_REGEX_H
 6 | #define ADA_URL_PATTERN_REGEX_H
 7 | 
 8 | #include <string>
 9 | #include <string_view>
10 | 
11 | #ifdef ADA_USE_UNSAFE_STD_REGEX_PROVIDER
12 | #include <regex>
13 | #endif  // ADA_USE_UNSAFE_STD_REGEX_PROVIDER
14 | 
15 | #if ADA_INCLUDE_URL_PATTERN
16 | namespace ada::url_pattern_regex {
17 | 
18 | template <typename T>
19 | concept regex_concept = requires(T t, std::string_view pattern,
20 |                                  bool ignore_case, std::string_view input) {
21 |   // Ensure the class has a type alias 'regex_type'
22 |   typename T::regex_type;
23 | 
24 |   // Function to create a regex instance
25 |   {
26 |     T::create_instance(pattern, ignore_case)
27 |   } -> std::same_as<std::optional<typename T::regex_type>>;
28 | 
29 |   // Function to perform regex search
30 |   {
31 |     T::regex_search(input, std::declval<typename T::regex_type&>())
32 |   } -> std::same_as<std::optional<std::vector<std::optional<std::string>>>>;
33 | 
34 |   // Function to match regex pattern
35 |   {
36 |     T::regex_match(input, std::declval<typename T::regex_type&>())
37 |   } -> std::same_as<bool>;
38 | 
39 |   // Copy constructor
40 |   { T(std::declval<const T&>()) } -> std::same_as<T>;
41 | 
42 |   // Move constructor
43 |   { T(std::declval<T&&>()) } -> std::same_as<T>;
44 | };
45 | 
46 | #ifdef ADA_USE_UNSAFE_STD_REGEX_PROVIDER
47 | class std_regex_provider final {
48 |  public:
49 |   std_regex_provider() = default;
50 |   using regex_type = std::regex;
51 |   static std::optional<regex_type> create_instance(std::string_view pattern,
52 |                                                    bool ignore_case);
53 |   static std::optional<std::vector<std::optional<std::string>>> regex_search(
54 |       std::string_view input, const regex_type& pattern);
55 |   static bool regex_match(std::string_view input, const regex_type& pattern);
56 | };
57 | #endif  // ADA_USE_UNSAFE_STD_REGEX_PROVIDER
58 | 
59 | }  // namespace ada::url_pattern_regex
60 | #endif  // ADA_INCLUDE_URL_PATTERN
61 | #endif  // ADA_URL_PATTERN_REGEX_H
62 | 


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [project]
 2 | name = "ada-url"
 3 | requires-python = ">=3.12"
 4 | 
 5 | [tool.ruff]
 6 | line-length = 120
 7 | target-version = "py312"
 8 | 
 9 | [tool.ruff.format]
10 | quote-style = "single"
11 | indent-style = "space"
12 | docstring-code-format = true
13 | 
14 | [tool.ruff.lint]
15 | select = [
16 |   "C90",    # McCabe cyclomatic complexity
17 |   "E",      # pycodestyle
18 |   "F",      # Pyflakes
19 |   "ICN",    # flake8-import-conventions
20 |   "INT",    # flake8-gettext
21 |   "PLC",    # Pylint conventions
22 |   "PLE",    # Pylint errors
23 |   "PLR09",  # Pylint refactoring: max-args, max-branches, max returns, max-statements
24 |   "PYI",    # flake8-pyi
25 |   "RSE",    # flake8-raise
26 |   "RUF",    # Ruff-specific rules
27 |   "T10",    # flake8-debugger
28 |   "TCH",    # flake8-type-checking
29 |   "TID",    # flake8-tidy-imports
30 |   "W",      # pycodestyle
31 |   "YTT",    # flake8-2020
32 |   "ANN"     # flake8-annotations
33 | ]
34 | ignore = [
35 |   "E722",   # Do not use bare `except`
36 |   "ANN101", # Missing type annotation for self in method
37 |   "TID252", # Prefer absolute imports over relative imports from parent modules
38 | ]
39 | 


--------------------------------------------------------------------------------
/singleheader/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | #
 2 | # Amalgamation
 3 | #
 4 | set(SINGLEHEADER_FILES
 5 |   ${CMAKE_CURRENT_BINARY_DIR}/ada.cpp
 6 |   ${CMAKE_CURRENT_BINARY_DIR}/ada.h
 7 |   ${CMAKE_CURRENT_BINARY_DIR}/ada_c.h
 8 |   ${CMAKE_CURRENT_BINARY_DIR}/demo.cpp
 9 |   ${CMAKE_CURRENT_BINARY_DIR}/demo.c
10 |   ${CMAKE_CURRENT_BINARY_DIR}/README.md
11 | )
12 | set_source_files_properties(${SINGLEHEADER_FILES} PROPERTIES GENERATED TRUE)
13 | 
14 | # In theory, this is unneeded, because the tests module does the same test:
15 | find_package (Python3 COMPONENTS Interpreter)
16 | 
17 | if (Python3_Interpreter_FOUND)
18 |   MESSAGE( STATUS "Python found, we are going to amalgamate.py." )
19 | 
20 |   add_custom_command(
21 |     OUTPUT ${SINGLEHEADER_FILES}
22 |     COMMAND ${CMAKE_COMMAND} -E env
23 |       AMALGAMATE_SOURCE_PATH=${PROJECT_SOURCE_DIR}/src
24 |       AMALGAMATE_INPUT_PATH=${PROJECT_SOURCE_DIR}/include
25 |       AMALGAMATE_OUTPUT_PATH=${CMAKE_CURRENT_BINARY_DIR}
26 |       ${Python3_EXECUTABLE} ${CMAKE_CURRENT_SOURCE_DIR}/amalgamate.py
27 |       #
28 |       # This is the best way I could find to make amalgamation trigger whenever source files or
29 |       # header files change: since the "ada" library has to get rebuilt when that happens, we
30 |       # take a dependency on the generated library file (even though we're not using it). Depending
31 |       # on ada-source doesn't do the trick because DEPENDS here can only depend on an
32 |       # *artifact*--it won't scan source and include files the way a concrete library or executable
33 |       # will.
34 |       #
35 |       # It sucks that we have to build the actual library to make it happen, but it's better than\
36 |       # nothing!
37 |       #
38 |       DEPENDS amalgamate.py ada
39 |   )
40 |   add_custom_target(ada-singleheader-files DEPENDS ${SINGLEHEADER_FILES})
41 | 
42 |   #
43 |   # Include this if you intend to #include "ada.cpp" in your own .cpp files.
44 |   #
45 |   add_library(ada-singleheader-include-source INTERFACE)
46 |   target_include_directories(ada-singleheader-include-source INTERFACE $<BUILD_INTERFACE:${CMAKE_CURRENT_BINARY_DIR}>)
47 |   add_dependencies(ada-singleheader-include-source ada-singleheader-files)
48 | 
49 |   add_library(ada-singleheader-source INTERFACE)
50 |   target_sources(ada-singleheader-source INTERFACE $<BUILD_INTERFACE:${CMAKE_CURRENT_BINARY_DIR}/ada.cpp>)
51 |   target_link_libraries(ada-singleheader-source INTERFACE ada-singleheader-include-source)
52 |   if (ADA_TESTING OR ADA_BUILD_SINGLE_HEADER_LIB)
53 |     add_library(ada-singleheader-lib STATIC $<BUILD_INTERFACE:${CMAKE_CURRENT_BINARY_DIR}/ada.cpp>)
54 |   endif(ADA_TESTING OR ADA_BUILD_SINGLE_HEADER_LIB)
55 | 
56 |   if (ADA_TESTING)
57 |     add_executable(demo $<BUILD_INTERFACE:${CMAKE_CURRENT_BINARY_DIR}/demo.cpp>)
58 |     target_link_libraries(demo ada-singleheader-include-source)
59 | 
60 |     add_executable(demo_no_url_pattern $<BUILD_INTERFACE:${CMAKE_CURRENT_BINARY_DIR}/demo.cpp>)
61 |     target_link_libraries(demo_no_url_pattern ada-singleheader-include-source)
62 |     target_compile_definitions(demo_no_url_pattern PRIVATE ADA_INCLUDE_URL_PATTERN=0)
63 | 
64 |     add_test(demo_no_url_pattern demo_no_url_pattern)
65 | 
66 |     add_executable(cdemo $<BUILD_INTERFACE:${CMAKE_CURRENT_BINARY_DIR}/demo.c>)
67 |     target_link_libraries(cdemo ada-singleheader-lib)
68 |     add_test(cdemo cdemo)
69 |   endif()
70 | else()
71 |   MESSAGE( STATUS "Python not found, we are unable to test amalgamate.py." )
72 | endif()
73 | 


--------------------------------------------------------------------------------
/singleheader/README.md:
--------------------------------------------------------------------------------
 1 | ## Amalgamation demo
 2 | 
 3 | While in the ada main directory, using Python 3, type:
 4 | 
 5 | ```
 6 | python singleheader/amalgamate.py
 7 | ```
 8 | 
 9 | This will create two new files (ada.h and ada.cpp).
10 | 
11 | You can then compile the demo file as follows:
12 | 
13 | ```
14 | c++ -std=c++20 -c demo.cpp
15 | ```
16 | 
17 | It will produce a binary file (e.g., demo.o) which contains ada.cpp.
18 | 
19 | ```
20 | c++ -std=c++20 -o demo demo.cpp
21 | ./demo
22 | ```
23 | 
24 | You may build and link using CMake (--target demo), because CMake can configure all the necessary flags.
25 | 
26 | 
27 | ### C Demo
28 | 
29 | You may also build a C executable.
30 | 
31 | ```
32 | c++ -c ada.cpp -std=c++20
33 | cc -c demo.c
34 | c++ demo.o ada.o -o cdemo
35 | ./cdemo
36 | ```
37 | 


--------------------------------------------------------------------------------
/singleheader/amalgamate.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | #
  3 | # Creates the amalgamated source files.
  4 | #
  5 | 
  6 | import zipfile
  7 | import sys
  8 | import os.path
  9 | import subprocess
 10 | import os
 11 | import re
 12 | import shutil
 13 | import datetime
 14 | from typing import TextIO
 15 | 
 16 | if sys.version_info[0] < 3:
 17 |     sys.stdout.write('Sorry, requires Python 3.x or better\n')
 18 |     sys.exit(1)
 19 | 
 20 | SCRIPT_PATH = os.path.dirname(os.path.abspath(sys.argv[0]))
 21 | PROJECT_PATH = os.path.dirname(SCRIPT_PATH)
 22 | print(f'SCRIPT_PATH={SCRIPT_PATH} PROJECT_PATH={PROJECT_PATH}')
 23 | 
 24 | AMALGAMATE_SOURCE_PATH = os.environ.get('AMALGAMATE_SOURCE_PATH') or os.path.join(PROJECT_PATH, 'src')
 25 | AMALGAMATE_INCLUDE_PATH = os.environ.get('AMALGAMATE_INCLUDE_PATH') or os.path.join(PROJECT_PATH, 'include')
 26 | AMALGAMATE_OUTPUT_PATH = os.environ.get('AMALGAMATE_OUTPUT_PATH') or os.path.join(SCRIPT_PATH)
 27 | 
 28 | # this list excludes the "src/generic headers"
 29 | ALL_C_FILES = ['ada.cpp']
 30 | 
 31 | # order matters
 32 | ALL_C_HEADERS = ['ada.h']
 33 | 
 34 | found_includes = []
 35 | 
 36 | def doinclude(fid: TextIO, file: str, line: str, origin: str) -> None:
 37 |     p = os.path.join(AMALGAMATE_INCLUDE_PATH, file)
 38 |     pi = os.path.join(AMALGAMATE_SOURCE_PATH, file)
 39 | 
 40 |     if os.path.exists(p):
 41 |         if file not in found_includes:
 42 |             found_includes.append(file)
 43 |             dofile(fid, AMALGAMATE_INCLUDE_PATH, file)
 44 |     elif os.path.exists(pi):
 45 |         if file not in found_includes:
 46 |             found_includes.append(file)
 47 |             dofile(fid, AMALGAMATE_SOURCE_PATH, file)
 48 |     else:
 49 |         # If we don't recognize it, just emit the #include
 50 |         print('unrecognized:', file, ' from ', line, ' in ', origin)
 51 |         print(line, file=fid)
 52 | 
 53 | 
 54 | def dofile(fid: TextIO, prepath: str, filename: str) -> None:
 55 |     file = os.path.join(prepath, filename)
 56 |     RELFILE = os.path.relpath(file, PROJECT_PATH)
 57 |     # Last lines are always ignored. Files should end by an empty lines.
 58 |     print(f'/* begin file {RELFILE} */', file=fid)
 59 |     includepattern = re.compile('\\s*#\\s*include "(.*)"')
 60 |     with open(file, 'r') as fid2:
 61 |         for line in fid2:
 62 |             line = line.rstrip('\n')
 63 |             s = includepattern.search(line)
 64 |             if s:
 65 |                 includedfile = s.group(1)
 66 |                 if includedfile == 'ada.h' and filename == 'ada.cpp':
 67 |                     print(line, file=fid)
 68 |                     continue
 69 | 
 70 |                 if includedfile.startswith('../'):
 71 |                     includedfile = includedfile[2:]
 72 |                 # we explicitly include ada headers, one time each
 73 |                 doinclude(fid, includedfile, line, filename)
 74 |             else:
 75 |                 print(line, file=fid)
 76 |     print(f'/* end file {RELFILE} */', file=fid)
 77 | 
 78 | 
 79 | # Get the generation date from git, so the output is reproducible.
 80 | # The %ci specifier gives the unambiguous ISO 8601 format, and
 81 | # does not change with locale and timezone at time of generation.
 82 | # Forcing it to be UTC is difficult, because it needs to be portable
 83 | # between gnu date and busybox date.
 84 | try:
 85 |     timestamp = (
 86 |         subprocess.run(['git', 'show', '-s', '--format=%ci', 'HEAD'], stdout=subprocess.PIPE)
 87 |         .stdout.decode('utf-8')
 88 |         .strip()
 89 |     )
 90 | except Exception:
 91 |     print('git not found, timestamp based on current time')
 92 |     timestamp = str(datetime.datetime.now())
 93 | print(f'timestamp is {timestamp}')
 94 | 
 95 | os.makedirs(AMALGAMATE_OUTPUT_PATH, exist_ok=True)
 96 | AMAL_H = os.path.join(AMALGAMATE_OUTPUT_PATH, 'ada.h')
 97 | AMAL_C = os.path.join(AMALGAMATE_OUTPUT_PATH, 'ada.cpp')
 98 | DEMOCPP = os.path.join(AMALGAMATE_OUTPUT_PATH, 'cpp')
 99 | README = os.path.join(AMALGAMATE_OUTPUT_PATH, 'README.md')
100 | 
101 | print(f'Creating {AMAL_H}')
102 | amal_h = open(AMAL_H, mode='w', encoding='utf8')
103 | print(f'/* auto-generated on {timestamp}. Do not edit! */', file=amal_h)
104 | for h in ALL_C_HEADERS:
105 |     doinclude(amal_h, h, f'ERROR {h} not found', h)
106 | 
107 | amal_h.close()
108 | print(f'Creating {AMAL_C}')
109 | amal_c = open(AMAL_C, mode='w', encoding='utf8')
110 | print(f'/* auto-generated on {timestamp}. Do not edit! */', file=amal_c)
111 | for c in ALL_C_FILES:
112 |     doinclude(amal_c, c, f'ERROR {c} not found', c)
113 | 
114 | amal_c.close()
115 | 
116 | # copy the README and DEMOCPP
117 | if SCRIPT_PATH != AMALGAMATE_OUTPUT_PATH:
118 |     shutil.copy2(os.path.join(SCRIPT_PATH, 'demo.cpp'), AMALGAMATE_OUTPUT_PATH)
119 |     shutil.copy2(os.path.join(SCRIPT_PATH, 'demo.c'), AMALGAMATE_OUTPUT_PATH)
120 |     shutil.copy2(os.path.join(SCRIPT_PATH, 'README.md'), AMALGAMATE_OUTPUT_PATH)
121 | 
122 | shutil.copy2(os.path.join(AMALGAMATE_INCLUDE_PATH, 'ada_c.h'), AMALGAMATE_OUTPUT_PATH)
123 | 
124 | zf = zipfile.ZipFile(os.path.join(AMALGAMATE_OUTPUT_PATH, 'singleheader.zip'), 'w', zipfile.ZIP_DEFLATED)
125 | zf.write(os.path.join(AMALGAMATE_OUTPUT_PATH, 'ada.cpp'), 'ada.cpp')
126 | zf.write(os.path.join(AMALGAMATE_OUTPUT_PATH, 'ada.h'), 'ada.h')
127 | zf.write(os.path.join(AMALGAMATE_INCLUDE_PATH, 'ada_c.h'), 'ada_c.h')
128 | 
129 | 
130 | print('Done with all files generation.')
131 | 
132 | print(f'Files have been written to directory: {AMALGAMATE_OUTPUT_PATH}/')
133 | print('Done with all files generation.')
134 | 


--------------------------------------------------------------------------------
/singleheader/demo.c:
--------------------------------------------------------------------------------
 1 | #include "ada_c.h"
 2 | #include <stdio.h>
 3 | #include <stdlib.h>
 4 | #include <stdbool.h>
 5 | #include <string.h>
 6 | 
 7 | static void ada_print(ada_string string) {
 8 |   printf("%.*s\n", (int)string.length, string.data);
 9 | }
10 | 
11 | int main(int c, char* arg[]) {
12 |   const char* input =
13 |       "https://username:password@www.google.com:8080/"
14 |       "pathname?query=true#hash-exists";
15 |   ada_url url = ada_parse(input, strlen(input));
16 |   if (!ada_is_valid(url)) {
17 |     puts("failure");
18 |     return EXIT_FAILURE;
19 |   }
20 |   ada_print(ada_get_href(
21 |       url));  // prints
22 |               // https://username:password@host:8080/pathname?query=true#hash-exists
23 |   ada_print(ada_get_protocol(url));  // prints https:
24 |   ada_print(ada_get_username(url));  // prints username
25 |   ada_set_href(url, "https://www.yagiz.co", strlen("https://www.yagiz.co"));
26 |   if (!ada_is_valid(url)) {
27 |     puts("failure");
28 |     return EXIT_FAILURE;
29 |   }
30 |   ada_set_hash(url, "new-hash", strlen("new-hash"));
31 |   ada_set_hostname(url, "new-host", strlen("new-host"));
32 |   ada_set_host(url, "changed-host:9090", strlen("changed-host:9090"));
33 |   ada_set_pathname(url, "new-pathname", strlen("new-pathname"));
34 |   ada_set_search(url, "new-search", strlen("new-search"));
35 |   ada_set_protocol(url, "wss", 3);
36 |   ada_print(ada_get_href(
37 |       url));  // will print
38 |               // wss://changed-host:9090/new-pathname?new-search#new-hash
39 |   ada_free(url);
40 |   return EXIT_SUCCESS;
41 | }
42 | 


--------------------------------------------------------------------------------
/singleheader/demo.cpp:
--------------------------------------------------------------------------------
 1 | #include "ada.cpp"
 2 | #include "ada.h"
 3 | #include <iostream>
 4 | 
 5 | int main(int, char *[]) {
 6 |   auto url = ada::parse<ada::url>("https://www.google.com");
 7 |   if (!url) {
 8 |     std::cout << "failure" << std::endl;
 9 |     return EXIT_FAILURE;
10 |   }
11 |   url->set_protocol("http");
12 |   std::cout << url->get_protocol() << std::endl;
13 |   std::cout << url->get_host() << std::endl;
14 |   return EXIT_SUCCESS;
15 | }
16 | 


--------------------------------------------------------------------------------
/src/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | 
 2 | message(STATUS "Compiler ID : " ${CMAKE_CXX_COMPILER_ID})
 3 | message(STATUS "CMAKE_BUILD_TYPE : " ${CMAKE_BUILD_TYPE})
 4 | 
 5 | add_library(ada-include-source INTERFACE)
 6 | target_include_directories(ada-include-source INTERFACE $<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}>)
 7 | add_library(ada-source INTERFACE)
 8 | target_sources(ada-source INTERFACE $<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}>/ada.cpp)
 9 | target_link_libraries(ada-source INTERFACE ada-include-source)
10 | add_library(ada ada.cpp)
11 | target_compile_features(ada PUBLIC cxx_std_20)
12 | target_include_directories(ada PRIVATE $<BUILD_INTERFACE:${CMAKE_CURRENT_SOURCE_DIR}> )
13 | target_include_directories(ada PUBLIC "$<BUILD_INTERFACE:${PROJECT_SOURCE_DIR}/include>")
14 | 
15 | if(MSVC)
16 |   if("${MSVC_TOOLSET_VERSION}" STREQUAL "140")
17 |     target_compile_options(ada INTERFACE /W0 /sdl)
18 |     set(ADA_LEGACY_VISUAL_STUDIO TRUE)
19 |   else()
20 |     target_compile_options(ada PRIVATE /WX /W3 /sdl /w34714) # https://docs.microsoft.com/en-us/cpp/error-messages/compiler-warnings/compiler-warning-level-4-c4714?view=vs-2019
21 |   endif()
22 | else(MSVC)
23 |   if(NOT WIN32)
24 |     target_compile_options(ada INTERFACE -fPIC)
25 |   endif()
26 |   message(STATUS "Assuming GCC-like compiler.")
27 |   target_compile_options(ada PRIVATE -Wall -Wextra -Weffc++)
28 |   if(CMAKE_CXX_COMPILER_ID STREQUAL "GNU")
29 |     target_compile_options(ada PRIVATE -Wsuggest-override)
30 |   endif()
31 |   if((CMAKE_CXX_COMPILER_ID STREQUAL "Clang") OR (CMAKE_CXX_COMPILER_ID STREQUAL "AppleClang"))
32 |     target_compile_options(ada PRIVATE -Winconsistent-missing-override)
33 |   endif()
34 |   target_compile_options(ada PRIVATE -Wfatal-errors -Wsign-compare -Wshadow -Wwrite-strings -Wpointer-arith -Winit-self -Wconversion -Wno-sign-conversion)
35 | endif(MSVC)
36 | 
37 | # workaround for GNU GCC poor AVX load/store code generation
38 | if ((CMAKE_CXX_COMPILER_ID STREQUAL "GNU") AND (CMAKE_SYSTEM_PROCESSOR MATCHES "^(i.86|x86(_64)?)$"))
39 |   target_compile_options(ada PRIVATE -mno-avx256-split-unaligned-load -mno-avx256-split-unaligned-store)
40 | endif()
41 | if(ADA_DEVELOPMENT_CHECKS)
42 |   target_compile_definitions(ada PUBLIC ADA_DEVELOPMENT_CHECKS=1)
43 | endif()
44 | 
45 | if(ADA_SANITIZE)
46 |   target_compile_options(ada PUBLIC -fsanitize=address  -fno-omit-frame-pointer -fno-sanitize-recover=all)
47 |   target_compile_definitions(ada PUBLIC ASAN_OPTIONS=detect_leaks=1)
48 |   target_link_libraries(ada PUBLIC -fsanitize=address  -fno-omit-frame-pointer -fno-sanitize-recover=all)
49 | endif()
50 | if(ADA_SANITIZE_WITHOUT_LEAKS)
51 |   target_compile_options(ada PUBLIC -fsanitize=address  -fno-omit-frame-pointer -fno-sanitize-recover=all)
52 |   target_link_libraries(ada PUBLIC -fsanitize=address  -fno-omit-frame-pointer -fno-sanitize-recover=all)
53 | endif()
54 | 
55 | if(ADA_LOGGING)
56 |   target_compile_definitions(ada PRIVATE ADA_LOGGING=1)
57 | endif()
58 | 
59 | if(ADA_TESTING)
60 |   target_compile_definitions(ada PRIVATE ADA_TESTING=1)
61 | endif()
62 | 
63 | if(ADA_INCLUDE_URL_PATTERN)
64 |   target_compile_definitions(ada PRIVATE ADA_INCLUDE_URL_PATTERN=1)
65 | else()
66 |   target_compile_definitions(ada PRIVATE ADA_INCLUDE_URL_PATTERN=0)
67 | endif()
68 | 


--------------------------------------------------------------------------------
/src/ada.cpp:
--------------------------------------------------------------------------------
 1 | #include "ada.h"
 2 | #include "checkers.cpp"
 3 | #include "unicode.cpp"
 4 | #include "serializers.cpp"
 5 | #include "implementation.cpp"
 6 | #include "helpers.cpp"
 7 | #include "url.cpp"
 8 | #include "parser.cpp"
 9 | #include "url_components.cpp"
10 | #include "url_aggregator.cpp"
11 | 
12 | #if ADA_INCLUDE_URL_PATTERN
13 | #include "url_pattern.cpp"
14 | #include "url_pattern_helpers.cpp"
15 | #include "url_pattern_regex.cpp"
16 | #endif  // ADA_INCLUDE_URL_PATTERN
17 | 
18 | #include "ada_c.cpp"
19 | 


--------------------------------------------------------------------------------
/src/checkers.cpp:
--------------------------------------------------------------------------------
  1 | #include "ada/checkers-inl.h"
  2 | #include "ada/checkers.h"
  3 | #include "ada/unicode-inl.h"
  4 | #include "ada/common_defs.h"
  5 | 
  6 | #include <algorithm>
  7 | #include <array>
  8 | #include <string_view>
  9 | 
 10 | namespace ada::checkers {
 11 | 
 12 | ada_really_inline constexpr bool is_ipv4(std::string_view view) noexcept {
 13 |   // The string is not empty and does not contain upper case ASCII characters.
 14 |   //
 15 |   // Optimization. To be considered as a possible ipv4, the string must end
 16 |   // with 'x' or a lowercase hex character.
 17 |   // Most of the time, this will be false so this simple check will save a lot
 18 |   // of effort.
 19 |   // If the address ends with a dot, we need to prune it (special case).
 20 |   if (view.ends_with('.')) {
 21 |     view.remove_suffix(1);
 22 |     if (view.empty()) {
 23 |       return false;
 24 |     }
 25 |   }
 26 |   char last_char = view.back();
 27 |   bool possible_ipv4 = (last_char >= '0' && last_char <= '9') ||
 28 |                        (last_char >= 'a' && last_char <= 'f') ||
 29 |                        last_char == 'x';
 30 |   if (!possible_ipv4) {
 31 |     return false;
 32 |   }
 33 |   // From the last character, find the last dot.
 34 |   size_t last_dot = view.rfind('.');
 35 |   if (last_dot != std::string_view::npos) {
 36 |     // We have at least one dot.
 37 |     view = view.substr(last_dot + 1);
 38 |   }
 39 |   /** Optimization opportunity: we have basically identified the last number of
 40 |      the ipv4 if we return true here. We might as well parse it and have at
 41 |      least one number parsed when we get to parse_ipv4. */
 42 |   if (std::ranges::all_of(view, ada::checkers::is_digit)) {
 43 |     return true;
 44 |   }
 45 |   // It could be hex (0x), but not if there is a single character.
 46 |   if (view.size() == 1) {
 47 |     return false;
 48 |   }
 49 |   // It must start with 0x.
 50 |   if (!view.starts_with("0x")) {
 51 |     return false;
 52 |   }
 53 |   // We must allow "0x".
 54 |   if (view.size() == 2) {
 55 |     return true;
 56 |   }
 57 |   // We have 0x followed by some characters, we need to check that they are
 58 |   // hexadecimals.
 59 |   view.remove_prefix(2);
 60 |   return std::ranges::all_of(view, ada::unicode::is_lowercase_hex);
 61 | }
 62 | 
 63 | // for use with path_signature, we include all characters that need percent
 64 | // encoding.
 65 | static constexpr std::array<uint8_t, 256> path_signature_table =
 66 |     []() consteval {
 67 |       std::array<uint8_t, 256> result{};
 68 |       for (size_t i = 0; i < 256; i++) {
 69 |         if (i <= 0x20 || i == 0x22 || i == 0x23 || i == 0x3c || i == 0x3e ||
 70 |             i == 0x3f || i == 0x60 || i == 0x7b || i == 0x7d || i > 0x7e) {
 71 |           result[i] = 1;
 72 |         } else if (i == 0x25) {
 73 |           result[i] = 8;
 74 |         } else if (i == 0x2e) {
 75 |           result[i] = 4;
 76 |         } else if (i == 0x5c) {
 77 |           result[i] = 2;
 78 |         } else {
 79 |           result[i] = 0;
 80 |         }
 81 |       }
 82 |       return result;
 83 |     }();
 84 | 
 85 | ada_really_inline constexpr uint8_t path_signature(
 86 |     std::string_view input) noexcept {
 87 |   // The path percent-encode set is the query percent-encode set and U+003F (?),
 88 |   // U+0060 (`), U+007B ({), and U+007D (}). The query percent-encode set is the
 89 |   // C0 control percent-encode set and U+0020 SPACE, U+0022 ("), U+0023 (#),
 90 |   // U+003C (<), and U+003E (>). The C0 control percent-encode set are the C0
 91 |   // controls and all code points greater than U+007E (~).
 92 |   size_t i = 0;
 93 |   uint8_t accumulator{};
 94 |   for (; i + 7 < input.size(); i += 8) {
 95 |     accumulator |= uint8_t(path_signature_table[uint8_t(input[i])] |
 96 |                            path_signature_table[uint8_t(input[i + 1])] |
 97 |                            path_signature_table[uint8_t(input[i + 2])] |
 98 |                            path_signature_table[uint8_t(input[i + 3])] |
 99 |                            path_signature_table[uint8_t(input[i + 4])] |
100 |                            path_signature_table[uint8_t(input[i + 5])] |
101 |                            path_signature_table[uint8_t(input[i + 6])] |
102 |                            path_signature_table[uint8_t(input[i + 7])]);
103 |   }
104 |   for (; i < input.size(); i++) {
105 |     accumulator |= uint8_t(path_signature_table[uint8_t(input[i])]);
106 |   }
107 |   return accumulator;
108 | }
109 | 
110 | ada_really_inline constexpr bool verify_dns_length(
111 |     std::string_view input) noexcept {
112 |   if (input.back() == '.') {
113 |     if (input.size() > 254) return false;
114 |   } else if (input.size() > 253)
115 |     return false;
116 | 
117 |   size_t start = 0;
118 |   while (start < input.size()) {
119 |     auto dot_location = input.find('.', start);
120 |     // If not found, it's likely the end of the domain
121 |     if (dot_location == std::string_view::npos) dot_location = input.size();
122 | 
123 |     auto label_size = dot_location - start;
124 |     if (label_size > 63 || label_size == 0) return false;
125 | 
126 |     start = dot_location + 1;
127 |   }
128 | 
129 |   return true;
130 | }
131 | }  // namespace ada::checkers
132 | 


--------------------------------------------------------------------------------
/src/implementation.cpp:
--------------------------------------------------------------------------------
 1 | #include "ada/implementation-inl.h"
 2 | 
 3 | #include <string_view>
 4 | 
 5 | #include "ada/common_defs.h"
 6 | #include "ada/parser.h"
 7 | #include "ada/url.h"
 8 | #include "ada/url_aggregator.h"
 9 | 
10 | namespace ada {
11 | 
12 | template <class result_type>
13 | ada_warn_unused tl::expected<result_type, errors> parse(
14 |     std::string_view input, const result_type* base_url) {
15 |   result_type u =
16 |       ada::parser::parse_url_impl<result_type, true>(input, base_url);
17 |   if (!u.is_valid) {
18 |     return tl::unexpected(errors::type_error);
19 |   }
20 |   return u;
21 | }
22 | 
23 | template ada::result<url> parse<url>(std::string_view input,
24 |                                      const url* base_url = nullptr);
25 | template ada::result<url_aggregator> parse<url_aggregator>(
26 |     std::string_view input, const url_aggregator* base_url = nullptr);
27 | 
28 | std::string href_from_file(std::string_view input) {
29 |   // This is going to be much faster than constructing a URL.
30 |   std::string tmp_buffer;
31 |   std::string_view internal_input;
32 |   if (unicode::has_tabs_or_newline(input)) {
33 |     tmp_buffer = input;
34 |     helpers::remove_ascii_tab_or_newline(tmp_buffer);
35 |     internal_input = tmp_buffer;
36 |   } else {
37 |     internal_input = input;
38 |   }
39 |   std::string path;
40 |   if (internal_input.empty()) {
41 |     path = "/";
42 |   } else if ((internal_input[0] == '/') || (internal_input[0] == '\\')) {
43 |     helpers::parse_prepared_path(internal_input.substr(1),
44 |                                  ada::scheme::type::FILE, path);
45 |   } else {
46 |     helpers::parse_prepared_path(internal_input, ada::scheme::type::FILE, path);
47 |   }
48 |   return "file://" + path;
49 | }
50 | 
51 | bool can_parse(std::string_view input, const std::string_view* base_input) {
52 |   ada::url_aggregator base_aggregator;
53 |   ada::url_aggregator* base_pointer = nullptr;
54 | 
55 |   if (base_input != nullptr) {
56 |     base_aggregator = ada::parser::parse_url_impl<ada::url_aggregator, false>(
57 |         *base_input, nullptr);
58 |     if (!base_aggregator.is_valid) {
59 |       return false;
60 |     }
61 |     base_pointer = &base_aggregator;
62 |   }
63 | 
64 |   ada::url_aggregator result =
65 |       ada::parser::parse_url_impl<ada::url_aggregator, false>(input,
66 |                                                               base_pointer);
67 |   return result.is_valid;
68 | }
69 | 
70 | ada_warn_unused std::string to_string(ada::encoding_type type) {
71 |   switch (type) {
72 |     case ada::encoding_type::UTF8:
73 |       return "UTF-8";
74 |     case ada::encoding_type::UTF_16LE:
75 |       return "UTF-16LE";
76 |     case ada::encoding_type::UTF_16BE:
77 |       return "UTF-16BE";
78 |     default:
79 |       unreachable();
80 |   }
81 | }
82 | 
83 | }  // namespace ada
84 | 


--------------------------------------------------------------------------------
/src/serializers.cpp:
--------------------------------------------------------------------------------
 1 | #include <array>
 2 | #include <charconv>
 3 | #include <string>
 4 | 
 5 | namespace ada::serializers {
 6 | 
 7 | void find_longest_sequence_of_ipv6_pieces(
 8 |     const std::array<uint16_t, 8>& address, size_t& compress,
 9 |     size_t& compress_length) noexcept {
10 |   for (size_t i = 0; i < 8; i++) {
11 |     if (address[i] == 0) {
12 |       size_t next = i + 1;
13 |       while (next != 8 && address[next] == 0) ++next;
14 |       const size_t count = next - i;
15 |       if (compress_length < count) {
16 |         compress_length = count;
17 |         compress = i;
18 |         if (next == 8) break;
19 |         i = next;
20 |       }
21 |     }
22 |   }
23 | }
24 | 
25 | std::string ipv6(const std::array<uint16_t, 8>& address) noexcept {
26 |   size_t compress_length = 0;  // The length of a long sequence of zeros.
27 |   size_t compress = 0;         // The start of a long sequence of zeros.
28 |   find_longest_sequence_of_ipv6_pieces(address, compress, compress_length);
29 | 
30 |   if (compress_length <= 1) {
31 |     // Optimization opportunity: Find a faster way then snprintf for imploding
32 |     // and return here.
33 |     compress = compress_length = 8;
34 |   }
35 | 
36 |   std::string output(4 * 8 + 7 + 2, '\0');
37 |   size_t piece_index = 0;
38 |   char* point = output.data();
39 |   char* point_end = output.data() + output.size();
40 |   *point++ = '[';
41 |   while (true) {
42 |     if (piece_index == compress) {
43 |       *point++ = ':';
44 |       // If we skip a value initially, we need to write '::', otherwise
45 |       // a single ':' will do since it follows a previous ':'.
46 |       if (piece_index == 0) {
47 |         *point++ = ':';
48 |       }
49 |       piece_index += compress_length;
50 |       if (piece_index == 8) {
51 |         break;
52 |       }
53 |     }
54 |     point = std::to_chars(point, point_end, address[piece_index], 16).ptr;
55 |     piece_index++;
56 |     if (piece_index == 8) {
57 |       break;
58 |     }
59 |     *point++ = ':';
60 |   }
61 |   *point++ = ']';
62 |   output.resize(point - output.data());
63 |   return output;
64 | }
65 | 
66 | std::string ipv4(const uint64_t address) noexcept {
67 |   std::string output(15, '\0');
68 |   char* point = output.data();
69 |   char* point_end = output.data() + output.size();
70 |   point = std::to_chars(point, point_end, uint8_t(address >> 24)).ptr;
71 |   for (int i = 2; i >= 0; i--) {
72 |     *point++ = '.';
73 |     point = std::to_chars(point, point_end, uint8_t(address >> (i * 8))).ptr;
74 |   }
75 |   output.resize(point - output.data());
76 |   return output;
77 | }
78 | 
79 | }  // namespace ada::serializers
80 | 


--------------------------------------------------------------------------------
/src/url_components.cpp:
--------------------------------------------------------------------------------
 1 | #include "ada/helpers.h"
 2 | #include "ada/url_components-inl.h"
 3 | 
 4 | #include <string>
 5 | 
 6 | namespace ada {
 7 | 
 8 | [[nodiscard]] std::string url_components::to_string() const {
 9 |   std::string answer;
10 |   auto back = std::back_insert_iterator(answer);
11 |   answer.append("{\n");
12 | 
13 |   answer.append("\t\"protocol_end\":\"");
14 |   helpers::encode_json(std::to_string(protocol_end), back);
15 |   answer.append("\",\n");
16 | 
17 |   answer.append("\t\"username_end\":\"");
18 |   helpers::encode_json(std::to_string(username_end), back);
19 |   answer.append("\",\n");
20 | 
21 |   answer.append("\t\"host_start\":\"");
22 |   helpers::encode_json(std::to_string(host_start), back);
23 |   answer.append("\",\n");
24 | 
25 |   answer.append("\t\"host_end\":\"");
26 |   helpers::encode_json(std::to_string(host_end), back);
27 |   answer.append("\",\n");
28 | 
29 |   answer.append("\t\"port\":\"");
30 |   helpers::encode_json(std::to_string(port), back);
31 |   answer.append("\",\n");
32 | 
33 |   answer.append("\t\"pathname_start\":\"");
34 |   helpers::encode_json(std::to_string(pathname_start), back);
35 |   answer.append("\",\n");
36 | 
37 |   answer.append("\t\"search_start\":\"");
38 |   helpers::encode_json(std::to_string(search_start), back);
39 |   answer.append("\",\n");
40 | 
41 |   answer.append("\t\"hash_start\":\"");
42 |   helpers::encode_json(std::to_string(hash_start), back);
43 |   answer.append("\",\n");
44 | 
45 |   answer.append("\n}");
46 |   return answer;
47 | }
48 | 
49 | }  // namespace ada
50 | 


--------------------------------------------------------------------------------
/src/url_pattern_regex.cpp:
--------------------------------------------------------------------------------
 1 | #if ADA_INCLUDE_URL_PATTERN
 2 | 
 3 | #include "ada/url_pattern_regex.h"
 4 | 
 5 | namespace ada::url_pattern_regex {
 6 | 
 7 | #ifdef ADA_USE_UNSAFE_STD_REGEX_PROVIDER
 8 | std::optional<std::regex> std_regex_provider::create_instance(
 9 |     std::string_view pattern, bool ignore_case) {
10 |   // Let flags be an empty string.
11 |   // If options's ignore case is true then set flags to "vi".
12 |   // Otherwise set flags to "v"
13 |   auto flags = ignore_case
14 |                    ? std::regex::icase | std::regex_constants::ECMAScript
15 |                    : std::regex_constants::ECMAScript;
16 |   try {
17 |     return std::regex(pattern.data(), pattern.size(), flags);
18 |   } catch (const std::regex_error& e) {
19 |     (void)e;
20 |     ada_log("std_regex_provider::create_instance failed:", e.what());
21 |     return std::nullopt;
22 |   }
23 | }
24 | 
25 | std::optional<std::vector<std::optional<std::string>>>
26 | std_regex_provider::regex_search(std::string_view input,
27 |                                  const std::regex& pattern) {
28 |   std::string input_str(
29 |       input.begin(),
30 |       input.end());  // Convert string_view to string for regex_search
31 |   std::smatch match_result;
32 |   if (!std::regex_search(input_str, match_result, pattern,
33 |                          std::regex_constants::match_any)) {
34 |     return std::nullopt;
35 |   }
36 |   std::vector<std::optional<std::string>> matches;
37 |   // If input is empty, let's assume the result will be empty as well.
38 |   if (input.empty() || match_result.empty()) {
39 |     return matches;
40 |   }
41 |   matches.reserve(match_result.size());
42 |   for (size_t i = 1; i < match_result.size(); ++i) {
43 |     if (auto entry = match_result[i]; entry.matched) {
44 |       matches.emplace_back(entry.str());
45 |     }
46 |   }
47 |   return matches;
48 | }
49 | 
50 | bool std_regex_provider::regex_match(std::string_view input,
51 |                                      const std::regex& pattern) {
52 |   return std::regex_match(input.begin(), input.end(), pattern);
53 | }
54 | 
55 | #endif  // ADA_USE_UNSAFE_STD_REGEX_PROVIDER
56 | 
57 | }  // namespace ada::url_pattern_regex
58 | 
59 | #endif  // ADA_INCLUDE_URL_PATTERN
60 | 


--------------------------------------------------------------------------------
/tests/CMakeLists.txt:
--------------------------------------------------------------------------------
  1 | #
  2 | # Source files should be just ASCII
  3 | #
  4 | find_program(FIND find)
  5 | find_program(FILE file)
  6 | find_program(GREP grep)
  7 | if(FIND AND FILE AND GREP)
  8 |   add_test(
  9 |       NAME just_ascii
 10 |       COMMAND sh -c "\
 11 | ${FIND} include src tests tools benchmarks  -name '*.h' -o -name '*.txt' -o -name '*.cpp' -type f -exec ${FILE} '{}' \; | ${GREP} -qv ASCII || exit 0  && exit 1"
 12 |       WORKING_DIRECTORY "${PROJECT_SOURCE_DIR}"
 13 |   )
 14 | endif()
 15 | 
 16 | add_subdirectory(wpt)
 17 | 
 18 | set(ADA_TEST_INCLUDE_DIR ${CMAKE_CURRENT_SOURCE_DIR}/../)
 19 | if(MSVC)
 20 |   add_compile_options("/Zi" "/EHsc" "/GR")
 21 |   add_compile_options("$<$<C_COMPILER_ID:MSVC>:/utf-8>")
 22 |   add_compile_options("$<$<CXX_COMPILER_ID:MSVC>:/utf-8>")
 23 | endif()
 24 | 
 25 | if(ADA_LOGGING)
 26 |   add_compile_definitions(ADA_LOGGING=1)
 27 | endif()
 28 | 
 29 | if(ADA_INCLUDE_URL_PATTERN)
 30 |   add_compile_definitions(ADA_INCLUDE_URL_PATTERN=1)
 31 | else()
 32 |   add_compile_definitions(ADA_INCLUDE_URL_PATTERN=0)
 33 | endif()
 34 | 
 35 | if(ADA_TESTING)
 36 |   add_compile_definitions(ADA_TESTING=1)
 37 | endif()
 38 | 
 39 | include(${PROJECT_SOURCE_DIR}/cmake/add-cpp-test.cmake)
 40 | link_libraries(ada)
 41 | 
 42 | add_cpp_test(basic_fuzzer)
 43 | 
 44 | if(MSVC AND BUILD_SHARED_LIBS)
 45 |   # Copy the ada dll into the directory
 46 |   add_custom_command(TARGET basic_fuzzer PRE_BUILD        # Adds a pre-build event
 47 |     COMMAND ${CMAKE_COMMAND} -E copy_if_different  # which executes "cmake -E copy_if_different..."
 48 |         "$<TARGET_FILE:ada>"      # <--this is in-file
 49 |         "$<TARGET_FILE_DIR:basic_fuzzer>")                 # <--this is out-file path
 50 | endif()
 51 | 
 52 | if(MSVC AND BUILD_SHARED_LIBS)
 53 |   message(STATUS "For some tests we use Google Test and it fails when building a DLL.")
 54 |   message(STATUS "Thus the tests are disabled. Sorry.")
 55 | else()
 56 |   include(GoogleTest)
 57 |   add_executable(wpt_url_tests wpt_url_tests.cpp)
 58 |   if(ADA_INCLUDE_URL_PATTERN)
 59 |   add_executable(wpt_urlpattern_tests wpt_urlpattern_tests.cpp)
 60 |   endif()
 61 |   add_executable(url_components url_components.cpp)
 62 |   add_executable(basic_tests basic_tests.cpp)
 63 |   add_executable(from_file_tests from_file_tests.cpp)
 64 |   add_executable(ada_c ada_c.cpp)
 65 |   add_executable(url_search_params url_search_params.cpp)
 66 | 
 67 |   target_link_libraries(wpt_url_tests PRIVATE simdjson GTest::gtest_main)
 68 |   if(ADA_INCLUDE_URL_PATTERN)
 69 |   target_link_libraries(wpt_urlpattern_tests PRIVATE simdjson GTest::gtest_main)
 70 |   endif()
 71 |   target_link_libraries(url_components PRIVATE simdjson GTest::gtest_main)
 72 |   target_link_libraries(basic_tests PRIVATE simdjson GTest::gtest_main)
 73 |   target_link_libraries(from_file_tests PRIVATE simdjson GTest::gtest_main)
 74 |   target_link_libraries(ada_c PRIVATE simdjson GTest::gtest_main)
 75 |   target_link_libraries(url_search_params PRIVATE simdjson GTest::gtest_main)
 76 | 
 77 |   gtest_discover_tests(wpt_url_tests PROPERTIES TEST_DISCOVERY_TIMEOUT 600)
 78 |   if(ADA_INCLUDE_URL_PATTERN)
 79 |   gtest_discover_tests(wpt_urlpattern_tests PROPERTIES TEST_DISCOVERY_TIMEOUT 600)
 80 |   endif()
 81 |   gtest_discover_tests(url_components PROPERTIES TEST_DISCOVERY_TIMEOUT 600)
 82 |   gtest_discover_tests(basic_tests PROPERTIES TEST_DISCOVERY_TIMEOUT 600)
 83 |   gtest_discover_tests(from_file_tests PROPERTIES TEST_DISCOVERY_TIMEOUT 600)
 84 |   gtest_discover_tests(ada_c PROPERTIES TEST_DISCOVERY_TIMEOUT 600)
 85 |   gtest_discover_tests(url_search_params PROPERTIES TEST_DISCOVERY_TIMEOUT 600)
 86 | 
 87 |   if("${CMAKE_CXX_COMPILER_ID}" STREQUAL "GNU")
 88 |     if (CMAKE_CXX_COMPILER_VERSION VERSION_LESS 9)
 89 |       target_link_libraries(wpt_url_tests PUBLIC stdc++fs)
 90 |       target_link_libraries(wpt_urlpattern_tests PUBLIC stdc++fs)
 91 |       target_link_libraries(url_components PUBLIC stdc++fs)
 92 |       target_link_libraries(url_search_params PUBLIC stdc++fs)
 93 |     endif()
 94 |   endif()
 95 | 
 96 |   if(MSVC OR MINGW)
 97 |     target_compile_definitions(wpt_url_tests PRIVATE _CRT_SECURE_NO_WARNINGS)
 98 |     target_compile_definitions(wpt_urlpattern_tests PRIVATE _CRT_SECURE_NO_WARNINGS)
 99 |     target_compile_definitions(url_components PRIVATE _CRT_SECURE_NO_WARNINGS)
100 |     target_compile_definitions(basic_fuzzer PRIVATE _CRT_SECURE_NO_WARNINGS)
101 |     target_compile_definitions(from_file_tests PRIVATE _CRT_SECURE_NO_WARNINGS)
102 |     target_compile_definitions(basic_tests PRIVATE _CRT_SECURE_NO_WARNINGS)
103 |     target_compile_definitions(url_search_params PRIVATE _CRT_SECURE_NO_WARNINGS)
104 |   endif()
105 | 
106 | endif()
107 | 


--------------------------------------------------------------------------------
/tests/from_file_tests.cpp:
--------------------------------------------------------------------------------
 1 | #include "ada.h"
 2 | #include <cstdlib>
 3 | #include <iostream>
 4 | #include "gtest/gtest.h"
 5 | 
 6 | std::string long_way(std::string path) {
 7 |   ada::result<ada::url> base = ada::parse<ada::url>("file://");
 8 |   base->set_pathname(path);
 9 |   return base->get_href();
10 | }
11 | 
12 | TEST(from_file_tests, basics) {
13 |   for (std::string path :
14 |        {"", "fsfds", "C:\\\\blabala\\fdfds\\back.txt", "/home/user/txt.txt",
15 |         "/%2e.bar", "/foo/%2e%2", "/foo/..bar", "foo\t%91"}) {
16 |     ASSERT_TRUE(long_way(path) == ada::href_from_file(path));
17 |   }
18 | }
19 | 


--------------------------------------------------------------------------------
/tests/installation/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.15)
 2 | 
 3 | project(test_ada_install VERSION 0.1.0 LANGUAGES CXX)
 4 | 
 5 | set(CMAKE_CXX_STANDARD 20)
 6 | set(CMAKE_CXX_STANDARD_REQUIRED ON)
 7 | 
 8 | find_package(ada REQUIRED)
 9 | 
10 | # You can provide your own code, this is just an example:
11 | file(WRITE main.cpp "
12 | #include \"ada.h\"
13 | #include <iostream>
14 | 
15 | int main(int , char *[]) {
16 |   ada::result<ada::url_aggregator> url = ada::parse<ada::url_aggregator>(\"https://www.google.com\");
17 |   url->set_protocol(\"http\");
18 |   std::cout << url->get_protocol() << std::endl;
19 |   std::cout << url->get_host() << std::endl;
20 |   return EXIT_SUCCESS;
21 | }")
22 | 
23 | add_executable(main main.cpp)
24 | target_link_libraries(main PUBLIC ada::ada)
25 | 


--------------------------------------------------------------------------------
/tests/wasm/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | link_libraries(ada)
 2 | # Node
 3 | add_executable(wasm-node wasm.cpp)
 4 | set_target_properties(wasm-node PROPERTIES LINK_FLAGS "-Os -s ENVIRONMENT=node -s EXPORT_NAME=loadWASM -s MODULARIZE=1 --bind")
 5 | 
 6 | configure_file(test.js.in test.js)
 7 | 
 8 | find_program(NODEJS_BINARY NAMES node nodejs)
 9 | if(NODEJS_BINARY)
10 |   add_test(NAME wasmtest
11 |          COMMAND "${NODEJS_BINARY}" "${CMAKE_CURRENT_BINARY_DIR}/test.js")
12 | endif(NODEJS_BINARY)
13 | 
14 | 


--------------------------------------------------------------------------------
/tests/wasm/test.js.in:
--------------------------------------------------------------------------------
 1 | const assert = require('node:assert');
 2 | const test = require('node:test');
 3 | const wasm = require('${CMAKE_CURRENT_BINARY_DIR}/wasm-node');
 4 | 
 5 | function toJS(obj) {
 6 |   const result = {};
 7 |   for (const key of Object.keys(obj.__proto__)) {
 8 |        result[key] = typeof obj[key] === "object" ? toJS(obj[key]) : obj[key];
 9 |   }
10 |   return result;
11 | }
12 | 
13 | const expected = {
14 |   "result": "success",
15 |   "href": "https://google.com/?q=Yagiz#Nizipli",
16 |   "type": 2,
17 |   "components": {
18 |     "protocol_end": 6,
19 |     "username_end": 8,
20 |     "host_start": 8,
21 |     "host_end": 18,
22 |     "port": 4294967295,
23 |     "pathname_start": 18,
24 |     "search_start": 19,
25 |     "hash_start": 27
26 |   }
27 | };
28 | 
29 | test('wasm', async () => {
30 |   const { parse } = await wasm();
31 |   assert.deepStrictEqual(toJS(parse('https://google.com/?q=Yagiz#Nizipli')), expected);
32 | });
33 | 
34 | 


--------------------------------------------------------------------------------
/tests/wasm/wasm.cpp:
--------------------------------------------------------------------------------
 1 | #include "ada.h"
 2 | #include <emscripten/emscripten.h>
 3 | #include <emscripten/bind.h>
 4 | 
 5 | using namespace emscripten;
 6 | 
 7 | struct parse_result {
 8 |   std::string result;
 9 |   std::string href;
10 |   uint32_t type;
11 |   ada::url_components components;
12 | };
13 | 
14 | parse_result parse(const std::string &input) {
15 |   auto out = ada::parse<ada::url_aggregator>(input);
16 |   parse_result result;
17 |   if (!out.has_value()) {
18 |     result.result = "fail";
19 |   } else {
20 |     result.result = "success";
21 |     result.href = std::string(out->get_href());
22 |     result.type = out->type;
23 |     result.components = out->get_components();
24 |   }
25 |   return result;
26 | }
27 | 
28 | EMSCRIPTEN_BINDINGS(url_components) {
29 |   class_<parse_result>("Result")
30 |       .property("result", &parse_result::result)
31 |       .property("href", &parse_result::href)
32 |       .property("type", &parse_result::type)
33 |       .property("components", &parse_result::components);
34 |   class_<ada::url_components>("URLComponents")
35 |       .property("protocol_end", &ada::url_components::protocol_end)
36 |       .property("username_end", &ada::url_components::username_end)
37 |       .property("host_start", &ada::url_components::host_start)
38 |       .property("host_end", &ada::url_components::host_end)
39 |       .property("port", &ada::url_components::port)
40 |       .property("pathname_start", &ada::url_components::pathname_start)
41 |       .property("search_start", &ada::url_components::search_start)
42 |       .property("hash_start", &ada::url_components::hash_start);
43 | 
44 |   function("parse", &parse);
45 | }


--------------------------------------------------------------------------------
/tests/wpt/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | 
2 | file(GLOB_RECURSE wpt_files RELATIVE ${CMAKE_CURRENT_SOURCE_DIR} *.json)
3 | foreach(wpt_file ${wpt_files})
4 |   configure_file(${wpt_file} ${wpt_file} COPYONLY)
5 | endforeach(wpt_file)
6 | 


--------------------------------------------------------------------------------
/tests/wpt/IdnaTestV2-removed.json:
--------------------------------------------------------------------------------
  1 | [
  2 |   "This is generated with the help from ../tools/IdnaTestV2-compare.py.",
  3 |   "These tests are from an older IdnaTestV2 and thus the comment line may no longer be accurate.",
  4 |   {
  5 |     "comment": "P1; V6; V3 (ignored)",
  6 |     "input": "-\udb40\ude56\ua867\uff0e\udb40\ude82\ud8dc\udd83\ud83c\udd09",
  7 |     "output": null
  8 |   },
  9 |   {
 10 |     "comment": "P1; V5; V6",
 11 |     "input": "\ud83c\udd04\uff0e\u1cdc\u2488\u00df",
 12 |     "output": null
 13 |   },
 14 |   {
 15 |     "comment": "P1; V5; V6",
 16 |     "input": "\ud83c\udd04\uff0e\u1cdc\u2488SS",
 17 |     "output": null
 18 |   },
 19 |   {
 20 |     "comment": "P1; V5; V6",
 21 |     "input": "\ud83c\udd04\uff0e\u1cdc\u2488ss",
 22 |     "output": null
 23 |   },
 24 |   {
 25 |     "comment": "P1; V5; V6",
 26 |     "input": "\ud83c\udd04\uff0e\u1cdc\u2488Ss",
 27 |     "output": null
 28 |   },
 29 |   {
 30 |     "comment": "C2; P1; V6",
 31 |     "input": "\u0756\u3002\u3164\u200d\u03c2",
 32 |     "output": null
 33 |   },
 34 |   {
 35 |     "comment": "C2; P1; V6",
 36 |     "input": "\u0756\u3002\u1160\u200d\u03c2",
 37 |     "output": null
 38 |   },
 39 |   {
 40 |     "comment": "C2; P1; V6",
 41 |     "input": "\u0756\u3002\u1160\u200d\u03a3",
 42 |     "output": null
 43 |   },
 44 |   {
 45 |     "comment": "C2; P1; V6",
 46 |     "input": "\u0756\u3002\u1160\u200d\u03c3",
 47 |     "output": null
 48 |   },
 49 |   {
 50 |     "comment": "C2; P1; V6",
 51 |     "input": "\u0756\u3002\u3164\u200d\u03a3",
 52 |     "output": null
 53 |   },
 54 |   {
 55 |     "comment": "C2; P1; V6",
 56 |     "input": "\u0756\u3002\u3164\u200d\u03c3",
 57 |     "output": null
 58 |   },
 59 |   {
 60 |     "comment": "P1; V6",
 61 |     "input": "\ud83c\udd07\u4f10\ufe12.\ud831\ude5a\ua8c4",
 62 |     "output": null
 63 |   },
 64 |   {
 65 |     "comment": "P1; V5; V6",
 66 |     "input": "\ud802\ude3f.\ud83c\udd06\u2014",
 67 |     "output": null
 68 |   },
 69 |   {
 70 |     "comment": "C2; P1; V5; V6",
 71 |     "input": "\u1c32\ud83c\udd08\u2f9b\u05a6\uff0e\u200d\uda7e\udd64\u07fd",
 72 |     "output": null
 73 |   },
 74 |   {
 75 |     "comment": "C2; P1; V5; V6",
 76 |     "input": "\ud83e\udc9f\ud83c\udd08\u200d\ua84e\uff61\u0f84",
 77 |     "output": null
 78 |   },
 79 |   {
 80 |     "comment": "P1; V6",
 81 |     "input": "\udaa5\udeaa\uff61\ud83c\udd02",
 82 |     "output": null
 83 |   },
 84 |   {
 85 |     "comment": "C2; P1; V6",
 86 |     "input": "\u186f\u2689\u59f6\ud83c\udd09\uff0e\u06f7\u200d\ud83c\udfaa\u200d",
 87 |     "output": null
 88 |   },
 89 |   {
 90 |     "comment": "C1; P1; V5; V6",
 91 |     "input": "\ua67d\u200c\ud87e\uddf5\ud83c\udd06\uff61\u200c\ud804\udc42\u1b01",
 92 |     "output": null
 93 |   },
 94 |   {
 95 |     "comment": "C1; P1; V5; V6",
 96 |     "input": "\ua67d\u200c\u9723\ud83c\udd06\uff61\u200c\ud804\udc42\u1b01",
 97 |     "output": null
 98 |   },
 99 |   {
100 |     "comment": "C1; P1; V5; V6; V3 (ignored)",
101 |     "input": "-\u1897\u200c\ud83c\udd04.\ud805\udf22",
102 |     "output": null
103 |   }
104 | ]
105 | 


--------------------------------------------------------------------------------
/tests/wpt/ada_extra_setters_tests.json:
--------------------------------------------------------------------------------
  1 | {
  2 |   "comment": [
  3 |     "#Additional tests designed by the ada team."
  4 |   ],
  5 |   "href": [
  6 |     {
  7 |       "comment": "Update with pathname, fragment and search state filled",
  8 |       "href": "https://yagiz.co",
  9 |       "new_value": "https://google.com/url?search=true#fragment",
 10 |       "expected": {
 11 |         "href": "https://google.com/url?search=true#fragment"
 12 |       }
 13 |     },
 14 |     {
 15 |       "comment": "Update with authority state filled",
 16 |       "href": "https://yagiz.co",
 17 |       "new_value": "https://username:password@localhost:5432/my-db",
 18 |       "expected": {
 19 |         "href": "https://username:password@localhost:5432/my-db"
 20 |       }
 21 |     },
 22 |     {
 23 |       "comment": "Removes leading and trailing control characters",
 24 |       "href": "https://yagiz.co",
 25 |       "new_value": "\u0000http://www.google.com\u0000",
 26 |       "expected": {
 27 |         "href": "http://www.google.com/"
 28 |       }
 29 |     }
 30 |   ],
 31 |   "port": [
 32 |     {
 33 |       "comment": "Should not update on leading control characters",
 34 |       "href": "https://yagiz.co:443",
 35 |       "new_value": "\u000080\u0000",
 36 |       "expected": {
 37 |         "port": ""
 38 |       }
 39 |     },
 40 |     {
 41 |       "comment": "Leading u0009 on special scheme",
 42 |       "href": "https://yagiz.co:443",
 43 |       "new_value": "\u00098080",
 44 |       "expected": {
 45 |         "port": "8080"
 46 |       }
 47 |     },
 48 |     {
 49 |       "comment": "Leading u0009 on non-special scheme",
 50 |       "href": "wpt++://yagiz.co:443",
 51 |       "new_value": "\u00098080",
 52 |       "expected": {
 53 |         "port": "8080"
 54 |       }
 55 |     },
 56 |     {
 57 |       "comment": "Trailing control characters",
 58 |       "href": "https://yagiz.co:443",
 59 |       "new_value": "8080\u0000",
 60 |       "expected": {
 61 |         "port": "8080"
 62 |       }
 63 |     },
 64 |     {
 65 |       "href": "https://yagiz.co",
 66 |       "new_value": "\u000044\u00093\u0000",
 67 |       "expected": {
 68 |         "port": ""
 69 |       }
 70 |     },
 71 |     {
 72 |       "href": "https://yagiz.co:443",
 73 |       "new_value": "\u0000\u0009\u0000",
 74 |       "expected": {
 75 |         "port": ""
 76 |       }
 77 |     },
 78 |     {
 79 |       "comment": "Should remove port on invalid input",
 80 |       "href": "https://www.google.com:443",
 81 |       "new_value": "99999",
 82 |       "expected": {
 83 |         "port": ""
 84 |       }
 85 |     },
 86 |     {
 87 |       "comment": "Should revert back to original on invalid input",
 88 |       "href": "https://www.google.com:4343",
 89 |       "new_value": "yagiz",
 90 |       "expected": {
 91 |         "port": "4343"
 92 |       }
 93 |     },
 94 |     {
 95 |       "comment": "Should use all ascii prefixed characters as port",
 96 |       "href": "https://www.google.com:4343",
 97 |       "new_value": "4yagiz",
 98 |       "expected": {
 99 |         "port": "4"
100 |       }
101 |     }
102 |   ],
103 |   "hash": [
104 |     {
105 |       "comment": "Should not trim leading and trailing control characters",
106 |       "href": "https://domain.com",
107 |       "new_value": "\u0000hello\u0000",
108 |       "expected": {
109 |         "hash": "#%00hello%00"
110 |       }
111 |     }
112 |   ],
113 |   "pathname": [
114 |     {
115 |       "comment": "Used by Node.js by node::url::FromFilePath",
116 |       "href": "file://",
117 |       "new_value": "/Users/yagiz/Developer/node/test/fixtures/loop.%25.js",
118 |       "expected": {
119 |         "pathname": "/Users/yagiz/Developer/node/test/fixtures/loop.%25.js"
120 |       }
121 |     }
122 |   ],
123 |   "search": [
124 |     {
125 |       "comment": "Remove non-existent param removes ? from URL",
126 |       "href": "data:space    ?test",
127 |       "new_value": "",
128 |       "expected": {
129 |         "search": "",
130 |         "pathname": "space   %20"
131 |       }
132 |     }
133 |   ]
134 | }
135 | 


--------------------------------------------------------------------------------
/tests/wpt/ada_long_urltestdata.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   "# Windows' codebase will not allow this case for now.",
 3 |   "# Host",
 4 |   {
 5 |     "input": "http://ğığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığığı.com",
 6 |     "base": "about:blank",
 7 |     "href": "http://xn--teaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa78hbabbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb.com/",
 8 |     "origin": "http://xn--teaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa78hbabbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb.com",
 9 |     "protocol": "http:",
10 |     "username": "",
11 |     "password": "",
12 |     "host": "xn--teaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa78hbabbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb.com",
13 |     "hostname": "xn--teaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa78hbabbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbbb.com",
14 |     "port": "",
15 |     "pathname": "/",
16 |     "search": "",
17 |     "hash": ""
18 |   }
19 | ]
20 | 


--------------------------------------------------------------------------------
/tests/wpt/percent-encoding.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   "Tests for percent-encoding.",
 3 |   {
 4 |     "input": "\u2020",
 5 |     "output": {
 6 |       "big5": "%26%238224%3B",
 7 |       "euc-kr": "%A2%D3",
 8 |       "utf-8": "%E2%80%A0",
 9 |       "windows-1252": "%86"
10 |     }
11 |   },
12 |   "This uses a trailing A to prevent the URL parser from trimming the C0 control.",
13 |   {
14 |     "input": "\u000EA",
15 |     "output": {
16 |       "big5": "%0EA",
17 |       "iso-2022-jp": "%26%2365533%3BA",
18 |       "utf-8": "%0EA"
19 |     }
20 |   },
21 |   {
22 |     "input": "\u203E\u005C",
23 |     "output": {
24 |       "iso-2022-jp": "%1B(J~%1B(B\\",
25 |       "utf-8": "%E2%80%BE\\"
26 |     }
27 |   },
28 |   {
29 |     "input": "\uE5E5",
30 |     "output": {
31 |       "gb18030": "%26%2358853%3B",
32 |       "utf-8": "%EE%97%A5"
33 |     }
34 |   },
35 |   {
36 |     "input": "\u2212",
37 |     "output": {
38 |       "shift_jis": "%81|",
39 |       "utf-8": "%E2%88%92"
40 |     }
41 |   },
42 |   {
43 |     "input": "á|",
44 |     "output": {
45 |       "utf-8": "%C3%A1|"
46 |     }
47 |   }
48 | ]
49 | 


--------------------------------------------------------------------------------
/tests/wpt/urlpattern-compare-test-data.json:
--------------------------------------------------------------------------------
  1 | [
  2 |   {
  3 |     "component": "pathname",
  4 |     "left": { "pathname": "/foo/a" },
  5 |     "right": { "pathname": "/foo/b" },
  6 |     "expected": -1
  7 |   },
  8 |   {
  9 |     "component": "pathname",
 10 |     "left": { "pathname": "/foo/b" },
 11 |     "right": { "pathname": "/foo/bar" },
 12 |     "expected": -1
 13 |   },
 14 |   {
 15 |     "component": "pathname",
 16 |     "left": { "pathname": "/foo/bar" },
 17 |     "right": { "pathname": "/foo/:bar" },
 18 |     "expected": 1
 19 |   },
 20 |   {
 21 |     "component": "pathname",
 22 |     "left": { "pathname": "/foo/" },
 23 |     "right": { "pathname": "/foo/:bar" },
 24 |     "expected": 1
 25 |   },
 26 |   {
 27 |     "component": "pathname",
 28 |     "left": { "pathname": "/foo/:bar" },
 29 |     "right": { "pathname": "/foo/*" },
 30 |     "expected": 1
 31 |   },
 32 |   {
 33 |     "component": "pathname",
 34 |     "left": { "pathname": "/foo/{bar}" },
 35 |     "right": { "pathname": "/foo/(bar)" },
 36 |     "expected": 1
 37 |   },
 38 |   {
 39 |     "component": "pathname",
 40 |     "left": { "pathname": "/foo/{bar}" },
 41 |     "right": { "pathname": "/foo/{bar}+" },
 42 |     "expected": 1
 43 |   },
 44 |   {
 45 |     "component": "pathname",
 46 |     "left": { "pathname": "/foo/{bar}+" },
 47 |     "right": { "pathname": "/foo/{bar}?" },
 48 |     "expected": 1
 49 |   },
 50 |   {
 51 |     "component": "pathname",
 52 |     "left": { "pathname": "/foo/{bar}?" },
 53 |     "right": { "pathname": "/foo/{bar}*" },
 54 |     "expected": 1
 55 |   },
 56 |   {
 57 |     "component": "pathname",
 58 |     "left": { "pathname": "/foo/(123)" },
 59 |     "right": { "pathname": "/foo/(12)" },
 60 |     "expected": 1
 61 |   },
 62 |   {
 63 |     "component": "pathname",
 64 |     "left": { "pathname": "/foo/:b" },
 65 |     "right": { "pathname": "/foo/:a" },
 66 |     "expected": 0
 67 |   },
 68 |   {
 69 |     "component": "pathname",
 70 |     "left": { "pathname": "*/foo" },
 71 |     "right": { "pathname": "*" },
 72 |     "expected": 1
 73 |   },
 74 |   {
 75 |     "component": "port",
 76 |     "left": { "port": "9" },
 77 |     "right": { "port": "100" },
 78 |     "expected": 1
 79 |   },
 80 |   {
 81 |     "component": "pathname",
 82 |     "left": { "pathname": "foo/:bar?/baz" },
 83 |     "right": { "pathname": "foo/{:bar}?/baz" },
 84 |     "expected": -1
 85 |   },
 86 |   {
 87 |     "component": "pathname",
 88 |     "left": { "pathname": "foo/:bar?/baz" },
 89 |     "right": { "pathname": "foo{/:bar}?/baz" },
 90 |     "expected": 0
 91 |   },
 92 |   {
 93 |     "component": "pathname",
 94 |     "left": { "pathname": "foo/:bar?/baz" },
 95 |     "right": { "pathname": "fo{o/:bar}?/baz" },
 96 |     "expected": 1
 97 |   },
 98 |   {
 99 |     "component": "pathname",
100 |     "left": { "pathname": "foo/:bar?/baz" },
101 |     "right": { "pathname": "foo{/:bar/}?baz" },
102 |     "expected": -1
103 |   },
104 |   {
105 |     "component": "pathname",
106 |     "left": "https://a.example.com/b?a",
107 |     "right": "https://b.example.com/a?b",
108 |     "expected": 1
109 |   },
110 |   {
111 |     "component": "pathname",
112 |     "left": { "pathname": "/foo/{bar}/baz" },
113 |     "right": { "pathname": "/foo/bar/baz" },
114 |     "expected": 0
115 |   },
116 |   {
117 |     "component": "protocol",
118 |     "left": { "protocol": "a" },
119 |     "right": { "protocol": "b" },
120 |     "expected": -1
121 |   },
122 |   {
123 |     "component": "username",
124 |     "left": { "username": "a" },
125 |     "right": { "username": "b" },
126 |     "expected": -1
127 |   },
128 |   {
129 |     "component": "password",
130 |     "left": { "password": "a" },
131 |     "right": { "password": "b" },
132 |     "expected": -1
133 |   },
134 |   {
135 |     "component": "hostname",
136 |     "left": { "hostname": "a" },
137 |     "right": { "hostname": "b" },
138 |     "expected": -1
139 |   },
140 |   {
141 |     "component": "search",
142 |     "left": { "search": "a" },
143 |     "right": { "search": "b" },
144 |     "expected": -1
145 |   },
146 |   {
147 |     "component": "hash",
148 |     "left": { "hash": "a" },
149 |     "right": { "hash": "b" },
150 |     "expected": -1
151 |   }
152 | ]
153 | 


--------------------------------------------------------------------------------
/tests/wpt/urltestdata-javascript-only.json:
--------------------------------------------------------------------------------
 1 | [
 2 |     "See ../README.md for a description of the format.",
 3 |     {
 4 |         "input": "http://example.com/\uD800\uD801\uDFFE\uDFFF\uFDD0\uFDCF\uFDEF\uFDF0\uFFFE\uFFFF?\uD800\uD801\uDFFE\uDFFF\uFDD0\uFDCF\uFDEF\uFDF0\uFFFE\uFFFF",
 5 |         "base": null,
 6 |         "href": "http://example.com/%EF%BF%BD%F0%90%9F%BE%EF%BF%BD%EF%B7%90%EF%B7%8F%EF%B7%AF%EF%B7%B0%EF%BF%BE%EF%BF%BF?%EF%BF%BD%F0%90%9F%BE%EF%BF%BD%EF%B7%90%EF%B7%8F%EF%B7%AF%EF%B7%B0%EF%BF%BE%EF%BF%BF",
 7 |         "origin": "http://example.com",
 8 |         "protocol": "http:",
 9 |         "username": "",
10 |         "password": "",
11 |         "host": "example.com",
12 |         "hostname": "example.com",
13 |         "port": "",
14 |         "pathname": "/%EF%BF%BD%F0%90%9F%BE%EF%BF%BD%EF%B7%90%EF%B7%8F%EF%B7%AF%EF%B7%B0%EF%BF%BE%EF%BF%BF",
15 |         "search": "?%EF%BF%BD%F0%90%9F%BE%EF%BF%BD%EF%B7%90%EF%B7%8F%EF%B7%AF%EF%B7%B0%EF%BF%BE%EF%BF%BF",
16 |         "hash": ""
17 |     }
18 | ]
19 | 


--------------------------------------------------------------------------------
/tests/wpt/verifydnslength_tests.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   "Tests for the verify_dns_length function. See the section 2.3.4 of https://www.ietf.org/rfc/rfc1035.txt .",
 3 |   {
 4 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 1",
 5 |     "input": "http://lorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlore.com",
 6 |     "failure": true
 7 |   },
 8 |   {
 9 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 2",
10 |     "input": "http://br.lorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlore.org/",
11 |     "failure": true
12 |   },
13 |   {
14 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 3",
15 |     "input": "http://exampleexampleexampleexampleexampleexampleexampleexampleexampleexample.lorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlore.org.br/",
16 |     "failure": true
17 |   },
18 |   {
19 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 4",
20 |     "input": "http://br.exampleexampleexampleexampleexampleexampleexampleexampleexampleexample.lorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlorenlore",
21 |     "failure": true
22 |   },
23 |   {
24 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 4",
25 |     "input": "http://example..com.br",
26 |     "failure": true
27 |   },
28 |   {
29 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 4",
30 |     "input": "http://example.com.br..",
31 |     "failure": true
32 |   },
33 |   {
34 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 4",
35 |     "input": "http://example.com.br....",
36 |     "failure": true
37 |   },
38 |   {
39 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 4",
40 |     "input": "http://.example.com.br",
41 |     "failure": true
42 |   },
43 |   {
44 |     "message": "A domain label must be a mininum of 1 character and a maximum of 63 characters. 4",
45 |     "input": "http://example.com..br",
46 |     "failure": true
47 |   },
48 |   {
49 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 1",
50 |     "input": "http://example.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br",
51 |     "failure": true
52 |   },
53 |   {
54 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 4",
55 |     "input": "http://example.com.",
56 |     "failure": false
57 |   },
58 |   {
59 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 2",
60 |     "input": "http://example.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.comm.br.",
61 |     "failure": false
62 |   },
63 |   {
64 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 3",
65 |     "input": "http://example.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.comm.br",
66 |     "failure": false
67 |   },
68 |   {
69 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 3",
70 |     "input": "http://example.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.com.br.comm.br.",
71 |     "failure": false
72 |   },
73 |   {
74 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 6",
75 |     "input": "http://aaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa.aaaaaaaaaaaaaaaaaaaa.com",
76 |     "failure": false
77 |   },
78 |   {
79 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 6",
80 |     "input": "http://example.com.",
81 |     "failure": false
82 |   },
83 |   {
84 |     "message": "A domain name must be a maximum of 253 characters (or 254 if there is a dot at the end). 6",
85 |     "input": "http://example.com./",
86 |     "failure": false
87 |   }
88 | ]
89 | 


--------------------------------------------------------------------------------
/tools/CMakeLists.txt:
--------------------------------------------------------------------------------
1 | add_subdirectory(cli)


--------------------------------------------------------------------------------
/tools/cli/CMakeLists.txt:
--------------------------------------------------------------------------------
 1 | add_executable(adaparse adaparse.cpp line_iterator.h)
 2 | target_link_libraries(adaparse PRIVATE ada)
 3 | target_include_directories(adaparse PUBLIC "$<BUILD_INTERFACE:${PROJECT_SOURCE_DIR}/include>")
 4 | 
 5 | 
 6 | if(CMAKE_CXX_COMPILER_ID STREQUAL "AppleClang")
 7 |     # We are on an Apple platform, so we can use dead_strip and LTO
 8 |     # to reduce the size of the final binary.
 9 |     message(STATUS "Apple platform detected, using dead_strip and LTO")
10 |     target_link_options(adaparse PRIVATE "-Wl,-dead_strip")
11 |     target_compile_options(adaparse PRIVATE "-flto")
12 |     target_link_options(adaparse PRIVATE "-flto")
13 | endif(CMAKE_CXX_COMPILER_ID STREQUAL "AppleClang")
14 | 
15 | if((CMAKE_CXX_COMPILER_ID STREQUAL "GNU") OR (CMAKE_CXX_COMPILER_ID STREQUAL "Clang"))
16 |   execute_process(COMMAND ${CMAKE_CXX_COMPILER} -print-libgcc-file-name OUTPUT_VARIABLE ADA_GCC_LIB)
17 |   get_filename_component(ADA_GCC_DIR "${ADA_GCC_LIB}" DIRECTORY)
18 |   message(STATUS "looking for static C++ library in " ${ADA_GCC_DIR})
19 |   find_library(LIBSTDCPP libstdc++.a PATHS "${ADA_GCC_DIR}")
20 |   if(LIBSTDCPP)
21 |     # static linkink for speed
22 |     message(STATUS "libstdc++.a found")
23 |     target_link_options(adaparse PRIVATE "-static-libstdc++")
24 |   else()
25 |     message(STATUS "libstdc++.a not found")
26 |   endif()
27 |   # Note that we are not under Apple at this time.
28 |   # We can use the -Wl,--gc-sections option to remove unused sections
29 |   # from the final binary, which can reduce the size of the binary.
30 |   target_link_options(adaparse PRIVATE "-Wl,--gc-sections")
31 | endif()
32 | 
33 | if(MSVC AND BUILD_SHARED_LIBS)
34 |   # Copy the ada dll into the directory
35 |   add_custom_command(TARGET adaparse POST_BUILD        # Adds a post-build event
36 |     COMMAND ${CMAKE_COMMAND} -E copy_if_different  # which executes "cmake -E copy_if_different..."
37 |         "$<TARGET_FILE:ada>"      # <--this is in-file
38 |         "$<TARGET_FILE_DIR:adaparse>")                 # <--this is out-file path
39 | endif()
40 | CPMAddPackage("gh:fmtlib/fmt#11.0.2")
41 | CPMAddPackage(
42 |   GITHUB_REPOSITORY jarro2783/cxxopts
43 |   VERSION 3.2.0
44 |   OPTIONS "CXXOPTS_BUILD_EXAMPLES NO" "CXXOPTS_BUILD_TESTS NO" "CXXOPTS_ENABLE_INSTALL YES"
45 | )
46 | target_link_libraries(adaparse PRIVATE cxxopts::cxxopts fmt::fmt)
47 | 
48 | if(MSVC OR MINGW)
49 |   target_compile_definitions(adaparse PRIVATE _CRT_SECURE_NO_WARNINGS _CRT_NONSTDC_NO_DEPRECATE)
50 | endif()
51 | 
52 | install(
53 |    TARGETS
54 |     adaparse
55 |    ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
56 |    LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
57 |    RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}
58 | )
59 | 


--------------------------------------------------------------------------------
/tools/cli/benchmark_adaparse.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | echo "Benchmarking piping function"
 4 | 
 5 | # Set the number of trials
 6 | num_trials=50
 7 | 
 8 | if [ -f "linux_files.txt" ]; then
 9 |     echo "linux_files.txt exists."
10 | else 
11 |     echo "downloading linux_files.txt."
12 |     curl https://raw.githubusercontent.com/ada-url/url-various-datasets/main/files/linux_files.txt -O
13 | fi
14 | 
15 | if [ -f "wikipedia_100k.txt" ]; then
16 |     echo "wikipedia_100k.txt exists."
17 | else 
18 |     echo "downloading wikipedia_100k.txt."
19 |     curl https://raw.githubusercontent.com/ada-url/url-various-datasets/main/wikipedia/wikipedia_100k.txt -O
20 | fi
21 | 
22 | if [ -f "top100.txt" ]; then
23 |     echo "top100.txt exists."
24 | else 
25 |     echo "downloading top100.txt."
26 |     curl https://raw.githubusercontent.com/ada-url/url-various-datasets/main/top100/top100.txt -O
27 | fi
28 | 
29 | # File list to benchmark against
30 | files=("top100.txt" "linux_files.txt" "wikipedia_100k.txt" )
31 | 
32 | # Run the programs for the specified number of trials
33 | for file in "${files[@]}"; do
34 |   echo "Benchmarking $file"
35 | 
36 |   # Variables to store the sum of the Gb/s values for each program
37 |   sum_fastpipespeed=0
38 | 
39 |   for i in $(seq 1 $num_trials); do
40 |       result_fastspeed=$(cat $file | ../../build/tools/adaparse --benchmark 2>&1 | tail -1 | grep -oP '\d+(\.\d+)?') 
41 |       sum_fastpipespeed=$(echo "$sum_fastpipespeed + $result_fastspeed" | bc)
42 |   done
43 | 
44 |   # Compute the averages
45 |   avg_fastpipespeed=$(echo "scale=7; $sum_fastpipespeed / $num_trials" | bc)
46 | 
47 |   # Display the results
48 |   echo "------------------------------"
49 |   echo "Finished benchmarking $file"
50 |   echo "Number of trials: $num_trials"
51 |   echo "Average Gb/s for fastpipespeed: $avg_fastpipespeed"
52 | 
53 |   echo "----------------------------"
54 | 
55 | 
56 | 
57 |   echo ""
58 | done
59 | 


--------------------------------------------------------------------------------
/tools/cli/benchmark_write_to_file.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | echo "Benchmarking writing to file from pipe."
 4 | 
 5 | # Set the number of trials
 6 | num_trials=50
 7 | 
 8 | if [ -f "linux_files.txt" ]; then
 9 |     echo "linux_files.txt exists."
10 | else 
11 |     echo "downloading linux_files.txt."
12 |     curl https://raw.githubusercontent.com/ada-url/url-various-datasets/main/files/linux_files.txt -O
13 | fi
14 | 
15 | if [ -f "wikipedia_100k.txt" ]; then
16 |     echo "wikipedia_100k.txt exists."
17 | else 
18 |     echo "downloading wikipedia_100k.txt."
19 |     curl https://raw.githubusercontent.com/ada-url/url-various-datasets/main/wikipedia/wikipedia_100k.txt -O
20 | fi
21 | 
22 | if [ -f "top100.txt" ]; then
23 |     echo "top100.txt exists."
24 | else 
25 |     echo "downloading top100.txt."
26 |     curl https://raw.githubusercontent.com/ada-url/url-various-datasets/main/top100/top100.txt -O
27 | fi
28 | 
29 | # File list to benchmark against
30 | files=("top100.txt" "linux_files.txt" "wikipedia_100k.txt" )
31 | 
32 | # Run the programs for the specified number of trials
33 | for file in "${files[@]}"; do
34 |   echo "Benchmarking $file"
35 | 
36 |   # Variables to store the sum of the Gb/s values for each program
37 |   sum_fastpipespeed=0
38 | 
39 |   for i in $(seq 1 $num_trials); do
40 |       result_fastspeed=$(cat $file | ../../build/tools/adaparse --benchmark --output test_write_speeds.txt 2>&1 | tail -1 | grep -oP '\d+(\.\d+)?') 
41 |       sum_fastpipespeed=$(echo "$sum_fastpipespeed + $result_fastspeed" | bc)
42 |   done
43 | 
44 |   # Compute the averages
45 |   avg_fastpipespeed=$(echo "scale=7; $sum_fastpipespeed / $num_trials" | bc)
46 | 
47 |   # Display the results
48 |   echo "------------------------------"
49 |   echo "Finished benchmarking $file"
50 |   echo "Number of trials: $num_trials"
51 |   echo "Average Gb/s for fastpipespeed: $avg_fastpipespeed"
52 | 
53 |   echo "----------------------------"
54 | 
55 | 
56 | 
57 |   echo ""
58 | done
59 | 


--------------------------------------------------------------------------------
/tools/cli/line_iterator.h:
--------------------------------------------------------------------------------
 1 | #ifndef LINE_ITERATOR_H
 2 | #define LINE_ITERATOR_H
 3 | 
 4 | #include <string_view>
 5 | 
 6 | struct line_iterator {
 7 |   std::string_view all_text{};
 8 |   size_t next_end_of_line{0};
 9 |   line_iterator(const char *_buffer, size_t _len) : all_text(_buffer, _len) {}
10 | 
11 |   inline bool find_another_complete_line() noexcept {
12 |     next_end_of_line = all_text.find('\n');
13 |     return next_end_of_line != std::string_view::npos;
14 |   }
15 | 
16 |   inline operator bool() const noexcept {
17 |     return next_end_of_line != std::string_view::npos;
18 |   }
19 | 
20 |   inline std::string_view grab_line() noexcept {
21 |     auto line = all_text.substr(0, next_end_of_line);  // advance to next EOL
22 |     // remove anything prior to said EOL
23 |     all_text.remove_prefix(next_end_of_line + 1);
24 |     return line;
25 |   }
26 | 
27 |   inline size_t tail() const noexcept { return all_text.size(); }
28 | };
29 | 
30 | #endif


--------------------------------------------------------------------------------
/tools/prepare-doxygen.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | set -e
 3 | 
 4 | PACKAGE_URL="https://github.com/jothepro/doxygen-awesome-css.git"
 5 | PACKAGE_VERSION="v2.3.3"
 6 | 
 7 | BASE_DIR=$(pwd)
 8 | THEME_DIR="$BASE_DIR/docs/theme"
 9 | WORKSPACE=$(mktemp -d 2> /dev/null || mktemp -d -t 'tmp')
10 | 
11 | cleanup () {
12 |   EXIT_CODE=$?
13 |   [ -d "$WORKSPACE" ] && rm -rf "$WORKSPACE"
14 |   exit $EXIT_CODE
15 | }
16 | 
17 | trap cleanup INT TERM EXIT
18 | 
19 | cd "$WORKSPACE"
20 | git clone --depth=1 --branch "$PACKAGE_VERSION" "$PACKAGE_URL" theme
21 | rm -rf "$THEME_DIR"
22 | mv "$WORKSPACE/theme" "$THEME_DIR"
23 | 


--------------------------------------------------------------------------------
/tools/release/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ada-url/ada/667c3cd123992949f8b2ce2455fb555d69b77c7e/tools/release/__init__.py


--------------------------------------------------------------------------------
/tools/release/create_release.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | 
 3 | from os import environ, path
 4 | from github import Github
 5 | from lib.release import create_release
 6 | 
 7 | WORK_DIR = path.dirname(path.abspath(__file__)).replace('/tools/release', '')
 8 | 
 9 | NEXT_TAG = environ.get('NEXT_RELEASE_TAG', None)
10 | REPO_NAME = environ.get('GITHUB_REPOSITORY', None)
11 | TOKEN = environ.get('GITHUB_TOKEN', None)
12 | if not NEXT_TAG or not REPO_NAME or not TOKEN:
13 |     raise Exception('Bad environment variables. Invalid GITHUB_REPOSITORY, GITHUB_TOKEN or NEXT_RELEASE_TAG')
14 | 
15 | g = Github(TOKEN)
16 | repository = g.get_repo(REPO_NAME)
17 | 
18 | release = create_release(repository, NEXT_TAG)
19 | release.upload_asset('singleheader/ada.cpp')
20 | release.upload_asset('singleheader/ada.h')
21 | release.upload_asset('singleheader/ada_c.h')
22 | release.upload_asset('singleheader/singleheader.zip')
23 | 


--------------------------------------------------------------------------------
/tools/release/lib/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ada-url/ada/667c3cd123992949f8b2ce2455fb555d69b77c7e/tools/release/lib/__init__.py


--------------------------------------------------------------------------------
/tools/release/lib/release.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | 
 3 | import re
 4 | from github import Repository, GitRelease
 5 | 
 6 | 
 7 | def is_valid_tag(tag: str) -> bool:
 8 |     tag_regex = r'^v\d+\.\d+\.\d+$'
 9 |     return bool(re.match(tag_regex, tag))
10 | 
11 | 
12 | def create_release(repository: Repository, tag: str) -> GitRelease:
13 |     if not is_valid_tag(tag):
14 |         raise Exception(f'Invalid tag: {tag}')
15 | 
16 |     try:
17 |         return repository.create_git_release(
18 |             tag=tag, name=tag, draft=False, prerelease=False, generate_release_notes=True
19 |         )
20 |     except Exception as exp:
21 |         raise Exception(f'create_release: Error creating release/tag {tag}: {exp!s}') from exp
22 | 


--------------------------------------------------------------------------------
/tools/release/lib/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ada-url/ada/667c3cd123992949f8b2ce2455fb555d69b77c7e/tools/release/lib/tests/__init__.py


--------------------------------------------------------------------------------
/tools/release/lib/tests/samples/ada_version_h.txt:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file ada_version.h
 3 |  * @brief Definitions for Ada's version number.
 4 |  */
 5 | #ifndef ADA_ADA_VERSION_H
 6 | #define ADA_ADA_VERSION_H
 7 | 
 8 | #define ADA_VERSION "1.0.0"
 9 | 
10 | namespace ada {
11 | 
12 | enum {
13 |   ADA_VERSION_MAJOR = 1,
14 |   ADA_VERSION_MINOR = 0,
15 |   ADA_VERSION_REVISION = 0,
16 | };
17 | 
18 | }  // namespace ada
19 | 
20 | #endif  // ADA_ADA_VERSION_H
21 | 


--------------------------------------------------------------------------------
/tools/release/lib/tests/samples/ada_version_h_expected.txt:
--------------------------------------------------------------------------------
 1 | /**
 2 |  * @file ada_version.h
 3 |  * @brief Definitions for Ada's version number.
 4 |  */
 5 | #ifndef ADA_ADA_VERSION_H
 6 | #define ADA_ADA_VERSION_H
 7 | 
 8 | #define ADA_VERSION "2.0.0"
 9 | 
10 | namespace ada {
11 | 
12 | enum {
13 |   ADA_VERSION_MAJOR = 2,
14 |   ADA_VERSION_MINOR = 0,
15 |   ADA_VERSION_REVISION = 0,
16 | };
17 | 
18 | }  // namespace ada
19 | 
20 | #endif  // ADA_ADA_VERSION_H
21 | 


--------------------------------------------------------------------------------
/tools/release/lib/tests/samples/cmakelists.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.16)
 2 | 
 3 | project(ada
 4 |   DESCRIPTION "Fast spec-compliant URL parser"
 5 |   LANGUAGES C CXX
 6 |   VERSION 1.0.0
 7 | )
 8 | 
 9 | set(ADA_LIB_VERSION "1.0.0" CACHE STRING "ada library version")
10 | set(ADA_LIB_SOVERSION "1" CACHE STRING "ada library soversion")
11 | 


--------------------------------------------------------------------------------
/tools/release/lib/tests/samples/cmakelists_expected.txt:
--------------------------------------------------------------------------------
 1 | cmake_minimum_required(VERSION 3.16)
 2 | 
 3 | project(ada
 4 |   DESCRIPTION "Fast spec-compliant URL parser"
 5 |   LANGUAGES C CXX
 6 |   VERSION 2.0.0
 7 | )
 8 | 
 9 | set(ADA_LIB_VERSION "2.0.0" CACHE STRING "ada library version")
10 | set(ADA_LIB_SOVERSION "2" CACHE STRING "ada library soversion")
11 | 


--------------------------------------------------------------------------------
/tools/release/lib/tests/samples/doxygen.txt:
--------------------------------------------------------------------------------
 1 | # Doxyfile 1.9.6
 2 | 
 3 | # This file describes the settings to be used by the documentation system
 4 | # doxygen (www.doxygen.org) for a project.
 5 | #
 6 | # All text after a double hash (##) is considered a comment and is placed in
 7 | # front of the TAG it is preceding.
 8 | #
 9 | # All text after a single hash (#) is considered a comment and will be ignored.
10 | # The format is:
11 | # TAG = value [value, ...]
12 | # For lists, items can also be appended using:
13 | # TAG += value [value, ...]
14 | # Values that contain spaces should be placed between quotes (\" \").
15 | #
16 | # Note:
17 | #
18 | # Use doxygen to compare the used configuration file with the template
19 | # configuration file:
20 | # doxygen -x [configFile]
21 | # Use doxygen to compare the used configuration file with the template
22 | # configuration file without replacing the environment variables or CMake type
23 | # replacement variables:
24 | # doxygen -x_noenv [configFile]
25 | 
26 | #---------------------------------------------------------------------------
27 | # Project related configuration options
28 | #---------------------------------------------------------------------------
29 | 
30 | # This tag specifies the encoding used for all characters in the configuration
31 | # file that follow. The default is UTF-8 which is also the encoding used for all
32 | # text before the first occurrence of this tag. Doxygen uses libiconv (or the
33 | # iconv built into libc) for the transcoding. See
34 | # https://www.gnu.org/software/libiconv/ for the list of possible encodings.
35 | # The default value is: UTF-8.
36 | 
37 | DOXYFILE_ENCODING      = UTF-8
38 | 
39 | # The PROJECT_NAME tag is a single word (or a sequence of words surrounded by
40 | # double-quotes, unless you are using Doxywizard) that should identify the
41 | # project for which the documentation is generated. This name is used in the
42 | # title of most generated pages and in a few other places.
43 | # The default value is: My Project.
44 | 
45 | PROJECT_NAME           = "Ada"
46 | 
47 | # The PROJECT_NUMBER tag can be used to enter a project or revision number. This
48 | # could be handy for archiving the generated documentation or if some version
49 | # control system is used.
50 | 
51 | PROJECT_NUMBER         = "2.0.0"
52 | 
53 | # Using the PROJECT_BRIEF tag one can provide an optional one line description
54 | # for a project that appears at the top of each page and should give viewer a
55 | # quick idea about the purpose of the project. Keep the description short.
56 | 
57 | PROJECT_BRIEF          = "Spec-compliant URL parser"
58 | 
59 | # With the PROJECT_LOGO tag one can specify a logo or an icon that is included
60 | # in the documentation. The maximum height of the logo should not exceed 55
61 | # pixels and the maximum width should not exceed 200 pixels. Doxygen will copy
62 | # the logo to the output directory.
63 | 
64 | PROJECT_LOGO           =
65 | 
66 | # The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) path
67 | # into which the generated documentation will be written. If a relative path is
68 | # entered, it will be relative to the location where doxygen was started. If
69 | # left blank the current directory will be used.
70 | 
71 | OUTPUT_DIRECTORY       = "docs"
72 | 
73 | # If the CREATE_SUBDIRS tag is set to YES then doxygen will create up to 4096
74 | # sub-directories (in 2 levels) under the output directory of each output format
75 | # and will distribute the generated files over these directories. Enabling this
76 | # option can be useful when feeding doxygen a huge amount of source files, where
77 | # putting all generated files in the same directory would otherwise causes
78 | # performance problems for the file system. Adapt CREATE_SUBDIRS_LEVEL to
79 | # control the number of sub-directories.
80 | # The default value is: NO.
81 | 
82 | CREATE_SUBDIRS         = YES
83 | 


--------------------------------------------------------------------------------
/tools/release/lib/tests/samples/doxygen_expected.txt:
--------------------------------------------------------------------------------
 1 | # Doxyfile 1.9.6
 2 | 
 3 | # This file describes the settings to be used by the documentation system
 4 | # doxygen (www.doxygen.org) for a project.
 5 | #
 6 | # All text after a double hash (##) is considered a comment and is placed in
 7 | # front of the TAG it is preceding.
 8 | #
 9 | # All text after a single hash (#) is considered a comment and will be ignored.
10 | # The format is:
11 | # TAG = value [value, ...]
12 | # For lists, items can also be appended using:
13 | # TAG += value [value, ...]
14 | # Values that contain spaces should be placed between quotes (\" \").
15 | #
16 | # Note:
17 | #
18 | # Use doxygen to compare the used configuration file with the template
19 | # configuration file:
20 | # doxygen -x [configFile]
21 | # Use doxygen to compare the used configuration file with the template
22 | # configuration file without replacing the environment variables or CMake type
23 | # replacement variables:
24 | # doxygen -x_noenv [configFile]
25 | 
26 | #---------------------------------------------------------------------------
27 | # Project related configuration options
28 | #---------------------------------------------------------------------------
29 | 
30 | # This tag specifies the encoding used for all characters in the configuration
31 | # file that follow. The default is UTF-8 which is also the encoding used for all
32 | # text before the first occurrence of this tag. Doxygen uses libiconv (or the
33 | # iconv built into libc) for the transcoding. See
34 | # https://www.gnu.org/software/libiconv/ for the list of possible encodings.
35 | # The default value is: UTF-8.
36 | 
37 | DOXYFILE_ENCODING      = UTF-8
38 | 
39 | # The PROJECT_NAME tag is a single word (or a sequence of words surrounded by
40 | # double-quotes, unless you are using Doxywizard) that should identify the
41 | # project for which the documentation is generated. This name is used in the
42 | # title of most generated pages and in a few other places.
43 | # The default value is: My Project.
44 | 
45 | PROJECT_NAME           = "Ada"
46 | 
47 | # The PROJECT_NUMBER tag can be used to enter a project or revision number. This
48 | # could be handy for archiving the generated documentation or if some version
49 | # control system is used.
50 | 
51 | PROJECT_NUMBER         = "2.0.0"
52 | 
53 | # Using the PROJECT_BRIEF tag one can provide an optional one line description
54 | # for a project that appears at the top of each page and should give viewer a
55 | # quick idea about the purpose of the project. Keep the description short.
56 | 
57 | PROJECT_BRIEF          = "Spec-compliant URL parser"
58 | 
59 | # With the PROJECT_LOGO tag one can specify a logo or an icon that is included
60 | # in the documentation. The maximum height of the logo should not exceed 55
61 | # pixels and the maximum width should not exceed 200 pixels. Doxygen will copy
62 | # the logo to the output directory.
63 | 
64 | PROJECT_LOGO           =
65 | 
66 | # The OUTPUT_DIRECTORY tag is used to specify the (relative or absolute) path
67 | # into which the generated documentation will be written. If a relative path is
68 | # entered, it will be relative to the location where doxygen was started. If
69 | # left blank the current directory will be used.
70 | 
71 | OUTPUT_DIRECTORY       = "docs"
72 | 
73 | # If the CREATE_SUBDIRS tag is set to YES then doxygen will create up to 4096
74 | # sub-directories (in 2 levels) under the output directory of each output format
75 | # and will distribute the generated files over these directories. Enabling this
76 | # option can be useful when feeding doxygen a huge amount of source files, where
77 | # putting all generated files in the same directory would otherwise causes
78 | # performance problems for the file system. Adapt CREATE_SUBDIRS_LEVEL to
79 | # control the number of sub-directories.
80 | # The default value is: NO.
81 | 
82 | CREATE_SUBDIRS         = YES
83 | 


--------------------------------------------------------------------------------
/tools/release/lib/tests/test_update_versions.py:
--------------------------------------------------------------------------------
 1 | from .. import versions
 2 | import os
 3 | 
 4 | 
 5 | def test_update_cmakelists_version() -> None:
 6 |     current_dir = os.path.dirname(os.path.abspath(__file__))
 7 |     sample_path = f'{current_dir}/samples/cmakelists.txt'
 8 |     sample_expected_path = f'{current_dir}/samples/cmakelists_expected.txt'
 9 | 
10 |     versions.update_cmakelists_version('2.0.0', sample_path)
11 | 
12 |     with open(sample_path, 'r') as cmake:
13 |         given = cmake.read()
14 | 
15 |     with open(sample_expected_path, 'r') as cmake_expected:
16 |         expected = cmake_expected.read()
17 | 
18 |     assert given == expected
19 |     versions.update_cmakelists_version('1.0.0', sample_path)  # cleanup
20 | 
21 | 
22 | def test_update_ada_version_h() -> None:
23 |     current_dir = os.path.dirname(os.path.abspath(__file__))
24 |     sample_path = f'{current_dir}/samples/ada_version_h.txt'
25 |     sample_expected_path = f'{current_dir}/samples/ada_version_h_expected.txt'
26 | 
27 |     versions.update_ada_version_h('2.0.0', sample_path)
28 | 
29 |     with open(sample_path, 'r') as ada_version_h:
30 |         given = ada_version_h.read()
31 | 
32 |     with open(sample_expected_path, 'r') as ada_version_h_expected:
33 |         expected = ada_version_h_expected.read()
34 | 
35 |     assert given == expected
36 |     versions.update_ada_version_h('1.0.0', sample_path)  # cleanup
37 | 
38 | 
39 | def test_update_doxygen_version() -> None:
40 |     current_dir = os.path.dirname(os.path.abspath(__file__))
41 |     sample_path = f'{current_dir}/samples/doxygen.txt'
42 |     sample_expected_path = f'{current_dir}/samples/doxygen_expected.txt'
43 | 
44 |     versions.update_doxygen_version('2.0.0', sample_path)
45 | 
46 |     with open(sample_path, 'r') as doxygen:
47 |         given = doxygen.read()
48 | 
49 |     with open(sample_expected_path, 'r') as doxygen_expected:
50 |         expected = doxygen_expected.read()
51 | 
52 |     assert given == expected
53 |     versions.update_ada_version_h('1.0.0', sample_path)  # cleanup
54 | 


--------------------------------------------------------------------------------
/tools/release/lib/versions.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | 
 3 | import fileinput
 4 | import re
 5 | 
 6 | 
 7 | def update_cmakelists_version(new_version: str, file_path: str) -> None:
 8 |     inside_project = False
 9 |     with fileinput.FileInput(file_path, inplace=True) as cmakelists:
10 |         for line in cmakelists:
11 |             if 'set(ADA_LIB_VERSION' in line:
12 |                 line = re.sub(r'[0-9]+\.[0-9]+\.[0-9]+', new_version, line)
13 |             elif 'set(ADA_LIB_SOVERSION' in line:
14 |                 line = re.sub(r'[0-9]+', new_version.split('.')[0], line)
15 | 
16 |             elif 'project(' in line:
17 |                 inside_project = True
18 |             elif inside_project:
19 |                 if 'VERSION' in line:
20 |                     line = re.sub(r'[0-9]+\.[0-9]+\.[0-9]+', new_version, line)
21 |                     inside_project = False
22 |             print(line, end='')
23 | 
24 | 
25 | def update_ada_version_h(new_version: str, file_path: str) -> None:
26 |     new_version_list = new_version.split('.')
27 |     with fileinput.FileInput(file_path, inplace=True) as ada_version_h:
28 |         inside_enum = False
29 |         for line in ada_version_h:
30 |             if '#define ADA_VERSION' in line:
31 |                 line = f'#define ADA_VERSION "{new_version}"\n'
32 | 
33 |             elif 'enum {' in line:
34 |                 inside_enum = True
35 |             elif inside_enum:
36 |                 if line.strip().startswith('ADA_VERSION_MAJOR'):
37 |                     line = re.sub(r'\d+', new_version_list[0], line)
38 |                 elif line.strip().startswith('ADA_VERSION_MINOR'):
39 |                     line = re.sub(r'\d+', new_version_list[1], line)
40 |                 elif line.strip().startswith('ADA_VERSION_REVISION'):
41 |                     line = re.sub(r'\d+', new_version_list[2], line)
42 | 
43 |             print(line, end='')
44 | 
45 | 
46 | def update_doxygen_version(new_version: str, file_path: str) -> None:
47 |     with fileinput.FileInput(file_path, inplace=True) as doxygen:
48 |         for line in doxygen:
49 |             if line.strip().startswith('PROJECT_NUMBER         ='):
50 |                 line = f'PROJECT_NUMBER         = "{new_version}"\n'
51 | 
52 |             print(line, end='')
53 | 


--------------------------------------------------------------------------------
/tools/release/requirements.txt:
--------------------------------------------------------------------------------
1 | PyGithub==2.6.1
2 | pytest==8.3.5
3 | 


--------------------------------------------------------------------------------
/tools/release/update_versions.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python3
 2 | 
 3 | import os
 4 | import lib.versions as update_versions
 5 | from lib.release import is_valid_tag
 6 | 
 7 | WORK_DIR = os.path.dirname(os.path.abspath(__file__)).replace('/tools/release', '')
 8 | 
 9 | ADA_VERSION_H = f'{WORK_DIR}/include/ada/ada_version.h'
10 | DOXYGEN = f'{WORK_DIR}/doxygen'
11 | CMAKE_LISTS = f'{WORK_DIR}/CMakeLists.txt'
12 | 
13 | NEXT_TAG = os.environ['NEXT_RELEASE_TAG']
14 | if not NEXT_TAG or not is_valid_tag(NEXT_TAG):
15 |     raise Exception(f'Bad environment variables. Invalid NEXT_RELEASE_TAG {NEXT_TAG}.')
16 | 
17 | NEXT_TAG = NEXT_TAG[1:]  # from v1.0.0 to 1.0.0
18 | 
19 | update_versions.update_ada_version_h(NEXT_TAG, ADA_VERSION_H)
20 | update_versions.update_doxygen_version(NEXT_TAG, DOXYGEN)
21 | update_versions.update_cmakelists_version(NEXT_TAG, CMAKE_LISTS)
22 | 


--------------------------------------------------------------------------------
/tools/run-clangcldocker.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env bash
 2 | set -e
 3 | COMMAND=$*
 4 | SCRIPTPATH="$( cd "$(dirname "$0")" ; pwd -P )"
 5 | MAINSOURCE=$SCRIPTPATH/..
 6 | ALL_ADA_FILES=$(cd $MAINSOURCE && git ls-tree --full-tree --name-only -r HEAD | grep -e ".*\.\(c\|h\|cc\|cpp\|hh\)\$")
 7 | 
 8 | if clang-format-17 --version  2>/dev/null | grep -qF 'version 17.'; then
 9 |   cd $MAINSOURCE; clang-format-17 --style=file --verbose -i "$@" $ALL_ADA_FILES
10 |   exit 0
11 | elif clang-format --version  2>/dev/null | grep -qF 'version 17.'; then
12 |   cd $MAINSOURCE; clang-format --style=file --verbose -i "$@" $ALL_ADA_FILES
13 |   exit 0
14 | fi
15 | echo "Trying to use docker"
16 | command -v docker >/dev/null 2>&1 || { echo >&2 "Please install docker. E.g., go to https://www.docker.com/products/docker-desktop Type 'docker' to diagnose the problem."; exit 1; }
17 | docker info >/dev/null 2>&1 || { echo >&2 "Docker server is not running? type 'docker info'."; exit 1; }
18 | 
19 | if [ -t 0 ]; then DOCKER_ARGS=-it; fi
20 | docker pull kszonek/clang-format-17
21 | 
22 | docker run --rm $DOCKER_ARGS -v "$MAINSOURCE":"$MAINSOURCE":Z  -w "$MAINSOURCE" -u "$(id -u $USER):$(id -g $USER)" kszonek/clang-format-17 --style=file --verbose -i "$@" $ALL_ADA_FILES
23 | 


--------------------------------------------------------------------------------
/tools/update-wpt.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | set -e
 3 | 
 4 | TARGET_MODULE=$1
 5 | BASE_DIR=$(pwd)
 6 | WPT_DIR="$BASE_DIR/tests/wpt"
 7 | 
 8 | if [ "$#" -ne 1 ]; then
 9 |     echo "Usage: $0 <target_module>"
10 |     exit 1
11 | fi
12 | 
13 | WORKSPACE=$(mktemp -d 2> /dev/null || mktemp -d -t 'tmp')
14 | 
15 | cleanup () {
16 |   EXIT_CODE=$?
17 |   [ -d "$WORKSPACE" ] && rm -rf "$WORKSPACE"
18 |   exit $EXIT_CODE
19 | }
20 | 
21 | trap cleanup INT TERM EXIT
22 | 
23 | cd "$WORKSPACE"
24 | git clone \
25 |   --no-checkout \
26 |   --depth=1 \
27 |   --filter=blob:none \
28 |   --sparse \
29 |   https://github.com/web-platform-tests/wpt.git wpt
30 | cd wpt
31 | # Conditionally sparse-checkout based on TARGET_MODULE
32 | if [ "$TARGET_MODULE" = "url" ]; then
33 |   git sparse-checkout add "url/resources"
34 | elif [ "$TARGET_MODULE" = "urlpattern" ]; then
35 |   git sparse-checkout add "urlpattern/resources"
36 | else
37 |   echo "Invalid target module: $TARGET_MODULE. Must be 'url' or 'urlpattern'."
38 |   exit 1
39 | fi
40 | 
41 | git checkout
42 | 
43 | # Copy the appropriate resources based on the target module
44 | if [ "$TARGET_MODULE" = "url" ]; then
45 |   cp url/resources/*.json "$WPT_DIR"
46 | elif [ "$TARGET_MODULE" = "urlpattern" ]; then
47 |   cp urlpattern/resources/*.json "$WPT_DIR"
48 | fi
49 | 


--------------------------------------------------------------------------------