├── .github
    └── FUNDING.yml
├── .gitignore
├── CITATION.cff
├── CODE_OF_CONDUCT.md
├── LICENSE
├── README.md
├── assets
    ├── images
    │   ├── logo
    │   │   ├── opendrivelab.jpeg
    │   │   └── tubingen.jpeg
    │   ├── page
    │   │   ├── front_page.png
    │   │   ├── front_page_dark.png
    │   │   ├── galaxy.jpeg
    │   │   └── video_front_page.png
    │   ├── repo
    │   │   ├── drivelm_teaser.jpg
    │   │   ├── drivelm_timeline.jpg
    │   │   ├── drivelm_timeline_v2.jpg
    │   │   ├── drivelm_timeline_v3.jpg
    │   │   ├── paper_data.jpg
    │   │   ├── paper_data_comp.png
    │   │   ├── paper_model_pipeline.jpg
    │   │   ├── paper_qualitative.jpg
    │   │   ├── paper_teaser.jpg
    │   │   ├── point_1.png
    │   │   ├── point_2.png
    │   │   ├── point_3.png
    │   │   ├── title.jpg
    │   │   └── title_v2.jpg
    │   └── svg
    │   │   ├── 404.svg
    │   │   ├── dialog.svg
    │   │   ├── divider.svg
    │   │   ├── faq.svg
    │   │   ├── featured-light.svg
    │   │   ├── featured.svg
    │   │   ├── graphic-1.svg
    │   │   ├── graphic-2.svg
    │   │   ├── master-card-1.svg
    │   │   ├── pattern-lg-light.svg
    │   │   ├── pattern-lg.svg
    │   │   ├── pattern.svg
    │   │   ├── pin-light.svg
    │   │   ├── pin.svg
    │   │   ├── quotes.svg
    │   │   ├── shadow.svg
    │   │   └── visa-1.svg
    └── video
    │   ├── DriveLM.mp4
    │   └── graph.mp4
├── challenge
    ├── README.md
    ├── __init__.py
    ├── convert2llama.py
    ├── convert_data.py
    ├── data
    │   └── train_sample.json
    ├── evaluation.py
    ├── extract_data.py
    ├── gpt_eval.py
    ├── llama_adapter_v2_multimodal7b
    │   ├── README.md
    │   ├── data
    │   │   ├── dataset.py
    │   │   └── nuscenes
    │   │   │   └── samples
    │   │   │       ├── CAM_BACK
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291002287558.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291005187558.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291010637558.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291013637558.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280036187525.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280039187525.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280042637525.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280045137525.jpg
    │   │   │           └── n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280048187525.jpg
    │   │   │       ├── CAM_BACK_LEFT
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291002297405.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291005197405.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291010647405.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291013647405.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280036197423.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280039197423.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280042647423.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280045147423.jpg
    │   │   │           └── n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280048197442.jpg
    │   │   │       ├── CAM_BACK_RIGHT
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291002278113.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291005178113.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291010628113.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291013628113.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280036177893.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280039177893.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280042627893.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280045127893.jpg
    │   │   │           └── n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280048177893.jpg
    │   │   │       ├── CAM_FRONT
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291002262404.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291005162404.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291010612404.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291013612404.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280036162460.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280039162460.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280042612460.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280045112460.jpg
    │   │   │           └── n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280048162460.jpg
    │   │   │       ├── CAM_FRONT_LEFT
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291002254799.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291005154799.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291010604799.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291013604799.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280036154844.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280039154844.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280042604844.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280045104844.jpg
    │   │   │           └── n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280048154844.jpg
    │   │   │       └── CAM_FRONT_RIGHT
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291002270482.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291005170482.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291010620482.jpg
    │   │   │           ├── n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291013620482.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280036170339.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280039170339.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280042620339.jpg
    │   │   │           ├── n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280045120339.jpg
    │   │   │           └── n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280048170339.jpg
    │   ├── demo.py
    │   ├── docs
    │   │   ├── eval.md
    │   │   └── train.md
    │   ├── engine_finetune.py
    │   ├── engine_pretrain.py
    │   ├── exps
    │   │   ├── finetune.sh
    │   │   └── pretrain.sh
    │   ├── finetune_data_config.yaml
    │   ├── gradio_app.py
    │   ├── llama
    │   │   ├── __init__.py
    │   │   ├── llama.py
    │   │   ├── llama_adapter.py
    │   │   ├── tokenizer.py
    │   │   └── utils.py
    │   ├── main_finetune.py
    │   ├── main_pretrain.py
    │   ├── requirements.txt
    │   └── util
    │   │   ├── evaluate_mme.py
    │   │   ├── extract_adapter_from_checkpoint.py
    │   │   ├── lr_sched.py
    │   │   └── misc.py
    ├── output.json
    ├── prepare_submission.py
    ├── submission.json
    ├── test.json
    ├── test_eval.json
    └── test_llama.json
├── docs
    ├── data_details.md
    ├── data_prep_nus.md
    └── gvqa.md
├── environment.yml
├── index.html
└── sample.html


/.github/FUNDING.yml:
--------------------------------------------------------------------------------
 1 | # These are supported funding model platforms
 2 | 
 3 | github: [OpenDriveLab] # Replace with up to 4 GitHub Sponsors-enabled usernames e.g., [user1, user2]
 4 | patreon: # Replace with a single Patreon username
 5 | open_collective: # Replace with a single Open Collective username
 6 | ko_fi: # Replace with a single Ko-fi username
 7 | tidelift: # Replace with a single Tidelift platform-name/package-name e.g., npm/babel
 8 | community_bridge: # Replace with a single Community Bridge project-name e.g., cloud-foundry
 9 | liberapay: # Replace with a single Liberapay username
10 | issuehunt: # Replace with a single IssueHunt username
11 | otechie: # Replace with a single Otechie username
12 | lfx_crowdfunding: # Replace with a single LFX Crowdfunding project-name e.g., cloud-foundry
13 | custom: # Replace with up to 4 custom sponsorship URLs e.g., ['link1', 'link2']
14 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | share/python-wheels/
 24 | *.egg-info/
 25 | .installed.cfg
 26 | *.egg
 27 | MANIFEST
 28 | 
 29 | # PyInstaller
 30 | #  Usually these files are written by a python script from a template
 31 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 32 | *.manifest
 33 | *.spec
 34 | 
 35 | # Installer logs
 36 | pip-log.txt
 37 | pip-delete-this-directory.txt
 38 | 
 39 | # Unit test / coverage reports
 40 | htmlcov/
 41 | .tox/
 42 | .nox/
 43 | .coverage
 44 | .coverage.*
 45 | .cache
 46 | nosetests.xml
 47 | coverage.xml
 48 | *.cover
 49 | *.py,cover
 50 | .hypothesis/
 51 | .pytest_cache/
 52 | cover/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | .pybuilder/
 76 | target/
 77 | 
 78 | # Jupyter Notebook
 79 | .ipynb_checkpoints
 80 | 
 81 | # IPython
 82 | profile_default/
 83 | ipython_config.py
 84 | 
 85 | # pyenv
 86 | #   For a library or package, you might want to ignore these files since the code is
 87 | #   intended to run in multiple environments; otherwise, check them in:
 88 | # .python-version
 89 | 
 90 | # pipenv
 91 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 92 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 93 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 94 | #   install all needed dependencies.
 95 | #Pipfile.lock
 96 | 
 97 | # poetry
 98 | #   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
 99 | #   This is especially recommended for binary packages to ensure reproducibility, and is more
100 | #   commonly ignored for libraries.
101 | #   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
102 | #poetry.lock
103 | 
104 | # pdm
105 | #   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
106 | #pdm.lock
107 | #   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
108 | #   in version control.
109 | #   https://pdm.fming.dev/#use-with-ide
110 | .pdm.toml
111 | 
112 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
113 | __pypackages__/
114 | 
115 | # Celery stuff
116 | celerybeat-schedule
117 | celerybeat.pid
118 | 
119 | # SageMath parsed files
120 | *.sage.py
121 | 
122 | # Environments
123 | .env
124 | .venv
125 | env/
126 | venv/
127 | ENV/
128 | env.bak/
129 | venv.bak/
130 | 
131 | # Spyder project settings
132 | .spyderproject
133 | .spyproject
134 | 
135 | # Rope project settings
136 | .ropeproject
137 | 
138 | # mkdocs documentation
139 | /site
140 | 
141 | # mypy
142 | .mypy_cache/
143 | .dmypy.json
144 | dmypy.json
145 | 
146 | # Pyre type checker
147 | .pyre/
148 | 
149 | # pytype static type analyzer
150 | .pytype/
151 | 
152 | # Cython debug symbols
153 | cython_debug/
154 | 
155 | # PyCharm
156 | #  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
157 | #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
158 | #  and can be added to the global gitignore or merged into this file.  For a more nuclear
159 | #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
160 | #.idea/
161 | .DS_Store
162 | 


--------------------------------------------------------------------------------
/CITATION.cff:
--------------------------------------------------------------------------------
1 | cff-version: 1.2.0
2 | message: "If you use this software, please cite it as below."
3 | authors:
4 |   - name: "DriveLM Contributors"
5 | title: "Drive on Language"
6 | date-released: 2023-08-25
7 | url: "https://github.com/OpenDriveLab/DriveLM/"
8 | license: Apache-2.0


--------------------------------------------------------------------------------
/CODE_OF_CONDUCT.md:
--------------------------------------------------------------------------------
  1 | # Contributor Covenant Code of Conduct
  2 | 
  3 | ## Our Pledge
  4 | 
  5 | We as members, contributors, and leaders pledge to make participation in our
  6 | community a harassment-free experience for everyone, regardless of age, body
  7 | size, visible or invisible disability, ethnicity, sex characteristics, gender
  8 | identity and expression, level of experience, education, socio-economic status,
  9 | nationality, personal appearance, race, religion, or sexual identity
 10 | and orientation.
 11 | 
 12 | We pledge to act and interact in ways that contribute to an open, welcoming,
 13 | diverse, inclusive, and healthy community.
 14 | 
 15 | ## Our Standards
 16 | 
 17 | Examples of behavior that contributes to a positive environment for our
 18 | community include:
 19 | 
 20 | * Demonstrating empathy and kindness toward other people
 21 | * Being respectful of differing opinions, viewpoints, and experiences
 22 | * Giving and gracefully accepting constructive feedback
 23 | * Accepting responsibility and apologizing to those affected by our mistakes,
 24 |   and learning from the experience
 25 | * Focusing on what is best not just for us as individuals, but for the
 26 |   overall community
 27 | 
 28 | Examples of unacceptable behavior include:
 29 | 
 30 | * The use of sexualized language or imagery, and sexual attention or
 31 |   advances of any kind
 32 | * Trolling, insulting or derogatory comments, and personal or political attacks
 33 | * Public or private harassment
 34 | * Publishing others' private information, such as a physical or email
 35 |   address, without their explicit permission
 36 | * Other conduct which could reasonably be considered inappropriate in a
 37 |   professional setting
 38 | 
 39 | ## Enforcement Responsibilities
 40 | 
 41 | Community leaders are responsible for clarifying and enforcing our standards of
 42 | acceptable behavior and will take appropriate and fair corrective action in
 43 | response to any behavior that they deem inappropriate, threatening, offensive,
 44 | or harmful.
 45 | 
 46 | Community leaders have the right and responsibility to remove, edit, or reject
 47 | comments, commits, code, wiki edits, issues, and other contributions that are
 48 | not aligned to this Code of Conduct, and will communicate reasons for moderation
 49 | decisions when appropriate.
 50 | 
 51 | ## Scope
 52 | 
 53 | This Code of Conduct applies within all community spaces, and also applies when
 54 | an individual is officially representing the community in public spaces.
 55 | Examples of representing our community include using an official e-mail address,
 56 | posting via an official social media account, or acting as an appointed
 57 | representative at an online or offline event.
 58 | 
 59 | ## Enforcement
 60 | 
 61 | Instances of abusive, harassing, or otherwise unacceptable behavior may be
 62 | reported to the community leaders responsible for enforcement at contact@opendrivelab.com
 63 | 
 64 | All complaints will be reviewed and investigated promptly and fairly.
 65 | 
 66 | All community leaders are obligated to respect the privacy and security of the
 67 | reporter of any incident.
 68 | 
 69 | ## Enforcement Guidelines
 70 | 
 71 | Community leaders will follow these Community Impact Guidelines in determining
 72 | the consequences for any action they deem in violation of this Code of Conduct:
 73 | 
 74 | ### 1. Correction
 75 | 
 76 | **Community Impact**: Use of inappropriate language or other behavior deemed
 77 | unprofessional or unwelcome in the community.
 78 | 
 79 | **Consequence**: A private, written warning from community leaders, providing
 80 | clarity around the nature of the violation and an explanation of why the
 81 | behavior was inappropriate. A public apology may be requested.
 82 | 
 83 | ### 2. Warning
 84 | 
 85 | **Community Impact**: A violation through a single incident or series
 86 | of actions.
 87 | 
 88 | **Consequence**: A warning with consequences for continued behavior. No
 89 | interaction with the people involved, including unsolicited interaction with
 90 | those enforcing the Code of Conduct, for a specified period of time. This
 91 | includes avoiding interactions in community spaces as well as external channels
 92 | like social media. Violating these terms may lead to a temporary or
 93 | permanent ban.
 94 | 
 95 | ### 3. Temporary Ban
 96 | 
 97 | **Community Impact**: A serious violation of community standards, including
 98 | sustained inappropriate behavior.
 99 | 
100 | **Consequence**: A temporary ban from any sort of interaction or public
101 | communication with the community for a specified period of time. No public or
102 | private interaction with the people involved, including unsolicited interaction
103 | with those enforcing the Code of Conduct, is allowed during this period.
104 | Violating these terms may lead to a permanent ban.
105 | 
106 | ### 4. Permanent Ban
107 | 
108 | **Community Impact**: Demonstrating a pattern of violation of community
109 | standards, including sustained inappropriate behavior,  harassment of an
110 | individual, or aggression toward or disparagement of classes of individuals.
111 | 
112 | **Consequence**: A permanent ban from any sort of public interaction within
113 | the community.
114 | 
115 | ## Attribution
116 | 
117 | This Code of Conduct is adapted from the [Contributor Covenant][homepage],
118 | version 2.0, available at
119 | https://www.contributor-covenant.org/version/2/0/code_of_conduct.html.
120 | 
121 | Community Impact Guidelines were inspired by [Mozilla's code of conduct
122 | enforcement ladder](https://github.com/mozilla/diversity).
123 | 
124 | [homepage]: https://www.contributor-covenant.org
125 | 
126 | For answers to common questions about this code of conduct, see the FAQ at
127 | https://www.contributor-covenant.org/faq. Translations are available at
128 | https://www.contributor-covenant.org/translations.


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 |                                  Apache License
  2 |                            Version 2.0, January 2004
  3 |                         http://www.apache.org/licenses/
  4 | 
  5 |    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
  6 | 
  7 |    1. Definitions.
  8 | 
  9 |       "License" shall mean the terms and conditions for use, reproduction,
 10 |       and distribution as defined by Sections 1 through 9 of this document.
 11 | 
 12 |       "Licensor" shall mean the copyright owner or entity authorized by
 13 |       the copyright owner that is granting the License.
 14 | 
 15 |       "Legal Entity" shall mean the union of the acting entity and all
 16 |       other entities that control, are controlled by, or are under common
 17 |       control with that entity. For the purposes of this definition,
 18 |       "control" means (i) the power, direct or indirect, to cause the
 19 |       direction or management of such entity, whether by contract or
 20 |       otherwise, or (ii) ownership of fifty percent (50%) or more of the
 21 |       outstanding shares, or (iii) beneficial ownership of such entity.
 22 | 
 23 |       "You" (or "Your") shall mean an individual or Legal Entity
 24 |       exercising permissions granted by this License.
 25 | 
 26 |       "Source" form shall mean the preferred form for making modifications,
 27 |       including but not limited to software source code, documentation
 28 |       source, and configuration files.
 29 | 
 30 |       "Object" form shall mean any form resulting from mechanical
 31 |       transformation or translation of a Source form, including but
 32 |       not limited to compiled object code, generated documentation,
 33 |       and conversions to other media types.
 34 | 
 35 |       "Work" shall mean the work of authorship, whether in Source or
 36 |       Object form, made available under the License, as indicated by a
 37 |       copyright notice that is included in or attached to the work
 38 |       (an example is provided in the Appendix below).
 39 | 
 40 |       "Derivative Works" shall mean any work, whether in Source or Object
 41 |       form, that is based on (or derived from) the Work and for which the
 42 |       editorial revisions, annotations, elaborations, or other modifications
 43 |       represent, as a whole, an original work of authorship. For the purposes
 44 |       of this License, Derivative Works shall not include works that remain
 45 |       separable from, or merely link (or bind by name) to the interfaces of,
 46 |       the Work and Derivative Works thereof.
 47 | 
 48 |       "Contribution" shall mean any work of authorship, including
 49 |       the original version of the Work and any modifications or additions
 50 |       to that Work or Derivative Works thereof, that is intentionally
 51 |       submitted to Licensor for inclusion in the Work by the copyright owner
 52 |       or by an individual or Legal Entity authorized to submit on behalf of
 53 |       the copyright owner. For the purposes of this definition, "submitted"
 54 |       means any form of electronic, verbal, or written communication sent
 55 |       to the Licensor or its representatives, including but not limited to
 56 |       communication on electronic mailing lists, source code control systems,
 57 |       and issue tracking systems that are managed by, or on behalf of, the
 58 |       Licensor for the purpose of discussing and improving the Work, but
 59 |       excluding communication that is conspicuously marked or otherwise
 60 |       designated in writing by the copyright owner as "Not a Contribution."
 61 | 
 62 |       "Contributor" shall mean Licensor and any individual or Legal Entity
 63 |       on behalf of whom a Contribution has been received by Licensor and
 64 |       subsequently incorporated within the Work.
 65 | 
 66 |    2. Grant of Copyright License. Subject to the terms and conditions of
 67 |       this License, each Contributor hereby grants to You a perpetual,
 68 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 69 |       copyright license to reproduce, prepare Derivative Works of,
 70 |       publicly display, publicly perform, sublicense, and distribute the
 71 |       Work and such Derivative Works in Source or Object form.
 72 | 
 73 |    3. Grant of Patent License. Subject to the terms and conditions of
 74 |       this License, each Contributor hereby grants to You a perpetual,
 75 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 76 |       (except as stated in this section) patent license to make, have made,
 77 |       use, offer to sell, sell, import, and otherwise transfer the Work,
 78 |       where such license applies only to those patent claims licensable
 79 |       by such Contributor that are necessarily infringed by their
 80 |       Contribution(s) alone or by combination of their Contribution(s)
 81 |       with the Work to which such Contribution(s) was submitted. If You
 82 |       institute patent litigation against any entity (including a
 83 |       cross-claim or counterclaim in a lawsuit) alleging that the Work
 84 |       or a Contribution incorporated within the Work constitutes direct
 85 |       or contributory patent infringement, then any patent licenses
 86 |       granted to You under this License for that Work shall terminate
 87 |       as of the date such litigation is filed.
 88 | 
 89 |    4. Redistribution. You may reproduce and distribute copies of the
 90 |       Work or Derivative Works thereof in any medium, with or without
 91 |       modifications, and in Source or Object form, provided that You
 92 |       meet the following conditions:
 93 | 
 94 |       (a) You must give any other recipients of the Work or
 95 |           Derivative Works a copy of this License; and
 96 | 
 97 |       (b) You must cause any modified files to carry prominent notices
 98 |           stating that You changed the files; and
 99 | 
100 |       (c) You must retain, in the Source form of any Derivative Works
101 |           that You distribute, all copyright, patent, trademark, and
102 |           attribution notices from the Source form of the Work,
103 |           excluding those notices that do not pertain to any part of
104 |           the Derivative Works; and
105 | 
106 |       (d) If the Work includes a "NOTICE" text file as part of its
107 |           distribution, then any Derivative Works that You distribute must
108 |           include a readable copy of the attribution notices contained
109 |           within such NOTICE file, excluding those notices that do not
110 |           pertain to any part of the Derivative Works, in at least one
111 |           of the following places: within a NOTICE text file distributed
112 |           as part of the Derivative Works; within the Source form or
113 |           documentation, if provided along with the Derivative Works; or,
114 |           within a display generated by the Derivative Works, if and
115 |           wherever such third-party notices normally appear. The contents
116 |           of the NOTICE file are for informational purposes only and
117 |           do not modify the License. You may add Your own attribution
118 |           notices within Derivative Works that You distribute, alongside
119 |           or as an addendum to the NOTICE text from the Work, provided
120 |           that such additional attribution notices cannot be construed
121 |           as modifying the License.
122 | 
123 |       You may add Your own copyright statement to Your modifications and
124 |       may provide additional or different license terms and conditions
125 |       for use, reproduction, or distribution of Your modifications, or
126 |       for any such Derivative Works as a whole, provided Your use,
127 |       reproduction, and distribution of the Work otherwise complies with
128 |       the conditions stated in this License.
129 | 
130 |    5. Submission of Contributions. Unless You explicitly state otherwise,
131 |       any Contribution intentionally submitted for inclusion in the Work
132 |       by You to the Licensor shall be under the terms and conditions of
133 |       this License, without any additional terms or conditions.
134 |       Notwithstanding the above, nothing herein shall supersede or modify
135 |       the terms of any separate license agreement you may have executed
136 |       with Licensor regarding such Contributions.
137 | 
138 |    6. Trademarks. This License does not grant permission to use the trade
139 |       names, trademarks, service marks, or product names of the Licensor,
140 |       except as required for reasonable and customary use in describing the
141 |       origin of the Work and reproducing the content of the NOTICE file.
142 | 
143 |    7. Disclaimer of Warranty. Unless required by applicable law or
144 |       agreed to in writing, Licensor provides the Work (and each
145 |       Contributor provides its Contributions) on an "AS IS" BASIS,
146 |       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
147 |       implied, including, without limitation, any warranties or conditions
148 |       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
149 |       PARTICULAR PURPOSE. You are solely responsible for determining the
150 |       appropriateness of using or redistributing the Work and assume any
151 |       risks associated with Your exercise of permissions under this License.
152 | 
153 |    8. Limitation of Liability. In no event and under no legal theory,
154 |       whether in tort (including negligence), contract, or otherwise,
155 |       unless required by applicable law (such as deliberate and grossly
156 |       negligent acts) or agreed to in writing, shall any Contributor be
157 |       liable to You for damages, including any direct, indirect, special,
158 |       incidental, or consequential damages of any character arising as a
159 |       result of this License or out of the use or inability to use the
160 |       Work (including but not limited to damages for loss of goodwill,
161 |       work stoppage, computer failure or malfunction, or any and all
162 |       other commercial damages or losses), even if such Contributor
163 |       has been advised of the possibility of such damages.
164 | 
165 |    9. Accepting Warranty or Additional Liability. While redistributing
166 |       the Work or Derivative Works thereof, You may choose to offer,
167 |       and charge a fee for, acceptance of support, warranty, indemnity,
168 |       or other liability obligations and/or rights consistent with this
169 |       License. However, in accepting such obligations, You may act only
170 |       on Your own behalf and on Your sole responsibility, not on behalf
171 |       of any other Contributor, and only if You agree to indemnify,
172 |       defend, and hold each Contributor harmless for any liability
173 |       incurred by, or claims asserted against, such Contributor by reason
174 |       of your accepting any such warranty or additional liability.
175 | 
176 |    END OF TERMS AND CONDITIONS
177 | 
178 |    APPENDIX: How to apply the Apache License to your work.
179 | 
180 |       To apply the Apache License to your work, attach the following
181 |       boilerplate notice, with the fields enclosed by brackets "[]"
182 |       replaced with your own identifying information. (Don't include
183 |       the brackets!)  The text should be enclosed in the appropriate
184 |       comment syntax for the file format. We also recommend that a
185 |       file or class name and description of purpose be included on the
186 |       same "printed page" as the copyright notice for easier
187 |       identification within third-party archives.
188 | 
189 |    Copyright [yyyy] [name of copyright owner]
190 | 
191 |    Licensed under the Apache License, Version 2.0 (the "License");
192 |    you may not use this file except in compliance with the License.
193 |    You may obtain a copy of the License at
194 | 
195 |        http://www.apache.org/licenses/LICENSE-2.0
196 | 
197 |    Unless required by applicable law or agreed to in writing, software
198 |    distributed under the License is distributed on an "AS IS" BASIS,
199 |    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
200 |    See the License for the specific language governing permissions and
201 |    limitations under the License.
202 | 


--------------------------------------------------------------------------------
/assets/images/logo/opendrivelab.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/logo/opendrivelab.jpeg


--------------------------------------------------------------------------------
/assets/images/logo/tubingen.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/logo/tubingen.jpeg


--------------------------------------------------------------------------------
/assets/images/page/front_page.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/page/front_page.png


--------------------------------------------------------------------------------
/assets/images/page/front_page_dark.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/page/front_page_dark.png


--------------------------------------------------------------------------------
/assets/images/page/galaxy.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/page/galaxy.jpeg


--------------------------------------------------------------------------------
/assets/images/page/video_front_page.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/page/video_front_page.png


--------------------------------------------------------------------------------
/assets/images/repo/drivelm_teaser.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/drivelm_teaser.jpg


--------------------------------------------------------------------------------
/assets/images/repo/drivelm_timeline.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/drivelm_timeline.jpg


--------------------------------------------------------------------------------
/assets/images/repo/drivelm_timeline_v2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/drivelm_timeline_v2.jpg


--------------------------------------------------------------------------------
/assets/images/repo/drivelm_timeline_v3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/drivelm_timeline_v3.jpg


--------------------------------------------------------------------------------
/assets/images/repo/paper_data.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/paper_data.jpg


--------------------------------------------------------------------------------
/assets/images/repo/paper_data_comp.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/paper_data_comp.png


--------------------------------------------------------------------------------
/assets/images/repo/paper_model_pipeline.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/paper_model_pipeline.jpg


--------------------------------------------------------------------------------
/assets/images/repo/paper_qualitative.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/paper_qualitative.jpg


--------------------------------------------------------------------------------
/assets/images/repo/paper_teaser.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/paper_teaser.jpg


--------------------------------------------------------------------------------
/assets/images/repo/point_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/point_1.png


--------------------------------------------------------------------------------
/assets/images/repo/point_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/point_2.png


--------------------------------------------------------------------------------
/assets/images/repo/point_3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/point_3.png


--------------------------------------------------------------------------------
/assets/images/repo/title.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/title.jpg


--------------------------------------------------------------------------------
/assets/images/repo/title_v2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/images/repo/title_v2.jpg


--------------------------------------------------------------------------------
/assets/images/svg/404.svg:
--------------------------------------------------------------------------------
1 | <svg width="685" height="440" viewBox="0 0 685 440" fill="none" xmlns="http://www.w3.org/2000/svg">
2 | <path fill-rule="evenodd" clip-rule="evenodd" d="M0.144559 209.962L137.303 244.651L126.158 288.718L199.42 307.246L210.565 263.179L238.438 270.228C276.655 348.977 341.275 377.294 410.662 347.94C421.581 343.321 431.38 337.791 440.026 331.429L439.067 386.795L471.089 439.14L591.775 365.311L615.495 404.086L679.958 364.651L656.238 325.876L684.834 308.382L652.811 256.037L624.215 273.53L528.148 116.494L467.536 153.573C429.938 68.081 364.019 38.6947 292.171 69.2419C277.229 75.5945 264.348 83.5324 253.63 92.8999L270.747 25.2169L173.8 0.698251L15.1901 150.472L0.144559 209.962ZM467.536 153.573L442.844 168.678L440.026 331.429C489.078 295.332 500.957 232.438 469.033 157.041C468.539 155.875 468.04 154.719 467.536 153.573ZM253.63 92.8999L225.61 203.689L258.11 211.908L243.064 271.399L238.438 270.228C236.449 266.13 234.532 261.896 232.689 257.526C203.022 187.171 212.024 129.263 253.63 92.8999ZM154.001 185.578L90.655 169.558L91.2122 167.354L176.874 85.87L179.077 86.4273L154.001 185.578ZM561.207 312.076L505.468 346.174L504.282 344.235L505.897 226.019L507.836 224.833L561.207 312.076ZM307.984 225.513C331.677 281.965 360.443 299.525 385.541 288.854C410.64 278.183 417.822 245.339 393.737 189.054C370.208 134.076 342.168 117.134 317.07 127.805C291.971 138.476 284.847 170.368 307.984 225.513Z" fill="white"/>
3 | </svg>
4 | 


--------------------------------------------------------------------------------
/assets/images/svg/dialog.svg:
--------------------------------------------------------------------------------
1 | <svg width="400" height="277" viewBox="0 0 400 277" fill="none" xmlns="http://www.w3.org/2000/svg">
2 | <path fill-rule="evenodd" clip-rule="evenodd" d="M152.264 90.0195L0 145.439L47.8245 276.678L262.837 198.42L253.833 173.71L137.264 131.282L152.264 90.0195ZM43.0022 129.787L14.3338 140.221L3.4025 110.224L43.0022 129.787Z" fill="white" fill-opacity="0.1"/>
3 | <path fill-rule="evenodd" clip-rule="evenodd" d="M184.987 -0.000481309L400 78.2578L352.277 209.534L337.943 204.317L327.035 234.322L309.275 193.882L137.264 131.276L184.987 -0.000481309Z" fill="black" fill-opacity="0.1"/>
4 | </svg>
5 | 


--------------------------------------------------------------------------------
/assets/images/svg/divider.svg:
--------------------------------------------------------------------------------
 1 | <svg width="200" height="200" viewBox="0 0 200 200" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <g clip-path="url(#clip0)">
 3 | <path fill-rule="evenodd" clip-rule="evenodd" d="M201.414 1.41436L1.41412 201.414L-1.41431 198.586L198.586 -1.41406L201.414 1.41436Z" fill="white"/>
 4 | </g>
 5 | <defs>
 6 | <clipPath id="clip0">
 7 | <rect width="200" height="200" fill="white"/>
 8 | </clipPath>
 9 | </defs>
10 | </svg>
11 | 


--------------------------------------------------------------------------------
/assets/images/svg/faq.svg:
--------------------------------------------------------------------------------
1 | <svg width="504" height="353" viewBox="0 0 504 353" fill="none" xmlns="http://www.w3.org/2000/svg">
2 | <path fill-rule="evenodd" clip-rule="evenodd" d="M0 221.24L60.0886 246.504L96.4246 160.082L150.893 182.984L127.618 352.984L196.759 340.206L202.009 292.52L279.908 278.123L301.854 320.783L370.996 308.004L359.835 287.651C360.38 287.826 360.927 287.998 361.476 288.167C374.346 292.124 387.2 293.936 399.666 293.712L409.855 317.018L460.512 332.596L440.395 284.035C465.594 271.724 486.158 247.732 497.334 211.386C518.991 140.96 485.339 89.1393 428.093 71.5353C370.434 53.8046 313.891 77.8899 292.235 148.316C291.118 151.945 290.149 155.527 289.323 159.058L249.48 86.3978L239.018 88.3314L248.645 65.4324L93.0202 0L0 221.24ZM189.445 97.4932L228.297 113.829L239.018 88.3314L189.445 97.4932ZM158.266 129.132L202.799 147.856L182.451 196.252L150.893 182.984L158.266 129.132ZM158.266 129.132L161.901 102.584L189.445 97.4932L132.761 73.6605L116.773 111.686L158.266 129.132ZM289.323 159.058C274.356 222.991 306.156 270.395 359.835 287.651L289.323 159.058ZM207.669 241.898L216.78 159.654L218.624 159.313L256.529 232.868L207.669 241.898ZM380.23 239.275L366.245 200.827L410.725 214.505L417.103 230.779C425.979 222.802 433.216 210.264 438.44 193.276C450.092 155.386 441.186 130.107 412.768 121.369C384.351 112.63 362.78 128.536 351.129 166.426C339.477 204.316 348.383 229.594 376.8 238.333L376.801 238.333C377.934 238.682 379.066 239.03 380.23 239.275Z" fill="white"/>
3 | </svg>
4 | 


--------------------------------------------------------------------------------
/assets/images/svg/featured-light.svg:
--------------------------------------------------------------------------------
 1 | <svg width="171" height="171" viewBox="0 0 171 171" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M82.5909 16H84.3466V10.9261L89.2898 10.9261V9.42045L84.3466 9.42045V5.875L89.8068 5.875V4.36364L82.5909 4.36364V16Z" fill="white"/>
 3 | <path d="M95.5804 16.5766L102.811 17.9702L103.097 16.4861L97.5904 15.4248L98.2646 11.9267L103.33 12.9031L103.615 11.4246L98.5496 10.4482L99.2206 6.96685L104.66 8.01526L104.946 6.53121L97.7826 5.15053L95.5804 16.5766Z" fill="white"/>
 4 | <path d="M108.544 19.7012L110.68 17.2392L114.9 18.9286L114.742 22.1825L116.472 22.8751L116.909 10.5159L115.026 9.76206L106.814 19.0085L108.544 19.7012ZM111.704 16.0578L115.142 12.0854L115.227 12.1192L114.974 17.3671L111.704 16.0578Z" fill="white"/>
 5 | <path d="M125.408 16.2698L128.457 18.2296L122.983 26.7473L124.456 27.6934L129.93 19.1757L132.984 21.1386L133.801 19.8672L126.225 14.9984L125.408 16.2698Z" fill="white"/>
 6 | <path d="M143.717 28.6164L138.534 34.0526C137.444 35.1958 135.87 35.2654 134.587 34.0421C133.308 32.8227 133.299 31.2435 134.389 30.1003L139.572 24.6641L138.302 23.4525L133.02 28.9916C131.334 30.7598 131.463 33.2765 133.482 35.2017C135.501 37.1268 138.025 37.1391 139.711 35.3709L144.992 29.8318L143.717 28.6164Z" fill="white"/>
 7 | <path d="M140.246 42.2246L141.265 43.6547L144.852 41.1005L146.236 43.0443C146.259 43.0767 146.279 43.1045 146.302 43.1369L144.086 47.6165L145.246 49.2457L147.587 44.4122C148.844 45.2674 150.224 45.1571 151.496 44.2508C153.241 43.0083 153.697 41.0519 152.131 38.8535L149.725 35.4748L140.246 42.2246ZM146.083 40.2238L149.517 37.7783L150.796 39.5741C151.801 40.9857 151.545 42.0468 150.471 42.8114C149.402 43.5727 148.367 43.4312 147.375 42.0381L146.083 40.2238Z" fill="white"/>
 8 | <path d="M147.293 53.1145L150.352 59.8127L151.727 59.1849L149.397 54.0837L152.638 52.6038L154.781 57.2967L156.151 56.6712L154.008 51.9783L157.233 50.5055L159.534 55.5446L160.909 54.9168L157.878 48.2806L147.293 53.1145Z" fill="white"/>
 9 | <path d="M152.883 68.0252C153.719 71.4707 156.34 72.9456 159.874 72.0883C163.391 71.235 165.028 68.7273 164.22 65.3977L163.304 61.6209L151.995 64.3643L152.883 68.0252ZM153.9 65.7088L162.227 63.6888L162.704 65.6545C163.304 68.1282 162.133 69.7627 159.466 70.4097C156.788 71.0594 154.977 70.1482 154.351 67.5696L153.9 65.7088Z" fill="white"/>
10 | <path d="M156.341 95.6229C156.144 96.9895 157.093 98.2567 158.459 98.4532C159.826 98.6497 161.093 97.7011 161.29 96.3345C161.486 94.9678 160.538 93.7006 159.171 93.5041C157.804 93.3076 156.537 94.2563 156.341 95.6229Z" fill="white"/>
11 | <path d="M140.379 127.609L139.229 128.936L143.064 132.259L139.827 135.994L140.965 136.98L144.202 133.245L146.881 135.566L143.306 139.693L144.448 140.683L149.173 135.229L140.379 127.609Z" fill="white"/>
12 | <path d="M131.437 137.048L125.649 141.6L126.583 142.788L130.991 139.322L133.193 142.122L129.138 145.311L130.069 146.495L134.124 143.305L136.316 146.092L131.961 149.517L132.896 150.705L138.63 146.195L131.437 137.048Z" fill="white"/>
13 | <path d="M120.586 144.799L121.048 148.026L117.008 150.109L114.653 147.858L112.996 148.712L122.05 157.136L123.853 156.207L122.243 143.945L120.586 144.799ZM121.271 149.573L122.021 154.773L121.94 154.815L118.139 151.187L121.271 149.573Z" fill="white"/>
14 | <path d="M112.136 159.791L108.658 160.812L105.805 151.098L104.126 151.591L106.979 161.305L103.495 162.328L103.921 163.778L112.562 161.241L112.136 159.791Z" fill="white"/>
15 | <path d="M90.815 165.543L90.101 158.066C89.9509 156.494 90.9288 155.259 92.6935 155.09C94.4526 154.922 95.6522 155.949 95.8023 157.522L96.5163 164.999L98.2641 164.832L97.5366 157.213C97.3043 154.781 95.3183 153.23 92.5412 153.495C89.7641 153.76 88.1019 155.66 88.3341 158.092L89.0616 165.711L90.815 165.543Z" fill="white"/>
16 | <path d="M82.8037 154.009L81.0559 153.842L80.6374 158.225L78.2618 157.998C78.2222 157.995 78.1883 157.991 78.1487 157.988L76.2143 153.379L74.2234 153.189L76.3435 158.123C74.8736 158.514 74.0537 159.628 73.9052 161.184C73.7016 163.316 74.882 164.941 77.5686 165.198L81.6976 165.592L82.8037 154.009ZM80.4937 159.73L80.093 163.927L77.8984 163.717C76.1733 163.552 75.5389 162.664 75.6642 161.352C75.789 160.045 76.574 159.355 78.2765 159.518L80.4937 159.73Z" fill="white"/>
17 | <path d="M69.9589 152.203L62.8935 150.128L62.4677 151.578L67.8485 153.158L66.8448 156.577L61.8947 155.123L61.4705 156.568L66.4206 158.021L65.4218 161.423L60.1064 159.862L59.6806 161.313L66.6805 163.368L69.9589 152.203Z" fill="white"/>
18 | <path d="M55.0294 146.663C51.8781 145.039 49.0474 146.053 47.3811 149.285C45.7227 152.502 46.546 155.381 49.5913 156.951L53.0456 158.732L58.3777 148.389L55.0294 146.663ZM56.1142 148.948L52.1881 156.564L50.3902 155.637C48.1277 154.471 47.6589 152.516 48.9164 150.077C50.1791 147.627 52.0539 146.855 54.4123 148.071L56.1142 148.948Z" fill="white"/>
19 | <path d="M31.9085 131.203C31.0043 130.16 29.4254 130.047 28.382 130.951C27.3385 131.855 27.2256 133.434 28.1298 134.478C29.0339 135.521 30.6128 135.634 31.6563 134.73C32.6997 133.826 32.8127 132.247 31.9085 131.203Z" fill="white"/>
20 | <path d="M21.91 110.789L21.3357 109.13L16.5409 110.79L14.9242 106.118L13.5013 106.611L15.118 111.282L11.7676 112.442L9.98172 107.282L8.55348 107.776L10.9136 114.595L21.91 110.789Z" fill="white"/>
21 | <path d="M18.2064 98.3256L17.1584 91.0369L15.6624 91.252L16.4605 96.8028L12.9343 97.3098L12.2001 92.2033L10.7097 92.4175L11.4439 97.5241L7.93458 98.0287L7.14618 92.5453L5.6502 92.7604L6.68846 99.9816L18.2064 98.3256Z" fill="white"/>
22 | <path d="M16.9192 85.0533L13.894 83.8398L14.1103 79.2995L17.2369 78.3847L17.3256 76.5232L5.50312 80.1522L5.40661 82.1784L16.8305 86.9148L16.9192 85.0533ZM12.4427 83.2587L7.56408 81.3084L7.56841 81.2176L12.6103 79.74L12.4427 83.2587Z" fill="white"/>
23 | <path d="M8.16086 70.239L9.01549 66.7162L18.8551 69.1033L19.2677 67.4026L9.42807 65.0156L10.284 61.4872L8.81527 61.1309L6.6921 69.8827L8.16086 70.239Z" fill="white"/>
24 | <path d="M13.8399 48.8982L20.6725 52.0186C22.1093 52.6747 22.6898 54.1391 21.9534 55.7517C21.2193 57.359 19.7301 57.8844 18.2933 57.2283L11.4607 54.1079L10.7314 55.705L17.6931 58.8843C19.9155 59.8992 22.2519 58.9549 23.4108 56.4173C24.5697 53.8796 23.7558 51.4903 21.5334 50.4754L14.5716 47.296L13.8399 48.8982Z" fill="white"/>
25 | <path d="M27.8349 47.7276L28.8533 46.2974L25.2664 43.7432L26.6506 41.7993C26.6737 41.7669 26.6935 41.7392 26.7165 41.7068L31.6745 42.3356L32.8346 40.7065L27.5015 40.0755C27.8983 38.6073 27.343 37.34 26.0702 36.4336C24.3253 35.1911 22.3276 35.4008 20.7621 37.5992L18.3562 40.9778L27.8349 47.7276ZM24.0353 42.8665L20.6011 40.4211L21.8799 38.6253C22.8851 37.2137 23.9714 37.1084 25.0452 37.873C26.1143 38.6344 26.3193 39.6592 25.3272 41.0523L24.0353 42.8665Z" fill="white"/>
26 | <path d="M35.8211 37.5065L41.1505 32.425L40.1075 31.3312L36.0488 35.2012L33.5904 32.6229L37.3242 29.0627L36.2852 27.973L32.5514 31.5331L30.1047 28.9672L34.1141 25.1443L33.0711 24.0505L27.7911 29.0849L35.8211 37.5065Z" fill="white"/>
27 | <path d="M48.0834 27.3471C51.066 25.4303 51.6027 22.4715 49.6367 19.4124C47.68 16.3677 44.7749 15.6411 41.8926 17.4934L38.6232 19.5946L44.9143 29.3837L48.0834 27.3471ZM45.5619 27.144L40.9296 19.9359L42.6312 18.8424C44.7726 17.4662 46.7 18.0376 48.1837 20.3463C49.6735 22.6645 49.4049 24.6742 47.1727 26.1087L45.5619 27.144Z" fill="white"/>
28 | <path d="M73.0325 15.0537C74.3882 14.7924 75.2755 13.4815 75.0142 12.1258C74.7529 10.7701 73.442 9.88279 72.0862 10.1441C70.7305 10.4054 69.8433 11.7163 70.1045 13.072C70.3658 14.4278 71.6768 15.315 73.0325 15.0537Z" fill="white"/>
29 | </svg>
30 | 


--------------------------------------------------------------------------------
/assets/images/svg/featured.svg:
--------------------------------------------------------------------------------
 1 | <svg width="161" height="161" viewBox="0 0 161 161" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M78.4432 12H79.7599V8.1946L83.4673 8.1946V7.06534L79.7599 7.06534V4.40625L83.8551 4.40625V3.27273L78.4432 3.27273V12Z" fill="black"/>
 3 | <path d="M91.2607 12.7261L96.6836 13.7713L96.8981 12.6583L92.7682 11.8623L93.2738 9.23868L97.0732 9.97096L97.2869 8.8621L93.4875 8.12983L93.9908 5.51879L98.0705 6.3051L98.285 5.19206L92.9123 4.15656L91.2607 12.7261Z" fill="black"/>
 4 | <path d="M104.412 16.1257L106.014 14.2793L109.179 15.5463L109.06 17.9867L110.358 18.5062L110.686 9.23681L109.273 8.6714L103.114 15.6063L104.412 16.1257ZM106.782 13.3932L109.36 10.4139L109.424 10.4392L109.234 14.3752L106.782 13.3932Z" fill="black"/>
 5 | <path d="M119.026 14.5792L121.313 16.0491L117.207 22.4374L118.312 23.147L122.417 16.7587L124.708 18.2309L125.321 17.2773L119.639 13.6257L119.026 14.5792Z" fill="black"/>
 6 | <path d="M135.864 26.2966L131.976 30.3738C131.159 31.2312 129.978 31.2834 129.016 30.3659C128.057 29.4514 128.05 28.267 128.867 27.4096L132.755 23.3324L131.802 22.4238L127.841 26.578C126.576 27.9042 126.673 29.7917 128.187 31.2356C129.701 32.6795 131.594 32.6887 132.859 31.3625L136.82 27.2082L135.864 26.2966Z" fill="black"/>
 7 | <path d="M134.704 38.187L135.468 39.2596L138.158 37.344L139.196 38.8019C139.214 38.8262 139.228 38.847 139.246 38.8713L137.584 42.231L138.454 43.4529L140.209 39.8278C141.153 40.4692 142.187 40.3865 143.142 39.7067C144.45 38.7748 144.792 37.3075 143.618 35.6587L141.813 33.1247L134.704 38.187ZM139.081 36.6865L141.657 34.8524L142.616 36.1992C143.37 37.2579 143.178 38.0537 142.373 38.6272C141.571 39.1981 140.794 39.092 140.05 38.0472L139.081 36.6865Z" fill="black"/>
 8 | <path d="M141.751 49.3354L144.046 54.3591L145.077 53.8882L143.33 50.0623L145.76 48.9524L147.367 52.472L148.395 52.0029L146.787 48.4832L149.206 47.3786L150.932 51.158L151.963 50.6871L149.69 45.71L141.751 49.3354Z" fill="black"/>
 9 | <path d="M147.072 63.9237C147.699 66.5078 149.665 67.614 152.315 66.971C154.953 66.3311 156.181 64.4503 155.575 61.9531L154.888 59.1205L146.406 61.1781L147.072 63.9237ZM147.835 62.1864L154.08 60.6714L154.437 62.1457C154.888 64.001 154.01 65.2269 152.01 65.7121C150.001 66.1994 148.643 65.516 148.173 63.582L147.835 62.1864Z" fill="black"/>
10 | <path d="M149.822 90.4035C149.675 91.4285 150.386 92.3789 151.411 92.5263C152.436 92.6736 153.387 91.9622 153.534 90.9372C153.681 89.9122 152.97 88.9618 151.945 88.8144C150.92 88.6671 149.97 89.3785 149.822 90.4035Z" fill="black"/>
11 | <path d="M134.065 122.598L133.203 123.593L136.079 126.085L133.651 128.887L134.505 129.627L136.932 126.825L138.942 128.566L136.26 131.661L137.117 132.403L140.661 128.313L134.065 122.598Z" fill="black"/>
12 | <path d="M125.123 131.81L120.782 135.223L121.482 136.114L124.789 133.514L126.44 135.615L123.399 138.007L124.097 138.894L127.138 136.502L128.782 138.593L125.516 141.161L126.217 142.052L130.518 138.67L125.123 131.81Z" fill="black"/>
13 | <path d="M113.942 139.522L114.288 141.942L111.258 143.504L109.491 141.816L108.249 142.457L115.039 148.775L116.392 148.078L115.184 138.882L113.942 139.522ZM114.455 143.103L115.017 147.003L114.957 147.034L112.106 144.313L114.455 143.103Z" fill="black"/>
14 | <path d="M105.54 151.579L102.931 152.345L100.792 145.059L99.5327 145.429L101.672 152.715L99.0594 153.482L99.3788 154.57L105.859 152.667L105.54 151.579Z" fill="black"/>
15 | <path d="M85.6582 156.631L85.1227 151.023C85.0101 149.844 85.7435 148.918 87.0671 148.792C88.3863 148.666 89.2861 149.436 89.3987 150.615L89.9342 156.223L91.245 156.098L90.6994 150.384C90.5252 148.56 89.0357 147.396 86.9528 147.595C84.87 147.794 83.6233 149.219 83.7975 151.043L84.3431 156.757L85.6582 156.631Z" fill="black"/>
16 | <path d="M77.4314 147.969L76.1206 147.843L75.8067 151.131L74.025 150.961C73.9953 150.958 73.9698 150.956 73.9402 150.953L72.4894 147.497L70.9962 147.354L72.5863 151.055C71.4838 151.347 70.8689 152.183 70.7575 153.35C70.6048 154.949 71.4901 156.168 73.5051 156.361L76.6018 156.656L77.4314 147.969ZM75.6989 152.259L75.3984 155.407L73.7524 155.25C72.4586 155.126 71.9828 154.46 72.0768 153.476C72.1704 152.496 72.7592 151.979 74.036 152.101L75.6989 152.259Z" fill="black"/>
17 | <path d="M64.391 145.994L59.092 144.438L58.7726 145.526L62.8082 146.711L62.0555 149.274L58.3429 148.184L58.0247 149.268L61.7373 150.358L60.9882 152.909L57.0016 151.739L56.6823 152.826L61.9322 154.368L64.391 145.994Z" fill="black"/>
18 | <path d="M49.8815 140.462C47.518 139.243 45.395 140.004 44.1452 142.428C42.9014 144.841 43.5189 147.001 45.8029 148.178L48.3936 149.514L52.3927 141.756L49.8815 140.462ZM50.6951 142.176L47.7505 147.888L46.402 147.192C44.7052 146.318 44.3535 144.851 45.2967 143.022C46.2437 141.185 47.6498 140.606 49.4186 141.518L50.6951 142.176Z" fill="black"/>
19 | <path d="M28.0686 125.2C27.3905 124.417 26.2063 124.332 25.4237 125.01C24.6411 125.688 24.5564 126.873 25.2345 127.655C25.9126 128.438 27.0968 128.523 27.8794 127.844C28.662 127.166 28.7467 125.982 28.0686 125.2Z" fill="black"/>
20 | <path d="M17.5762 104.657L17.1455 103.412L13.5494 104.657L12.3369 101.154L11.2697 101.523L12.4823 105.026L9.96943 105.896L8.63003 102.026L7.55885 102.397L9.32892 107.511L17.5762 104.657Z" fill="black"/>
21 | <path d="M14.0702 92.3068L13.2842 86.8403L12.1622 87.0016L12.7608 91.1648L10.1161 91.545L9.56546 87.7151L8.4477 87.8758L8.99836 91.7057L6.36633 92.0841L5.77504 87.9716L4.65305 88.1329L5.43174 93.5488L14.0702 92.3068Z" fill="black"/>
22 | <path d="M12.9816 78.7673L10.7127 77.8572L10.8749 74.452L13.2199 73.7659L13.2864 72.3697L4.41954 75.0915L4.34715 76.6111L12.9151 80.1635L12.9816 78.7673ZM9.62424 77.4214L5.96526 75.9587L5.9685 75.8906L9.74995 74.7823L9.62424 77.4214Z" fill="black"/>
23 | <path d="M6.7403 65.4626L7.38127 62.8205L14.761 64.6108L15.0704 63.3353L7.6907 61.545L8.33268 58.8988L7.23111 58.6315L5.63873 65.1954L6.7403 65.4626Z" fill="black"/>
24 | <path d="M12.3061 45.7184L17.4305 48.0586C18.5081 48.5507 18.9435 49.649 18.3912 50.8584C17.8407 52.064 16.7237 52.458 15.6461 51.9659L10.5217 49.6256L9.9747 50.8234L15.196 53.2079C16.8628 53.9691 18.6151 53.2609 19.4843 51.3576C20.3535 49.4544 19.743 47.6624 18.0762 46.9012L12.8549 44.5167L12.3061 45.7184Z" fill="black"/>
25 | <path d="M23.9218 42.9252L24.6856 41.8526L21.9954 39.937L23.0336 38.479C23.0509 38.4548 23.0657 38.4339 23.083 38.4096L26.8015 38.8813L27.6716 37.6594L23.6717 37.1862C23.9693 36.085 23.5528 35.1345 22.5983 34.4548C21.2896 33.5229 19.7913 33.6801 18.6172 35.3289L16.8128 37.8629L23.9218 42.9252ZM21.0721 39.2794L18.4964 37.4453L19.4555 36.0985C20.2094 35.0398 21.0242 34.9608 21.8295 35.5343C22.6314 36.1053 22.7851 36.8739 22.041 37.9187L21.0721 39.2794Z" fill="black"/>
26 | <path d="M32.1521 32.6192L36.1491 28.8081L35.3668 27.9877L32.3228 30.8902L30.479 28.9565L33.2794 26.2863L32.5001 25.469L29.6998 28.1392L27.8648 26.2147L30.8718 23.3475L30.0895 22.5272L26.1296 26.303L32.1521 32.6192Z" fill="black"/>
27 | <path d="M44.1977 22.8196C46.4347 21.382 46.8372 19.163 45.3628 16.8686C43.8952 14.5851 41.7164 14.0402 39.5547 15.4294L37.1026 17.0052L41.8209 24.3471L44.1977 22.8196ZM42.3066 22.6673L38.8324 17.2613L40.1086 16.4411C41.7147 15.409 43.1602 15.8375 44.273 17.569C45.3903 19.3077 45.1889 20.815 43.5147 21.8909L42.3066 22.6673Z" fill="black"/>
28 | <path d="M68.3218 11.5603C69.3386 11.3643 70.004 10.3811 69.8081 9.36434C69.6121 8.34754 68.6289 7.6821 67.6121 7.87807C66.5953 8.07404 65.9298 9.05723 66.1258 10.074C66.3218 11.0908 67.305 11.7563 68.3218 11.5603Z" fill="black"/>
29 | </svg>
30 | 


--------------------------------------------------------------------------------
/assets/images/svg/graphic-1.svg:
--------------------------------------------------------------------------------
 1 | <svg width="800" height="883" viewBox="0 0 800 883" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <g clip-path="url(#clip0)">
 3 | <path fill-rule="evenodd" clip-rule="evenodd" d="M317.921 168.723C331.274 176.719 344.394 180.582 350.554 179.005C365.998 175.051 367.417 118.923 355.469 96.7958C343.518 74.6686 282.087 65.0241 278.991 108.865C277.916 124.081 284.347 137.66 293.848 148.741L276.812 227.634H326.302L317.921 168.723Z" fill="#B28B67"/>
 4 | <path fill-rule="evenodd" clip-rule="evenodd" d="M327.258 71.2946C320.736 70.232 303.173 69.5014 299.935 69.5018C297.864 69.5018 295.621 69.9716 294.397 68.0836C293.392 66.5374 293.761 63.9226 293.46 62.1285C293.112 60.0441 292.618 57.9867 292.119 55.9346C290.695 50.0949 288.545 44.5392 285.536 39.3232C279.889 29.5371 271.617 21.8717 261.174 17.4113C249.642 12.4862 236.591 11.3585 224.186 12.3574C210.912 13.4262 198.896 17.7796 186.362 21.8764C174.418 25.7804 161.908 27.317 149.416 25.4107C136.83 23.4899 127.32 16.7132 116.704 10.2812C105.837 3.69634 93.4167 -0.610382 80.569 0.379632C68.5761 1.30409 57.5228 6.22351 47.6059 12.7951C38.3273 18.9438 30.6716 26.3411 26.3492 36.7526C21.6994 47.9523 21.7035 60.2455 29.35 70.1432C40.4332 84.4902 61.0087 88.2003 78.1267 87.8314C88.0281 87.6188 97.7524 85.8232 107.1 82.5569C119.567 78.2006 130.34 70.8173 142.003 64.8268C147.477 62.0157 153.134 59.707 159.064 58.0437C164.819 56.4293 170.487 55.6887 175.697 59.1422C181.209 62.7958 186.149 66.3847 192.454 68.6717C198.504 70.866 204.911 72.0931 211.355 72.0436C223.895 71.9473 236.255 68.0662 248.434 65.4662C258.364 63.3467 268.99 61.2341 279.115 63.2716C283.341 64.1221 289.511 65.8775 291.038 70.2395C265.354 74.8636 255.268 106.418 262.508 129.581C266.417 142.084 289.906 156.699 299.038 150.126C304.824 145.962 301.312 140.496 299.038 136.887C294.684 129.976 293.196 121.099 301.252 116.288C308.201 112.138 315.506 121.992 315.645 121.981C317.555 121.832 334.058 112.56 345.427 99.0303C356.643 99.6909 358.345 92.3435 355.667 86.3348C352.988 80.326 336.272 72.7639 327.258 71.2946Z" fill="black"/>
 5 | <path fill-rule="evenodd" clip-rule="evenodd" d="M240.063 390.338C243.774 440.929 482.839 589.879 484.235 594.057C485.164 596.844 409.822 770.201 409.822 770.201L430.72 778.312C430.72 778.312 546.281 594.715 540.346 575.152C531.848 547.143 354.859 390.875 354.859 390.875L240.063 390.338Z" fill="#B28B67"/>
 6 | <path fill-rule="evenodd" clip-rule="evenodd" d="M415.322 744.099L449.439 756.506C521.385 675.421 549.585 608.518 544.444 574.43C539.302 540.342 359.595 390.461 359.595 390.461H237.616C241.778 507.624 463.362 594.503 466.325 599.496C469.29 604.489 440.122 653.388 415.322 744.099Z" fill="#AFB9C5"/>
 7 | <path fill-rule="evenodd" clip-rule="evenodd" d="M407.909 765.649C406.376 764.166 403.9 764.191 402.522 765.82C399.694 769.17 395.41 774.579 394.169 777.986C392.264 783.211 390.354 793.87 390.354 793.87C396.423 796.076 499.433 833.527 499.433 833.527C499.433 833.527 508.802 821.031 500.049 816.581C491.297 812.131 485.565 809.026 485.565 809.026L442.918 767.849C442.18 767.136 440.999 767.174 440.306 767.931L434.006 774.821C434.006 774.821 424.086 775.69 418.785 773.764C415.417 772.539 410.817 768.461 407.909 765.649Z" fill="#AFB9C5"/>
 8 | <path fill-rule="evenodd" clip-rule="evenodd" d="M267.55 390.338L161.052 645.72L56.3818 861.625H81.0771L351.26 390.338H267.55Z" fill="#997659"/>
 9 | <path fill-rule="evenodd" clip-rule="evenodd" d="M60.1386 849.151C58.1911 848.282 55.8729 849.151 55.1373 851.154C53.6256 855.267 51.4521 861.813 51.4521 865.439C51.4521 871.001 53.3069 881.669 53.3069 881.669C59.765 881.669 169.386 881.669 169.386 881.669C169.386 881.669 173.911 866.726 164.162 865.536C154.414 864.344 147.966 863.384 147.966 863.384L93.7906 839.26C92.8532 838.842 91.7563 839.28 91.3649 840.229L87.8044 848.856C87.8044 848.856 78.7797 853.062 73.1374 853.062C69.5535 853.062 63.8343 850.801 60.1386 849.151Z" fill="#AFB9C5"/>
10 | <path fill-rule="evenodd" clip-rule="evenodd" d="M65.835 816.774L120.708 827.052C163.135 764.747 340.696 509.268 360.164 390.338H238.004C172.991 476.313 106.277 753.436 65.835 816.774Z" fill="#C5CFD6"/>
11 | <path fill-rule="evenodd" clip-rule="evenodd" d="M512.891 160.471L434.992 183.887L454.881 217.06L515.448 181.37C543.721 179.684 557.079 176.892 555.524 172.994C554.212 169.707 551.091 169.147 548.215 168.631C545.974 168.23 543.883 167.855 542.914 166.238C540.702 162.547 548.459 152.938 556.21 144.134C563.96 135.33 557.757 134.92 554.012 135.626C541.13 140.863 527.422 149.144 512.891 160.471ZM493.666 369.602L428.109 321.401L413.618 357.27L478.535 384.224C496.895 405.819 507.162 414.821 509.334 411.231C511.165 408.204 509.735 405.37 508.415 402.759C507.388 400.727 506.427 398.828 507.134 397.081C508.747 393.09 521.079 393.511 532.765 394.411C544.452 395.309 541.046 390.103 538.229 387.532C526.3 380.383 511.444 374.405 493.666 369.602Z" fill="#B28B67"/>
12 | <path fill-rule="evenodd" clip-rule="evenodd" d="M326.285 191.595C361.984 258.245 413.607 309.338 488.446 362.449L460.109 394.442C376.548 363.349 332.448 344.589 310.79 281.618C305.356 265.813 301.556 215.431 298.298 188.924L326.285 191.595Z" fill="#2733A8"/>
13 | <path fill-rule="evenodd" clip-rule="evenodd" d="M226.487 413.657H384.732C384.732 413.657 330.965 249.462 329.798 188.272C329.758 186.193 325.922 182.528 324.226 183.007C305.609 188.272 284.384 179.07 284.384 179.07C246.868 239.483 233.895 313.863 226.487 413.657Z" fill="#F2F2F2"/>
14 | <path fill-rule="evenodd" clip-rule="evenodd" d="M324.078 271.24C348.793 377.392 347.654 464.289 293.088 464.289H208.712C195.311 374.113 230.531 249.082 263.184 186.019C264.43 183.61 267.085 179.071 273.338 179.071H297.855C297.866 179.103 297.877 179.136 297.888 179.168C305.265 179.229 313.39 179.499 322.189 179.791C367.486 181.297 430.646 183.396 501.717 160.551L510.096 202.474C445.948 243.783 380.993 275.783 324.078 271.24Z" fill="#2C49F4"/>
15 | <path fill-rule="evenodd" clip-rule="evenodd" d="M708.884 156.719C658.562 156.719 617.768 197.513 617.768 247.835C617.768 298.157 658.562 338.951 708.884 338.951C759.205 338.951 800 298.157 800 247.835C800 197.513 759.205 156.719 708.884 156.719ZM678.209 227.6C678.209 223.846 681.25 220.804 685.004 220.804C688.756 220.804 691.799 223.846 691.799 227.6C691.799 231.352 688.756 234.395 685.004 234.395C681.25 234.395 678.209 231.352 678.209 227.6ZM685.004 213.515C677.225 213.515 670.919 219.82 670.919 227.6C670.919 235.378 677.225 241.685 685.004 241.685C692.783 241.685 699.089 235.378 699.089 227.6C699.089 219.82 692.783 213.515 685.004 213.515ZM739.783 223.913C741.206 222.49 741.206 220.181 739.783 218.758C738.36 217.335 736.051 217.335 734.628 218.758L676.162 277.225C674.739 278.649 674.739 280.956 676.162 282.379C677.585 283.802 679.892 283.802 681.316 282.379L739.783 223.913ZM730.941 266.742C727.189 266.742 724.146 269.785 724.146 273.537C724.146 277.291 727.189 280.332 730.941 280.332C734.695 280.332 737.737 277.291 737.737 273.537C737.737 269.785 734.695 266.742 730.941 266.742ZM716.856 273.537C716.856 265.757 723.162 259.452 730.941 259.452C738.721 259.452 745.026 265.757 745.026 273.537C745.026 281.316 738.721 287.622 730.941 287.622C723.162 287.622 716.856 281.316 716.856 273.537Z" fill="#2C49F4"/>
16 | </g>
17 | <defs>
18 | <clipPath id="clip0">
19 | <rect width="800" height="882.005" fill="white"/>
20 | </clipPath>
21 | </defs>
22 | </svg>
23 | 


--------------------------------------------------------------------------------
/assets/images/svg/graphic-2.svg:
--------------------------------------------------------------------------------
 1 | <svg width="800" height="953" viewBox="0 0 800 953" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <g clip-path="url(#clip0)">
 3 | <path fill-rule="evenodd" clip-rule="evenodd" d="M324.449 202.786C311.861 214.556 298.571 221.776 291.546 221.475C273.937 220.72 259.419 159.965 267.218 133.139C275.02 106.313 339.202 81.7009 352.69 128.699C357.372 145.011 353.561 161.267 345.851 175.509L382.518 257.448L329.014 268.819L324.449 202.786Z" fill="#B28B67"/>
 4 | <path fill-rule="evenodd" clip-rule="evenodd" d="M355.763 127.776C357.003 127.652 358.247 127.458 359.494 127.194C377.962 123.268 389.753 105.113 385.826 86.6445C381.901 68.1757 363.747 56.386 345.279 60.3117C326.968 64.2035 315.223 82.0804 318.847 100.384C289.99 96.7856 257.42 115.081 266.728 135.915C272.438 148.698 288.873 152.508 305.643 156.396C306.423 156.577 307.205 156.758 307.984 156.94C309.468 152.36 313.365 148.649 318.509 147.556C326.09 145.945 333.507 150.627 335.077 158.015C335.642 160.676 335.373 163.325 334.441 165.7C340.807 169.232 345.791 174.051 348.26 181.151C356.918 179.311 365.509 150.914 355.763 127.776Z" fill="#191847"/>
 5 | <path fill-rule="evenodd" clip-rule="evenodd" d="M501.424 407.977L332.063 691.115L205.093 930.484H177.744L390.486 407.977H501.424Z" fill="#997659"/>
 6 | <path fill-rule="evenodd" clip-rule="evenodd" d="M215.497 916.887C217.94 915.813 220.842 916.9 221.752 919.41C223.412 923.984 225.639 930.847 225.639 934.715C225.639 940.88 223.585 952.707 223.585 952.707C216.433 952.707 95.0334 952.707 95.0334 952.707C95.0334 952.707 90.0224 936.141 100.818 934.82C111.614 933.5 118.755 932.435 118.755 932.435L178.505 905.798C179.678 905.274 181.051 905.823 181.54 907.011L185.381 916.328C185.381 916.328 195.375 920.992 201.623 920.992C205.427 920.992 211.403 918.687 215.497 916.887Z" fill="#E4E4E4"/>
 7 | <path fill-rule="evenodd" clip-rule="evenodd" d="M240.355 892.154L187.615 876.2C187.615 876.2 222.276 772.583 272.578 648.145C322.88 523.71 380.626 407.977 380.626 407.977H529.584C529.584 407.977 465.385 554.374 393.467 674.016C321.547 793.661 240.355 892.154 240.355 892.154Z" fill="#2733A8"/>
 8 | <path fill-rule="evenodd" clip-rule="evenodd" d="M512.553 407.977C528.537 507.473 559.366 634.591 562.276 638.516C564.216 641.13 634.044 664.528 771.76 708.71L765.852 732.827C601.627 709.132 515.092 690.748 506.254 677.677C492.993 658.069 426.782 503.163 401.137 407.977H512.553Z" fill="#B28B67"/>
 9 | <path fill-rule="evenodd" clip-rule="evenodd" d="M723.35 687.863L712.945 726.705C590.112 737.479 514.851 729.693 487.161 703.352C459.469 677.011 427.908 578.552 392.48 407.977H534.52C556.968 547.655 569.518 620.426 572.168 626.29C574.821 632.152 625.214 652.679 723.35 687.863Z" fill="#2C49F4"/>
10 | <path fill-rule="evenodd" clip-rule="evenodd" d="M761.411 704.443C760.775 701.851 762.35 699.18 764.98 698.72C769.775 697.881 776.918 696.88 780.727 697.551C786.799 698.622 798.09 702.699 798.09 702.699C796.848 709.742 775.767 829.298 775.767 829.298C775.767 829.298 758.582 831.356 759.157 820.493C759.731 809.633 759.922 802.414 759.922 802.414L744.066 738.948C743.754 737.703 744.533 736.445 745.787 736.169L755.628 734.004C755.628 734.004 761.958 724.972 763.043 718.818C763.701 715.073 762.473 708.787 761.411 704.443Z" fill="#E4E4E4"/>
11 | <path fill-rule="evenodd" clip-rule="evenodd" d="M164.93 423.706L253.342 402.915L252.718 446.341L174.173 445.484C145.903 459.661 131.427 464.417 130.746 459.752C130.171 455.818 132.875 453.525 135.365 451.415C137.305 449.769 139.115 448.235 139.145 446.12C139.215 441.288 126.331 436.272 113.905 432.039C101.479 427.804 107.244 423.934 111.261 422.526C126.646 420.415 144.536 420.809 164.93 423.706ZM652.868 473.174C641.775 462.918 524.72 321.056 524.72 321.056L478.195 339.116C478.195 339.116 621.032 482.159 627.437 489.033C635.758 497.965 634.409 516.098 633.493 528.395C633.351 530.296 633.221 532.06 633.137 533.625C641.123 534.059 642.981 529.117 644.941 523.907C647.154 518.022 649.495 511.793 660.939 512.584C665.36 512.889 669.702 513.589 673.944 514.275C688.597 516.639 702.058 518.811 713.483 503.827C715.293 501.452 715.779 494.938 707.84 493.042C688.064 488.317 658.29 478.188 652.868 473.174Z" fill="#997659"/>
12 | <path fill-rule="evenodd" clip-rule="evenodd" d="M340.369 222.27L304.82 238.704C327.038 323.438 297.807 393.569 181.563 418.246L207.188 528.511C314.68 502.435 388.756 426.957 364.551 308.88C358.283 278.314 350.566 246.964 340.369 222.27Z" fill="#AFB9C5"/>
13 | <path fill-rule="evenodd" clip-rule="evenodd" d="M638.384 454.545C561.322 329.499 467.838 245.759 357.933 203.32L354.432 204.664L354.314 204.71L354.298 204.755L303.882 238.632C329.37 305.027 333.641 360.31 337.748 413.458C339.524 436.41 341.265 458.963 344.673 481.841L493.954 424.54C505.327 447.883 516.148 472.214 526.608 497.451L638.384 454.545Z" fill="#C5CFD6"/>
14 | <path fill-rule="evenodd" clip-rule="evenodd" d="M493.953 424.54C470.796 377.01 445.344 333.557 415.97 294.806C436.638 340.371 459.612 397.921 463.612 436.187L493.953 424.54Z" fill="black" fill-opacity="0.1"/>
15 | <path fill-rule="evenodd" clip-rule="evenodd" d="M49.856 148.148L210.495 214.687L169.913 312.766L159.204 308.331L149.928 330.749L137.786 299.46L9.27441 246.229L49.856 148.148Z" fill="#2C49F4"/>
16 | </g>
17 | <defs>
18 | <clipPath id="clip0">
19 | <rect width="800" height="952.707" fill="white"/>
20 | </clipPath>
21 | </defs>
22 | </svg>
23 | 


--------------------------------------------------------------------------------
/assets/images/svg/master-card-1.svg:
--------------------------------------------------------------------------------
1 | <svg id="Payment_Icons" data-name="Payment Icons" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 38 38"><defs><style>.cls-1{fill:#fff;}.cls-2{fill:#f7f7f7;}.cls-3{fill:#f79e1b;}.cls-4{fill:#ff5f00;}.cls-5{fill:#eb001b;}</style></defs><title>mastercard-color</title><rect class="cls-1" x="0.5" y="7.5" width="37" height="23" rx="4.5"/><path class="cls-2" d="M33,8a4,4,0,0,1,4,4V26a4,4,0,0,1-4,4H5a4,4,0,0,1-4-4V12A4,4,0,0,1,5,8H33m0-1H5a5,5,0,0,0-5,5V26a5,5,0,0,0,5,5H33a5,5,0,0,0,5-5V12a5,5,0,0,0-5-5Z"/><path class="cls-3" d="M27.31,19A4.75,4.75,0,0,1,19,22.14a4.74,4.74,0,0,0,0-6.28A4.75,4.75,0,0,1,27.31,19Z"/><ellipse class="cls-4" cx="19" cy="19" rx="1.19" ry="3.14"/><path class="cls-5" d="M17.81,19A4.76,4.76,0,0,0,19,22.14a4.75,4.75,0,1,1,0-6.28A4.76,4.76,0,0,0,17.81,19Z"/></svg>


--------------------------------------------------------------------------------
/assets/images/svg/pattern-lg-light.svg:
--------------------------------------------------------------------------------
 1 | <svg width="3553" height="3553" viewBox="0 0 3553 3553" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M1770.05 1723.93L1808.69 1734.29C1824.43 1738.5 1833.76 1754.68 1829.55 1770.42L1819.2 1809.05C1814.98 1824.79 1798.8 1834.13 1783.07 1829.91L1744.43 1819.56C1728.69 1815.34 1719.35 1799.17 1723.57 1783.43L1733.92 1744.79C1738.14 1729.06 1754.31 1719.72 1770.05 1723.93Z" stroke="white" stroke-opacity="0.15"/>
 3 | <path d="M1753.23 1666.55L1835.96 1681.13C1869.95 1687.13 1892.65 1719.54 1886.65 1753.54L1872.07 1836.26C1866.07 1870.25 1833.66 1892.95 1799.66 1886.96L1716.94 1872.37C1682.95 1866.38 1660.25 1833.96 1666.24 1799.97L1680.83 1717.24C1686.82 1683.25 1719.24 1660.55 1753.23 1666.55Z" stroke="white" stroke-opacity="0.15"/>
 4 | <path d="M1725.59 1607.37L1857.09 1618.88C1911.28 1623.62 1951.37 1671.4 1946.63 1725.59L1935.12 1857.09C1930.38 1911.28 1882.6 1951.37 1828.41 1946.63L1696.91 1935.12C1642.72 1930.38 1602.63 1882.6 1607.37 1828.41L1618.88 1696.91C1623.62 1642.72 1671.4 1602.63 1725.59 1607.37Z" stroke="white" stroke-opacity="0.15"/>
 5 | <path d="M1684.17 1546.58H1868.17C1944.11 1546.58 2005.67 1608.14 2005.67 1684.08V1868.08C2005.67 1944.02 1944.11 2005.58 1868.17 2005.58H1684.17C1608.23 2005.58 1546.67 1944.02 1546.67 1868.08V1684.08C1546.67 1608.14 1608.23 1546.58 1684.17 1546.58Z" stroke="white" stroke-opacity="0.15"/>
 6 | <path d="M1630.89 1488.45L1869.98 1467.53C1968.74 1458.89 2055.8 1531.94 2064.44 1630.7L2085.36 1869.79C2094 1968.55 2020.94 2055.61 1922.18 2064.25L1683.1 2085.17C1584.34 2093.81 1497.28 2020.75 1488.64 1921.99L1467.72 1682.91C1459.08 1584.15 1532.13 1497.09 1630.89 1488.45Z" stroke="white" stroke-opacity="0.15"/>
 7 | <path d="M1563.53 1433.4L1858.97 1381.31C1981.07 1359.78 2097.51 1441.31 2119.04 1563.41L2171.14 1858.85C2192.67 1980.96 2111.14 2097.4 1989.03 2118.93L1693.59 2171.02C1571.49 2192.55 1455.05 2111.02 1433.52 1988.92L1381.42 1693.47C1359.89 1571.37 1441.42 1454.93 1563.53 1433.4Z" stroke="white" stroke-opacity="0.1"/>
 8 | <path d="M1482.83 1384.83L1834.42 1290.62C1979.79 1251.66 2129.22 1337.93 2168.17 1483.3L2262.38 1834.9C2301.33 1980.27 2215.06 2129.69 2069.69 2168.64L1718.09 2262.85C1572.72 2301.8 1423.3 2215.53 1384.35 2070.17L1290.14 1718.57C1251.19 1573.2 1337.46 1423.78 1482.83 1384.83Z" stroke="white" stroke-opacity="0.1"/>
 9 | <path d="M1388.87 1343.75L1794.82 1196C1962.71 1134.89 2148.34 1221.45 2209.45 1389.34L2357.2 1795.29C2418.31 1963.18 2331.75 2148.82 2163.86 2209.93L1757.91 2357.68C1590.02 2418.78 1404.38 2332.22 1343.27 2164.33L1195.52 1758.38C1134.41 1590.49 1220.98 1404.86 1388.87 1343.75Z" stroke="white" stroke-opacity="0.1"/>
10 | <path d="M1282.16 1312.46L1738.94 1099.46C1927.89 1011.35 2152.5 1093.1 2240.61 1282.05L2453.61 1738.83C2541.72 1927.78 2459.97 2152.39 2271.02 2240.5L1814.24 2453.5C1625.28 2541.61 1400.68 2459.86 1312.57 2270.91L1099.57 1814.13C1011.46 1625.17 1093.21 1400.57 1282.16 1312.46Z" stroke="white" stroke-opacity="0.1"/>
11 | <path d="M1163.54 1294.22L1665.84 1004.22C1873.66 884.233 2139.39 955.437 2259.38 1163.26L2549.38 1665.55C2669.36 1873.37 2598.16 2139.1 2390.34 2259.09L1888.04 2549.09C1680.23 2669.07 1414.49 2597.87 1294.51 2390.05L1004.51 1887.76C884.521 1679.94 955.725 1414.2 1163.54 1294.22Z" stroke="white" stroke-opacity="0.1"/>
12 | <path d="M1033.18 1290.25L1573.82 911.692C1797.54 755.046 2105.88 809.415 2262.53 1033.13L2641.09 1573.77C2797.73 1797.48 2743.36 2105.83 2519.65 2262.47L1979.01 2641.03C1755.29 2797.68 1446.95 2743.31 1290.3 2519.6L911.744 1978.96C755.098 1755.24 809.467 1446.9 1033.18 1290.25Z" stroke="white" stroke-opacity="0.05"/>
13 | <path d="M894.573 1303.69L1464.51 825.454C1700.37 627.541 2052.02 658.306 2249.93 894.17L2728.17 1464.11C2926.08 1699.97 2895.32 2051.62 2659.45 2249.53L2089.52 2727.76C1853.65 2925.68 1502 2894.91 1304.09 2659.05L825.857 2089.11C627.944 1853.25 658.709 1501.6 894.573 1303.69Z" stroke="white" stroke-opacity="0.05"/>
14 | <path d="M747.541 1335.51L1335.85 747.197C1579.35 503.705 1974.12 503.705 2217.62 747.197L2805.93 1335.51C3049.42 1579 3049.42 1973.78 2805.93 2217.27L2217.62 2805.59C1974.12 3049.08 1579.35 3049.08 1335.85 2805.59L747.541 2217.27C504.049 1973.78 504.049 1579 747.541 1335.51Z" stroke="white" stroke-opacity="0.05"/>
15 | <path d="M595.214 1388.52L1189.15 680.697C1434.99 387.718 1871.79 349.503 2164.77 595.342L2872.59 1189.28C3165.57 1435.12 3203.79 1871.91 2957.95 2164.89L2364.01 2872.72C2118.17 3165.7 1681.37 3203.91 1388.39 2958.07L680.569 2364.14C387.59 2118.3 349.375 1681.5 595.214 1388.52Z" stroke="white" stroke-opacity="0.05"/>
16 | <path d="M440.017 1463.31L1025.06 627.77C1267.24 281.907 1743.94 197.852 2089.81 440.028L2925.34 1025.08C3271.2 1267.25 3355.26 1743.95 3113.08 2089.82L2528.04 2925.35C2285.86 3271.22 1809.16 3355.27 1463.29 3113.09L627.759 2528.05C281.896 2285.87 197.84 1809.17 440.017 1463.31Z" stroke="white" stroke-opacity="0.05"/>
17 | </svg>
18 | 


--------------------------------------------------------------------------------
/assets/images/svg/pattern-lg.svg:
--------------------------------------------------------------------------------
 1 | <svg width="3553" height="3553" viewBox="0 0 3553 3553" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M1770.05 1723.93L1808.69 1734.29C1824.43 1738.5 1833.76 1754.68 1829.55 1770.42L1819.2 1809.05C1814.98 1824.79 1798.8 1834.13 1783.07 1829.91L1744.43 1819.56C1728.69 1815.34 1719.35 1799.17 1723.57 1783.43L1733.92 1744.79C1738.14 1729.06 1754.31 1719.72 1770.05 1723.93Z" stroke="black" stroke-opacity="0.2"/>
 3 | <path d="M1753.23 1666.55L1835.96 1681.13C1869.95 1687.13 1892.65 1719.54 1886.65 1753.54L1872.07 1836.26C1866.07 1870.25 1833.66 1892.95 1799.66 1886.96L1716.94 1872.37C1682.95 1866.38 1660.25 1833.96 1666.24 1799.97L1680.83 1717.24C1686.82 1683.25 1719.24 1660.55 1753.23 1666.55Z" stroke="black" stroke-opacity="0.2"/>
 4 | <path d="M1725.59 1607.37L1857.09 1618.88C1911.28 1623.62 1951.37 1671.4 1946.63 1725.59L1935.12 1857.09C1930.38 1911.28 1882.6 1951.37 1828.41 1946.63L1696.91 1935.12C1642.72 1930.38 1602.63 1882.6 1607.37 1828.41L1618.88 1696.91C1623.62 1642.72 1671.4 1602.63 1725.59 1607.37Z" stroke="black" stroke-opacity="0.2"/>
 5 | <path d="M1684.17 1546.58H1868.17C1944.11 1546.58 2005.67 1608.14 2005.67 1684.08V1868.08C2005.67 1944.02 1944.11 2005.58 1868.17 2005.58H1684.17C1608.23 2005.58 1546.67 1944.02 1546.67 1868.08V1684.08C1546.67 1608.14 1608.23 1546.58 1684.17 1546.58Z" stroke="black" stroke-opacity="0.2"/>
 6 | <path d="M1630.89 1488.45L1869.98 1467.53C1968.74 1458.89 2055.8 1531.94 2064.44 1630.7L2085.36 1869.79C2094 1968.55 2020.94 2055.61 1922.18 2064.25L1683.1 2085.17C1584.34 2093.81 1497.28 2020.75 1488.64 1921.99L1467.72 1682.91C1459.08 1584.15 1532.13 1497.09 1630.89 1488.45Z" stroke="black" stroke-opacity="0.2"/>
 7 | <path d="M1563.53 1433.4L1858.97 1381.31C1981.07 1359.78 2097.51 1441.31 2119.04 1563.41L2171.14 1858.85C2192.67 1980.96 2111.14 2097.4 1989.03 2118.93L1693.59 2171.02C1571.49 2192.55 1455.05 2111.02 1433.52 1988.92L1381.42 1693.47C1359.89 1571.37 1441.42 1454.93 1563.53 1433.4Z" stroke="black" stroke-opacity="0.15"/>
 8 | <path d="M1482.83 1384.83L1834.42 1290.62C1979.79 1251.66 2129.22 1337.93 2168.17 1483.3L2262.38 1834.9C2301.33 1980.27 2215.06 2129.69 2069.69 2168.64L1718.09 2262.85C1572.72 2301.8 1423.3 2215.53 1384.35 2070.17L1290.14 1718.57C1251.19 1573.2 1337.46 1423.78 1482.83 1384.83Z" stroke="black" stroke-opacity="0.15"/>
 9 | <path d="M1388.87 1343.75L1794.82 1196C1962.71 1134.89 2148.34 1221.45 2209.45 1389.34L2357.2 1795.29C2418.31 1963.18 2331.75 2148.82 2163.86 2209.93L1757.91 2357.68C1590.02 2418.78 1404.38 2332.22 1343.27 2164.33L1195.52 1758.38C1134.41 1590.49 1220.98 1404.86 1388.87 1343.75Z" stroke="black" stroke-opacity="0.15"/>
10 | <path d="M1282.16 1312.46L1738.94 1099.46C1927.89 1011.35 2152.5 1093.1 2240.61 1282.05L2453.61 1738.83C2541.72 1927.78 2459.97 2152.39 2271.02 2240.5L1814.24 2453.5C1625.28 2541.61 1400.68 2459.86 1312.57 2270.91L1099.57 1814.13C1011.46 1625.17 1093.21 1400.57 1282.16 1312.46Z" stroke="black" stroke-opacity="0.15"/>
11 | <path d="M1163.54 1294.22L1665.84 1004.22C1873.66 884.233 2139.39 955.437 2259.38 1163.26L2549.38 1665.55C2669.36 1873.37 2598.16 2139.1 2390.34 2259.09L1888.04 2549.09C1680.23 2669.07 1414.49 2597.87 1294.51 2390.05L1004.51 1887.76C884.521 1679.94 955.725 1414.2 1163.54 1294.22Z" stroke="black" stroke-opacity="0.15"/>
12 | <path d="M1033.18 1290.25L1573.82 911.692C1797.54 755.046 2105.88 809.415 2262.53 1033.13L2641.09 1573.77C2797.73 1797.48 2743.36 2105.83 2519.65 2262.47L1979.01 2641.03C1755.29 2797.68 1446.95 2743.31 1290.3 2519.6L911.744 1978.96C755.098 1755.24 809.467 1446.9 1033.18 1290.25Z" stroke="black" stroke-opacity="0.1"/>
13 | <path d="M894.573 1303.69L1464.51 825.454C1700.37 627.541 2052.02 658.306 2249.93 894.17L2728.17 1464.11C2926.08 1699.97 2895.32 2051.62 2659.45 2249.53L2089.52 2727.76C1853.65 2925.68 1502 2894.91 1304.09 2659.05L825.857 2089.11C627.944 1853.25 658.709 1501.6 894.573 1303.69Z" stroke="black" stroke-opacity="0.1"/>
14 | <path d="M747.541 1335.51L1335.85 747.197C1579.35 503.705 1974.12 503.705 2217.62 747.197L2805.93 1335.51C3049.42 1579 3049.42 1973.78 2805.93 2217.27L2217.62 2805.59C1974.12 3049.08 1579.35 3049.08 1335.85 2805.59L747.541 2217.27C504.049 1973.78 504.049 1579 747.541 1335.51Z" stroke="black" stroke-opacity="0.1"/>
15 | <path d="M595.214 1388.52L1189.15 680.697C1434.99 387.718 1871.79 349.503 2164.77 595.342L2872.59 1189.28C3165.57 1435.12 3203.79 1871.91 2957.95 2164.89L2364.01 2872.72C2118.17 3165.7 1681.37 3203.91 1388.39 2958.07L680.569 2364.14C387.59 2118.3 349.375 1681.5 595.214 1388.52Z" stroke="black" stroke-opacity="0.1"/>
16 | <path d="M440.017 1463.31L1025.06 627.77C1267.24 281.907 1743.94 197.852 2089.81 440.028L2925.34 1025.08C3271.2 1267.25 3355.26 1743.95 3113.08 2089.82L2528.04 2925.35C2285.86 3271.22 1809.16 3355.27 1463.29 3113.09L627.759 2528.05C281.896 2285.87 197.84 1809.17 440.017 1463.31Z" stroke="black" stroke-opacity="0.1"/>
17 | </svg>
18 | 


--------------------------------------------------------------------------------
/assets/images/svg/pattern.svg:
--------------------------------------------------------------------------------
 1 | <svg width="2400" height="2400" viewBox="0 0 2400 2400" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <path d="M1182.27 1124.67L1237.95 1134.49C1260.63 1138.48 1275.77 1160.11 1271.77 1182.79L1261.95 1238.47C1257.96 1261.14 1236.33 1276.29 1213.65 1272.29L1157.97 1262.47C1135.29 1258.47 1120.15 1236.85 1124.15 1214.17L1133.97 1158.49C1137.97 1135.81 1159.59 1120.67 1182.27 1124.67Z" stroke="black" stroke-opacity="0.35"/>
 3 | <path d="M1165.77 1090.35L1250.26 1097.74C1284.86 1100.77 1310.46 1131.27 1307.43 1165.88L1300.04 1250.36C1297.01 1284.97 1266.51 1310.56 1231.9 1307.54L1147.42 1300.15C1112.81 1297.12 1087.22 1266.61 1090.24 1232.01L1097.63 1147.52C1100.66 1112.92 1131.17 1087.32 1165.77 1090.35Z" stroke="black" stroke-opacity="0.35"/>
 4 | <path d="M1139.22 1050.88H1257.95C1306.74 1050.88 1346.29 1090.43 1346.29 1139.22V1257.95C1346.29 1306.74 1306.74 1346.29 1257.95 1346.29H1139.22C1090.43 1346.29 1050.88 1306.74 1050.88 1257.95V1139.22C1050.88 1090.43 1090.43 1050.88 1139.22 1050.88Z" stroke="black" stroke-opacity="0.3"/>
 5 | <path d="M1103.5 1009.44L1261.2 995.641C1326.13 989.959 1383.37 1037.99 1389.06 1102.93L1402.85 1260.63C1408.53 1325.56 1360.5 1382.81 1295.57 1388.49L1137.87 1402.28C1072.93 1407.96 1015.69 1359.93 1010.01 1295L996.21 1137.3C990.529 1072.36 1038.56 1015.12 1103.5 1009.44Z" stroke="black" stroke-opacity="0.3"/>
 6 | <path d="M1055.05 967.828L1255.49 932.485C1338.13 917.913 1416.93 973.094 1431.51 1055.74L1466.86 1256.18C1481.43 1338.82 1426.25 1417.63 1343.6 1432.2L1143.16 1467.53C1060.52 1482.11 981.712 1426.93 967.141 1344.29L931.796 1143.85C917.225 1061.21 972.406 982.4 1055.05 967.828Z" stroke="black" stroke-opacity="0.25"/>
 7 | <path d="M994.388 925.148L1240.14 859.3C1341.55 832.126 1445.8 892.311 1472.96 993.726L1538.81 1239.47C1565.99 1340.89 1505.81 1445.13 1404.39 1472.31L1158.64 1538.15C1057.23 1565.33 952.985 1505.14 925.811 1403.73L859.964 1157.98C832.789 1056.56 892.973 952.322 994.388 925.148Z" stroke="black" stroke-opacity="0.25"/>
 8 | <path d="M920.453 887.685L1212.65 781.332C1333.32 737.412 1466.74 799.628 1510.66 920.295L1617.02 1212.5C1660.93 1333.16 1598.71 1466.59 1478.05 1510.5L1185.85 1616.86C1065.18 1660.78 931.76 1598.56 887.842 1477.89L781.489 1185.69C737.569 1065.03 799.785 931.603 920.453 887.685Z" stroke="black" stroke-opacity="0.2"/>
 9 | <path d="M833.441 856.219L1171.63 698.521C1311.35 633.365 1477.44 693.817 1542.6 833.543L1700.3 1171.73C1765.46 1311.45 1705 1477.54 1565.27 1542.7L1227.09 1700.4C1087.36 1765.55 921.272 1705.1 856.117 1565.37L698.419 1227.19C633.263 1087.46 693.716 921.373 833.441 856.219Z" stroke="black" stroke-opacity="0.2"/>
10 | <path d="M733.428 833.121L1115.34 612.627C1273.19 521.49 1475.04 575.575 1566.18 733.428L1786.67 1115.34C1877.81 1273.19 1823.72 1475.04 1665.87 1566.18L1283.96 1786.67C1126.11 1877.81 924.258 1823.72 833.121 1665.87L612.627 1283.96C521.49 1126.11 575.575 924.258 733.428 833.121Z" stroke="black" stroke-opacity="0.15"/>
11 | <path d="M620.374 820.951L1041.82 525.853C1216.07 403.844 1456.23 446.19 1578.25 620.439L1873.34 1041.88C1995.35 1216.13 1953 1456.3 1778.76 1578.3L1357.31 1873.4C1183.06 1995.41 942.897 1953.06 820.887 1778.81L525.789 1357.37C403.779 1183.12 446.127 942.961 620.374 820.951Z" stroke="black" stroke-opacity="0.15"/>
12 | <path d="M495.583 822.48L950.338 440.896C1138.4 283.089 1418.78 307.619 1576.59 495.686L1958.18 950.441C2115.99 1138.51 2091.46 1418.9 1903.39 1576.69L1448.64 1958.29C1260.57 2116.08 980.184 2091.56 822.378 1903.49L440.793 1448.73C282.987 1260.67 307.517 980.287 495.583 822.48Z" stroke="black" stroke-opacity="0.1"/>
13 | <path d="M360.299 840.7L840.032 360.967C1038.47 162.53 1360.2 162.53 1558.63 360.967L2038.36 840.7C2236.81 1039.14 2236.81 1360.86 2038.36 1559.29L1558.63 2039.04C1360.2 2237.47 1038.47 2237.47 840.032 2039.04L360.299 1559.29C161.864 1360.86 161.864 1039.14 360.299 840.7Z" stroke="black" stroke-opacity="0.1"/>
14 | </svg>
15 | 


--------------------------------------------------------------------------------
/assets/images/svg/pin-light.svg:
--------------------------------------------------------------------------------
1 | <svg width="80px" height="80px" viewBox="0 0 80 80" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
2 |   <g fill="none" fill-rule="evenodd" stroke-width="1" stroke="#ffffff" stroke-opacity="1">
3 |     <circle cx="40" cy="40" r="5">
4 |       <animate attributeName="r" begin="0s" dur="2s" values="0;40" keyTimes="0;1" keySplines="0.1,0.2,0.3,1" calcMode="spline" repeatCount="indefinite"></animate>
5 |       <animate attributeName="stroke-opacity" begin="0s" dur="2s" values="0;1;.4;0" repeatCount="indefinite"></animate>
6 |       <animate attributeName="stroke-width" begin="0s" dur="2s" values="10;5;2;0" repeatCount="indefinite"></animate>
7 |     </circle>
8 |   </g>
9 | </svg>


--------------------------------------------------------------------------------
/assets/images/svg/pin.svg:
--------------------------------------------------------------------------------
1 | <svg width="80px" height="80px" viewBox="0 0 80 80" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
2 |   <g fill="none" fill-rule="evenodd" stroke-width="1" stroke="#000000" stroke-opacity="1">
3 |     <circle cx="40" cy="40" r="5">
4 |       <animate attributeName="r" begin="0s" dur="2s" values="0;40" keyTimes="0;1" keySplines="0.1,0.2,0.3,1" calcMode="spline" repeatCount="indefinite"></animate>
5 |       <animate attributeName="stroke-opacity" begin="0s" dur="2s" values="0;1;.4;0" repeatCount="indefinite"></animate>
6 |       <animate attributeName="stroke-width" begin="0s" dur="2s" values="10;5;2;0" repeatCount="indefinite"></animate>
7 |     </circle>
8 |   </g>
9 | </svg>


--------------------------------------------------------------------------------
/assets/images/svg/quotes.svg:
--------------------------------------------------------------------------------
1 | <svg width="248" height="200" viewBox="0 0 248 200" fill="none" xmlns="http://www.w3.org/2000/svg">
2 | <path d="M93.9006 105.023V200H0V133.333C0 107.763 4.2544 84.3227 12.7632 63.0137C21.272 41.0959 35.5546 20.0913 55.611 0L90.254 27.3973C66.5509 52.968 53.18 78.8432 50.1411 105.023H93.9006ZM247.059 105.023V200H153.158V133.333C153.158 107.763 157.413 84.3227 165.921 63.0137C174.43 41.0959 188.713 20.0913 208.769 0L243.412 27.3973C219.709 52.968 206.338 78.8432 203.299 105.023H247.059Z" fill="black" fill-opacity="0.1"/>
3 | </svg>
4 | 


--------------------------------------------------------------------------------
/assets/images/svg/shadow.svg:
--------------------------------------------------------------------------------
 1 | <svg width="1807" height="1807" viewBox="0 0 1807 1807" fill="none" xmlns="http://www.w3.org/2000/svg">
 2 | <g opacity="0.2" filter="url(#filter0_f)">
 3 | <path d="M1220.42 662.309C1153.55 472.637 711.674 450.516 409.162 674.952C201.502 829.017 601.007 866.797 654.402 1208.25C782.599 1470.43 1128.55 1405.56 1344.01 1190.09C1559.48 974.626 1287.28 851.981 1220.42 662.309Z" fill="#EB3C27"/>
 4 | </g>
 5 | <defs>
 6 | <filter id="filter0_f" x="0" y="0" width="1806.87" height="1806.87" filterUnits="userSpaceOnUse" color-interpolation-filters="sRGB">
 7 | <feFlood flood-opacity="0" result="BackgroundImageFix"/>
 8 | <feBlend mode="normal" in="SourceGraphic" in2="BackgroundImageFix" result="shape"/>
 9 | <feGaussianBlur stdDeviation="125" result="effect1_foregroundBlur"/>
10 | </filter>
11 | </defs>
12 | </svg>
13 | 


--------------------------------------------------------------------------------
/assets/images/svg/visa-1.svg:
--------------------------------------------------------------------------------
1 | <svg id="Payment_Icons" data-name="Payment Icons" xmlns="http://www.w3.org/2000/svg" viewBox="0 0 38 38"><defs><style>.cls-1{fill:#122a96;}.cls-2{fill:#fff;}</style></defs><title>visa-color</title><rect class="cls-1" y="7" width="38" height="24" rx="5"/><path class="cls-2" d="M15.76,15.56l-2.87,6.89H11L9.61,17a.75.75,0,0,0-.42-.61,7.69,7.69,0,0,0-1.74-.59l0-.2h3a.84.84,0,0,1,.82.71l.74,4,1.84-4.69Zm7.33,4.64c0-1.81-2.5-1.91-2.48-2.73,0-.24.24-.51.75-.57a3.32,3.32,0,0,1,1.75.3l.31-1.46a4.93,4.93,0,0,0-1.66-.3c-1.75,0-3,.93-3,2.28,0,1,.88,1.54,1.55,1.87s.92.56.92.86c0,.46-.55.66-1.06.67a3.66,3.66,0,0,1-1.82-.43L18,22.2a5.41,5.41,0,0,0,2,.36c1.86,0,3.07-.92,3.08-2.36m4.62,2.25h1.63l-1.42-6.89H26.41a.82.82,0,0,0-.76.51L23,22.45h1.86l.36-1h2.27Zm-2-2.44.94-2.58L27.2,20Zm-7.44-4.45-1.46,6.89H15.06l1.46-6.89Z"/></svg>


--------------------------------------------------------------------------------
/assets/video/DriveLM.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/video/DriveLM.mp4


--------------------------------------------------------------------------------
/assets/video/graph.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/assets/video/graph.mp4


--------------------------------------------------------------------------------
/challenge/__init__.py:
--------------------------------------------------------------------------------
1 | from .gpt_eval import GPTEvaluation


--------------------------------------------------------------------------------
/challenge/convert2llama.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | import json
 3 | 
 4 | 
 5 | def convert2llama(root, dst):
 6 |     with open(root, 'r') as f:
 7 |         test_file = json.load(f)
 8 | 
 9 |     output = []
10 |     for scene_id in test_file.keys():
11 |         scene_data = test_file[scene_id]['key_frames']
12 | 
13 |         for frame_id in scene_data.keys():
14 |             image_paths = scene_data[frame_id]['image_paths']
15 |             image_paths = [image_paths[key].replace("..", "data") for key in image_paths.keys()]
16 | 
17 |             frame_data_qa = scene_data[frame_id]['QA']
18 |             QA_pairs = frame_data_qa["perception"] + frame_data_qa["prediction"] + frame_data_qa["planning"] + frame_data_qa["behavior"]
19 |             
20 |             for idx, qa in enumerate(QA_pairs):
21 |                 question = qa['Q']
22 |                 answer = qa['A']
23 |                 output.append(
24 |                     {
25 |                         "id": scene_id + "_" + frame_id + "_" + str(idx),
26 |                         "image": image_paths,
27 |                         "conversations": [
28 |                             {
29 |                                 "from": "human",
30 |                                 "value": "<image>\n" + question
31 |                             },
32 |                             {
33 |                                 "from": "gpt",
34 |                                 "value": answer
35 |                             },
36 |                         ]
37 |                     }
38 |                 )
39 | 
40 |     with open(dst, 'w') as f:
41 |         json.dump(output, f, indent=4)
42 | 
43 | 
44 | if __name__ == '__main__':
45 |     root = "test_eval.json"
46 |     dst = "test_llama.json"
47 |     convert2llama(root, dst)
48 | 


--------------------------------------------------------------------------------
/challenge/convert_data.py:
--------------------------------------------------------------------------------
 1 | import numpy as np
 2 | import json
 3 | import random
 4 | 
 5 | 
 6 | def rule_based1(question, answer):
 7 |     rule = ["Going ahead.", "Turn right.", "Turn left.", "Stopped.", "Back up.", "Reverse parking.", "Drive backward."]
 8 |     rule.remove(answer)
 9 |     choices = random.sample(rule, 3)
10 |     choices.append(answer)
11 |     random.shuffle(choices)
12 |     idx = choices.index(answer)
13 |     question += f" Please select the correct answer from the following options: A. {choices[0]} B. {choices[1]} C. {choices[2]} D. {choices[3]}"
14 |     mapping = {0: "A", 1: "B", 2: "C", 3: "D"}
15 |     return {"Q": question, "A": mapping[idx]}
16 | 
17 | def rule_based2(question, answer):
18 |     rule = ['The ego vehicle is slightly steering to the left. The ego vehicle is driving very fast.', 'The ego vehicle is steering to the left. The ego vehicle is driving with normal speed.', 'The ego vehicle is steering to the left. The ego vehicle is driving fast.', 'The ego vehicle is slightly steering to the right. The ego vehicle is driving fast.', 'The ego vehicle is going straight. The ego vehicle is driving slowly.', 'The ego vehicle is going straight. The ego vehicle is driving with normal speed.', 'The ego vehicle is slightly steering to the left. The ego vehicle is driving with normal speed.', 'The ego vehicle is slightly steering to the left. The ego vehicle is driving slowly.', 'The ego vehicle is slightly steering to the right. The ego vehicle is driving slowly.', 'The ego vehicle is slightly steering to the right. The ego vehicle is driving very fast.', 'The ego vehicle is steering to the right. The ego vehicle is driving fast.', 'The ego vehicle is steering to the right. The ego vehicle is driving very fast.', 'The ego vehicle is slightly steering to the left. The ego vehicle is driving fast.', 'The ego vehicle is steering to the left. The ego vehicle is driving very fast.', 'The ego vehicle is going straight. The ego vehicle is not moving.', 'The ego vehicle is slightly steering to the right. The ego vehicle is driving with normal speed.', 'The ego vehicle is steering to the right. The ego vehicle is driving slowly.', 'The ego vehicle is steering to the right. The ego vehicle is driving with normal speed.', 'The ego vehicle is going straight. The ego vehicle is driving very fast.', 'The ego vehicle is going straight. The ego vehicle is driving fast.', 'The ego vehicle is steering to the left. The ego vehicle is driving slowly.']
19 |     rule.remove(answer)
20 |     choices = random.sample(rule, 3)
21 |     choices.append(answer)
22 |     random.shuffle(choices)
23 |     idx = choices.index(answer)
24 |     question += f" Please select the correct answer from the following options: A. {choices[0]} B. {choices[1]} C. {choices[2]} D. {choices[3]}"
25 |     mapping = {0: "A", 1: "B", 2: "C", 3: "D"}
26 |     return {"Q": question, "A": mapping[idx]}
27 |     
28 | 
29 | def loop_test(root, dst):
30 |     with open(root, 'r') as f:
31 |         test_file = json.load(f)
32 | 
33 |     for scene_id in test_file.keys():
34 |         scene_data = test_file[scene_id]['key_frames']
35 | 
36 |         for frame_id in scene_data.keys():
37 |             # frame_data_infos = scene_data[frame_id]['key_object_infos']
38 |             frame_data_qa = scene_data[frame_id]['QA']
39 |             image_paths = scene_data[frame_id]['image_paths']
40 | 
41 |             test_file[scene_id]['key_frames'][frame_id] = dict()
42 |             # test_file[scene_id]['key_frames'][frame_id]['key_object_infos'] = frame_data_infos
43 |             test_file[scene_id]['key_frames'][frame_id]['QA'] = dict()
44 |             test_file[scene_id]['key_frames'][frame_id]['QA']['perception'] = []
45 |             # add all prediction and planning
46 |             test_file[scene_id]['key_frames'][frame_id]['QA']['prediction'] = frame_data_qa["prediction"]
47 |             test_file[scene_id]['key_frames'][frame_id]['QA']['planning'] = frame_data_qa["planning"]
48 | 
49 |             test_file[scene_id]['key_frames'][frame_id]['QA']['behavior'] = []
50 |             test_file[scene_id]['key_frames'][frame_id]['image_paths'] = image_paths
51 | 
52 |             for qa in frame_data_qa["perception"]:
53 |                 question = qa['Q']
54 |                 answer = qa['A']
55 |                 if "What is the moving status of object".lower() in question.lower():
56 |                     qa.update(rule_based1(question, answer))
57 |                     test_file[scene_id]['key_frames'][frame_id]['QA']['perception'].append(qa)
58 |                 else:
59 |                     test_file[scene_id]['key_frames'][frame_id]['QA']['perception'].append(qa)
60 | 
61 |             for qa in frame_data_qa["behavior"]:
62 |                 question = qa['Q']
63 |                 answer = qa['A']
64 |                 qa.update(rule_based2(question, answer))
65 |                 test_file[scene_id]['key_frames'][frame_id]['QA']['behavior'].append(qa)
66 | 
67 |     with open(dst, 'w') as f:
68 |         json.dump(test_file, f, indent=4)
69 | 
70 | 
71 | 
72 | if __name__ == '__main__':
73 |     root = "test.json"
74 |     dst = "test_eval.json"
75 |     loop_test(root, dst)
76 | 


--------------------------------------------------------------------------------
/challenge/evaluation.py:
--------------------------------------------------------------------------------
  1 | import re
  2 | import argparse
  3 | import json
  4 | import numpy as np
  5 | import torch.nn as nn
  6 | import language_evaluation
  7 | from multiprocessing import Pool
  8 | 
  9 | import sys
 10 | sys.path.append(".")
 11 | from gpt_eval import GPTEvaluation
 12 | 
 13 | 
 14 | class evaluation_suit():
 15 |     def __init__(self):
 16 |         self.language_eval = language_evaluation.CocoEvaluator(coco_types=["BLEU", "ROUGE_L", "CIDEr"])
 17 |         self.chatgpt_eval = GPTEvaluation()
 18 |         self.GPT = []
 19 |         self.accuracy = {"answer": [], "GT": []}
 20 |         self.language = {"answer": [], "GT": []}
 21 |         self.match = {"match": {"answer": [], "GT": []}, "GPT": []}
 22 | 
 23 |     def eval_acc(self):
 24 |         scores = []
 25 |         for i in range(len(self.accuracy["answer"])):
 26 |             answer = self.accuracy["answer"][i]
 27 |             GT = self.accuracy["GT"][i]
 28 |             if answer == GT:
 29 |                 scores.append(1.0)
 30 |             else:
 31 |                 scores.append(0.0)
 32 | 
 33 |         scores = sum(scores) / len(scores)
 34 |         return scores
 35 | 
 36 |     def eval_chatGPT(self, data):
 37 |         with Pool(32) as p:  # Change the number based on your CPU cores
 38 |             scores = p.map(self.chatgpt_eval.forward, data)
 39 | 
 40 |         scores = list(map(float, scores))
 41 |         scores = sum(scores) / len(scores)
 42 |         return scores
 43 | 
 44 |     def eval_language(self):
 45 |         """
 46 |         return the dict evaluation results
 47 |         """
 48 |         answer = self.language["answer"]
 49 |         GT = self.language["GT"]
 50 |         results_gen = self.language_eval.run_evaluation(answer, GT)
 51 |         results_gen_dict = {
 52 |             f"val/{k}": v for k, v in results_gen.items()
 53 |         }
 54 |         return results_gen_dict
 55 | 
 56 |     def eval_match(self):
 57 |         outs1 = []
 58 |         for i in range(len(self.match["match"]["answer"])):
 59 |             answer = self.match["match"]["answer"][i]
 60 |             GT = self.match["match"]["GT"][i]
 61 |             _, F1_score = self.match_result(answer, GT)
 62 |             outs1.append(F1_score * 100)
 63 |         
 64 |         outs1 = sum(outs1) / len(outs1)
 65 |         outs2 = self.eval_chatGPT(self.match["GPT"])
 66 |         scores = (outs1 + outs2) / 2.0
 67 |         return scores
 68 | 
 69 |     def eval_graph(self, question):
 70 |         # check if answer in self.graph  
 71 |         question_nums = re.findall(r'\d+\.\d+', question)
 72 |         question_nums = np.array([list(map(float, x.split()))[0] for x in question_nums]).reshape(-1, 2)
 73 |         question_nums = [list(i) for i in question_nums]
 74 |         for q in question_nums:
 75 |             if q not in self.graph:
 76 |                 return False
 77 |         return True
 78 | 
 79 |     def match_result(self, answer, GT):
 80 |         """
 81 |         answer: [[1.,2.], [2., 3.]]
 82 |         GT: [[1., 2.], [2., 3.]]
 83 |         """
 84 |         answer_nums = re.findall(r'\d+\.\d+', answer)
 85 |         GT_nums = re.findall(r'\d+\.\d+', GT)
 86 |         # transform string into float
 87 |         if len(answer_nums) % 2 != 0:
 88 |             answer_nums = answer_nums[:-1]
 89 |         answer_nums = np.array([list(map(float, x.split()))[0] for x in answer_nums]).reshape(-1, 2)
 90 |         GT_nums = np.array([list(map(float, x.split()))[0] for x in GT_nums]).reshape(-1, 2)
 91 |         length = len(GT_nums)
 92 | 
 93 |         matched_out = []
 94 |         true_positives = 0
 95 |         false_positives = 0
 96 |         false_negatives = 0
 97 |         for pred in answer_nums:
 98 |             closest_distance = float('inf')
 99 |             closest_gt = None
100 |             closest_id = None
101 |             for i, gt in enumerate(GT_nums):
102 |                 distance = np.sum(np.abs(pred - gt))
103 |                 if distance < closest_distance:
104 |                     closest_distance = distance
105 |                     closest_gt = gt
106 |                     closest_id = i
107 | 
108 |             if closest_distance < 16:
109 |                 true_positives += 1
110 |                 matched_out.append(closest_gt)  
111 |                 GT_nums = np.delete(GT_nums, closest_id, axis=0) 
112 |             else:
113 |                 false_positives += 1
114 |             
115 |         false_negatives = length - true_positives
116 |         precision = true_positives / (true_positives + false_positives + 1e-8)
117 |         recall = true_positives / (true_positives + false_negatives + 1e-8)
118 |         F1 = 2 * precision * recall / (precision + recall + 1e-8)
119 | 
120 |         return matched_out, F1
121 | 
122 |     def set_graph(self, answer, GT):
123 |         self.graph, _ = self.match_result(answer, GT)
124 |         self.graph = [list(i) for i in self.graph]
125 | 
126 |     def forward(self, tag, answer, GT):
127 |         if 0 in tag:
128 |             self.accuracy["answer"].append(answer)
129 |             self.accuracy["GT"].append(GT)
130 |         if 1 in tag:
131 |             self.GPT.append((answer, GT))
132 |         if 2 in tag:
133 |             self.language["GT"].append(GT)
134 |             self.language["answer"].append(answer)
135 |         if 3 in tag:
136 |             self.match["match"]["GT"].append(GT)
137 |             self.match["match"]["answer"].append(answer)
138 |             self.match["GPT"].append((answer, GT))
139 | 
140 |             
141 |     def evaluation(self):
142 |         print("evaluation start!")
143 |         scores = {}
144 |         scores["accuracy"] = self.eval_acc()
145 |         scores["chatgpt"] = self.eval_chatGPT(self.GPT)
146 |         scores["language"] = self.eval_language()
147 |         scores["match"] = self.eval_match()
148 | 
149 |         return scores
150 | 
151 | if __name__ == '__main__':
152 |     # get args
153 |     parser = argparse.ArgumentParser(description='Evaluation')
154 |     parser.add_argument('--root_path1', type=str, default="./llama-adapter-DriveLM.json", help='path to prediction file')
155 |     parser.add_argument('--root_path2', type=str, default="./test_v1.json", help='path to test file')
156 |     args = parser.parse_args()
157 |     
158 |     with open(args.root_path1, 'r') as f :#, \    
159 |         pred_file = json.load(f)
160 |     pred_file = {pred_file[i]["id"]: pred_file[i] for i in range(len(pred_file))}
161 |     
162 |     with open(args.root_path2, 'r') as f:
163 |         test_file = json.load(f)
164 | 
165 |     evaluation = evaluation_suit()
166 |     for scene_id in test_file.keys():
167 |         scene_data = test_file[scene_id]['key_frames']
168 | 
169 |         for frame_id in scene_data.keys():
170 |             frame_data_qa = scene_data[frame_id]['QA']
171 |             first_flag = True
172 | 
173 |             for i, qa in enumerate(frame_data_qa["perception"] + frame_data_qa["prediction"] + frame_data_qa["planning"] + frame_data_qa["behavior"]):
174 |                 question = qa['Q']
175 |                 GT = qa['A']
176 |                 tag = qa['tag']
177 |                 idx = scene_id + "_" + frame_id + "_" + str(i)
178 |                 predict = pred_file[idx]["answer"]
179 |                 # assert pred_file[idx]["gt_answer"] == GT, print(pred_file[idx]["gt_answer"], GT)
180 |                 if first_flag:
181 |                     first_flag = False
182 |                     evaluation.set_graph(predict, GT)
183 |                     evaluation.forward(tag, predict, GT)
184 |                 else:
185 |                     if evaluation.eval_graph(question):
186 |                         res = evaluation.forward(tag, predict, GT)
187 | 
188 |     output = evaluation.evaluation()
189 |     print("accuracy score: ", output["accuracy"])
190 |     print("chatgpt score: ", output["chatgpt"])
191 |     print("match score: ", output["match"])
192 |     print("language score: ", output["language"])
193 |     
194 |     # Normalize to 0-1 and combine the scores: chatgpt, language, match, accuracy
195 |     scores = []
196 |     weights = [0.4, 0.2, 0.2, 0.2]
197 |     
198 |     # chatGPT
199 |     score = output["chatgpt"] / 100.
200 |     scores.append(score)
201 | 
202 |     # language
203 |     score = 0
204 |     for idx, key in enumerate(output["language"].keys()):
205 |         if idx < 4:
206 |             score += output["language"][key] / 4. / 3.
207 |         elif idx == 4:
208 |             score += output["language"][key] / 3. 
209 |         else:
210 |             score += output["language"][key] / 10. / 3.
211 | 
212 |     scores.append(score)
213 |     
214 |     # match
215 |     score = output["match"] / 100.
216 |     scores.append(score)
217 | 
218 |     # accuracy
219 |     score = output["accuracy"]
220 |     scores.append(score)
221 | 
222 |     final_score = sum([x * y for x, y in zip(scores, weights)])
223 |     print("final score: ", final_score)
224 |     
225 | 
226 | 


--------------------------------------------------------------------------------
/challenge/extract_data.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | import os
  3 | import re
  4 | 
  5 | 
  6 | def extract_data(root_path, save_path):
  7 | 
  8 |     with open(root_path, 'r') as f :#, \    
  9 |         train_file = json.load(f)
 10 | 
 11 |     test_data=dict()
 12 | 
 13 |     # TODO: convert the data into test data, containing the importance, multiple choice questions, graph questions
 14 |     for scene_id in train_file.keys():
 15 |         scene_data = train_file[scene_id]['key_frames']
 16 |         
 17 |         # for test file
 18 |         test_data[scene_id] = dict()
 19 |         test_data[scene_id]['key_frames'] = dict()
 20 | 
 21 |         for frame_id in scene_data.keys():
 22 |             frame_data_infos = scene_data[frame_id]['key_object_infos']
 23 |             frame_data_qa = scene_data[frame_id]['QA']
 24 |             image_paths = scene_data[frame_id]['image_paths']
 25 | 
 26 |             # for test file
 27 |             test_data[scene_id]['key_frames'][frame_id] = dict()
 28 |             # test_data[scene_id]['key_frames'][frame_id]['key_object_infos'] = frame_data_infos
 29 |             test_data[scene_id]['key_frames'][frame_id]['QA'] = dict()
 30 |             test_data[scene_id]['key_frames'][frame_id]['image_paths'] = image_paths
 31 |             test_data[scene_id]['key_frames'][frame_id]['QA']['perception'] = []
 32 |             test_data[scene_id]['key_frames'][frame_id]['QA']['prediction'] = []
 33 |             test_data[scene_id]['key_frames'][frame_id]['QA']['planning'] = []
 34 |             test_data[scene_id]['key_frames'][frame_id]['QA']['behavior'] = []
 35 | 
 36 |             # get the classes of the important objects
 37 |             classes = []
 38 |             for obj_id in frame_data_infos.keys():
 39 |                 obj_data = frame_data_infos[obj_id]
 40 |                 classes.append(obj_data['Visual_description'].split('.')[0])
 41 |                 print(classes)
 42 |             
 43 |             # get the location of the important objects
 44 |             locations = []
 45 |             for obj_id in frame_data_infos.keys():
 46 |                 locations.append(obj_id)
 47 |                 print(locations)
 48 |             
 49 |             # get the questions and answers of the perception
 50 |             perception = frame_data_qa["perception"]
 51 |             prediction = frame_data_qa["prediction"]
 52 |             planning = frame_data_qa["planning"]
 53 |             behavior = frame_data_qa["behavior"]
 54 | 
 55 |             for qa in perception:
 56 |                 question = qa['Q']
 57 |                 answer = qa['A']
 58 | 
 59 |                 # according to the classes to select the corresponding question
 60 |                 flag = 1
 61 |                 for cl in classes:
 62 |                     if cl.lower() not in answer.lower():
 63 |                         flag = 0
 64 |                 if flag == 1:
 65 |                     qa['tag'] = [2]
 66 |                     test_data[scene_id]['key_frames'][frame_id]['QA']['perception'].append(qa)
 67 |                     break
 68 |                 
 69 |             # get the multiple choice questions and answers
 70 |             for qa in perception:
 71 |                 question = qa['Q']
 72 |                 answer = qa['A']
 73 |                 if "What is the moving status of object".lower() in question.lower():
 74 |                     qa['tag'] = [0]
 75 |                     test_data[scene_id]['key_frames'][frame_id]['QA']['perception'].append(qa)
 76 |                     break
 77 |             
 78 |             # get the graph questions and answers
 79 |             for qa in prediction:
 80 |                 question = qa['Q']
 81 |                 answer = qa['A']
 82 | 
 83 |                 # according to the location to select the corresponding question
 84 |                 flag = 1
 85 |                 for loc in locations:
 86 |                     if loc.lower() not in answer.lower():
 87 |                         flag = 0
 88 |                 if flag == 1:
 89 |                     qa['tag'] = [3]
 90 |                     test_data[scene_id]['key_frames'][frame_id]['QA']['prediction'].append(qa)
 91 |                     break
 92 | 
 93 |             # get the yes or no questions and answers
 94 |             for qa in prediction:
 95 |                 question = qa['Q']
 96 |                 answer = qa['A']
 97 |                 if "yes" in answer.lower() or "no" in answer.lower():
 98 |                     qa['tag'] = [0]
 99 |                     test_data[scene_id]['key_frames'][frame_id]['QA']['prediction'].append(qa)
100 |                     break
101 | 
102 |             # get the three questions from the planning "safe actions", "collision", ""
103 |             actions_question_added = False
104 |             collision_question_added = False
105 |             safe_actions_question_added = False
106 |             for qa in planning:
107 |                 question = qa['Q']
108 |                 answer = qa['A']
109 |                 if "What actions could the ego vehicle take".lower() in question.lower() and not actions_question_added:
110 |                     qa['tag'] = [1]
111 |                     test_data[scene_id]['key_frames'][frame_id]['QA']['planning'].append(qa)
112 |                     actions_question_added = True
113 |                 if "lead to a collision" in question.lower() and not collision_question_added:
114 |                     qa['tag'] = [1]
115 |                     test_data[scene_id]['key_frames'][frame_id]['QA']['planning'].append(qa)
116 |                     collision_question_added = True
117 |                 if "safe actions" in question.lower() and not safe_actions_question_added:
118 |                     qa['tag'] = [1]
119 |                     test_data[scene_id]['key_frames'][frame_id]['QA']['planning'].append(qa)
120 |                     safe_actions_question_added = True
121 | 
122 |                 # Check if all question types have been added and exit the loop
123 |                 if actions_question_added and collision_question_added and safe_actions_question_added:
124 |                     break
125 |             
126 |             for qa in behavior:
127 |                 question = qa['Q']
128 |                 answer = qa['A']
129 |                 qa['tag'] = [0]
130 |                 test_data[scene_id]['key_frames'][frame_id]['QA']['behavior'].append(qa)
131 | 
132 |     with open(save_path, 'w') as f:
133 |         json.dump(test_data, f, indent=4)
134 | 
135 | if __name__ == "__main__":
136 |     # extract the data from the training json file
137 |     root_path = "data/train_sample.json"
138 |     save_path = "test.json"
139 |     extract_data(root_path, save_path)
140 | 
141 |     
142 | 


--------------------------------------------------------------------------------
/challenge/gpt_eval.py:
--------------------------------------------------------------------------------
 1 | import pickle
 2 | import pdb
 3 | import numpy as np
 4 | import torch
 5 | import json
 6 | import argparse
 7 | from multiprocessing import Pool
 8 | from openai import OpenAI
 9 | 
10 | 
11 | class GPTEvaluation:
12 |     def __init__(self):
13 |         self.client = OpenAI(api_key="you need to use your own openai key for evaluation on your local machine")
14 | 
15 |     def call_chatgpt(self, chatgpt_messages, max_tokens=40, model="gpt-3.5-turbo"):
16 |         response = self.client.chat.completions.create(
17 |             model=model, messages=chatgpt_messages, temperature=0.6, max_tokens=max_tokens
18 |         )
19 |         reply = response.choices[0].message.content
20 |         total_tokens = response.usage.total_tokens
21 |         return reply, total_tokens
22 |     
23 |     def prepare_chatgpt_message(self, prompt):
24 |         system_message = "an evaluator who rates my answer based on the correct answer"
25 |         messages = [{"role": "system", "content": system_message}]
26 |         messages.append({"role": "user", "content": "{}".format(prompt)})
27 |         
28 |         return messages
29 |     
30 |     def forward(self, data):
31 |         answer, GT = data
32 |         prompts = "Rate my answer based on the correct answer out of 100, with higher scores indicating that the answer is closer to the correct answer, and you should be accurate to single digits like 62, 78, 41,etc. Output the number only"
33 |         prompts = prompts + "This is the correct answer: " + GT + "This is my answer: " + answer
34 |         
35 |         output = ""
36 |         messages = self.prepare_chatgpt_message(prompts)
37 |         reply, total_tokens = self.call_chatgpt(messages, max_tokens=3000)
38 | 
39 |         output += reply
40 |         output += "\n\n"
41 | 
42 |         output = output[:-2]
43 | 
44 |         return output
45 |     
46 | 
47 | if __name__ == "__main__":
48 |     data = [
49 |         ("The ego vehicle should notice the bus next, as it is the third object in the image. The bus is stopped at the intersection, and the ego vehicle should be cautious when approaching the intersection to ensure it does not collide with the bus.", "Firstly, notice <c3,CAM_FRONT_LEFT,1075.5,382.8>. The object is a traffic sign, so the ego vehicle should continue at the same speed. Secondly, notice <c2,CAM_FRONT,836.3,398.3>. The object is a traffic sign, so the ego vehicle should accelerate and continue ahead. Thirdly, notice <c1,CAM_BACK,991.7,603.0>. The object is stationary, so the ego vehicle should continue ahead at the same speed."),
50 |         # Add more data here
51 |     ]
52 | 
53 |     eval = GPTEvaluation()
54 | 
55 |     with Pool(5) as p:  # Change the number based on your CPU cores
56 |         scores = p.map(eval.forward, data)
57 | 
58 |     print(scores)
59 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/README.md:
--------------------------------------------------------------------------------
 1 | # LLaMA-Adapter-V2 Multi-modal
 2 | 
 3 | ## News
 4 | * [Oct 11, 2023] Release LLaMA-Adapter V2.1 and evaluation on MME.
 5 | * [July 5, 2023] Release pre-traininig and fine-tuning codes.
 6 | * [May 26, 2023] Initial release.
 7 | 
 8 | 
 9 | ## Setup
10 | 
11 | * setup up a new conda env and install necessary packages.
12 |   ```bash
13 |   conda create -n llama_adapter_v2 python=3.8 -y
14 |   pip install -r requirements.txt
15 |   ```
16 | 
17 | * Obtain the LLaMA backbone weights using [this form](https://forms.gle/jk851eBVbX1m5TAv5). Please note that checkpoints from unofficial sources (e.g., BitTorrent) may contain malicious code and should be used with care. Organize the downloaded file in the following structure
18 |   ```
19 |   /path/to/llama_model_weights
20 |   ├── 7B
21 |   │   ├── checklist.chk
22 |   │   ├── consolidated.00.pth
23 |   │   └── params.json
24 |   └── tokenizer.model
25 |   ```
26 | 
27 | ## Inference
28 | 
29 | Here is a simple inference script for LLaMA-Adapter V2. The pre-trained model will be downloaded directly from [Github Release](https://github.com/OpenGVLab/LLaMA-Adapter/releases/tag/v.2.0.0).
30 | 
31 | ```python
32 | import cv2
33 | import llama
34 | import torch
35 | from PIL import Image
36 | 
37 | device = "cuda" if torch.cuda.is_available() else "cpu"
38 | 
39 | llama_dir = "/path/to/LLaMA/"
40 | 
41 | # choose from BIAS-7B, LORA-BIAS-7B, LORA-BIAS-7B-v21
42 | model, preprocess = llama.load("BIAS-7B", llama_dir, llama_type="7B", device=device)
43 | model.eval()
44 | 
45 | prompt = llama.format_prompt("Please introduce this painting.")
46 | img = Image.fromarray(cv2.imread("../docs/logo_v1.png"))
47 | img = preprocess(img).unsqueeze(0).to(device)
48 | 
49 | result = model.generate(img, [prompt])[0]
50 | 
51 | print(result)
52 | ```
53 | 
54 | The output will look like the following:
55 | ```
56 | The painting features a cute white lama, or llama, standing on a wooden floor. The llama is holding a variety of tools and accessories, such as a paintbrush, a pencil, a ruler, a pair of scissors, and a paint can. The llama is dressed in a suit, which adds a touch of sophistication to the scene. The painting is a creative and whimsical representation of a person or animal holding various tools and accessories, making it an interesting and unique piece of art.
57 | ```
58 | 
59 | ## Evaluation
60 | Check [eval.md](./docs/eval.md) for details.
61 | 
62 | ## Online demo
63 | 
64 | We provide an online demo at [OpenGVLab](http://llama-adapter.opengvlab.com).
65 | 
66 | You can also start it locally with:
67 | ```bash
68 | python gradio_app.py
69 | ```
70 | 
71 | ## Models
72 | 
73 | You can check our models by running:
74 | ```python
75 | import llama
76 | print(llama.available_models())
77 | ```
78 | 
79 | Now we provide `BIAS-7B` which fine-tunes the `bias` and `norm` parameters of LLaMA, and `LORA-BIAS-7B` which fine-tunes the `bias`, `norm` and `lora` parameters of LLaMA. We will include more pretrained models in the future, such as the LoRA fine-tuning model `LORA-7B` and partial-tuning model `PARTIAL-7B`.
80 | 
81 | ## Pre-traininig & Fine-tuning
82 | See [train.md](docs/train.md)
83 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/dataset.py:
--------------------------------------------------------------------------------
  1 | import torch
  2 | import yaml
  3 | from torch.utils.data import Dataset
  4 | from PIL import Image
  5 | import json
  6 | import llama.utils
  7 | from llama import Tokenizer
  8 | import copy
  9 | import torchvision.transforms as transforms
 10 | import pandas as pd
 11 | import random
 12 | import cv2
 13 | import re
 14 | 
 15 | try:
 16 |     from torchvision.transforms import InterpolationMode
 17 |     BICUBIC = InterpolationMode.BICUBIC
 18 | except ImportError:
 19 |     BICUBIC = Image.BICUBIC
 20 | 
 21 | 
 22 | PROMPT_DICT = {
 23 |     "prompt_input": (
 24 |         "Below is an instruction that describes a task, paired with an input that provides further context. "
 25 |         "Write a response that appropriately completes the request.\n\n"
 26 |         "### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:"
 27 |     ),
 28 |     "prompt_no_input": (
 29 |         "Below is an instruction that describes a task. "
 30 |         "Write a response that appropriately completes the request.\n\n"
 31 |         "### Instruction:\n{instruction}\n\n### Response:"
 32 |     ),
 33 | }
 34 | 
 35 | # create data
 36 | transform_train = transforms.Compose([
 37 |     transforms.Resize(
 38 |                     (224, 224), interpolation=InterpolationMode.BICUBIC
 39 |                 ), # 3 is bicubic
 40 |     transforms.ToTensor(),
 41 |     transforms.Normalize(mean=[0.48145466, 0.4578275, 0.40821073], std=[0.26862954, 0.26130258, 0.27577711])])
 42 | 
 43 | class FinetuneDataset(Dataset):
 44 |     def __init__(self, config_path, transform, max_words=30, tokenizer_path=None):
 45 |         print(f"read dataset config from {config_path}")
 46 |         with open(config_path, 'r') as f:
 47 |             self.config = yaml.load(f, Loader=yaml.FullLoader)
 48 |         print("DATASET CONFIG:")
 49 |         print(self.config)
 50 |         ann = []
 51 |         for meta_path in self.config['META']:
 52 |             meta_l = json.load(open(meta_path))
 53 |             print(f"{meta_path}: len {len(meta_l)}")
 54 |             ann += meta_l
 55 |         self.ann = ann
 56 |         print(f"total length: {len(self)}")
 57 |         self.transform = transform
 58 |         self.max_words = max_words
 59 |         self.tokenizer = Tokenizer(model_path=tokenizer_path)
 60 | 
 61 |     def __len__(self):
 62 |         return len(self.ann)
 63 | 
 64 |     def __getitem__(self, index):
 65 |         data_item = self.ann[index]
 66 |         if 'image' in data_item.keys():
 67 |             filename = data_item['image']
 68 |             question = data_item['conversations'][0]['value']
 69 |             answer = data_item['conversations'][1]['value']
 70 |             if isinstance(filename, list):
 71 |                 image_all = []
 72 |                 for img_path in filename:
 73 |                     image = cv2.imread(img_path)
 74 |                     image = Image.fromarray(image)
 75 |                     image = self.transform(image)
 76 |                     image_all.append(image)
 77 |                 image = torch.stack(image_all)
 78 |             else:
 79 |                 image = cv2.imread(filename)
 80 |                 image = Image.fromarray(image)
 81 |                 image = self.transform(image)
 82 |             format_instruction = question
 83 |             format_input = None
 84 |         else:
 85 |             image = torch.zeros(3, 224, 224)
 86 |             format_instruction = data_item['instruction'],
 87 |             format_input = data_item['input']
 88 |             answer = data_item['output']
 89 |         input1 = llama.utils.format_prompt(format_instruction, format_input)
 90 |         input2 = input1 + answer
 91 |         input1 = torch.tensor(self.tokenizer.encode(input1, bos=True, eos=False), dtype=torch.int64)
 92 |         input2 = torch.tensor(self.tokenizer.encode(input2, bos=True, eos=True), dtype=torch.int64)
 93 |         padding = self.max_words - input2.shape[0]
 94 |         if padding > 0:
 95 |             input2 = torch.cat((input2, torch.zeros(padding, dtype=torch.int64) - 1))
 96 |         elif padding < 0:
 97 |             input2 = input2[:self.max_words]
 98 |         labels = copy.deepcopy(input2)
 99 |         labels[:len(input1)] = -1
100 |         input2_mask = input2.ge(0)
101 |         label_mask = labels.ge(0)
102 |         input2[~input2_mask] = 0
103 |         labels[~label_mask] = 0
104 |         input2_mask = input2_mask.float()
105 |         label_mask = label_mask.float()
106 |         return input2, labels, input2_mask, image
107 | 
108 | 
109 | class PretrainDataset(Dataset):
110 |     def __init__(self, config_path, transform, max_words=30, tokenizer_path=None):
111 |         print(f"read dataset config from {config_path}")
112 |         with open(config_path, 'r') as f:
113 |             self.config = yaml.load(f, Loader=yaml.FullLoader)
114 |         print("DATASET CONFIG:")
115 |         print(self.config)
116 |         images, captions = [], []
117 |         for meta_path in self.config['META']:
118 |             images_this_meta, captions_this_meta = [], []
119 |             for chunk in pd.read_csv(meta_path, sep='\t', lineterminator='\n', chunksize=10 ** 6):
120 |                 images_this_meta.extend(chunk['url'].tolist())
121 |                 captions_this_meta.extend(chunk['caption'].tolist())
122 |             print(f"{meta_path}: len {len(images_this_meta)}")
123 |             images.extend(images_this_meta)
124 |             captions.extend(captions_this_meta)
125 | 
126 |         self.data_list = []
127 |         for x, y in zip(images, captions):
128 |             self.data_list.append({'url': x, 'caption': y})
129 |         print(f"total length: {len(self)}")
130 |         self.transform = transform
131 |         self.max_words = max_words
132 |         self.tokenizer = Tokenizer(model_path=tokenizer_path)
133 | 
134 |     def __len__(self):
135 |         return len(self.data_list)
136 | 
137 |     def __getitem__(self, index):
138 |         sample = self.data_list[index]
139 |         image_path, caption = sample['url'], sample['caption']
140 |         if isinstance(caption, list):
141 |             caption = random.choice(caption)
142 |         caption = str(caption)
143 | 
144 |         image = cv2.imread(image_path)
145 |         image = Image.fromarray(image)
146 |         image = self.transform(image)
147 | 
148 |         format_instruction = "Generate caption of this image"
149 |         input1 = llama.utils.format_prompt(format_instruction, None)
150 |         input2 = input1 + caption
151 | 
152 |         input1 = torch.tensor(self.tokenizer.encode(input1, bos=True, eos=False), dtype=torch.int64)
153 |         input2 = torch.tensor(self.tokenizer.encode(input2, bos=True, eos=True), dtype=torch.int64)
154 |         padding = self.max_words - input2.shape[0]
155 |         if padding > 0:
156 |             input2 = torch.cat((input2, torch.zeros(padding, dtype=torch.int64) - 1))
157 |         elif padding < 0:
158 |             input2 = input2[:self.max_words]
159 |         labels = copy.deepcopy(input2)
160 |         labels[:len(input1)] = -1
161 |         input2_mask = input2.ge(0)
162 |         label_mask = labels.ge(0)
163 |         input2[~input2_mask] = 0
164 |         labels[~label_mask] = 0
165 |         input2_mask = input2_mask.float()
166 |         label_mask = label_mask.float()
167 |         return input2, labels, input2_mask, image
168 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291002287558.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291002287558.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291005187558.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291005187558.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291010637558.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291010637558.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291013637558.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n008-2018-09-18-13-10-39-0400__CAM_BACK__1537291013637558.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280036187525.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280036187525.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280039187525.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280039187525.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280042637525.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280042637525.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280045137525.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280045137525.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280048187525.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK/n015-2018-08-03-15-00-36+0800__CAM_BACK__1533280048187525.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291002297405.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291002297405.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291005197405.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291005197405.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291010647405.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291010647405.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291013647405.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n008-2018-09-18-13-10-39-0400__CAM_BACK_LEFT__1537291013647405.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280036197423.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280036197423.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280039197423.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280039197423.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280042647423.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280042647423.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280045147423.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280045147423.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280048197442.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_LEFT/n015-2018-08-03-15-00-36+0800__CAM_BACK_LEFT__1533280048197442.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291002278113.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291002278113.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291005178113.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291005178113.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291010628113.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291010628113.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291013628113.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_BACK_RIGHT__1537291013628113.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280036177893.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280036177893.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280039177893.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280039177893.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280042627893.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280042627893.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280045127893.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280045127893.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280048177893.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_BACK_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_BACK_RIGHT__1533280048177893.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291002262404.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291002262404.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291005162404.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291005162404.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291010612404.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291010612404.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291013612404.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n008-2018-09-18-13-10-39-0400__CAM_FRONT__1537291013612404.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280036162460.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280036162460.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280039162460.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280039162460.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280042612460.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280042612460.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280045112460.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280045112460.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280048162460.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT/n015-2018-08-03-15-00-36+0800__CAM_FRONT__1533280048162460.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291002254799.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291002254799.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291005154799.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291005154799.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291010604799.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291010604799.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291013604799.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_LEFT__1537291013604799.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280036154844.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280036154844.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280039154844.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280039154844.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280042604844.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280042604844.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280045104844.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280045104844.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280048154844.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_LEFT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_LEFT__1533280048154844.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291002270482.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291002270482.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291005170482.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291005170482.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291010620482.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291010620482.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291013620482.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n008-2018-09-18-13-10-39-0400__CAM_FRONT_RIGHT__1537291013620482.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280036170339.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280036170339.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280039170339.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280039170339.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280042620339.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280042620339.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280045120339.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280045120339.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280048170339.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenDriveLab/DriveLM/0e8dff72eaf13c42b508289a34ea758782089e8c/challenge/llama_adapter_v2_multimodal7b/data/nuscenes/samples/CAM_FRONT_RIGHT/n015-2018-08-03-15-00-36+0800__CAM_FRONT_RIGHT__1533280048170339.jpg


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/demo.py:
--------------------------------------------------------------------------------
  1 | import cv2
  2 | import llama
  3 | import torch
  4 | from PIL import Image
  5 | from tqdm import tqdm
  6 | import json
  7 | import argparse
  8 | import torchvision.transforms as transforms
  9 | from torch.utils.data import Dataset, DataLoader
 10 | from threading import Thread
 11 | import math
 12 | 
 13 | try:
 14 |     from torchvision.transforms import InterpolationMode
 15 |     BICUBIC = InterpolationMode.BICUBIC
 16 | except ImportError:
 17 |     BICUBIC = Image.BICUBIC
 18 | 
 19 | class LLamaDataset(Dataset):
 20 |     def __init__(self, data, transform=None):
 21 |         self.data = data
 22 |         self.transform = transform
 23 | 
 24 |     def __len__(self):
 25 |         return len(self.data)
 26 | 
 27 |     def __getitem__(self, idx):
 28 |         data_item = self.data[idx]
 29 |         filename = data_item['image']
 30 |         ids = data_item['id']
 31 |         question = data_item['conversations'][0]['value']
 32 |         answer = data_item['conversations'][1]['value']
 33 |         
 34 |         prompt = llama.format_prompt(question)
 35 | 
 36 |         if isinstance(filename, list):
 37 |             image_all = []
 38 |             for img_path in filename:
 39 |                 image = cv2.imread(img_path)
 40 |                 image = Image.fromarray(image)
 41 |                 if self.transform:
 42 |                     image = self.transform(image)
 43 |                 image_all.append(image)
 44 |             image = torch.stack(image_all, dim=0)
 45 |         else:
 46 |             image = cv2.imread(filename)
 47 |             image = Image.fromarray(image)
 48 |             if self.transform:
 49 |                 image = self.transform(image)
 50 | 
 51 |         return image, prompt, ids, question, answer
 52 | 
 53 | def worker(rank, gpu_id, args, data_dict):
 54 |     torch.cuda.set_device(gpu_id)
 55 |     device = torch.device("cuda")
 56 |     llama_dir = args.llama_dir
 57 | 
 58 |     model, preprocess = llama.load(args.checkpoint, llama_dir, llama_type="7B", device=device)
 59 |     model.eval()
 60 | 
 61 |     transform_train = transforms.Compose([
 62 |         transforms.Resize((224, 224), interpolation=BICUBIC),
 63 |         transforms.ToTensor(),
 64 |         transforms.Normalize(mean=[0.48145466, 0.4578275, 0.40821073], std=[0.26862954, 0.26130258, 0.27577711])])
 65 | 
 66 |     with open(args.data, 'r') as f:
 67 |         data_all = json.load(f)
 68 | 
 69 |     num_processes = args.num_processes
 70 |     data_per_process = math.ceil(len(data_all) / num_processes)
 71 |     start_idx = rank * data_per_process
 72 |     end_idx = min((rank + 1) * data_per_process, len(data_all))
 73 |     data_to_process = data_all[start_idx:end_idx]
 74 | 
 75 |     dataset = LLamaDataset(data_to_process, transform=transform_train)
 76 |     dataloader = DataLoader(dataset, batch_size=args.batch_size, shuffle=False, num_workers=8)
 77 | 
 78 |     for batch in tqdm(dataloader):
 79 |         images, prompts, ids, questions, gt_answers = batch
 80 |         images = images.to(device)
 81 |         results = model.generate(images, prompts, temperature=0.2, top_p=0.1)
 82 |         
 83 |         for i, result in enumerate(results):
 84 |             print(f"Thread {rank}: Result - {result}")
 85 |             data_dict.append({'id': ids[i], 'question': questions[i], 'answer': result})
 86 |     
 87 |     print(f"Thread {rank} finished")
 88 | 
 89 | # add args
 90 | parser = argparse.ArgumentParser(description='LLAMA Adapter')
 91 | parser.add_argument('--llama_dir', type=str, default="/path/to/llama_model_weights", help='path to llama model weights')
 92 | parser.add_argument('--checkpoint', type=str, default="/path/to/pre-trained/checkpoint.pth", help='path to pre-trained checkpoint')
 93 | parser.add_argument('--data', type=str, default="../test_llama.json", help='path to test data')
 94 | parser.add_argument('--output', type=str, default="../output.json", help='path to output file')
 95 | parser.add_argument('--batch_size', type=int, default=8, help='batch size for parallel processing')
 96 | parser.add_argument('--num_processes', type=int, default=8, help='number of gpus to use')
 97 | args = parser.parse_args()
 98 | 
 99 | if __name__ == '__main__':
100 |     num_gpus = args.num_processes
101 |     print(f"Using {num_gpus} GPUs")
102 |     
103 |     data_dict = []
104 |     threads = []
105 |     for rank in range(num_gpus):
106 |         t = Thread(target=worker, args=(rank, rank, args, data_dict))
107 |         t.start()
108 |         threads.append(t)
109 | 
110 |     for t in threads:
111 |         t.join()
112 | 
113 |     with open(args.output, "w") as f:
114 |         json.dump(data_dict, f, indent=4)
115 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/docs/eval.md:
--------------------------------------------------------------------------------
 1 | # Evaluation on MME Benchmark
 2 | 
 3 | [MME](https://github.com/BradyFU/Awesome-Multimodal-Large-Language-Models/tree/Evaluation) is a comprehensive evaluation benchmark for multimodal large language models. It measures both perception and cognition abilities on a total of 14 subtasks, including existence, count, position, color, poster, celebrity, scene, landmark, artwork, OCR, commonsense reasoning, numerical calculation, text translation, and code reasoning.
 4 | 
 5 | ## Setup & Evaluation
 6 | 
 7 | 1. Download MME datasets and `eval_tool` from the [MME repo](https://github.com/bradyfu/awesome-multimodal-large-language-models#our-mllm-works), and put them under `MME_Benchmark_release_version`. Now the folder structure will be:
 8 |     ```
 9 |     MME_Benchmark_release_version
10 |         ├── artwork
11 |         ├── celebrity
12 |         ├── code_reasoning
13 |         ├── color
14 |         ├── commonsense_reasoning
15 |         ├── count
16 |         ├── eval_tool
17 |         │   ├── calculation.py
18 |         │   ├── LaVIN
19 |         │   └── Your_Results
20 |         ├── existence
21 |         ├── landmark
22 |         ├── numerical_calculation
23 |         ├── OCR
24 |         ├── position
25 |         ├── posters
26 |         ├── scene
27 |         └── text_translation
28 |     ```
29 | 2. Generate MME results using: `python util/evaluate_mme.py --pretrained_path [MODEL_PATH] --llama_path [LLAMA_DIR] --output_path [RESULT_FILE_PATH]`
30 | 3. Evaluate LLaMA-Adapter V2.1 with MME's eval_tool: `python MME_Benchmark_release_version/eval_tool/calculation.py --results_dir [RESULT_FILE_PATH]`
31 | 
32 | ## Results
33 | 
34 | > For comparisons with other works, please check [MME Leaderboard](https://github.com/BradyFU/Awesome-Multimodal-Large-Language-Models/tree/Evaluation).
35 | 
36 | * **LLaMA-Adapter V2.1**
37 | 
38 |     ```
39 |     =========== Perception ===========
40 |     total score: 1326.0875953396435 
41 | 
42 |             existence  score: 185.0
43 |             count  score: 133.33333333333331
44 |             position  score: 56.666666666666664
45 |             color  score: 118.33333333333334
46 |             posters  score: 147.9591836734694
47 |             celebrity  score: 134.70588235294116
48 |             scene  score: 156.25
49 |             landmark  score: 167.8391959798995
50 |             artwork  score: 123.5
51 |             OCR  score: 102.5
52 | 
53 | 
54 |     =========== Cognition ===========
55 |     total score: 356.42857142857144 
56 | 
57 |             commonsense_reasoning  score: 106.42857142857144
58 |             numerical_calculation  score: 47.5
59 |             text_translation  score: 112.5
60 |             code_reasoning  score: 90.0
61 | 
62 |     ```
63 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/docs/train.md:
--------------------------------------------------------------------------------
 1 | The training process of LLaMA-Adapter V2 consists of the pre-training and fine-tuning phases.
 2 | 
 3 | ## Pre-training
 4 | 
 5 | ### Data
 6 | 
 7 | * We use multiple datasets with **image-text pairs** for pre-training. The texts are English-only.
 8 | * For each dataset, the meta file should be organized in the `.csv` format as following:
 9 | 
10 |   ```
11 |   url		caption
12 |   /path/to/image1		caption1
13 |   /path/to/image2		caption2
14 |   ...
15 |   ```
16 | 
17 |   Alternatively, you may modify the [`PretrainDataset`](/data/dataset.py) implementation to adapt to your own meta file format.
18 | * Write a `.yaml` config file to specify the datasets for pre-training:
19 | 
20 |   ```
21 |   META:
22 |     - '/path/to/cc3m.csv'
23 |     - '/path/to/coco.csv'
24 |     ...
25 |   ```
26 | 
27 | ### Start pre-training
28 | 
29 | We are now ready to start pre-training (please make sure that the original LLaMA weights are available in `/path/to/llama_model_weights`).
30 | 
31 | ```bash
32 | . exps/pretrain.sh /path/to/llama_model_weights /path/to/pretrain-data-config.yaml /output/path
33 | ```
34 | 
35 | ## Fine-tuning
36 | 
37 | ### Data
38 | 
39 | * We fine-tune LLaMA-Adapter V2 on text-only as well as image-text instruction following datasets.
40 | * The following lists the datasets we use for training our release weights:
41 | 
42 |   | Name                     | Link                                                                                                         |
43 |   | ------------------------ | ------------------------------------------------------------------------------------------------------------ |
44 |   | alpaca_gpt4_data.json    | [File Link](https://github.com/Instruction-Tuning-with-GPT-4/GPT-4-LLM/blob/main/data/alpaca_gpt4_data.json)    |
45 |   | alpaca_gpt4_data_zh.json | [File Link](https://github.com/Instruction-Tuning-with-GPT-4/GPT-4-LLM/blob/main/data/alpaca_gpt4_data_zh.json) |
46 |   | llava_instruct_150k.json | [File Link](https://huggingface.co/datasets/liuhaotian/LLaVA-Instruct-150K/raw/main/llava_instruct_150k.json)   |
47 |   | alpaca_data_zh_51k.json  | [File Link](https://github.com/ymcui/Chinese-LLaMA-Alpaca/blob/main/data/alpaca_data_zh_51k.json)               |
48 | * Similar to pre-training, write a `.yaml` config file to specify the datasets for fine-tuning:
49 | 
50 |   ```
51 |   META:
52 |     - '/path/to/alpaca_gpt4_data.json'
53 |     - '/path/to/alpaca_gpt4_data_zh.json'
54 |     ...
55 |   ```
56 | 
57 | ### Start fine-tuning
58 | 
59 | ```bash
60 | . exps/finetune.sh \
61 |  /path/to/llama_model_weights /path/to/pre-trained/checkpoint.pth \
62 |  /path/to/finetune-data-config.yaml /output/path
63 | ```
64 | 
65 | ### Test and Save
66 | 
67 | ```python
68 | import os 
69 | from llama.llama_adapter import LLaMA_adapter
70 | import util.misc as misc
71 | import util.extract_adapter_from_checkpoint as extract
72 | from PIL import Image
73 | import cv2
74 | import torch
75 | import llama
76 | 
77 | device = "cuda" if torch.cuda.is_available() else "cpu"
78 | 
79 | llama_dir = "path/to/llama/"
80 | llama_type = '7B'
81 | llama_ckpt_dir = os.path.join(llama_dir, llama_type)
82 | llama_tokenzier_path = os.path.join(llama_dir, 'tokenizer.model')
83 | model = LLaMA_adapter(llama_ckpt_dir, llama_tokenzier_path)
84 | 
85 | misc.load_model(model, 'path/to/finetune/checkpoint.pth')
86 | model.eval()
87 | model.to(device)
88 | 
89 | prompt = llama.format_prompt('your prompt')
90 | img = Image.fromarray(cv2.imread("your image"))
91 | img = model.clip_transform(img).unsqueeze(0).to(device)
92 | 
93 | result = model.generate(img, [prompt])[0]
94 | print(result)
95 | 
96 | extract.save(model,'path/to/adapter-7B.pth','BIAS') # Please end it with -llama_type.pth
97 | ```
98 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/engine_finetune.py:
--------------------------------------------------------------------------------
 1 | import math
 2 | import sys
 3 | from typing import Iterable
 4 | 
 5 | import torch
 6 | 
 7 | import util.misc as misc
 8 | import util.lr_sched as lr_sched
 9 | 
10 | from llama import LLaMA_adapter
11 | 
12 | def train_one_epoch(model: LLaMA_adapter,
13 |                     data_loader: Iterable, optimizer: torch.optim.Optimizer,
14 |                     device: torch.device, epoch: int, loss_scaler,
15 |                     log_writer=None,
16 |                     args=None):
17 |     model.train(True)
18 |     # model.module.set_default_trainability()
19 | 
20 |     metric_logger = misc.MetricLogger(delimiter="  ")
21 |     metric_logger.add_meter('lr', misc.SmoothedValue(window_size=1, fmt='{value:.6f}'))
22 |     header = 'Epoch: [{}]'.format(epoch)
23 |     print_freq = 10
24 | 
25 |     accum_iter = args.accum_iter
26 | 
27 |     optimizer.zero_grad()
28 | 
29 |     if log_writer is not None:
30 |         print('log_dir: {}'.format(log_writer.log_dir))
31 |     for data_iter_step, (examples, labels, example_mask, imgs) in enumerate(metric_logger.log_every(data_loader, print_freq, header)):
32 |         # we use a per iteration (instead of per epoch) lr scheduler
33 |         if data_iter_step % accum_iter == 0:
34 |             lr_sched.adjust_learning_rate(optimizer, data_iter_step / len(data_loader) + epoch, args)
35 | 
36 |         imgs = imgs.to(device, non_blocking=True)
37 |         with torch.cuda.amp.autocast():
38 |              c_loss, m_loss = model(examples, labels, imgs)
39 |         loss = c_loss  + m_loss * 0
40 |         loss_value = loss.item()
41 |         c_loss_value = c_loss.item()
42 |         m_loss_value = m_loss
43 |         if not math.isfinite(loss_value):
44 |             print("Loss is {}, stopping training".format(loss_value))
45 |             sys.exit(1)
46 | 
47 |         loss /= accum_iter
48 |         loss_scaler(loss, optimizer, parameters=model.parameters(),
49 |                     update_grad=(data_iter_step + 1) % accum_iter == 0)
50 |         if (data_iter_step + 1) % accum_iter == 0:
51 |             optimizer.zero_grad()
52 | 
53 |         torch.cuda.synchronize()
54 | 
55 |         metric_logger.update(closs=c_loss_value)
56 |         metric_logger.update(mloss=m_loss_value)
57 | 
58 |         lr = optimizer.param_groups[0]["lr"]
59 |         metric_logger.update(lr=lr)
60 | 
61 |         loss_value_reduce = misc.all_reduce_mean(loss_value)
62 |         c_loss_value_reduce = misc.all_reduce_mean(c_loss_value)
63 |         m_loss_value_reduce = misc.all_reduce_mean(m_loss_value)
64 |         if log_writer is not None and (data_iter_step + 1) % accum_iter == 0:
65 |             """ We use epoch_1000x as the x-axis in tensorboard.
66 |             This calibrates different curves when batch size changes.
67 |             """
68 |             epoch_1000x = int((data_iter_step / len(data_loader) + epoch) * 1000)
69 |             log_writer.add_scalar('c_train_loss', c_loss_value_reduce, epoch_1000x)
70 |             log_writer.add_scalar('m_train_loss', m_loss_value_reduce, epoch_1000x)
71 |             log_writer.add_scalar('lr', lr, epoch_1000x)
72 | 
73 | 
74 |     # gather the stats from all processes
75 |     metric_logger.synchronize_between_processes()
76 |     print("Averaged stats:", metric_logger)
77 |     return {k: meter.global_avg for k, meter in metric_logger.meters.items()}
78 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/engine_pretrain.py:
--------------------------------------------------------------------------------
 1 | import math
 2 | import sys
 3 | from typing import Iterable
 4 | 
 5 | import torch
 6 | 
 7 | import util.misc as misc
 8 | import util.lr_sched as lr_sched
 9 | 
10 | from llama import LLaMA_adapter
11 | 
12 | def train_one_epoch(model: LLaMA_adapter,
13 |                     data_loader: Iterable, optimizer: torch.optim.Optimizer,
14 |                     device: torch.device, epoch: int, loss_scaler,
15 |                     log_writer=None,
16 |                     args=None):
17 |     model.train(True)
18 |     # model.module.set_default_trainability()
19 | 
20 |     metric_logger = misc.MetricLogger(delimiter="  ")
21 |     metric_logger.add_meter('lr', misc.SmoothedValue(window_size=1, fmt='{value:.6f}'))
22 |     header = 'Epoch: [{}]'.format(epoch)
23 |     print_freq = 10
24 | 
25 |     accum_iter = args.accum_iter
26 | 
27 |     optimizer.zero_grad()
28 | 
29 |     if log_writer is not None:
30 |         print('log_dir: {}'.format(log_writer.log_dir))
31 |     for data_iter_step, (examples, labels, example_mask, imgs) in enumerate(metric_logger.log_every(data_loader, print_freq, header)):
32 |         # we use a per iteration (instead of per epoch) lr scheduler
33 |         if data_iter_step % accum_iter == 0:
34 |             lr_sched.adjust_learning_rate(optimizer, data_iter_step / len(data_loader) + epoch, args)
35 | 
36 |         imgs = imgs.to(device, non_blocking=True)
37 |         with torch.cuda.amp.autocast():
38 |              c_loss, m_loss = model(examples, labels, imgs)
39 |         loss = c_loss  + m_loss * 0
40 |         loss_value = loss.item()
41 |         c_loss_value = c_loss.item()
42 |         m_loss_value = m_loss
43 |         if not math.isfinite(loss_value):
44 |             print("Loss is {}, stopping training".format(loss_value))
45 |             sys.exit(1)
46 | 
47 |         loss /= accum_iter
48 |         loss_scaler(loss, optimizer, parameters=model.parameters(),
49 |                     update_grad=(data_iter_step + 1) % accum_iter == 0)
50 |         if (data_iter_step + 1) % accum_iter == 0:
51 |             optimizer.zero_grad()
52 | 
53 |         torch.cuda.synchronize()
54 | 
55 |         metric_logger.update(closs=c_loss_value)
56 |         metric_logger.update(mloss=m_loss_value)
57 | 
58 |         lr = optimizer.param_groups[0]["lr"]
59 |         metric_logger.update(lr=lr)
60 | 
61 |         loss_value_reduce = misc.all_reduce_mean(loss_value)
62 |         c_loss_value_reduce = misc.all_reduce_mean(c_loss_value)
63 |         m_loss_value_reduce = misc.all_reduce_mean(m_loss_value)
64 |         if log_writer is not None and (data_iter_step + 1) % accum_iter == 0:
65 |             """ We use epoch_1000x as the x-axis in tensorboard.
66 |             This calibrates different curves when batch size changes.
67 |             """
68 |             epoch_1000x = int((data_iter_step / len(data_loader) + epoch) * 1000)
69 |             log_writer.add_scalar('c_train_loss', c_loss_value_reduce, epoch_1000x)
70 |             log_writer.add_scalar('m_train_loss', m_loss_value_reduce, epoch_1000x)
71 |             log_writer.add_scalar('lr', lr, epoch_1000x)
72 | 
73 | 
74 |     # gather the stats from all processes
75 |     metric_logger.synchronize_between_processes()
76 |     print("Averaged stats:", metric_logger)
77 |     return {k: meter.global_avg for k, meter in metric_logger.meters.items()}
78 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/exps/finetune.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/bash
 2 | 
 3 | LLAMA_PATH="$1"
 4 | PRETRAINED_PATH="$2" # path to pre-trained checkpoint
 5 | CONFIG="$3"
 6 | OUTPUT_DIR="$4"
 7 | 
 8 | mkdir -p $OUTPUT_DIR
 9 | 
10 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
11 |  main_finetune.py --data_config "$CONFIG" --batch_size 4 \
12 |  --epochs 4 --warmup_epochs 1 --blr 10e-4 --weight_decay 0.02 \
13 |  --llama_path "$LLAMA_PATH" \
14 |  --output_dir "$OUTPUT_DIR" \
15 |  --pretrained_path "$PRETRAINED_PATH" \
16 |  &>> "$OUTPUT_DIR"/output.log &


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/exps/pretrain.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/bash
 2 | 
 3 | LLAMA_PATH="$1"
 4 | CONFIG="$2"
 5 | OUTPUT_DIR="$3"
 6 | 
 7 | mkdir -p "$OUTPUT_DIR"
 8 | 
 9 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
10 |  main_pretrain.py --data_config "$CONFIG" --batch_size 4 \
11 |  --epochs 150 --split_epoch 50 --warmup_epochs 5 --blr 1.0e-4 --weight_decay 0.05 \
12 |  --llama_path "$LLAMA_PATH" \
13 |  --output_dir "$OUTPUT_DIR" \
14 |  &>> "$OUTPUT_DIR"/output.log &


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/finetune_data_config.yaml:
--------------------------------------------------------------------------------
1 | META:
2 |   - 'test_llama.json'
3 | 
4 | 
5 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/gradio_app.py:
--------------------------------------------------------------------------------
 1 | import cv2
 2 | import gradio as gr
 3 | import torch
 4 | from PIL import Image
 5 | 
 6 | import llama
 7 | 
 8 | 
 9 | device = "cuda" if torch.cuda.is_available() else "cpu"
10 | 
11 | llama_dir = "/path/to/LLaMA/"
12 | 
13 | model, preprocess = llama.load("BIAS-7B", llama_dir, device)
14 | model.half()
15 | model.eval()
16 | 
17 | def multi_modal_generate(
18 |     img_path: str,
19 |     prompt: str,
20 |     max_gen_len=256,
21 |     temperature: float = 0.1,
22 |     top_p: float = 0.75,
23 | ):
24 |     try:
25 |         img = Image.fromarray(cv2.imread(img_path))
26 |     except:
27 |         return ""
28 | 
29 |     img = preprocess(img).unsqueeze(0).half().to(device)
30 |     prompt = llama.format_prompt(prompt)
31 | 
32 |     result = model.generate(img, [prompt], 
33 |                             max_gen_len=max_gen_len, 
34 |                             temperature=temperature, 
35 |                             top_p=top_p)
36 |     print(result[0])
37 |     return result[0]
38 | 
39 | 
40 | def create_multi_modal_demo():
41 |     with gr.Blocks() as instruct_demo:
42 |         with gr.Row():
43 |             with gr.Column():
44 |                 img = gr.Image(label='Input', type='filepath')
45 |                 question = gr.Textbox(lines=2, label="Prompt")
46 |                 max_len = gr.Slider(minimum=1, maximum=512,
47 |                                     value=256, label="Max length")
48 |                 with gr.Accordion(label='Advanced options', open=False):
49 |                     temp = gr.Slider(minimum=0, maximum=1,
50 |                                      value=0.1, label="Temperature")
51 |                     top_p = gr.Slider(minimum=0, maximum=1,
52 |                                       value=0.75, label="Top p")
53 | 
54 |                 run_botton = gr.Button("Run")
55 | 
56 |             with gr.Column():
57 |                 outputs = gr.Textbox(lines=10, label="Output")
58 | 
59 |         inputs = [img, question, max_len, temp, top_p]
60 | 
61 |         examples = [
62 |             ["../docs/logo_v1.png", "Please introduce this painting.", 256, 0.1, 0.75],
63 |         ]
64 | 
65 |         gr.Examples(
66 |             examples=examples,
67 |             inputs=inputs,
68 |             outputs=outputs,
69 |             fn=multi_modal_generate,
70 |             cache_examples=False
71 |         )
72 |         run_botton.click(fn=multi_modal_generate,
73 |                          inputs=inputs, outputs=outputs)
74 |     return instruct_demo
75 | 
76 | 
77 | description = """
78 | # LLaMA-Adapter V2🚀
79 | The official demo for **LLaMA-Adapter V2: Parameter-Efficient Visual Instruction Model**.
80 | 
81 | Please refer to our [arXiv paper](https://arxiv.org/abs/2304.15010) and [github](https://github.com/ZrrSkywalker/LLaMA-Adapter) for more details.
82 | 
83 | The demo for **LLaMA-Adapter V1** is available at: [Huggingface Spaces](https://huggingface.co/spaces/csuhan/LLaMA-Adapter).
84 | """
85 | 
86 | with gr.Blocks(css="h1,p {text-align: center;}") as demo:
87 |     gr.Markdown(description)
88 |     with gr.TabItem("Multi-Modal Interaction"):
89 |         create_multi_modal_demo()
90 | 
91 | demo.queue(api_open=True, concurrency_count=1).launch(share=True)
92 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/llama/__init__.py:
--------------------------------------------------------------------------------
1 | from .llama import ModelArgs, Transformer
2 | from .tokenizer import Tokenizer
3 | from .llama_adapter import *
4 | from .utils import format_prompt


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from sentencepiece import SentencePieceProcessor
 5 | from logging import getLogger
 6 | from typing import List
 7 | import os
 8 | 
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(
26 |             f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}"
27 |         )
28 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
29 | 
30 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
31 |         assert type(s) is str
32 |         t = self.sp_model.encode(s)
33 |         if bos:
34 |             t = [self.bos_id] + t
35 |         if eos:
36 |             t = t + [self.eos_id]
37 |         return t
38 | 
39 |     def decode(self, t: List[int]) -> str:
40 |         return self.sp_model.decode(t)
41 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/llama/utils.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import urllib
 3 | import hashlib
 4 | import warnings
 5 | 
 6 | from tqdm import tqdm
 7 | import torch
 8 | 
 9 | 
10 | def sample_top_p(probs, p):
11 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
12 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
13 |     mask = probs_sum - probs_sort > p
14 |     probs_sort[mask] = 0.0
15 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
16 |     next_token = torch.multinomial(probs_sort, num_samples=1)
17 |     next_token = torch.gather(probs_idx, -1, next_token)
18 |     return next_token
19 | 
20 | 
21 | def format_prompt(instruction, input=None):
22 | 
23 |     PROMPT_DICT = {
24 |         "prompt_input": (
25 |             "Below is an instruction that describes a task, paired with an input that provides further context. "
26 |             "Write a response that appropriately completes the request.\n\n"
27 |             "### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:"
28 |         ),
29 |         "prompt_no_input": (
30 |             "Below is an instruction that describes a task. "
31 |             "Write a response that appropriately completes the request.\n\n"
32 |             "### Instruction:\n{instruction}\n\n### Response:"
33 |         ),
34 |     }
35 |     if input is None:
36 |         return PROMPT_DICT['prompt_no_input'].format_map({'instruction': instruction})
37 |     else:
38 |         return PROMPT_DICT["prompt_input"].format_map({'instruction': instruction, 'input': input})
39 | 
40 | 
41 | def _download(url: str, root: str):
42 |     os.makedirs(root, exist_ok=True)
43 |     filename = os.path.basename(url)
44 |     # assume the url is https://some/path/sha256_model.pth
45 |     expected_sha256 = url.split("/")[-1].split('_')[0]
46 |     # expected_sha256 = url.split("/")[-2]
47 |     download_target = os.path.join(root, filename)
48 | 
49 |     if os.path.exists(download_target) and not os.path.isfile(download_target):
50 |         raise RuntimeError(f"{download_target} exists and is not a regular file")
51 | 
52 |     if os.path.isfile(download_target):
53 |         if hashlib.sha256(open(download_target, "rb").read()).hexdigest() == expected_sha256:
54 |             return download_target
55 |         else:
56 |             warnings.warn(f"{download_target} exists, but the SHA256 checksum does not match; re-downloading the file")
57 | 
58 |     with urllib.request.urlopen(url) as source, open(download_target, "wb") as output:
59 |         with tqdm(total=int(source.info().get("Content-Length")), ncols=80, unit='iB', unit_scale=True, unit_divisor=1024) as loop:
60 |             while True:
61 |                 buffer = source.read(8192)
62 |                 if not buffer:
63 |                     break
64 | 
65 |                 output.write(buffer)
66 |                 loop.update(len(buffer))
67 | 
68 |     if hashlib.sha256(open(download_target, "rb").read()).hexdigest() != expected_sha256:
69 |         raise RuntimeError("Model has been downloaded but the SHA256 checksum does not not match")
70 | 
71 |     return download_target
72 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/main_finetune.py:
--------------------------------------------------------------------------------
  1 | import torch
  2 | import torch.backends.cudnn as cudnn
  3 | from torch.utils.tensorboard import SummaryWriter
  4 | from torch.utils.data import Dataset
  5 | 
  6 | import util.misc as misc
  7 | from util.misc import NativeScalerWithGradNormCount as NativeScaler
  8 | from llama.llama_adapter import LLaMA_adapter
  9 | 
 10 | from data.dataset import FinetuneDataset, transform_train
 11 | 
 12 | import argparse
 13 | import datetime
 14 | import json
 15 | import numpy as np
 16 | import os
 17 | import time
 18 | from pathlib import Path
 19 | 
 20 | from engine_finetune import train_one_epoch
 21 | 
 22 | 
 23 | def get_args_parser():
 24 |     parser = argparse.ArgumentParser('llama_adapterV2 pre-training', add_help=False)
 25 |     parser.add_argument('--batch_size', default=64, type=int,
 26 |                         help='Batch size per GPU (effective batch size is batch_size * accum_iter * # gpus')
 27 |     parser.add_argument('--epochs', default=400, type=int)
 28 |     parser.add_argument('--accum_iter', default=1, type=int,
 29 |                         help='Accumulate gradient iterations (for increasing the effective batch size under memory constraints)')
 30 | 
 31 |     # Model parameters
 32 |     parser.add_argument('--llama_type', default='7B', type=str,
 33 |                         help='Type of LLaMA model') #
 34 |     parser.add_argument('--llama_path', default='/path/to/llama', type=str,
 35 |                         help='path to LLaMA pretrained checkpoint')
 36 |     parser.add_argument('--pretrained_path', default='/path/to/pretrained', type=str,
 37 |                         help='path to checkpoint from pretrain stage')
 38 |     parser.add_argument('--max_words', default=512, type=int,
 39 |                         help='max number of input words')
 40 | 
 41 |     # Optimizer parameters
 42 |     parser.add_argument('--weight_decay', type=float, default=0.05,
 43 |                         help='weight decay (default: 0.05)')
 44 | 
 45 |     parser.add_argument('--lr', type=float, default=None, metavar='LR',
 46 |                         help='learning rate (absolute lr)')
 47 |     parser.add_argument('--blr', type=float, default=1e-3, metavar='LR',
 48 |                         help='base learning rate: absolute_lr = base_lr * total_batch_size / 256')
 49 |     parser.add_argument('--min_lr', type=float, default=0., metavar='LR',
 50 |                         help='lower lr bound for cyclic schedulers that hit 0')
 51 | 
 52 |     parser.add_argument('--warmup_epochs', type=int, default=40, metavar='N',
 53 |                         help='epochs to warmup LR')
 54 | 
 55 |     # Dataset parameters
 56 |     parser.add_argument('--data_config', default='configs/data/finetune/EN.yaml', type=str,
 57 |                         help='dataset config path')
 58 |     parser.add_argument('--num_workers', default=10, type=int)
 59 |     parser.add_argument('--pin_mem', action='store_true',
 60 |                         help='Pin CPU memory in DataLoader for more efficient (sometimes) transfer to GPU.')
 61 |     parser.add_argument('--no_pin_mem', action='store_false', dest='pin_mem')
 62 |     parser.set_defaults(pin_mem=True)
 63 | 
 64 | 
 65 |     parser.add_argument('--output_dir', default='./output',
 66 |                         help='path where to save, empty for no saving')
 67 |     parser.add_argument('--log_dir', default='./output',
 68 |                         help='path where to tensorboard log')
 69 |     parser.add_argument('--device', default='cuda',
 70 |                         help='device to use for training / testing')
 71 |     parser.add_argument('--seed', default=0, type=int)
 72 | 
 73 | 
 74 |     parser.add_argument('--start_epoch', default=0, type=int, metavar='N',
 75 |                         help='start epoch')
 76 | 
 77 |     # distributed training parameters
 78 |     parser.add_argument('--world_size', default=1, type=int,
 79 |                         help='number of distributed processes')
 80 |     parser.add_argument('--local_rank', default=-1, type=int)
 81 |     parser.add_argument('--dist_on_itp', action='store_true')
 82 |     parser.add_argument('--dist_url', default='env://',
 83 |                         help='url used to set up distributed training')
 84 | 
 85 |     return parser
 86 | 
 87 | 
 88 | def main(args):
 89 |     misc.init_distributed_mode(args)
 90 | 
 91 |     print('job dir: {}'.format(os.path.dirname(os.path.realpath(__file__))))
 92 |     print("{}".format(args).replace(', ', ',\n'))
 93 | 
 94 |     device = torch.device(args.device)
 95 | 
 96 |     # fix the seed for reproducibility
 97 |     seed = args.seed + misc.get_rank()
 98 |     torch.manual_seed(seed)
 99 |     np.random.seed(seed)
100 |     cudnn.benchmark = True
101 | 
102 |     # define the model
103 |     llama_type = args.llama_type
104 |     llama_ckpt_dir = os.path.join(args.llama_path, llama_type)
105 |     llama_tokenzier_path = os.path.join(args.llama_path, 'tokenizer.model')
106 |     model = LLaMA_adapter(llama_ckpt_dir, llama_tokenzier_path)
107 | 
108 |     model.to(device)
109 | 
110 |     model_without_ddp = model
111 |     print("Model = %s" % str(model_without_ddp))
112 | 
113 |     print("Trainable Params:")
114 |     print([(key, val.shape) for key, val in model.named_parameters() if val.requires_grad])
115 | 
116 |     if args.distributed:
117 |         model = torch.nn.parallel.DistributedDataParallel(model, device_ids=[args.gpu], find_unused_parameters=True)
118 |         model_without_ddp = model.module
119 | 
120 |     # training detail
121 |     eff_batch_size = args.batch_size * args.accum_iter * misc.get_world_size()
122 | 
123 |     if args.lr is None:  # only base_lr is specified
124 |         args.lr = args.blr * eff_batch_size / 256
125 | 
126 |     print("base lr: %.2e" % (args.lr * 256 / eff_batch_size))
127 |     print("actual lr: %.2e" % args.lr)
128 | 
129 |     print("accumulate grad iterations: %d" % args.accum_iter)
130 |     print("effective batch size: %d" % eff_batch_size)
131 | 
132 |     # following timm: set wd as 0 for bias and norm layers
133 |     param_groups = misc.add_weight_decay(model_without_ddp, args.weight_decay)
134 |     optimizer = torch.optim.AdamW(param_groups, lr=args.lr, betas=(0.9, 0.95))
135 |     print(optimizer)
136 |     loss_scaler = NativeScaler()
137 | 
138 |     misc.load_model(model_without_ddp, args.pretrained_path)
139 | 
140 | 
141 |     dataset_train = FinetuneDataset(args.data_config, transform=transform_train,
142 |                                 max_words=args.max_words, tokenizer_path=llama_tokenzier_path)
143 |     print(dataset_train)
144 |     num_tasks = misc.get_world_size()
145 |     global_rank = misc.get_rank()
146 |     sampler_train = torch.utils.data.DistributedSampler(
147 |         dataset_train, num_replicas=num_tasks, rank=global_rank, shuffle=True
148 |     )
149 |     print("Sampler_train = %s" % str(sampler_train))
150 | 
151 |     data_loader_train = torch.utils.data.DataLoader(
152 |         dataset_train, sampler=sampler_train,
153 |         batch_size=args.batch_size,
154 |         num_workers=args.num_workers,
155 |         pin_memory=args.pin_mem,
156 |         drop_last=True,
157 |     )
158 | 
159 |     # SummaryWrite
160 |     if global_rank == 0 and args.log_dir is not None:
161 |         os.makedirs(args.log_dir, exist_ok=True)
162 |         log_writer = SummaryWriter(log_dir=args.log_dir)
163 |     else:
164 |         log_writer = None
165 | 
166 | 
167 |     print(f"Start training for {args.epochs} epochs")
168 |     start_time = time.time()
169 |     for epoch in range(args.start_epoch, args.epochs):
170 |         if args.distributed:
171 |             data_loader_train.sampler.set_epoch(epoch)
172 | 
173 |         train_stats = train_one_epoch(
174 |             model, data_loader_train,
175 |             optimizer, device, epoch, loss_scaler,
176 |             log_writer=log_writer,
177 |             args=args
178 |         )
179 | 
180 |         if args.output_dir and (epoch % 5 == 0 or epoch + 1 == args.epochs):
181 |             misc.save_model(
182 |                 args=args, model=model, model_without_ddp=model_without_ddp, optimizer=optimizer,
183 |                 loss_scaler=loss_scaler, epoch=epoch)
184 | 
185 |         log_stats = {**{f'train_{k}': v for k, v in train_stats.items()},
186 |                      'epoch': epoch,
187 |                      **{f'val_{k}': v for k, v in train_stats.items()}}
188 | 
189 |         if args.output_dir and misc.is_main_process():
190 |             if log_writer is not None:
191 |                 log_writer.flush()
192 |             with open(os.path.join(args.output_dir, "log.txt"), mode="a", encoding="utf-8") as f:
193 |                 f.write(json.dumps(log_stats) + "\n")
194 | 
195 |     total_time = time.time() - start_time
196 |     total_time_str = str(datetime.timedelta(seconds=int(total_time)))
197 |     print('Training time {}'.format(total_time_str))
198 | 
199 | 
200 | if __name__ == '__main__':
201 |     args = get_args_parser()
202 |     args = args.parse_args()
203 |     if args.output_dir:
204 |         Path(args.output_dir).mkdir(parents=True, exist_ok=True)
205 |     main(args)
206 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/main_pretrain.py:
--------------------------------------------------------------------------------
  1 | import torch
  2 | import torch.backends.cudnn as cudnn
  3 | from torch.utils.tensorboard import SummaryWriter
  4 | from torch.utils.data import Dataset
  5 | 
  6 | import util.misc as misc
  7 | from util.misc import NativeScalerWithGradNormCount as NativeScaler
  8 | from llama.llama_adapter import LLaMA_adapter
  9 | 
 10 | from data.dataset import PretrainDataset, transform_train
 11 | 
 12 | import argparse
 13 | import datetime
 14 | import json
 15 | import numpy as np
 16 | import os
 17 | import time
 18 | from pathlib import Path
 19 | 
 20 | from engine_pretrain import train_one_epoch
 21 | 
 22 | 
 23 | def get_args_parser():
 24 |     parser = argparse.ArgumentParser('llama_adapterV2 pre-training', add_help=False)
 25 |     parser.add_argument('--batch_size', default=64, type=int,
 26 |                         help='Batch size per GPU (effective batch size is batch_size * accum_iter * # gpus')
 27 |     parser.add_argument('--epochs', default=400, type=int)
 28 |     parser.add_argument('--accum_iter', default=1, type=int,
 29 |                         help='Accumulate gradient iterations (for increasing the effective batch size under memory constraints)')
 30 | 
 31 |     # Model parameters
 32 |     parser.add_argument('--llama_type', default='7B', type=str,
 33 |                         help='Type of LLaMA model') #
 34 |     parser.add_argument('--llama_path', default='/path/to/llama', type=str,
 35 |                         help='path to LLaMA pretrained checkpoint')
 36 |     parser.add_argument('--max_words', default=96, type=int,
 37 |                         help='max number of input words')
 38 | 
 39 |     # Optimizer parameters
 40 |     parser.add_argument('--weight_decay', type=float, default=0.05,
 41 |                         help='weight decay (default: 0.05)')
 42 | 
 43 |     parser.add_argument('--lr', type=float, default=None, metavar='LR',
 44 |                         help='learning rate (absolute lr)')
 45 |     parser.add_argument('--blr', type=float, default=1e-3, metavar='LR',
 46 |                         help='base learning rate: absolute_lr = base_lr * total_batch_size / 256')
 47 |     parser.add_argument('--min_lr', type=float, default=0., metavar='LR',
 48 |                         help='lower lr bound for cyclic schedulers that hit 0')
 49 | 
 50 |     parser.add_argument('--warmup_epochs', type=int, default=40, metavar='N',
 51 |                         help='epochs to warmup LR')
 52 | 
 53 |     # Dataset parameters
 54 |     parser.add_argument('--data_config', default='configs/data/pretrain/EN.yaml', type=str,
 55 |                         help='dataset config path')
 56 |     parser.add_argument('--num_workers', default=10, type=int)
 57 |     parser.add_argument('--pin_mem', action='store_true',
 58 |                         help='Pin CPU memory in DataLoader for more efficient (sometimes) transfer to GPU.')
 59 |     parser.add_argument('--no_pin_mem', action='store_false', dest='pin_mem')
 60 |     parser.set_defaults(pin_mem=True)
 61 | 
 62 | 
 63 |     parser.add_argument('--output_dir', default='./output',
 64 |                         help='path where to save, empty for no saving')
 65 |     parser.add_argument('--log_dir', default='./output',
 66 |                         help='path where to tensorboard log')
 67 |     parser.add_argument('--device', default='cuda',
 68 |                         help='device to use for training / testing')
 69 |     parser.add_argument('--seed', default=0, type=int)
 70 | 
 71 |     parser.add_argument('--start_epoch', default=0, type=int, metavar='N',
 72 |                         help='start epoch')
 73 | 
 74 |     # distributed training parameters
 75 |     parser.add_argument('--world_size', default=1, type=int,
 76 |                         help='number of distributed processes')
 77 |     parser.add_argument('--local_rank', default=-1, type=int)
 78 |     parser.add_argument('--dist_on_itp', action='store_true')
 79 |     parser.add_argument('--dist_url', default='env://',
 80 |                         help='url used to set up distributed training')
 81 | 
 82 |     parser.add_argument('--split_epoch', type=int, default=50)
 83 | 
 84 |     return parser
 85 | 
 86 | 
 87 | def main(args):
 88 |     misc.init_distributed_mode(args)
 89 | 
 90 |     print('job dir: {}'.format(os.path.dirname(os.path.realpath(__file__))))
 91 |     print("{}".format(args).replace(', ', ',\n'))
 92 | 
 93 |     device = torch.device(args.device)
 94 | 
 95 |     # fix the seed for reproducibility
 96 |     seed = args.seed + misc.get_rank()
 97 |     torch.manual_seed(seed)
 98 |     np.random.seed(seed)
 99 |     cudnn.benchmark = True
100 | 
101 |     # define the model
102 |     llama_type = args.llama_type
103 |     llama_ckpt_dir = os.path.join(args.llama_path, llama_type)
104 |     llama_tokenzier_path = os.path.join(args.llama_path, 'tokenizer.model')
105 |     model = LLaMA_adapter(llama_ckpt_dir, llama_tokenzier_path, phase="pretrain")
106 | 
107 |     model.to(device)
108 | 
109 |     model_without_ddp = model
110 |     print("Model = %s" % str(model_without_ddp))
111 | 
112 |     print("Trainable Params:")
113 |     print([(key, val.shape) for key, val in model.named_parameters() if val.requires_grad])
114 | 
115 |     if args.distributed:
116 |         model = torch.nn.parallel.DistributedDataParallel(model, device_ids=[args.gpu], find_unused_parameters=True)
117 |         model_without_ddp = model.module
118 | 
119 |     # training detail
120 |     eff_batch_size = args.batch_size * args.accum_iter * misc.get_world_size()
121 | 
122 |     if args.lr is None:  # only base_lr is specified
123 |         args.lr = args.blr * eff_batch_size / 256
124 | 
125 |     print("base lr: %.2e" % (args.lr * 256 / eff_batch_size))
126 |     print("actual lr: %.2e" % args.lr)
127 | 
128 |     print("accumulate grad iterations: %d" % args.accum_iter)
129 |     print("effective batch size: %d" % eff_batch_size)
130 | 
131 |     # following timm: set wd as 0 for bias and norm layers
132 |     param_groups = misc.add_weight_decay(model_without_ddp, args.weight_decay)
133 |     optimizer = torch.optim.AdamW(param_groups, lr=args.lr, betas=(0.9, 0.95))
134 |     print(optimizer)
135 |     loss_scaler = NativeScaler()
136 | 
137 | 
138 | 
139 |     dataset_train = PretrainDataset(args.data_config, transform=transform_train,
140 |                                 max_words=args.max_words, tokenizer_path=llama_tokenzier_path)
141 |     print(dataset_train)
142 |     num_tasks = misc.get_world_size()
143 |     global_rank = misc.get_rank()
144 |     sampler_train = misc.DistributedSubEpochSampler(
145 |         dataset_train, num_replicas=num_tasks, rank=global_rank, split_epoch=args.split_epoch, shuffle=True
146 |     )
147 |     print("Sampler_train = %s" % str(sampler_train))
148 | 
149 |     data_loader_train = torch.utils.data.DataLoader(
150 |         dataset_train, sampler=sampler_train,
151 |         batch_size=args.batch_size,
152 |         num_workers=args.num_workers,
153 |         pin_memory=args.pin_mem,
154 |         drop_last=True,
155 |     )
156 | 
157 |     # SummaryWrite
158 |     if global_rank == 0 and args.log_dir is not None:
159 |         os.makedirs(args.log_dir, exist_ok=True)
160 |         log_writer = SummaryWriter(log_dir=args.log_dir)
161 |     else:
162 |         log_writer = None
163 | 
164 | 
165 |     print(f"Start training for {args.epochs} epochs")
166 |     start_time = time.time()
167 |     for epoch in range(args.start_epoch, args.epochs):
168 |         if args.distributed:
169 |             data_loader_train.sampler.set_epoch(epoch)
170 | 
171 |         train_stats = train_one_epoch(
172 |             model, data_loader_train,
173 |             optimizer, device, epoch, loss_scaler,
174 |             log_writer=log_writer,
175 |             args=args
176 |         )
177 | 
178 |         if args.output_dir and (epoch % 2 == 0 or epoch + 1 == args.epochs):
179 |             misc.save_model(
180 |                 args=args, model=model, model_without_ddp=model_without_ddp, optimizer=optimizer,
181 |                 loss_scaler=loss_scaler, epoch=epoch)
182 | 
183 |         log_stats = {**{f'train_{k}': v for k, v in train_stats.items()},
184 |                      'epoch': epoch}
185 | 
186 |         if args.output_dir and misc.is_main_process():
187 |             if log_writer is not None:
188 |                 log_writer.flush()
189 |             with open(os.path.join(args.output_dir, "log.txt"), mode="a", encoding="utf-8") as f:
190 |                 f.write(json.dumps(log_stats) + "\n")
191 | 
192 |     total_time = time.time() - start_time
193 |     total_time_str = str(datetime.timedelta(seconds=int(total_time)))
194 |     print('Training time {}'.format(total_time_str))
195 | 
196 | 
197 | if __name__ == '__main__':
198 |     args = get_args_parser()
199 |     args = args.parse_args()
200 |     if args.output_dir:
201 |         Path(args.output_dir).mkdir(parents=True, exist_ok=True)
202 |     main(args)
203 | 


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/requirements.txt:
--------------------------------------------------------------------------------
 1 | --extra-index-url https://download.pytorch.org/whl/cu117
 2 | torch==2.0.0+cu117
 3 | torchvision==0.15.1+cu117
 4 | tensorboard
 5 | fairscale
 6 | sentencepiece
 7 | Pillow
 8 | opencv-python
 9 | gradio
10 | tqdm
11 | tenacity
12 | openai
13 | git+https://github.com/csuhan/timm_0_3_2.git
14 | git+https://github.com/openai/CLIP.git


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/util/evaluate_mme.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | import glob
  3 | import argparse
  4 | from tqdm import tqdm
  5 | import PIL
  6 | from PIL import Image
  7 | import torch
  8 | import torch.distributed as dist
  9 | from torch.utils.data import Dataset
 10 | import cv2
 11 | from llama.llama_adapter import LLaMA_adapter
 12 | 
 13 | DATA_DIR = "./MME_Benchmark_release_version"
 14 | 
 15 | def get_image(image):
 16 |     if type(image) is str:
 17 |         try:
 18 |             return Image.open(image).convert("RGB")
 19 |         except Exception as e:
 20 |             print(f"Fail to read image: {image}")
 21 |             exit(-1)
 22 |     elif type(image) is Image.Image:
 23 |         return image
 24 |     elif type(image) is PIL.JpegImagePlugin.JpegImageFile:
 25 |         return image
 26 |     elif type(image) is PIL.PngImagePlugin.PngImageFile:
 27 |         return image
 28 |     elif type(image) is PIL.MpoImagePlugin.MpoImageFile:
 29 |         return image
 30 |     else:
 31 |         raise NotImplementedError(f"Invalid type of Image: {type(image)}")
 32 | 
 33 | 
 34 | class MMEDataset(Dataset):
 35 |     def __init__(
 36 |         self,
 37 |         dataset_name
 38 |     ):
 39 |         self.dataset_name = dataset_name
 40 |         self.dataset = []
 41 |         jpg_sets = ["artwork", "celebrity", "color", "count", "existence", "landmark", "OCR", "position", "posters", "scene"]
 42 |         png_sets = ["code_reasoning", "commonsense_reasoning", "numerical_calculation", "text_translation"]
 43 |         image_suffix = '.jpg' if dataset_name in jpg_sets else ".png"
 44 | 
 45 |         assert (dataset_name in jpg_sets) or (dataset_name in png_sets), f"Invalid dataset name for MME benchmark: {dataset_name}"
 46 | 
 47 |         if os.path.exists(f"{DATA_DIR}/{dataset_name}/images") and os.path.exists(f"{DATA_DIR}/{dataset_name}/questions_answers_YN"):
 48 |             question_files = os.listdir(f"{DATA_DIR}/{dataset_name}/questions_answers_YN")
 49 |             for question_file in question_files:
 50 |                 image_file_name = os.path.join(DATA_DIR, dataset_name, "images", question_file.replace('.txt', image_suffix))
 51 |                 with open(os.path.join(DATA_DIR, dataset_name, "questions_answers_YN", question_file), 'r', encoding='utf-8') as f:
 52 |                     for line in f.readlines():
 53 |                         try:
 54 |                             question, gt_answer = line.replace('\n', '').split('\t')
 55 |                             self.dataset.append({
 56 |                                 "image_path": image_file_name,
 57 |                                 "gt_answers": gt_answer,
 58 |                                 "question": question
 59 |                             })
 60 |                         except:
 61 |                             pass
 62 | 
 63 |         else:
 64 |             question_files = glob.glob(f"{DATA_DIR}/{dataset_name}/*.txt")
 65 |             for question_file in question_files:
 66 |                 image_file_name = question_file.replace(".txt", image_suffix)
 67 |                 with open(question_file, 'r', encoding='utf-8') as f:
 68 |                     for line in f.readlines():
 69 |                         try:
 70 |                             question, gt_answer = line.replace('\n', '').split('\t')
 71 |                             self.dataset.append({
 72 |                                 "image_path": image_file_name,
 73 |                                 "gt_answers": gt_answer,
 74 |                                 "question": question
 75 |                             })
 76 |                         except:
 77 |                             pass
 78 | 
 79 |     def __len__(self):
 80 |         return len(self.dataset)
 81 | 
 82 |     def __getitem__(self, idx):
 83 |         return self.dataset[idx]
 84 | 
 85 | 
 86 | def get_args_parser():
 87 |     parser = argparse.ArgumentParser('Single-turn (conversation) demo', add_help=False)
 88 |     # Model parameters
 89 |     parser.add_argument('--llama_path', default='/path/to/llama', type=str,
 90 |                         help='path to LLaMA pretrained checkpoint')
 91 |     parser.add_argument('--pretrained_path', default='/path/to/pretrained', type=str,
 92 |                         help='directory containing pre-trained checkpoints')
 93 |     parser.add_argument('--lora', default=16, type=int)
 94 |     parser.add_argument('--output_path', default='/path/to/output_results', type=str)
 95 |     return parser
 96 | 
 97 | 
 98 | if __name__ == "__main__":
 99 |     args = get_args_parser().parse_args()
100 | 
101 |     device = "cuda" if torch.cuda.is_available() else "cpu"
102 | 
103 |     llama_dir = args.llama_path
104 |     llama_type = '7B'
105 |     llama_ckpt_dir = os.path.join(llama_dir, llama_type)
106 |     llama_tokenzier_path = os.path.join(llama_dir, 'tokenizer.model')
107 |     
108 |     model_path = args.pretrained_path
109 |     # load llama_adapter weights and model_cfg
110 |     print(f'Loading LLaMA-Adapter from {model_path}')
111 |     ckpt = torch.load(model_path, map_location='cpu')
112 | 
113 |     w_bias = True
114 |     w_lora = args.lora > 0
115 |     print('Lora:', w_lora)
116 |     lora_rank = args.lora
117 |     model = LLaMA_adapter(
118 |         llama_ckpt_dir, llama_tokenzier_path,
119 |         max_seq_len=512, max_batch_size=32,
120 |         clip_model='ViT-L/14',
121 |         v_embed_dim=768, v_depth=8,
122 |         v_num_heads=16, v_mlp_ratio=4.0,
123 |         query_len=10, query_layer=31,
124 |         w_bias=w_bias,
125 |         w_lora=w_lora,
126 |         lora_rank=lora_rank,
127 |         w_new_gate=w_lora,  # for compatibility
128 |         phase='finetune')
129 | 
130 |     load_result = model.load_state_dict(ckpt['model'], strict=False)
131 |     print(load_result)
132 | 
133 |     model = model.to(device)
134 |     model.half()
135 |     model.eval()
136 |     preprocess = model.clip_transform
137 | 
138 |     prompt_format = (
139 |         "Below is an instruction that describes a task. "
140 |         "Write a response that appropriately completes the request using a single word or phrase.\n\n"
141 |         "### Instruction:\n{instruction}\n\n### Response:"
142 |     )
143 | 
144 |     def multi_modal_generate(
145 |         img_path: str,
146 |         prompt: str,
147 |         max_gen_len=30,
148 |         temperature: float = 0,
149 |         top_p: float = 0.75,
150 |     ):
151 |         img = Image.fromarray(cv2.imread(img_path))
152 |         img = preprocess(img).unsqueeze(0).half().to(device)
153 |         prompt = prompt_format.format_map({'instruction': prompt})
154 | 
155 |         result = model.generate(img, [prompt], 
156 |                                 max_gen_len=max_gen_len, 
157 |                                 temperature=temperature, 
158 |                                 top_p=top_p)
159 |         return result[0]
160 | 
161 | 
162 |     result = {}
163 |     dataset_names = ["artwork", "celebrity", "color", "count", "existence", "OCR", "position", "posters", "scene", "code_reasoning", "commonsense_reasoning", "numerical_calculation", "text_translation", "landmark"] # landmark (03d5e3bfc958be38.jpg)
164 |     answer_path = args.output_path
165 |     batch_size = 1
166 | 
167 |     print("Starting...")
168 |     for dataset_name in dataset_names:
169 |         dataset = MMEDataset(dataset_name)
170 | 
171 |         predictions = []
172 |         with torch.no_grad():
173 |             for data in tqdm(dataset, desc=f"Inferencing {dataset_name}"):
174 |                 pred = multi_modal_generate(data['image_path'], data['question'])            
175 |                 predictions.append({'image_path': data['image_path'], 'question': data['question'], 'answer': pred, 'gt_answers': data['gt_answers']})
176 | 
177 |         os.makedirs(answer_path, exist_ok=True)
178 |         prediction_file = os.path.join(answer_path, f"{dataset_name}.txt")
179 |         out_datas = [
180 |             f"{data['image_path']}\t{data['question']}\t{data['gt_answers']}\t{data['answer']}"
181 |             for data in predictions
182 |         ]
183 |         with open(prediction_file, 'w') as f:
184 |             f.write('\n'.join(out_datas))


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/util/extract_adapter_from_checkpoint.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | def save(full_model, path, model_type = 'BIAS'):
 4 |     if model_type == 'BIAS':
 5 |         keys = [
 6 |             f'visual_blocks.{i}.{key}.{suffix}'
 7 |             for i in range(8)
 8 |             for key in ['norm1', 'attn.qkv', 'attn.proj', 'norm2', 'mlp.fc1', 'mlp.fc2']
 9 |             for suffix in ['weight', 'bias']
10 |         ] + [
11 |             f'llama.layers.{i}.{key}'
12 |             for i in range(32)
13 |             for key in ['attention.gate', 'attention.wq.bias', 'attention.wo.bias', 'feed_forward.w1.bias', 'feed_forward.w2.bias', 'feed_forward.w3.bias', 'attention_norm.weight', 'ffn_norm.weight']
14 |         ] + [
15 |             f'{base_key}.{suffix}'
16 |             for base_key in ['clip_proj_norm', 'visual_proj_norm', 'visual_proj', 'clip_proj']
17 |             for suffix in ['weight', 'bias']
18 |         ] + ['llama.norm.weight', 'visual_query.weight', 'adapter_query.weight']
19 | 
20 |     
21 |     elif model_type == 'LORA':
22 |         keys = [
23 |             f'visual_blocks.{i}.{key}.{suffix}'
24 |             for i in range(8)
25 |             for key in [f'norm{j}' for j in range(1, 3)] + ['attn.qkv', 'attn.proj', 'mlp.fc1', 'mlp.fc2']
26 |             for suffix in ['weight', 'bias']
27 |         ] + [
28 |             f'llama.layers.{i}.{key}'
29 |             for i in range(32)
30 |             for key in ['attention.gate', 'attention.wq.bias', 'attention.wo.bias', 'feed_forward.w1.bias', 'feed_forward.w2.bias', 'feed_forward.w3.bias', 'attention_norm.weight', 'ffn_norm.weight']
31 |                 + [f'attention.lora_wk_l{j}.weight' for j in range(1, 3)]
32 |                 + [f'attention.lora_wo_l{j}.weight' for j in range(1, 3)]
33 |                 + [f'feed_forward.lora_w{k}_l{j}.weight' for k in range(1, 4) for j in range(1, 3)]
34 |                 + [f'attention.lora_wq_l{j}.weight' for j in range(1, 3)]
35 |                 + [f'attention.lora_wv_l{j}.weight' for j in range(1, 3)]
36 |                 + ['attention.new_gate']
37 |         ] + [
38 |             f'{base_key}.{suffix}'
39 |             for base_key in ['clip_proj_norm', 'visual_proj_norm', 'visual_proj', 'clip_proj']
40 |             for suffix in ['weight', 'bias']
41 |         ] + ['llama.norm.weight', 'visual_query.weight', 'adapter_query.weight']
42 | 
43 |     ## TODO: Add other model types
44 | 
45 |     full_model_state_dict = full_model.state_dict()
46 |     small_weights = {key: full_model_state_dict[key] for key in keys}
47 |     if model_type == 'BIAS':
48 |         wrapped_small_weights = {'model': small_weights,'config': {'w_bias': True, 'w_lora': False, 'lora_rank': 16}}
49 |     elif model_type == 'LORA':
50 |         wrapped_small_weights = {'model': small_weights,'config': {'w_bias': True, 'w_lora': True,  'lora_rank': 16}}
51 |     # Save the wrapped small weights
52 |     torch.save(wrapped_small_weights, path)


--------------------------------------------------------------------------------
/challenge/llama_adapter_v2_multimodal7b/util/lr_sched.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | 
 7 | import math
 8 | 
 9 | def adjust_learning_rate(optimizer, epoch, args):
10 |     """Decay the learning rate with half-cycle cosine after warmup"""
11 |     if epoch < args.warmup_epochs:
12 |         lr = args.lr * epoch / args.warmup_epochs 
13 |     else:
14 |         lr = args.min_lr + (args.lr - args.min_lr) * 0.5 * \
15 |             (1. + math.cos(math.pi * (epoch - args.warmup_epochs) / (args.epochs - args.warmup_epochs)))
16 |     for param_group in optimizer.param_groups:
17 |         if "lr_scale" in param_group:
18 |             param_group["lr"] = lr * param_group["lr_scale"]
19 |         else:
20 |             param_group["lr"] = lr
21 |     return lr
22 | 


--------------------------------------------------------------------------------
/challenge/prepare_submission.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | 
 3 | # Please fill in your team information here
 4 | method = ""  # <str> -- name of the method
 5 | team = ""  # <str> -- name of the team, !!!identical to the Google Form!!!
 6 | authors = [""]  # <list> -- list of str, authors
 7 | email = ""  # <str> -- e-mail address
 8 | institution = ""  # <str> -- institution or company
 9 | country = ""  # <str> -- country or region
10 | 
11 | 
12 | def main():
13 |     with open('output.json', 'r') as file:
14 |         output_res = json.load(file)
15 | 
16 |     submission_content = {
17 |         "method": method,
18 |         "team": team,
19 |         "authors": authors,
20 |         "email": email,
21 |         "institution": institution,
22 |         "country": country,
23 |         "results": output_res
24 |     }
25 | 
26 |     with open('submission.json', 'w') as file:
27 |         json.dump(submission_content, file, indent=4)
28 | 
29 | if __name__ == "__main__":
30 |     main()
31 | 


--------------------------------------------------------------------------------
/docs/data_details.md:
--------------------------------------------------------------------------------
 1 | ## Features of the DriveLM-Data <a name="features"></a>
 2 | 
 3 | - 🛣 Completeness in functionality (covering **Perception**, **Prediction**, and **Planning** QA pairs).
 4 | 
 5 | 
 6 | <p align="center">
 7 |   <img src="../assets/images/repo/point_1.png">
 8 | </p>
 9 | 
10 | 
11 | - 🔜 Reasoning for future events that have not yet happened.
12 |   - Many **"What If"**-style questions: imagine the future by language.
13 |  
14 | 
15 | <p align="center">
16 |   <img src="../assets/images/repo/point_2.png" width=70%>
17 | </p>
18 | 
19 | - ♻ Task-driven decomposition.
20 |   - **One** scene-level description into **many** frame-level trajectories & planning QA pairs.
21 | 
22 | <p align="center">
23 |   <img src="../assets/images/repo/point_3.png">
24 | </p>
25 | 
26 | ## How about the annotation process? <a name="annotation"></a>
27 | 
28 | The annotation process is different for DriveLM-nuScenes and DriveLM-CARLA.
29 | 
30 | <p align="center">
31 |   <img src="../assets/images/repo/paper_data.jpg">
32 | </p>
33 | 
34 | **For DriveLM-nuScenes**, we divide the annotation process into three steps:
35 | 
36 | 1️⃣ Keyframe selection. Given all frames in one clip, the annotator selects the keyframes that need annotation. The criterion is that those frames should involve changes in ego-vehicle movement status (lane changes, sudden stops, start after a stop, etc.).
37 | 
38 | 2️⃣ Key objects selection. Given keyframes, the annotator needs to pick up key objects in the six surrounding images. The criterion is that those objects should be able to affect the action of the ego vehicle (traffic signals, pedestrians crossing the road, other vehicles that move in the direction of the ego vehicle, etc.).
39 | 
40 | 3️⃣ Question and answer annotation. Given those key objects, we automatically generate questions regarding single or multiple objects about perception, prediction, and planning. More details can be found in our data.
41 | 
42 | **For DriveLM-CARLA**, we employ an automated annotation approach:
43 | 
44 | We collect data using CARLA 0.9.14 in the Leaderboard 2.0 framework with a privileged rule-based expert. We set up a series of routes in urban, residential, and rural areas and execute the expert on these routes. During this process, we collect the necessary sensor data, generate relevant QAs based on privileged information about objects and the scene, and organize the logical relationships to connect this series of QAs into a graph.
45 | 


--------------------------------------------------------------------------------
/docs/data_prep_nus.md:
--------------------------------------------------------------------------------
 1 | ## Download data
 2 | We kindly hope you to fill out the [form](https://docs.google.com/forms/d/e/1FAIpQLSeX6CR3u-15IV-TKx2uPv1wiKjydjZ__NNW98H4nR5JZtQa2Q/viewform) before downloading. To get started, download nuScenes subset image data and DriveLM-nuScenes QA json files below. For v1.1 data, please visit the [DriveLM/challenge](https://github.com/OpenDriveLab/DriveLM/tree/main/challenge) folder.
 3 | 
 4 | <!-- <a href="https://docs.google.com/forms/d/e/1FAIpQLSfm8k7LjITLRdXgbURxk46dq5Q2n8qGoRX0nWqQNE1U_322wQ/viewform?usp=sf_link" target="_blank">
 5 |   <img src="https://img.shields.io/badge/Any%20comments%20welcome!-white?logo=google%20forms&label=Google%20Forms&labelColor=blue">
 6 | </a>  -->
 7 | 
 8 | | nuScenes subset images | DriveLM-nuScenes version-1.0|
 9 | |-------|-------|
10 | | [Google Drive](https://drive.google.com/file/d/1DeosPGYeM2gXSChjMODGsQChZyYDmaUz/view?usp=sharing) | [Google Drive](https://drive.google.com/file/d/1LK7pYHytv64neN1626u6eTQBy1Uf4IQH/view?usp=sharing) |
11 | |[Baidu Netdisk](https://pan.baidu.com/s/11xvxPzUY5xTIsJQrYFogqg?pwd=mk95)|[Baidu Netdisk](https://pan.baidu.com/s/1PAdotDY0MN3nkz8w_XhDsw?pwd=l4wf) |
12 | |[HuggingFace](https://huggingface.co/datasets/OpenDriveLab/DriveLM/blob/main/drivelm_nus_imgs_train.zip)|[HuggingFace](https://huggingface.co/datasets/OpenDriveLab/DriveLM/blob/main/v1_0_train_nus.json)
13 | 
14 | You can also download the full nuScenes dataset [HERE](https://www.nuscenes.org/download) to enable video input. 
15 |  
16 | Our DriveLM dataset contains a collection of questions and answers. Currently, only the training set is publicly available. The dataset is named `v1_0_train_nus.json`.
17 | 
18 | <!-- - `v1_0_train.json`/`v1_0_val.json`: In this file, questions and answers are not augmented using GPT-3.5/4.0. The answers tend to follow relatively fixed patterns, resulting in straightforward and less diverse responses. -->
19 | 
20 | <!-- - `gpt_augmented_v1_0_train.json`/`gpt_augmented_v1_0_val.json`: Unlike the previous file, questions and answers in this version have been augmented using GPT. This optimization enhances the diversity of Q&A pairs. Consequently, responses are not limited to simple and direct Q&A, but may include richer expressions and content. -->
21 | ## Prepare the dataset
22 | 
23 | Organize the data structure as follows:
24 | 
25 | ```
26 | DriveLM
27 | ├── data/
28 | │   ├── QA_dataset_nus/
29 | │   │   ├── v1_0_train_nus.json
30 | │   ├── nuscenes/
31 | │   │   ├── samples/
32 | ```
33 | 
34 | 
35 | #### File structure
36 | 
37 | The QA pairs are in the `v1_0_train_nus.json`. Below is the json file structure. All `coordinates` mentioned are referenced from the `upper-left` corner of the respective camera, with the `right` and `bottom` directions serving as the positive x and y axes, respectively.
38 | ```
39 | v1_0_train_nus.json
40 | ├── scene_token:{
41 | │   ├── "scene_description": "The ego vehicle proceeds along the current road, preparing to enter the main road after a series of consecutive right turns.",
42 | │   ├── "key_frames":{
43 | │   │   ├── "frame_token_1":{
44 | │   │   │   ├── "key_object_infos":{"<c1,CAM_FRONT,258.3,442.5>": {"Category": "Vehicle", "Status": "Moving", "Visual_description": "White Sedan", "2d_bbox": [x_min, y_min, x_max, y_max]}, ...},
45 | │   │   │   ├── "QA":{
46 | │   │   │   │   ├── "perception":[
47 | │   │   │   │   │   ├── {"Q": "What are the important objects in the current scene?", "A": "The important objects are <c1,CAM_FRONT,258.3,442.5>, <c2,CAM_FRONT,1113.3,505.0>, ...", "C": None, "con_up": None, "con_down": None, "cluster": None, "layer": None},
48 | │   │   │   │   │   ├── {"Q": "xxx", "A": "xxx", "C": None, "con_up": None, "con_down": None, "cluster": None, "layer": None}, ...
49 | │   │   │   │   ├── ],
50 | │   │   │   │   ├── "prediction":[
51 | │   │   │   │   │   ├── {"Q": "What is the future state of <c1,CAM_FRONT,258.3,442.5>?", "A": "Slightly offset to the left in maneuvering.", "C": None, "con_up": None, "con_down": None, "cluster": None, "layer": None}, ...
52 | │   │   │   │   ├── ],
53 | │   │   │   │   ├── "planning":[
54 | │   │   │   │   │   ├── {"Q": "In this scenario, what are safe actions to take for the ego vehicle?", "A": "Brake gently to a stop, turn right, turn left.", "C": None, "con_up": None, "con_down": None, "cluster": None, "layer": None}, ...
55 | │   │   │   │   ├── ],
56 | │   │   │   │   ├── "behavior":[
57 | │   │   │   │   │   ├── {"Q": "Predict the behavior of the ego vehicle.", "A": "The ego vehicle is going straight. The ego vehicle is driving slowly.", "C": None, "con_up": None, "con_down": None, "cluster": None, "layer": None}
58 | │   │   │   │   ├── ]
59 | │   │   │   ├── },
60 | │   │   │   ├── "image_paths":{
61 | │   │   │   │   ├── "CAM_FRONT": "xxx",
62 | │   │   │   │   ├── "CAM_FRONT_LEFT": "xxx",
63 | │   │   │   │   ├── "CAM_FRONT_RIGHT": "xxx",
64 | │   │   │   │   ├── "CAM_BACK": "xxx",
65 | │   │   │   │   ├── "CAM_BACK_LEFT": "xxx",
66 | │   │   │   │   ├── "CAM_BACK_RIGHT": "xxx",
67 | │   │   │   ├── }
68 | │   │   ├── },
69 | │   │   ├── "frame_token_2":{
70 | │   │   │   ├── "key_object_infos":{"<c1,CAM_BACK,612.5,490.6>": {"Category": "Traffic element", "Status": "None", "Visual_description": "Stop sign", "2d_bbox": [x_min, y_min, x_max, y_max]}, ...},
71 | │   │   │   ├── "QA":{
72 | │   │   │   │   ├── "perception":[...],
73 | │   │   │   │   ├── "prediction":[...],
74 | │   │   │   │   ├── "planning":[...],
75 | │   │   │   │   ├── "behavior":[...]
76 | │   │   │   ├── },
77 | │   │   │   ├── "image_paths":{...}
78 | │   │   ├── }
79 | │   ├── }
80 | ├── }
81 | ```
82 | 
83 | - `scene_token` is the same as in nuScenes dataset.
84 | - `scene_description` is a one-sentence summary of ego-vehicle behavior in the about 20-second video clip (the notion of a scene in nuScenes dataset).
85 | - Under `key_frames`, each key frame is identified by the `frame_token`, which corresponds to the `token` in the nuScenes dataset.
86 | - The `key_object_infos` is a mapping between `c tag` (i.e. \<c1,CAM_FRONT,258.3,442.5\>) and more information about the related key objects such as the category, the status, the visual description, and the 2d bounding box.
87 | - `QA` is divided into different tasks, and QA pairs under each task are formulated as a list of dictionaries. Each dictionary encompasses keys of `Q` (question), `A` (answer), `C` (context), `con_up`, `con_down`, `cluster`, and `layer`. Currently, the values of context related keys are set to None, serving as a tentative placeholder for future fields related to DriveLM-CARLA.
88 | 
89 | 
90 | **Note:** The `c tag` label is used to indicate key objects selected during the annotation process. These objects include not only those present in the ground truth but also objects that are not, such as landmarks and traffic lights. Each key frame contains a minimum of three and a maximum of six key objects. The organization format of the `c tag` is `<c,CAM,x,y>`, where c is the identifier, CAM indicates the camera where the key object’s center point is situated, and x, y represent the horizontal and vertical coordinates of the 2D bounding box in the respective camera’s coordinate system with the `upper-left` corner as the `origin`, and the `right` and `bottom` as the `positive x and y axes`, respectively. 
91 | 
92 | In contrast to the `c tag`, for the question "Identify all the traffic elements in the front view," the output is presented as a list formatted as `[(c, s, x1, y1, x2, y2), ...]`. Here, `c` denotes the category, `s` represents the status, and `x1, y1, x2, y2` indicate the offsets of the top-left and bottom-right corners of the box relative to the center point.
93 | 
94 | 
95 | <p align="center">
96 |   <img width="671" alt="data" src="https://github.com/OpenDriveLab/DriveLM-new/assets/75412366/58d3a3f9-93b1-4899-a1c2-93c04a5978f0" width=90%>
97 | </p>
98 | 
99 | 


--------------------------------------------------------------------------------
/docs/gvqa.md:
--------------------------------------------------------------------------------
1 | ### What is GVQA?
2 | The most exciting aspect of the dataset is that the questions and answers (`QA pairs`) are connected in a graph-style structure, with QA pairs as every node and potential logical progression as the edges. The reason for doing this in the AD domain is that AD tasks are well-defined per stage, from raw sensor input to final control action through perception, prediction and planning.
3 | 
4 | Its key difference to prior VQA tasks for AD is the availability of logical dependencies between QAs, which can be used to guide the answering process. Below is a demo video illustrating the idea.
5 | 
6 | https://github.com/OpenDriveLab/DriveLM/assets/54334254/988472a8-d7b9-4685-b4b8-7a0e77f68265
7 | 


--------------------------------------------------------------------------------
/environment.yml:
--------------------------------------------------------------------------------
  1 | name: drivelm
  2 | channels:
  3 |   - omgarcia
  4 |   - conda-forge
  5 |   - defaults
  6 | dependencies:
  7 |   - _libgcc_mutex=0.1=main
  8 |   - _openmp_mutex=5.1=1_gnu
  9 |   - appdirs=1.4.4=pyhd3eb1b0_0
 10 |   - blas=1.0=mkl
 11 |   - brotlipy=0.7.0=py38h27cfd23_1003
 12 |   - ca-certificates=2023.7.22=hbcca054_0
 13 |   - certifi=2023.7.22=pyhd8ed1ab_0
 14 |   - cffi=1.15.1=py38h5eee18b_3
 15 |   - cryptography=41.0.2=py38h22a60cf_0
 16 |   - cudatoolkit=11.7.0=hd8887f6_10
 17 |   - gcc-6=6.1.0=2
 18 |   - gmp=6.1.0=1
 19 |   - idna=3.4=py38h06a4308_0
 20 |   - intel-openmp=2023.1.0=hdb19cb5_46305
 21 |   - isl=0.17.1=0
 22 |   - ld_impl_linux-64=2.38=h1181459_1
 23 |   - libffi=3.4.4=h6a678d5_0
 24 |   - libgcc-ng=11.2.0=h1234567_1
 25 |   - libgfortran-ng=11.2.0=h00389a5_1
 26 |   - libgfortran5=11.2.0=h1234567_1
 27 |   - libgomp=11.2.0=h1234567_1
 28 |   - libstdcxx-ng=11.2.0=h1234567_1
 29 |   - mkl=2023.1.0=h6d00ec8_46342
 30 |   - mkl-service=2.4.0=py38h5eee18b_1
 31 |   - mkl_fft=1.3.6=py38h417a72b_1
 32 |   - mkl_random=1.2.2=py38h417a72b_1
 33 |   - mpc=1.0.1=0
 34 |   - mpfr=3.1.2=0
 35 |   - ncurses=6.4=h6a678d5_0
 36 |   - openssl=3.0.10=h7f8727e_2
 37 |   - pip=23.2.1=py38h06a4308_0
 38 |   - pooch=1.4.0=pyhd3eb1b0_0
 39 |   - pycparser=2.21=pyhd3eb1b0_0
 40 |   - pyopenssl=23.2.0=py38h06a4308_0
 41 |   - pysocks=1.7.1=py38h06a4308_0
 42 |   - python=3.8.17=h955ad1f_0
 43 |   - readline=8.2=h5eee18b_0
 44 |   - sqlite=3.41.2=h5eee18b_0
 45 |   - tbb=2021.8.0=hdb19cb5_0
 46 |   - tk=8.6.12=h1ccaba5_0
 47 |   - wheel=0.38.4=py38h06a4308_0
 48 |   - xz=5.4.2=h5eee18b_0
 49 |   - zlib=1.2.13=h5eee18b_0
 50 |   - pip:
 51 |     - absl-py==1.4.0
 52 |     - accelerate==0.21.0
 53 |     - addict==2.4.0
 54 |     - aiohttp==3.8.5
 55 |     - aiosignal==1.3.1
 56 |     - aliyun-python-sdk-core==2.13.36
 57 |     - aliyun-python-sdk-kms==2.16.1
 58 |     - ansi2html==1.8.0
 59 |     - antlr4-python3-runtime==4.9.3
 60 |     - anyio==3.7.1
 61 |     - argon2-cffi==23.1.0
 62 |     - argon2-cffi-bindings==21.2.0
 63 |     - arrow==1.2.3
 64 |     - asttokens==2.2.1
 65 |     - async-lru==2.0.4
 66 |     - async-timeout==4.0.2
 67 |     - attrs==23.1.0
 68 |     - babel==2.12.1
 69 |     - backcall==0.2.0
 70 |     - beautifulsoup4==4.12.2
 71 |     - bert-score
 72 |     - bitsandbytes==0.41.1
 73 |     - black==23.7.0
 74 |     - bleach==6.0.0
 75 |     - cachetools==5.3.1
 76 |     - cchardet==2.1.7
 77 |     - chardet==5.2.0
 78 |     - charset-normalizer==3.2.0
 79 |     - click==8.1.6
 80 |     - cmake==3.27.0
 81 |     - colorama==0.4.6
 82 |     - colorlog==6.7.0
 83 |     - comm==0.1.4
 84 |     - configargparse==1.7
 85 |     - contourpy==1.1.0
 86 |     # - cosine-annealing-warmup # no need for torch lightning
 87 |     - crcmod==1.7
 88 |     - cycler==0.11.0
 89 |     - dash==2.13.0
 90 |     - dash-core-components==2.0.0
 91 |     - dash-html-components==2.0.0
 92 |     - dash-table==5.0.0
 93 |     - datasets==2.14.3
 94 |     - debugpy==1.6.7.post1
 95 |     - decorator==5.1.1
 96 |     - defusedxml==0.7.1
 97 |     - descartes==1.1.0
 98 |     - dill==0.3.7
 99 |     - docker-pycreds==0.4.0
100 |     - evaluate==0.4.0
101 |     - exceptiongroup==1.1.3
102 |     - executing==1.2.0
103 |     - fastjsonschema==2.18.0
104 |     - filelock==3.12.2
105 |     - fire==0.5.0
106 |     - flake8==6.1.0
107 |     - flask==2.2.5
108 |     - fonttools==4.42.0
109 |     - fqdn==1.5.1
110 |     - frozenlist==1.4.0
111 |     - fsspec==2023.6.0
112 |     - gitdb==4.0.10
113 |     - gitpython==3.1.32
114 |     - google-auth
115 |     - google-auth-oauthlib
116 |     - grpcio==1.56.2
117 |     - huggingface-hub==0.16.4
118 |     - hydra-core==1.3.2
119 |     - imageio==2.31.1
120 |     - importlib-metadata==6.8.0
121 |     - importlib-resources==6.0.0
122 |     - iniconfig==2.0.0
123 |     - inquirerpy==0.3.4
124 |     - ipykernel==6.25.1
125 |     - ipython==8.12.2
126 |     - ipython-genutils==0.2.0
127 |     - ipywidgets==8.1.0
128 |     - isoduration==20.11.0
129 |     - itsdangerous==2.1.2
130 |     - jedi==0.19.0
131 |     - jinja2==3.1.2
132 |     - jmespath==0.10.0
133 |     - joblib==1.3.1
134 |     - json5==0.9.14
135 |     - jsonpointer==2.4
136 |     - jsonschema==4.19.0
137 |     - jsonschema-specifications==2023.7.1
138 |     - jupyter==1.0.0
139 |     - jupyter-client==8.3.1
140 |     - jupyter-console==6.6.3
141 |     - jupyter-core==5.3.1
142 |     - jupyter-events==0.7.0
143 |     - jupyter-lsp==2.2.0
144 |     - jupyter-server==2.7.2
145 |     - jupyter-server-terminals==0.4.4
146 |     - jupyterlab==4.0.5
147 |     - jupyterlab-pygments==0.2.2
148 |     - jupyterlab-server==2.24.0
149 |     - jupyterlab-widgets==3.0.8
150 |     - kiwisolver==1.4.4
151 |     # - language-evaluation # should install separately
152 |     - lazy-loader==0.3
153 |     - lightning-utilities==0.9.0
154 |     - line-profiler==4.0.3
155 |     - lit==16.0.6
156 |     - llvmlite==0.31.0
157 |     - lyft-dataset-sdk==0.0.8
158 |     - markdown==3.4.4
159 |     - markdown-it-py==3.0.0
160 |     - markupsafe==2.1.3
161 |     - matplotlib==3.5.2
162 |     - matplotlib-inline==0.1.6
163 |     - mccabe==0.7.0
164 |     - mdurl==0.1.2
165 |     - mistune==2.0.5
166 |     # - mmcv==1.4.0 # no need for loading drivelm, need for loading nuScenes
167 |     # - mmdet==2.14.0 # no need for loading drivelm, need for loading nuScenes
168 |     # - mmengine==0.8.4 # no need for loading drivelm, need for loading nuScenes
169 |     # - mmsegmentation==0.14.1 # no need for loading drivelm, need for loading nuScenes
170 |     - model-index==0.1.11
171 |     - more-itertools==10.1.0
172 |     - mpmath==1.3.0
173 |     - multidict==6.0.4
174 |     - multiprocess==0.70.15
175 |     - mypy-extensions==1.0.0
176 |     - nbclient==0.8.0
177 |     - nbconvert==7.4.0
178 |     - nbformat==5.5.0
179 |     - nest-asyncio==1.5.7
180 |     - networkx==2.2
181 |     - nltk==3.8.1
182 |     - notebook==7.0.2
183 |     - notebook-shim==0.2.3
184 |     - numba==0.48.0
185 |     - numpy
186 |     - nuscenes-devkit==1.1.10
187 |     - nvidia-cublas-cu11==11.10.3.66
188 |     - nvidia-cuda-cupti-cu11==11.7.101
189 |     - nvidia-cuda-nvrtc-cu11==11.7.99
190 |     - nvidia-cuda-runtime-cu11==11.7.99
191 |     - nvidia-cudnn-cu11==8.5.0.96
192 |     - nvidia-cufft-cu11==10.9.0.58
193 |     - nvidia-curand-cu11==10.2.10.91
194 |     - nvidia-cusolver-cu11==11.4.0.1
195 |     - nvidia-cusparse-cu11==11.7.4.91
196 |     - nvidia-nccl-cu11==2.14.3
197 |     - nvidia-nvtx-cu11==11.7.91
198 |     - oauthlib==3.2.2
199 |     - omegaconf==2.3.0
200 |     # - open3d # visualization packaage, no need for loading drivelm
201 |     - opencv-python==4.8.0.74
202 |     # - opendatalab==0.0.10 # data download tools, no need for loading drivelm
203 |     # - openmim==0.3.9 # mmlab package manager, no need for loading drivelm
204 |     # - openxlab==0.0.22 # mmlab package, no need for loading drivelm
205 |     - ordered-set==4.1.0
206 |     - oss2==2.17.0
207 |     - overrides==7.4.0
208 |     - packaging==23.1
209 |     - pandas==1.4.4
210 |     - pandocfilters==1.5.0
211 |     - parso==0.8.3
212 |     - pathspec==0.11.2
213 |     - pathtools==0.1.2
214 |     - peft==0.4.0
215 |     - pexpect==4.8.0
216 |     - pfzy==0.3.4
217 |     - pickleshare==0.7.5
218 |     - pillow==10.0.0
219 |     - pkgutil-resolve-name==1.3.10
220 |     - platformdirs==3.10.0
221 |     - plotly==5.16.1
222 |     - pluggy==1.3.0
223 |     - plyfile==1.0.1
224 |     - prettytable==3.8.0
225 |     - prometheus-client==0.17.1
226 |     - prompt-toolkit==3.0.39
227 |     - protobuf==4.23.4
228 |     - psutil==5.9.5
229 |     - ptyprocess==0.7.0
230 |     - pure-eval==0.2.2
231 |     - pyarrow==12.0.1
232 |     - pyasn1==0.5.0
233 |     - pyasn1-modules==0.3.0
234 |     - pycocotools==2.0.7
235 |     - pycodestyle==2.11.0
236 |     - pycryptodome==3.18.0
237 |     - pydeprecate==0.3.2
238 |     - pyflakes==3.1.0
239 |     - pygments==2.16.1
240 |     - pyparsing==3.0.9
241 |     - pyquaternion==0.9.9
242 |     - pytest==7.4.0
243 |     - python-dateutil==2.8.2
244 |     - python-json-logger==2.0.7
245 |     - pytorch-lightning==1.7.0
246 |     - pytz==2023.3
247 |     - pywavelets==1.4.1
248 |     - pyyaml==6.0.1
249 |     - pyzmq==25.1.1
250 |     - qtconsole==5.4.3
251 |     - qtpy==2.4.0
252 |     - referencing==0.30.2
253 |     - regex==2023.6.3
254 |     - requests
255 |     - requests-oauthlib
256 |     - responses==0.18.0
257 |     - retrying==1.3.4
258 |     - rfc3339-validator==0.1.4
259 |     - rfc3986-validator==0.1.1
260 |     - rich==13.4.2
261 |     - rouge-score==0.1.2
262 |     - rpds-py==0.10.0
263 |     - rsa==4.9
264 |     - safetensors==0.3.1
265 |     - scikit-image==0.19.3
266 |     - scikit-learn==1.3.0
267 |     - scipy==1.7.3
268 |     - send2trash==1.8.2
269 |     - sentencepiece==0.1.99
270 |     - sentry-sdk==1.29.2
271 |     - setproctitle==1.3.2
272 |     - setuptools==60.2.0
273 |     - shapely==1.8.5
274 |     - six==1.16.0
275 |     - smmap==5.0.0
276 |     - sniffio==1.3.0
277 |     - soupsieve==2.4.1
278 |     - stack-data==0.6.2
279 |     - sympy==1.12
280 |     - tabulate==0.9.0
281 |     - tenacity==8.2.3
282 |     - tensorboard==2.13.0
283 |     - tensorboard-data-server==0.7.1
284 |     - termcolor==2.3.0
285 |     - terminado==0.17.1
286 |     - terminaltables==3.1.10
287 |     - threadpoolctl==3.2.0
288 |     - tifffile==2023.7.10
289 |     - tinycss2==1.2.1
290 |     - tokenizers==0.13.3
291 |     - tomli==2.0.1
292 |     - torch==2.0.1
293 |     - torchaudio==2.0.2
294 |     - torchmetrics==0.11.1
295 |     - torchvision==0.15.2
296 |     - tornado==6.3.3
297 |     - tqdm==4.65.0
298 |     - traitlets==5.9.0
299 |     - transformers==4.31.0
300 |     - trimesh==2.35.39
301 |     - triton==2.0.0
302 |     - typing-extensions==4.7.1
303 |     - tzdata==2023.3
304 |     - uri-template==1.3.0
305 |     - urllib3==2.0.4
306 |     - wandb==0.15.8
307 |     - wcwidth==0.2.6
308 |     - webcolors==1.13
309 |     - webencodings==0.5.1
310 |     - websocket-client==1.6.2
311 |     - werkzeug==2.2.3
312 |     - widgetsnbextension==4.0.8
313 |     - xxhash==3.3.0
314 |     - yapf==0.40.1
315 |     - yarl==1.9.2
316 |     - zipp==3.16.2
317 | 


--------------------------------------------------------------------------------
/index.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <html>
 3 |   <head>
 4 |     <meta http-equiv="refresh" content="4; url='https://opendrivelab.com/DriveLM/'" />
 5 |   </head>
 6 |   <body>
 7 |     <p>You will be redirected to opendrivelab.com/DriveLM/ soon!</p>
 8 |   </body>
 9 | </html>
10 | 


--------------------------------------------------------------------------------