├── .gitignore
├── .pre-commit-config.yaml
├── CODE_OF_CONDUCT.md
├── CONTRIBUTING.md
├── FAQ.md
├── LICENSE
├── LLaMA-Adapter-V2-arXiv.pdf
├── LLaMA-Adapter-arXiv.pdf
├── MODEL_CARD.md
├── README.md
├── README_llama.md
├── alpaca_finetuning_v1
    ├── engine_finetuning.py
    ├── extract_adapter_from_checkpoint.py
    ├── finetuning.py
    ├── finetuning.sh
    ├── llama
    │   ├── __init__.py
    │   ├── generation.py
    │   ├── model.py
    │   └── tokenizer.py
    ├── models_llama_adapter.py
    └── util
    │   ├── datasets.py
    │   ├── lars.py
    │   ├── lr_decay.py
    │   ├── lr_sched.py
    │   ├── misc.py
    │   └── pos_embed.py
├── docs
    ├── chat_demo.png
    ├── langchain_LLaMA_AdapterV2_demo.ipynb
    ├── langchain_integration.md
    ├── logo_v1.png
    ├── logo_v2.png
    ├── logo_v3.png
    ├── logo_v4.png
    ├── multi_model_example_1.png
    ├── multi_model_example_2.png
    ├── multi_model_example_3.png
    ├── multi_model_example_4.png
    ├── multimodal.png
    ├── pipeline.png
    └── youtube.png
├── download.sh
├── example.py
├── generate.sh
├── gorilla
    ├── README.md
    ├── alpaca_finetuning_v1
    │   ├── engine_finetuning.py
    │   ├── extract_adapter_from_checkpoint.py
    │   ├── finetuning.py
    │   ├── finetuning_hf.sh
    │   ├── finetuning_tf.sh
    │   ├── finetuning_th.sh
    │   ├── llama
    │   │   ├── __init__.py
    │   │   ├── generation.py
    │   │   ├── model.py
    │   │   └── tokenizer.py
    │   ├── models_llama_adapter.py
    │   └── util
    │   │   ├── datasets.py
    │   │   ├── lars.py
    │   │   ├── lr_decay.py
    │   │   ├── lr_sched.py
    │   │   ├── misc.py
    │   │   └── pos_embed.py
    ├── finetune
    │   ├── configs
    │   │   └── finetune
    │   │   │   ├── EN.yaml
    │   │   │   ├── gorilla_hf.yaml
    │   │   │   ├── gorilla_tf.yaml
    │   │   │   └── gorilla_th.yaml
    │   ├── conversation.py
    │   ├── data
    │   │   └── alpaca.py
    │   ├── data_preprocess.py
    │   ├── demo.py
    │   ├── engine_finetune.py
    │   ├── engine_pretrain.py
    │   ├── exps
    │   │   └── train
    │   │   │   ├── base
    │   │   │       └── run.sh
    │   │   │   └── rev
    │   │   │       └── run.sh
    │   ├── global_configs.py
    │   ├── main_finetune.py
    │   ├── main_pretrain.py
    │   ├── model
    │   │   ├── LLM
    │   │   │   ├── __init__.py
    │   │   │   ├── llama.py
    │   │   │   └── revllama.py
    │   │   ├── __init__.py
    │   │   ├── meta.py
    │   │   └── tokenizer.py
    │   ├── params.json
    │   ├── scripts
    │   │   ├── finetune
    │   │   │   ├── finetune_7B_gorilla_hf.sh
    │   │   │   ├── finetune_7B_gorilla_tf.sh
    │   │   │   └── finetune_7B_gorilla_th.sh
    │   │   └── tools
    │   │   │   ├── debug_finetune_131_7B.sh
    │   │   │   └── merge130.sh
    │   ├── submitit_pretrain.py
    │   ├── tools
    │   │   └── get_consolidated_ckpt.py
    │   ├── transformer.py
    │   └── util
    │   │   ├── crop.py
    │   │   ├── lr_decay.py
    │   │   ├── lr_sched.py
    │   │   ├── misc.py
    │   │   └── pos_embed.py
    ├── gorilla-main
    │   ├── .github
    │   │   └── ISSUE_TEMPLATE
    │   │   │   ├── apibench.md
    │   │   │   ├── custom-template.md
    │   │   │   ├── feature_request.md
    │   │   │   └── hosted-gorilla-.md
    │   ├── .gitignore
    │   ├── LICENSE
    │   ├── README.md
    │   ├── data
    │   │   ├── README.md
    │   │   ├── api
    │   │   │   ├── huggingface_api.jsonl
    │   │   │   ├── tensorflowhub_api.jsonl
    │   │   │   └── torchhub_api.jsonl
    │   │   ├── apibench
    │   │   │   ├── huggingface_eval.json
    │   │   │   ├── huggingface_train.json
    │   │   │   ├── tensorflow_eval.json
    │   │   │   ├── tensorflow_train.json
    │   │   │   ├── torchhub_eval.json
    │   │   │   └── torchhub_train.json
    │   │   └── apizoo
    │   │   │   └── shawnharmsen1.json
    │   ├── eval
    │   │   ├── README.md
    │   │   ├── eval-data
    │   │   │   ├── questions
    │   │   │   │   ├── huggingface
    │   │   │   │   │   ├── questions_huggingface_0_shot.jsonl
    │   │   │   │   │   ├── questions_huggingface_bm25.jsonl
    │   │   │   │   │   ├── questions_huggingface_gpt_index.jsonl
    │   │   │   │   │   └── questions_huggingface_oracle.jsonl
    │   │   │   │   ├── tensorflowhub
    │   │   │   │   │   ├── questions_tensorflowhub_0_shot.jsonl
    │   │   │   │   │   ├── questions_tensorflowhub_bm25.jsonl
    │   │   │   │   │   ├── questions_tensorflowhub_gpt_index.jsonl
    │   │   │   │   │   └── questions_tensorflowhub_oracle.jsonl
    │   │   │   │   └── torchhub
    │   │   │   │   │   ├── questions_torchhub_0_shot.jsonl
    │   │   │   │   │   ├── questions_torchhub_bm25.jsonl
    │   │   │   │   │   ├── questions_torchhub_gpt_index.jsonl
    │   │   │   │   │   └── questions_torchhub_oracle.jsonl
    │   │   │   └── responses
    │   │   │   │   ├── huggingface
    │   │   │   │       ├── response_huggingface_Gorilla_FT_0_shot.jsonl
    │   │   │   │       ├── response_huggingface_Gorilla_FT_bm25.jsonl
    │   │   │   │       ├── response_huggingface_Gorilla_FT_gpt_index.jsonl
    │   │   │   │       ├── response_huggingface_Gorilla_FT_oracle.jsonl
    │   │   │   │       ├── response_huggingface_Gorilla_RT_0_shot.jsonl
    │   │   │   │       ├── response_huggingface_Gorilla_RT_bm25.jsonl
    │   │   │   │       ├── response_huggingface_Gorilla_RT_gpt_index.jsonl
    │   │   │   │       └── response_huggingface_Gorilla_RT_oracle.jsonl
    │   │   │   │   ├── tensorflowhub
    │   │   │   │       ├── response_tensorflowhub_Gorilla_FT_0_shot.jsonl
    │   │   │   │       ├── response_tensorflowhub_Gorilla_FT_bm25.jsonl
    │   │   │   │       ├── response_tensorflowhub_Gorilla_FT_gpt_index.jsonl
    │   │   │   │       ├── response_tensorflowhub_Gorilla_FT_oracle.jsonl
    │   │   │   │       ├── response_tensorflowhub_Gorilla_RT_0_shot.jsonl
    │   │   │   │       ├── response_tensorflowhub_Gorilla_RT_bm25.jsonl
    │   │   │   │       ├── response_tensorflowhub_Gorilla_RT_gpt_index.jsonl
    │   │   │   │       └── response_tensorflowhub_Gorilla_RT_oracle.jsonl
    │   │   │   │   └── torchhub
    │   │   │   │       ├── response_torchhub_Gorilla_FT_0_shot.jsonl
    │   │   │   │       ├── response_torchhub_Gorilla_FT_bm25.jsonl
    │   │   │   │       ├── response_torchhub_Gorilla_FT_gpt_index.jsonl
    │   │   │   │       ├── response_torchhub_Gorilla_FT_oracle.jsonl
    │   │   │   │       ├── response_torchhub_Gorilla_RT_0_shot.jsonl
    │   │   │   │       ├── response_torchhub_Gorilla_RT_bm25.jsonl
    │   │   │   │       ├── response_torchhub_Gorilla_RT_gpt_index.jsonl
    │   │   │   │       └── response_torchhub_Gorilla_RT_oracle.jsonl
    │   │   ├── eval-scripts
    │   │   │   ├── ast_eval_hf.py
    │   │   │   ├── ast_eval_tf.py
    │   │   │   ├── ast_eval_th.py
    │   │   │   └── codebleu
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── bleu.py
    │   │   │   │   ├── dataflow_match.py
    │   │   │   │   ├── keywords
    │   │   │   │       ├── c_sharp.txt
    │   │   │   │       ├── java.txt
    │   │   │   │       └── python.txt
    │   │   │   │   ├── parser
    │   │   │   │       ├── DFG.py
    │   │   │   │       ├── __init__.py
    │   │   │   │       ├── build.py
    │   │   │   │       ├── build.sh
    │   │   │   │       ├── tree-sitter-python
    │   │   │   │       │   ├── .gitattributes
    │   │   │   │       │   ├── .github
    │   │   │   │       │   │   └── workflows
    │   │   │   │       │   │   │   └── ci.yml
    │   │   │   │       │   ├── .gitignore
    │   │   │   │       │   ├── .npmignore
    │   │   │   │       │   ├── Cargo.toml
    │   │   │   │       │   ├── LICENSE
    │   │   │   │       │   ├── README.md
    │   │   │   │       │   ├── binding.gyp
    │   │   │   │       │   ├── bindings
    │   │   │   │       │   │   ├── node
    │   │   │   │       │   │   │   ├── binding.cc
    │   │   │   │       │   │   │   └── index.js
    │   │   │   │       │   │   └── rust
    │   │   │   │       │   │   │   ├── README.md
    │   │   │   │       │   │   │   ├── build.rs
    │   │   │   │       │   │   │   └── lib.rs
    │   │   │   │       │   ├── examples
    │   │   │   │       │   │   ├── compound-statement-without-trailing-newline.py
    │   │   │   │       │   │   ├── crlf-line-endings.py
    │   │   │   │       │   │   ├── mixed-spaces-tabs.py
    │   │   │   │       │   │   ├── multiple-newlines.py
    │   │   │   │       │   │   ├── python2-grammar-crlf.py
    │   │   │   │       │   │   ├── python2-grammar.py
    │   │   │   │       │   │   ├── python3-grammar-crlf.py
    │   │   │   │       │   │   ├── python3-grammar.py
    │   │   │   │       │   │   ├── python3.8_grammar.py
    │   │   │   │       │   │   ├── simple-statements-without-trailing-newline.py
    │   │   │   │       │   │   ├── tabs.py
    │   │   │   │       │   │   └── trailing-whitespace.py
    │   │   │   │       │   ├── grammar.js
    │   │   │   │       │   ├── package.json
    │   │   │   │       │   ├── queries
    │   │   │   │       │   │   ├── highlights.scm
    │   │   │   │       │   │   └── tags.scm
    │   │   │   │       │   ├── script
    │   │   │   │       │   │   ├── known_failures.txt
    │   │   │   │       │   │   └── parse-examples
    │   │   │   │       │   ├── src
    │   │   │   │       │   │   ├── grammar.json
    │   │   │   │       │   │   ├── node-types.json
    │   │   │   │       │   │   ├── parser.c
    │   │   │   │       │   │   ├── scanner.cc
    │   │   │   │       │   │   └── tree_sitter
    │   │   │   │       │   │   │   └── parser.h
    │   │   │   │       │   └── test
    │   │   │   │       │   │   ├── corpus
    │   │   │   │       │   │       ├── errors.txt
    │   │   │   │       │   │       ├── expressions.txt
    │   │   │   │       │   │       ├── literals.txt
    │   │   │   │       │   │       ├── pattern_matching.txt
    │   │   │   │       │   │       └── statements.txt
    │   │   │   │       │   │   └── highlight
    │   │   │   │       │   │       ├── keywords.py
    │   │   │   │       │   │       ├── parameters.py
    │   │   │   │       │   │       └── pattern_matching.py
    │   │   │   │       └── utils.py
    │   │   │   │   ├── readme.txt
    │   │   │   │   ├── syntax_check.py
    │   │   │   │   ├── syntax_match.py
    │   │   │   │   ├── utils.py
    │   │   │   │   └── weighted_ngram_match.py
    │   │   └── get_llm_responses.py
    │   ├── inference
    │   │   ├── README.md
    │   │   ├── apply_delta.py
    │   │   ├── example_questions
    │   │   │   └── example_questions.jsonl
    │   │   ├── gorilla_eval.py
    │   │   ├── requirements.txt
    │   │   └── serve
    │   │   │   ├── conv_template.py
    │   │   │   ├── gorilla_cli.py
    │   │   │   └── gorilla_falcon_cli.py
    │   └── requirements.txt
    └── inference
    │   ├── CODE_OF_CONDUCT.md
    │   ├── CONTRIBUTING.md
    │   ├── FAQ.md
    │   ├── LICENSE
    │   ├── MODEL_CARD.md
    │   ├── README.md
    │   ├── download.sh
    │   ├── example.py
    │   ├── gorilla_inference_full_finetune.py
    │   ├── gorilla_inference_llama_adapter_v1.py
    │   ├── llama
    │       ├── __init__.py
    │       ├── generation.py
    │       ├── model.py
    │       └── tokenizer.py
    │   ├── llama_for_adapter
    │       ├── __init__.py
    │       ├── generation.py
    │       ├── model.py
    │       └── tokenizer.py
    │   ├── requirements.txt
    │   └── setup.py
├── imagebind_LLM
    ├── ImageBind
    │   ├── .assets
    │   │   ├── bird_audio.wav
    │   │   ├── bird_image.jpg
    │   │   ├── car_audio.wav
    │   │   ├── car_image.jpg
    │   │   ├── dog_audio.wav
    │   │   └── dog_image.jpg
    │   ├── .gitignore
    │   ├── CODE_OF_CONDUCT.md
    │   ├── CONTRIBUTING.md
    │   ├── LICENSE
    │   ├── README.md
    │   ├── bpe
    │   │   └── bpe_simple_vocab_16e6.txt.gz
    │   ├── data.py
    │   ├── demo.py
    │   ├── model_card.md
    │   ├── models
    │   │   ├── __init__.py
    │   │   ├── helpers.py
    │   │   ├── imagebind_model.py
    │   │   ├── multimodal_preprocessors.py
    │   │   ├── pointbert
    │   │   │   ├── PointTransformer_8192point.yaml
    │   │   │   ├── checkpoint.py
    │   │   │   ├── dvae.py
    │   │   │   ├── logger.py
    │   │   │   ├── misc.py
    │   │   │   └── point_encoder.py
    │   │   └── transformer.py
    │   └── requirements.txt
    ├── README.md
    ├── convert_ckpt.py
    ├── data
    │   └── dataset.py
    ├── demo.py
    ├── demo_3d.py
    ├── docs
    │   └── train.md
    ├── engine_finetune.py
    ├── engine_pretrain.py
    ├── examples
    │   ├── airplane.pt
    │   ├── car.pt
    │   ├── door.pt
    │   ├── girl.jpg
    │   ├── girl_bgm.wav
    │   └── toilet.pt
    ├── exps
    │   ├── finetune.sh
    │   ├── finetune_ENCN.sh
    │   └── pretrain.sh
    ├── gradio_app.py
    ├── image_generate.py
    ├── llama
    │   ├── __init__.py
    │   ├── llama.py
    │   ├── llama_adapter.py
    │   ├── tokenizer.py
    │   └── utils.py
    ├── main_finetune.py
    ├── main_pretrain.py
    ├── requirements.txt
    ├── tools
    │   └── get_chinese_llama.py
    └── util
    │   ├── lr_sched.py
    │   └── misc.py
├── llama
    ├── __init__.py
    ├── generation.py
    ├── model.py
    └── tokenizer.py
├── llama_adapter_v2_chat65b
    ├── README.md
    ├── chat_demo.py
    ├── checkpoints
    │   └── model_zoo.md
    ├── conversation.py
    ├── environment.yml
    ├── llama
    │   ├── __init__.py
    │   ├── generation.py
    │   ├── model.py
    │   └── tokenizer.py
    ├── models_llama_adapter.py
    ├── scripts
    │   ├── srun_chat_llama65b_bias_scale_norm.sh
    │   └── torchrun_chat_llama65b_bias_scale_norm.sh
    └── util
    │   └── misc.py
├── llama_adapter_v2_multimodal7b
    ├── README.md
    ├── data
    │   └── dataset.py
    ├── demo.py
    ├── docs
    │   ├── eval.md
    │   └── train.md
    ├── engine_finetune.py
    ├── engine_pretrain.py
    ├── exps
    │   ├── finetune.sh
    │   └── pretrain.sh
    ├── gradio_app.py
    ├── llama
    │   ├── __init__.py
    │   ├── llama.py
    │   ├── llama_adapter.py
    │   ├── tokenizer.py
    │   └── utils.py
    ├── main_finetune.py
    ├── main_pretrain.py
    ├── requirements.txt
    └── util
    │   ├── evaluate_mme.py
    │   ├── extract_adapter_from_checkpoint.py
    │   ├── lr_sched.py
    │   └── misc.py
├── pyproject.toml
├── requirements.txt
├── setup.cfg
├── setup.py
└── utils
    └── quantization.py


/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | default_language_version:
 2 |   python: python3
 3 | 
 4 | repos:
 5 |   - repo: https://github.com/pre-commit/pre-commit-hooks
 6 |     rev: v3.2.0
 7 |     hooks:
 8 |       - id: trailing-whitespace
 9 |       - id: end-of-file-fixer
10 |       - id: check-yaml
11 | 
12 |   - repo: https://github.com/PyCQA/isort
13 |     rev: 5.10.1
14 |     hooks:
15 |       - id: isort
16 |         name: Format imports
17 | 
18 |   - repo: https://github.com/psf/black
19 |     rev: 22.3.0
20 |     hooks:
21 |       - id: black
22 |         name: Format code
23 | 
24 |   - repo: https://github.com/asottile/blacken-docs
25 |     rev: v1.12.1
26 |     hooks:
27 |       - id: blacken-docs
28 |         args: [--line-length=120]
29 |         additional_dependencies: [black==21.12b0]
30 | 
31 |   - repo: https://github.com/charliermarsh/ruff-pre-commit
32 |     rev: "v0.0.237"
33 |     hooks:
34 |       - id: ruff
35 |         args: ["--fix"]
36 | 


--------------------------------------------------------------------------------
/CODE_OF_CONDUCT.md:
--------------------------------------------------------------------------------
 1 | # Code of Conduct
 2 | 
 3 | ## Our Pledge
 4 | 
 5 | In the interest of fostering an open and welcoming environment, we as
 6 | contributors and maintainers pledge to make participation in our project and
 7 | our community a harassment-free experience for everyone, regardless of age, body
 8 | size, disability, ethnicity, sex characteristics, gender identity and expression,
 9 | level of experience, education, socio-economic status, nationality, personal
10 | appearance, race, religion, or sexual identity and orientation.
11 | 
12 | ## Our Standards
13 | 
14 | Examples of behavior that contributes to creating a positive environment
15 | include:
16 | 
17 | * Using welcoming and inclusive language
18 | * Being respectful of differing viewpoints and experiences
19 | * Gracefully accepting constructive criticism
20 | * Focusing on what is best for the community
21 | * Showing empathy towards other community members
22 | 
23 | Examples of unacceptable behavior by participants include:
24 | 
25 | * The use of sexualized language or imagery and unwelcome sexual attention or
26 | advances
27 | * Trolling, insulting/derogatory comments, and personal or political attacks
28 | * Public or private harassment
29 | * Publishing others' private information, such as a physical or electronic
30 | address, without explicit permission
31 | * Other conduct which could reasonably be considered inappropriate in a
32 | professional setting
33 | 
34 | ## Our Responsibilities
35 | 
36 | Project maintainers are responsible for clarifying the standards of acceptable
37 | behavior and are expected to take appropriate and fair corrective action in
38 | response to any instances of unacceptable behavior.
39 | 
40 | Project maintainers have the right and responsibility to remove, edit, or
41 | reject comments, commits, code, wiki edits, issues, and other contributions
42 | that are not aligned to this Code of Conduct, or to ban temporarily or
43 | permanently any contributor for other behaviors that they deem inappropriate,
44 | threatening, offensive, or harmful.
45 | 
46 | ## Scope
47 | 
48 | This Code of Conduct applies within all project spaces, and it also applies when
49 | an individual is representing the project or its community in public spaces.
50 | Examples of representing a project or community include using an official
51 | project e-mail address, posting via an official social media account, or acting
52 | as an appointed representative at an online or offline event. Representation of
53 | a project may be further defined and clarified by project maintainers.
54 | 
55 | This Code of Conduct also applies outside the project spaces when there is a
56 | reasonable belief that an individual's behavior may have a negative impact on
57 | the project or its community.
58 | 
59 | ## Enforcement
60 | 
61 | Instances of abusive, harassing, or otherwise unacceptable behavior may be
62 | reported by contacting the project team at <opensource-conduct@meta.com>. All
63 | complaints will be reviewed and investigated and will result in a response that
64 | is deemed necessary and appropriate to the circumstances. The project team is
65 | obligated to maintain confidentiality with regard to the reporter of an incident.
66 | Further details of specific enforcement policies may be posted separately.
67 | 
68 | Project maintainers who do not follow or enforce the Code of Conduct in good
69 | faith may face temporary or permanent repercussions as determined by other
70 | members of the project's leadership.
71 | 
72 | ## Attribution
73 | 
74 | This Code of Conduct is adapted from the [Contributor Covenant][homepage], version 1.4,
75 | available at https://www.contributor-covenant.org/version/1/4/code-of-conduct.html
76 | 
77 | [homepage]: https://www.contributor-covenant.org
78 | 
79 | For answers to common questions about this code of conduct, see
80 | https://www.contributor-covenant.org/faq


--------------------------------------------------------------------------------
/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contributing to LLaMA
 2 | We want to make contributing to this project as easy and transparent as
 3 | possible.
 4 | 
 5 | ## Pull Requests
 6 | We actively welcome your pull requests.
 7 | 
 8 | 1. Fork the repo and create your branch from `main`.
 9 | 2. If you've added code that should be tested, add tests.
10 | 3. If you've changed APIs, update the documentation.
11 | 4. Ensure the test suite passes.
12 | 5. Make sure your code lints.
13 | 6. If you haven't already, complete the Contributor License Agreement ("CLA").
14 | 
15 | ## Contributor License Agreement ("CLA")
16 | In order to accept your pull request, we need you to submit a CLA. You only need
17 | to do this once to work on any of Meta's open source projects.
18 | 
19 | Complete your CLA here: <https://code.facebook.com/cla>
20 | 
21 | ## Issues
22 | We use GitHub issues to track public bugs. Please ensure your description is
23 | clear and has sufficient instructions to be able to reproduce the issue.
24 | 
25 | Meta has a [bounty program](https://www.facebook.com/whitehat/) for the safe
26 | disclosure of security bugs. In those cases, please go through the process
27 | outlined on that page and do not file a public issue.
28 | 
29 | ## License
30 | By contributing to LLaMA, you agree that your contributions will be licensed
31 | under the LICENSE file in the root directory of this source tree.


--------------------------------------------------------------------------------
/FAQ.md:
--------------------------------------------------------------------------------
 1 | # FAQ
 2 | ## <a name="1"></a>1. The download.sh script doesn't work on default bash in MacOS X:
 3 | 
 4 | Please see answers from theses issues:
 5 |  - https://github.com/facebookresearch/llama/issues/41#issuecomment-1451290160
 6 |  - https://github.com/facebookresearch/llama/issues/53#issue-1606582963
 7 | 
 8 | 
 9 | ## <a name="2"></a>2. Generations are bad! 
10 | 
11 | Keep in mind these models are not finetuned for question answering. As such, they should be prompted so that the expected answer is the natural continuation of the prompt.
12 | 
13 | Here are a few examples of prompts (from [issue#69](https://github.com/facebookresearch/llama/issues/69)) geared towards finetuned models, and how to modify them to get the expected results:
14 |  - Do not prompt with "What is the meaning of life? Be concise and do not repeat yourself." but with "I believe the meaning of life is"
15 |  - Do not prompt with "Explain the theory of relativity." but with "Simply put, the theory of relativity states that"
16 |  - Do not prompt with "Ten easy steps to build a website..." but with "Building a website can be done in 10 simple steps:\n"
17 | 
18 | To be able to directly prompt the models with questions / instructions, you can either:
19 |  - Prompt it with few-shot examples so that the model understands the task you have in mind.
20 |  - Finetune the models on datasets of instructions to make them more robust to input prompts.
21 | 
22 | We've updated `example.py` with more sample prompts. Overall, always keep in mind that models are very sensitive to prompts (particularly when they have not been finetuned).
23 | 
24 | ## <a name="3"></a>3. CUDA Out of memory errors
25 | 
26 | The `example.py` file pre-allocates a cache according to these settings:
27 | ```python
28 | model_args: ModelArgs = ModelArgs(max_seq_len=max_seq_len, max_batch_size=max_batch_size, **params)
29 | ```
30 | 
31 | Accounting for 14GB of memory for the model weights (7B model), this leaves 16GB available for the decoding cache which stores 2 * 2 * n_layers * max_batch_size * max_seq_len * n_heads * head_dim bytes.
32 | 
33 | With default parameters, this cache was about 17GB (2 * 2 * 32 * 32 * 1024 * 32 * 128) for the 7B model.
34 | 
35 | We've added command line options to `example.py` and changed the default `max_seq_len` to 512 which should allow decoding on 30GB GPUs.
36 | 
37 | Feel free to lower these settings according to your hardware.
38 | 
39 | ## <a name="4"></a>4. Other languages
40 | The model was trained primarily on English, but also on a few other languages with Latin or Cyrillic alphabets.
41 | 
42 | For instance, LLaMA was trained on Wikipedia for the 20 following languages: bg, ca, cs, da, de, en, es, fr, hr, hu, it, nl, pl, pt, ro, ru, sl, sr, sv, uk.
43 | 
44 | LLaMA's tokenizer splits unseen characters into UTF-8 bytes, as a result, it might also be able to process other languages like Chinese or Japanese, even though they use different characters.
45 | 
46 | Although the fraction of these languages in the training was negligible, LLaMA still showcases some abilities in Chinese-English translation:
47 | 
48 | ```
49 | Prompt = "J'aime le chocolat = I like chocolate\n祝你一天过得愉快 ="
50 | Output = "I wish you a nice day"
51 | ```


--------------------------------------------------------------------------------
/LLaMA-Adapter-V2-arXiv.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/LLaMA-Adapter-V2-arXiv.pdf


--------------------------------------------------------------------------------
/LLaMA-Adapter-arXiv.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/LLaMA-Adapter-arXiv.pdf


--------------------------------------------------------------------------------
/README_llama.md:
--------------------------------------------------------------------------------
 1 | # LLaMA 
 2 | 
 3 | This repository is intended as a minimal, hackable and readable example to load [LLaMA](https://ai.facebook.com/blog/large-language-model-llama-meta-ai/) ([arXiv](https://arxiv.org/abs/2302.13971v1)) models and run inference.
 4 | In order to download the checkpoints and tokenizer, fill this [google form](https://forms.gle/jk851eBVbX1m5TAv5)
 5 | 
 6 | ## Setup
 7 | 
 8 | In a conda env with pytorch / cuda available, run:
 9 | ```
10 | pip install -r requirements.txt
11 | ```
12 | Then in this repository:
13 | ```
14 | pip install -e .
15 | ```
16 | 
17 | ## Download
18 | 
19 | Once your request is approved, you will receive links to download the tokenizer and model files.
20 | Edit the `download.sh` script with the signed url provided in the email to download the model weights and tokenizer.
21 | 
22 | ## Inference
23 | 
24 | The provided `example.py` can be run on a single or multi-gpu node with `torchrun` and will output completions for two pre-defined prompts. Using `TARGET_FOLDER` as defined in `download.sh`:
25 | ```
26 | torchrun --nproc_per_node MP example.py --ckpt_dir $TARGET_FOLDER/model_size --tokenizer_path $TARGET_FOLDER/tokenizer.model
27 | ```
28 | 
29 | Different models require different MP values:
30 | 
31 | |  Model | MP |
32 | |--------|----|
33 | | 7B     | 1  |
34 | | 13B    | 2  |
35 | | 33B    | 4  |
36 | | 65B    | 8  |
37 | 
38 | ## FAQ
39 | 
40 | - [1. The download.sh script doesn't work on default bash in MacOS X](FAQ.md#1)
41 | - [2. Generations are bad!](FAQ.md#2)
42 | - [3. CUDA Out of memory errors](FAQ.md#3)
43 | - [4. Other languages](FAQ.md#4)
44 | 
45 | ## Reference
46 | 
47 | LLaMA: Open and Efficient Foundation Language Models -- https://arxiv.org/abs/2302.13971
48 | 
49 | ```
50 | @article{touvron2023llama,
51 |   title={LLaMA: Open and Efficient Foundation Language Models},
52 |   author={Touvron, Hugo and Lavril, Thibaut and Izacard, Gautier and Martinet, Xavier and Lachaux, Marie-Anne and Lacroix, Timoth{\'e}e and Rozi{\`e}re, Baptiste and Goyal, Naman and Hambro, Eric and Azhar, Faisal and Rodriguez, Aurelien and Joulin, Armand and Grave, Edouard and Lample, Guillaume},
53 |   journal={arXiv preprint arXiv:2302.13971},
54 |   year={2023}
55 | }
56 | ```
57 | 
58 | ## Model Card
59 | See [MODEL_CARD.md](MODEL_CARD.md)
60 | 
61 | ## License
62 | See the [LICENSE](LICENSE) file.
63 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/extract_adapter_from_checkpoint.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | model = torch.load("./checkpoint/checkpoint-4.pth", map_location="cpu")
 4 | new_model = dict()
 5 | weight_list = ["layers." + str(i) + ".attention.gate" for i in range(32)]
 6 | old_weight_list = ["layers." + str(i) + ".attention.gate" for i in range(32)]
 7 | weight_list = weight_list + ["adapter_query.weight"]
 8 | 
 9 | print(weight_list)
10 | print(model["model"]["adapter_query.weight"].shape)
11 | 
12 | for i in range(len(weight_list)):
13 |     new_model[weight_list[i]] = model["model"][weight_list[i]]
14 | 
15 | torch.save(new_model, "adapter_adapter_len10_layer30_epoch5.pth")
16 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/finetuning.sh:
--------------------------------------------------------------------------------
 1 | torchrun --nproc_per_node 8 finetuning.py \
 2 |     --model Llama7B_adapter \
 3 |     --llama_model_path $TARGET_FOLDER/ \
 4 |     --data_path $DATA_PATH/alpaca_data.json \
 5 |     --adapter_layer 30 \
 6 |     --adapter_len 10 \
 7 |     --max_seq_len 512 \
 8 |     --batch_size 4 \
 9 |     --epochs 5 \
10 |     --warmup_epochs 2 \
11 |     --blr 9e-3 \
12 |     --weight_decay 0.02 \
13 |     --output_dir ./checkpoint/
14 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/llama/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from .generation import LLaMA
5 | from .model import ModelArgs, Transformer
6 | from .tokenizer import Tokenizer
7 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/llama/generation.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from typing import List
 5 | 
 6 | import torch
 7 | 
 8 | from llama.model import Transformer
 9 | from llama.tokenizer import Tokenizer
10 | 
11 | 
12 | class LLaMA:
13 |     def __init__(self, model: Transformer, tokenizer: Tokenizer):
14 |         self.model = model
15 |         self.tokenizer = tokenizer
16 | 
17 |     def generate(
18 |         self,
19 |         prompts: List[str],
20 |         max_gen_len: int,
21 |         temperature: float = 0.8,
22 |         top_p: float = 0.95,
23 |     ) -> List[str]:
24 |         bsz = len(prompts)
25 |         params = self.model.params
26 |         assert bsz <= params.max_batch_size, (bsz, params.max_batch_size)
27 | 
28 |         prompt_tokens = [self.tokenizer.encode(x, bos=True, eos=False) for x in prompts]
29 | 
30 |         min_prompt_size = min([len(t) for t in prompt_tokens])
31 |         max_prompt_size = max([len(t) for t in prompt_tokens])
32 | 
33 |         total_len = min(params.max_seq_len, max_gen_len + max_prompt_size)
34 | 
35 |         tokens = torch.full((bsz, total_len), self.tokenizer.pad_id).cuda().long()
36 |         for k, t in enumerate(prompt_tokens):
37 |             tokens[k, : len(t)] = torch.tensor(t).long()
38 |         input_text_mask = tokens != self.tokenizer.pad_id
39 |         start_pos = min_prompt_size
40 |         prev_pos = 0
41 |         for cur_pos in range(start_pos, total_len):
42 |             logits = self.model.forward_only(tokens[:, prev_pos:cur_pos], prev_pos)
43 |             if temperature > 0:
44 |                 probs = torch.softmax(logits / temperature, dim=-1)
45 |                 next_token = sample_top_p(probs, top_p)
46 |             else:
47 |                 next_token = torch.argmax(logits, dim=-1)
48 |             next_token = next_token.reshape(-1)
49 |             # only replace token if prompt has already been generated
50 |             next_token = torch.where(input_text_mask[:, cur_pos], tokens[:, cur_pos], next_token)
51 |             tokens[:, cur_pos] = next_token
52 |             prev_pos = cur_pos
53 | 
54 |         decoded = []
55 |         for i, t in enumerate(tokens.tolist()):
56 |             # cut to max gen len
57 |             t = t[: len(prompt_tokens[i]) + max_gen_len]
58 |             # cut to eos tok if any
59 |             try:
60 |                 t = t[: t.index(self.tokenizer.eos_id)]
61 |             except ValueError:
62 |                 pass
63 |             decoded.append(self.tokenizer.decode(t))
64 |         return decoded
65 | 
66 | 
67 | def sample_top_p(probs, p):
68 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
69 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
70 |     mask = probs_sum - probs_sort > p
71 |     probs_sort[mask] = 0.0
72 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
73 |     next_token = torch.multinomial(probs_sort, num_samples=1)
74 |     next_token = torch.gather(probs_idx, -1, next_token)
75 |     return next_token
76 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | import os
 5 | from logging import getLogger
 6 | from typing import List
 7 | 
 8 | from sentencepiece import SentencePieceProcessor
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}")
26 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
27 | 
28 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
29 |         assert type(s) is str
30 |         t = self.sp_model.encode(s)
31 |         if bos:
32 |             t = [self.bos_id] + t
33 |         if eos:
34 |             t = t + [self.eos_id]
35 |         return t
36 | 
37 |     def decode(self, t: List[int]) -> str:
38 |         return self.sp_model.decode(t)
39 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/models_llama_adapter.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | 
 3 | import torch
 4 | 
 5 | from llama import ModelArgs, Tokenizer, Transformer
 6 | 
 7 | 
 8 | def Llama7B_adapter(args, **kwargs):
 9 | 
10 |     llama_model_path = args.llama_model_path
11 |     model_name = "7B"
12 | 
13 |     checkpoint = torch.load(llama_model_path + model_name + "/consolidated.00.pth", map_location="cpu")
14 |     print(llama_model_path + model_name + "/consolidated.00.pth")
15 | 
16 |     with open(llama_model_path + model_name + "/params.json", "r") as f:
17 |         params = json.loads(f.read())
18 | 
19 |     model_args: ModelArgs = ModelArgs(
20 |         max_seq_len=args.max_seq_len,
21 |         max_batch_size=32,
22 |         adapter_len=args.adapter_len,
23 |         adapter_layer=args.adapter_layer,
24 |         **params
25 |     )
26 |     tokenizer = Tokenizer(model_path=llama_model_path + "/tokenizer.model")
27 | 
28 |     model_args.vocab_size = tokenizer.n_words
29 |     torch.set_default_tensor_type(torch.cuda.HalfTensor)
30 |     model_llama_adapter = Transformer(model_args)
31 |     torch.set_default_tensor_type(torch.FloatTensor)
32 |     model_llama_adapter.load_state_dict(checkpoint, strict=False)
33 | 
34 |     for name, param in model_llama_adapter.named_parameters():
35 |         if "adapter" not in name:
36 |             param.requires_grad = False
37 |         else:
38 |             param.requires_grad = True
39 |             param.data = param.data.float()
40 | 
41 |     for name, param in model_llama_adapter.layers[-1 * args.adapter_layer :].named_parameters():
42 |         if "gate" in name or "adapter" in name:
43 |             param.data = param.data.float()
44 |             param.requires_grad = True
45 | 
46 |     return model_llama_adapter
47 | 
48 | 
49 | # set recommended archs
50 | Llama7B_adapter = Llama7B_adapter
51 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/util/datasets.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | # --------------------------------------------------------
 7 | # References:
 8 | # DeiT: https://github.com/facebookresearch/deit
 9 | # --------------------------------------------------------
10 | 
11 | import os
12 | 
13 | import PIL
14 | from timm.data import create_transform
15 | from timm.data.constants import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD
16 | from torchvision import datasets, transforms
17 | 
18 | 
19 | def build_dataset(is_train, args):
20 |     transform = build_transform(is_train, args)
21 | 
22 |     root = os.path.join(args.data_path, "train" if is_train else "val")
23 |     dataset = datasets.ImageFolder(root, transform=transform)
24 | 
25 |     print(dataset)
26 | 
27 |     return dataset
28 | 
29 | 
30 | def build_transform(is_train, args):
31 |     mean = IMAGENET_DEFAULT_MEAN
32 |     std = IMAGENET_DEFAULT_STD
33 |     # train transform
34 |     if is_train:
35 |         # this should always dispatch to transforms_imagenet_train
36 |         transform = create_transform(
37 |             input_size=args.input_size,
38 |             is_training=True,
39 |             color_jitter=args.color_jitter,
40 |             auto_augment=args.aa,
41 |             interpolation="bicubic",
42 |             re_prob=args.reprob,
43 |             re_mode=args.remode,
44 |             re_count=args.recount,
45 |             mean=mean,
46 |             std=std,
47 |         )
48 |         return transform
49 | 
50 |     # eval transform
51 |     t = []
52 |     if args.input_size <= 224:
53 |         crop_pct = 224 / 256
54 |     else:
55 |         crop_pct = 1.0
56 |     size = int(args.input_size / crop_pct)
57 |     t.append(
58 |         transforms.Resize(size, interpolation=PIL.Image.BICUBIC),  # to maintain same ratio w.r.t. 224 images
59 |     )
60 |     t.append(transforms.CenterCrop(args.input_size))
61 | 
62 |     t.append(transforms.ToTensor())
63 |     t.append(transforms.Normalize(mean, std))
64 |     return transforms.Compose(t)
65 | 


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/util/lars.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | # --------------------------------------------------------
 7 | # LARS optimizer, implementation from MoCo v3:
 8 | # https://github.com/facebookresearch/moco-v3
 9 | # --------------------------------------------------------
10 | 
11 | import torch
12 | 
13 | 
14 | class LARS(torch.optim.Optimizer):
15 |     """
16 |     LARS optimizer, no rate scaling or weight decay for parameters <= 1D.
17 |     """
18 |     def __init__(self, params, lr=0, weight_decay=0, momentum=0.9, trust_coefficient=0.001):
19 |         defaults = dict(lr=lr, weight_decay=weight_decay, momentum=momentum, trust_coefficient=trust_coefficient)
20 |         super().__init__(params, defaults)
21 | 
22 |     @torch.no_grad()
23 |     def step(self):
24 |         for g in self.param_groups:
25 |             for p in g['params']:
26 |                 dp = p.grad
27 | 
28 |                 if dp is None:
29 |                     continue
30 | 
31 |                 if p.ndim > 1: # if not normalization gamma/beta or bias
32 |                     dp = dp.add(p, alpha=g['weight_decay'])
33 |                     param_norm = torch.norm(p)
34 |                     update_norm = torch.norm(dp)
35 |                     one = torch.ones_like(param_norm)
36 |                     q = torch.where(param_norm > 0.,
37 |                                     torch.where(update_norm > 0,
38 |                                     (g['trust_coefficient'] * param_norm / update_norm), one),
39 |                                     one)
40 |                     dp = dp.mul(q)
41 | 
42 |                 param_state = self.state[p]
43 |                 if 'mu' not in param_state:
44 |                     param_state['mu'] = torch.zeros_like(p)
45 |                 mu = param_state['mu']
46 |                 mu.mul_(g['momentum']).add_(dp)
47 |                 p.add_(mu, alpha=-g['lr'])


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/util/lr_decay.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | # --------------------------------------------------------
 7 | # References:
 8 | # ELECTRA https://github.com/google-research/electra
 9 | # BEiT: https://github.com/microsoft/unilm/tree/master/beit
10 | # --------------------------------------------------------
11 | 
12 | import json
13 | 
14 | 
15 | def param_groups_lrd(model, weight_decay=0.05, no_weight_decay_list=[], layer_decay=.75):
16 |     """
17 |     Parameter groups for layer-wise lr decay
18 |     Following BEiT: https://github.com/microsoft/unilm/blob/master/beit/optim_factory.py#L58
19 |     """
20 |     param_group_names = {}
21 |     param_groups = {}
22 | 
23 |     num_layers = len(model.blocks) + 1
24 | 
25 |     layer_scales = list(layer_decay ** (num_layers - i) for i in range(num_layers + 1))
26 | 
27 |     for n, p in model.named_parameters():
28 |         if not p.requires_grad:
29 |             continue
30 | 
31 |         # no decay: all 1D parameters and model specific ones
32 |         if p.ndim == 1 or n in no_weight_decay_list:
33 |             g_decay = "no_decay"
34 |             this_decay = 0.
35 |         else:
36 |             g_decay = "decay"
37 |             this_decay = weight_decay
38 |             
39 |         layer_id = get_layer_id_for_vit(n, num_layers)
40 |         group_name = "layer_%d_%s" % (layer_id, g_decay)
41 | 
42 |         if group_name not in param_group_names:
43 |             this_scale = layer_scales[layer_id]
44 | 
45 |             param_group_names[group_name] = {
46 |                 "lr_scale": this_scale,
47 |                 "weight_decay": this_decay,
48 |                 "params": [],
49 |             }
50 |             param_groups[group_name] = {
51 |                 "lr_scale": this_scale,
52 |                 "weight_decay": this_decay,
53 |                 "params": [],
54 |             }
55 | 
56 |         param_group_names[group_name]["params"].append(n)
57 |         param_groups[group_name]["params"].append(p)
58 | 
59 |     # print("parameter groups: \n%s" % json.dumps(param_group_names, indent=2))
60 | 
61 |     return list(param_groups.values())
62 | 
63 | 
64 | def get_layer_id_for_vit(name, num_layers):
65 |     """
66 |     Assign a parameter with its layer id
67 |     Following BEiT: https://github.com/microsoft/unilm/blob/master/beit/optim_factory.py#L33
68 |     """
69 |     if name in ['cls_token', 'pos_embed']:
70 |         return 0
71 |     elif name.startswith('patch_embed'):
72 |         return 0
73 |     elif name.startswith('blocks'):
74 |         return int(name.split('.')[1]) + 1
75 |     else:
76 |         return num_layers


--------------------------------------------------------------------------------
/alpaca_finetuning_v1/util/lr_sched.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | 
 7 | import math
 8 | 
 9 | 
10 | def adjust_learning_rate(optimizer, epoch, args):
11 |     """Decay the learning rate with half-cycle cosine after warmup"""
12 |     if epoch < args.warmup_epochs:
13 |         lr = args.lr * epoch / args.warmup_epochs
14 |     else:
15 |         lr = args.min_lr + (args.lr - args.min_lr) * 0.5 * (
16 |             1.0 + math.cos(math.pi * (epoch - args.warmup_epochs) / (args.epochs - args.warmup_epochs))
17 |         )
18 |     for param_group in optimizer.param_groups:
19 |         if "lr_scale" in param_group:
20 |             param_group["lr"] = lr * param_group["lr_scale"]
21 |         else:
22 |             param_group["lr"] = lr
23 |     return lr
24 | 


--------------------------------------------------------------------------------
/docs/chat_demo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/chat_demo.png


--------------------------------------------------------------------------------
/docs/logo_v1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/logo_v1.png


--------------------------------------------------------------------------------
/docs/logo_v2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/logo_v2.png


--------------------------------------------------------------------------------
/docs/logo_v3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/logo_v3.png


--------------------------------------------------------------------------------
/docs/logo_v4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/logo_v4.png


--------------------------------------------------------------------------------
/docs/multi_model_example_1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/multi_model_example_1.png


--------------------------------------------------------------------------------
/docs/multi_model_example_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/multi_model_example_2.png


--------------------------------------------------------------------------------
/docs/multi_model_example_3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/multi_model_example_3.png


--------------------------------------------------------------------------------
/docs/multi_model_example_4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/multi_model_example_4.png


--------------------------------------------------------------------------------
/docs/multimodal.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/multimodal.png


--------------------------------------------------------------------------------
/docs/pipeline.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/pipeline.png


--------------------------------------------------------------------------------
/docs/youtube.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/docs/youtube.png


--------------------------------------------------------------------------------
/download.sh:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | PRESIGNED_URL=""             # replace with presigned url from email
 5 | MODEL_SIZE="7B,13B,30B,65B"  # edit this list with the model sizes you wish to download
 6 | TARGET_FOLDER=""             # where all files should end up
 7 | 
 8 | declare -A N_SHARD_DICT
 9 | 
10 | N_SHARD_DICT["7B"]="0"
11 | N_SHARD_DICT["13B"]="1"
12 | N_SHARD_DICT["30B"]="3"
13 | N_SHARD_DICT["65B"]="7"
14 | 
15 | echo "Downloading tokenizer"
16 | wget ${PRESIGNED_URL/'*'/"tokenizer.model"} -O ${TARGET_FOLDER}"/tokenizer.model"
17 | wget ${PRESIGNED_URL/'*'/"tokenizer_checklist.chk"} -O ${TARGET_FOLDER}"/tokenizer_checklist.chk"
18 | 
19 | (cd ${TARGET_FOLDER} && md5sum -c tokenizer_checklist.chk)
20 | 
21 | for i in ${MODEL_SIZE//,/ }
22 | do
23 |     echo "Downloading ${i}"
24 |     mkdir -p ${TARGET_FOLDER}"/${i}"
25 |     for s in $(seq -f "0%g" 0 ${N_SHARD_DICT[$i]})
26 |     do
27 |         wget ${PRESIGNED_URL/'*'/"${i}/consolidated.${s}.pth"} -O ${TARGET_FOLDER}"/${i}/consolidated.${s}.pth"
28 |     done
29 |     wget ${PRESIGNED_URL/'*'/"${i}/params.json"} -O ${TARGET_FOLDER}"/${i}/params.json"
30 |     wget ${PRESIGNED_URL/'*'/"${i}/checklist.chk"} -O ${TARGET_FOLDER}"/${i}/checklist.chk"
31 |     echo "Checking checksums"
32 |     (cd ${TARGET_FOLDER}"/${i}" && md5sum -c checklist.chk)
33 | done


--------------------------------------------------------------------------------
/generate.sh:
--------------------------------------------------------------------------------
1 | torchrun --nproc_per_node 1 example.py \
2 | --ckpt_dir /data1/llma/7B \
3 | --tokenizer_path /data1/llma/tokenizer.model \
4 | --adapter_path llama_adapter_len10_layer30_release.pth \
5 | --quantizer False
6 | 
7 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/extract_adapter_from_checkpoint.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import argparse
 3 | 
 4 | args = argparse.ArgumentParser("extract", add_help=False)
 5 | 
 6 | args.add_argument("--model_path", type=str)
 7 | 
 8 | args = args.parse_args()
 9 | 
10 | model = torch.load(args.model_path, map_location="cpu")
11 | new_model = dict()
12 | weight_list = ["layers." + str(i) + ".attention.gate" for i in range(32)]
13 | old_weight_list = ["layers." + str(i) + ".attention.gate" for i in range(32)]
14 | weight_list = weight_list + ["adapter_query.weight"]
15 | 
16 | print(weight_list)
17 | print(model["model"]["adapter_query.weight"].shape)
18 | 
19 | for i in range(len(weight_list)):
20 |     new_model[weight_list[i]] = model["model"][weight_list[i]]
21 | 
22 | save_path = args.model_path.replace('.pth', '-adapter.pth')
23 | torch.save(new_model, save_path)
24 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/finetuning_hf.sh:
--------------------------------------------------------------------------------
 1 | llama_path="/data1/llma/7B"
 2 | 
 3 | torchrun --nproc_per_node 2 --master_port=29501 finetuning.py \
 4 |     --model Llama7B_adapter \
 5 |     --llama_model_path "$llama_path"/ \
 6 |     --data_path ../gorilla-main/data/apibench/huggingface_train.json \
 7 |     --adapter_layer 30 \
 8 |     --adapter_len 10 \
 9 |     --max_seq_len 512 \
10 |     --batch_size 4 \
11 |     --epochs 10 \
12 |     --warmup_epochs 2 \
13 |     --blr 8e-1 \
14 |     --weight_decay 0.02 \
15 |     --output_dir ./checkpoint/exp_hf


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/finetuning_tf.sh:
--------------------------------------------------------------------------------
 1 | llama_path="/data1/llma/7B"
 2 | 
 3 | torchrun --nproc_per_node 6 --master_port=29502 finetuning.py \
 4 |     --model Llama7B_adapter \
 5 |     --llama_model_path "$llama_path"/ \
 6 |     --data_path ../gorilla-main/data/apibench/tensorflow_train.json \
 7 |     --adapter_layer 30 \
 8 |     --adapter_len 10 \
 9 |     --max_seq_len 512 \
10 |     --batch_size 4 \
11 |     --epochs 5 \
12 |     --warmup_epochs 2 \
13 |     --blr 6e-2 \
14 |     --weight_decay 0.02 \
15 |     --output_dir ./checkpoint/exp_tf
16 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/finetuning_th.sh:
--------------------------------------------------------------------------------
 1 | llama_path="/data1/llma/7B"
 2 | 
 3 | torchrun --nproc_per_node 1 finetuning.py \
 4 |     --model Llama7B_adapter \
 5 |     --llama_model_path "$llama_path"/ \
 6 |     --data_path ../gorilla-main/data/apibench/torchhub_train.json \
 7 |     --adapter_layer 30 \
 8 |     --adapter_len 10 \
 9 |     --max_seq_len 512 \
10 |     --batch_size 4 \
11 |     --epochs 5 \
12 |     --warmup_epochs 2 \
13 |     --blr 9e-3 \
14 |     --weight_decay 0.02 \
15 |     --output_dir ./checkpoint/exp_th
16 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/llama/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from .generation import LLaMA
5 | from .model import ModelArgs, Transformer
6 | from .tokenizer import Tokenizer
7 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/llama/generation.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from typing import List
 5 | 
 6 | import torch
 7 | 
 8 | from llama.model import Transformer
 9 | from llama.tokenizer import Tokenizer
10 | 
11 | 
12 | class LLaMA:
13 |     def __init__(self, model: Transformer, tokenizer: Tokenizer):
14 |         self.model = model
15 |         self.tokenizer = tokenizer
16 | 
17 |     def generate(
18 |         self,
19 |         prompts: List[str],
20 |         max_gen_len: int,
21 |         temperature: float = 0.8,
22 |         top_p: float = 0.95,
23 |     ) -> List[str]:
24 |         bsz = len(prompts)
25 |         params = self.model.params
26 |         assert bsz <= params.max_batch_size, (bsz, params.max_batch_size)
27 | 
28 |         prompt_tokens = [self.tokenizer.encode(x, bos=True, eos=False) for x in prompts]
29 | 
30 |         min_prompt_size = min([len(t) for t in prompt_tokens])
31 |         max_prompt_size = max([len(t) for t in prompt_tokens])
32 | 
33 |         total_len = min(params.max_seq_len, max_gen_len + max_prompt_size)
34 | 
35 |         tokens = torch.full((bsz, total_len), self.tokenizer.pad_id).cuda().long()
36 |         for k, t in enumerate(prompt_tokens):
37 |             tokens[k, : len(t)] = torch.tensor(t).long()
38 |         input_text_mask = tokens != self.tokenizer.pad_id
39 |         start_pos = min_prompt_size
40 |         prev_pos = 0
41 |         for cur_pos in range(start_pos, total_len):
42 |             logits = self.model.forward_only(tokens[:, prev_pos:cur_pos], prev_pos)
43 |             if temperature > 0:
44 |                 probs = torch.softmax(logits / temperature, dim=-1)
45 |                 next_token = sample_top_p(probs, top_p)
46 |             else:
47 |                 next_token = torch.argmax(logits, dim=-1)
48 |             next_token = next_token.reshape(-1)
49 |             # only replace token if prompt has already been generated
50 |             next_token = torch.where(input_text_mask[:, cur_pos], tokens[:, cur_pos], next_token)
51 |             tokens[:, cur_pos] = next_token
52 |             prev_pos = cur_pos
53 | 
54 |         decoded = []
55 |         for i, t in enumerate(tokens.tolist()):
56 |             # cut to max gen len
57 |             t = t[: len(prompt_tokens[i]) + max_gen_len]
58 |             # cut to eos tok if any
59 |             try:
60 |                 t = t[: t.index(self.tokenizer.eos_id)]
61 |             except ValueError:
62 |                 pass
63 |             decoded.append(self.tokenizer.decode(t))
64 |         return decoded
65 | 
66 | 
67 | def sample_top_p(probs, p):
68 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
69 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
70 |     mask = probs_sum - probs_sort > p
71 |     probs_sort[mask] = 0.0
72 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
73 |     next_token = torch.multinomial(probs_sort, num_samples=1)
74 |     next_token = torch.gather(probs_idx, -1, next_token)
75 |     return next_token
76 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | import os
 5 | from logging import getLogger
 6 | from typing import List
 7 | 
 8 | from sentencepiece import SentencePieceProcessor
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}")
26 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
27 | 
28 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
29 |         assert type(s) is str
30 |         t = self.sp_model.encode(s)
31 |         if bos:
32 |             t = [self.bos_id] + t
33 |         if eos:
34 |             t = t + [self.eos_id]
35 |         return t
36 | 
37 |     def decode(self, t: List[int]) -> str:
38 |         return self.sp_model.decode(t)
39 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/models_llama_adapter.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | 
 3 | import torch
 4 | 
 5 | from llama import ModelArgs, Tokenizer, Transformer
 6 | 
 7 | 
 8 | def Llama7B_adapter(args, **kwargs):
 9 | 
10 |     llama_model_path = args.llama_model_path
11 |     model_name = "7B"
12 | 
13 |     checkpoint = torch.load(llama_model_path + "/consolidated.00.pth", map_location="cpu")
14 |     print(llama_model_path + "/consolidated.00.pth")
15 | 
16 |     with open(llama_model_path + "/params.json", "r") as f:
17 |         params = json.loads(f.read())
18 | 
19 |     model_args: ModelArgs = ModelArgs(
20 |         max_seq_len=args.max_seq_len,
21 |         max_batch_size=32,
22 |         adapter_len=args.adapter_len,
23 |         adapter_layer=args.adapter_layer,
24 |         **params
25 |     )
26 |     tokenizer = Tokenizer(model_path=llama_model_path + "/tokenizer.model")
27 | 
28 |     model_args.vocab_size = tokenizer.n_words
29 |     torch.set_default_tensor_type(torch.cuda.HalfTensor)
30 |     model_llama_adapter = Transformer(model_args)
31 |     torch.set_default_tensor_type(torch.FloatTensor)
32 |     model_llama_adapter.load_state_dict(checkpoint, strict=False)
33 | 
34 |     for name, param in model_llama_adapter.named_parameters():
35 |         if "adapter" not in name:
36 |             param.requires_grad = False
37 |         else:
38 |             param.requires_grad = True
39 |             param.data = param.data.float()
40 | 
41 |     for name, param in model_llama_adapter.layers[-1 * args.adapter_layer :].named_parameters():
42 |         if "gate" in name or "adapter" in name:
43 |             param.data = param.data.float()
44 |             param.requires_grad = True
45 | 
46 |     return model_llama_adapter
47 | 
48 | 
49 | # set recommended archs
50 | Llama7B_adapter = Llama7B_adapter
51 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/util/datasets.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | # --------------------------------------------------------
 7 | # References:
 8 | # DeiT: https://github.com/facebookresearch/deit
 9 | # --------------------------------------------------------
10 | 
11 | import os
12 | 
13 | import PIL
14 | from timm.data import create_transform
15 | from timm.data.constants import IMAGENET_DEFAULT_MEAN, IMAGENET_DEFAULT_STD
16 | from torchvision import datasets, transforms
17 | 
18 | 
19 | def build_dataset(is_train, args):
20 |     transform = build_transform(is_train, args)
21 | 
22 |     root = os.path.join(args.data_path, "train" if is_train else "val")
23 |     dataset = datasets.ImageFolder(root, transform=transform)
24 | 
25 |     print(dataset)
26 | 
27 |     return dataset
28 | 
29 | 
30 | def build_transform(is_train, args):
31 |     mean = IMAGENET_DEFAULT_MEAN
32 |     std = IMAGENET_DEFAULT_STD
33 |     # train transform
34 |     if is_train:
35 |         # this should always dispatch to transforms_imagenet_train
36 |         transform = create_transform(
37 |             input_size=args.input_size,
38 |             is_training=True,
39 |             color_jitter=args.color_jitter,
40 |             auto_augment=args.aa,
41 |             interpolation="bicubic",
42 |             re_prob=args.reprob,
43 |             re_mode=args.remode,
44 |             re_count=args.recount,
45 |             mean=mean,
46 |             std=std,
47 |         )
48 |         return transform
49 | 
50 |     # eval transform
51 |     t = []
52 |     if args.input_size <= 224:
53 |         crop_pct = 224 / 256
54 |     else:
55 |         crop_pct = 1.0
56 |     size = int(args.input_size / crop_pct)
57 |     t.append(
58 |         transforms.Resize(size, interpolation=PIL.Image.BICUBIC),  # to maintain same ratio w.r.t. 224 images
59 |     )
60 |     t.append(transforms.CenterCrop(args.input_size))
61 | 
62 |     t.append(transforms.ToTensor())
63 |     t.append(transforms.Normalize(mean, std))
64 |     return transforms.Compose(t)
65 | 


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/util/lars.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | # --------------------------------------------------------
 7 | # LARS optimizer, implementation from MoCo v3:
 8 | # https://github.com/facebookresearch/moco-v3
 9 | # --------------------------------------------------------
10 | 
11 | import torch
12 | 
13 | 
14 | class LARS(torch.optim.Optimizer):
15 |     """
16 |     LARS optimizer, no rate scaling or weight decay for parameters <= 1D.
17 |     """
18 |     def __init__(self, params, lr=0, weight_decay=0, momentum=0.9, trust_coefficient=0.001):
19 |         defaults = dict(lr=lr, weight_decay=weight_decay, momentum=momentum, trust_coefficient=trust_coefficient)
20 |         super().__init__(params, defaults)
21 | 
22 |     @torch.no_grad()
23 |     def step(self):
24 |         for g in self.param_groups:
25 |             for p in g['params']:
26 |                 dp = p.grad
27 | 
28 |                 if dp is None:
29 |                     continue
30 | 
31 |                 if p.ndim > 1: # if not normalization gamma/beta or bias
32 |                     dp = dp.add(p, alpha=g['weight_decay'])
33 |                     param_norm = torch.norm(p)
34 |                     update_norm = torch.norm(dp)
35 |                     one = torch.ones_like(param_norm)
36 |                     q = torch.where(param_norm > 0.,
37 |                                     torch.where(update_norm > 0,
38 |                                     (g['trust_coefficient'] * param_norm / update_norm), one),
39 |                                     one)
40 |                     dp = dp.mul(q)
41 | 
42 |                 param_state = self.state[p]
43 |                 if 'mu' not in param_state:
44 |                     param_state['mu'] = torch.zeros_like(p)
45 |                 mu = param_state['mu']
46 |                 mu.mul_(g['momentum']).add_(dp)
47 |                 p.add_(mu, alpha=-g['lr'])


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/util/lr_decay.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | # --------------------------------------------------------
 7 | # References:
 8 | # ELECTRA https://github.com/google-research/electra
 9 | # BEiT: https://github.com/microsoft/unilm/tree/master/beit
10 | # --------------------------------------------------------
11 | 
12 | import json
13 | 
14 | 
15 | def param_groups_lrd(model, weight_decay=0.05, no_weight_decay_list=[], layer_decay=.75):
16 |     """
17 |     Parameter groups for layer-wise lr decay
18 |     Following BEiT: https://github.com/microsoft/unilm/blob/master/beit/optim_factory.py#L58
19 |     """
20 |     param_group_names = {}
21 |     param_groups = {}
22 | 
23 |     num_layers = len(model.blocks) + 1
24 | 
25 |     layer_scales = list(layer_decay ** (num_layers - i) for i in range(num_layers + 1))
26 | 
27 |     for n, p in model.named_parameters():
28 |         if not p.requires_grad:
29 |             continue
30 | 
31 |         # no decay: all 1D parameters and model specific ones
32 |         if p.ndim == 1 or n in no_weight_decay_list:
33 |             g_decay = "no_decay"
34 |             this_decay = 0.
35 |         else:
36 |             g_decay = "decay"
37 |             this_decay = weight_decay
38 |             
39 |         layer_id = get_layer_id_for_vit(n, num_layers)
40 |         group_name = "layer_%d_%s" % (layer_id, g_decay)
41 | 
42 |         if group_name not in param_group_names:
43 |             this_scale = layer_scales[layer_id]
44 | 
45 |             param_group_names[group_name] = {
46 |                 "lr_scale": this_scale,
47 |                 "weight_decay": this_decay,
48 |                 "params": [],
49 |             }
50 |             param_groups[group_name] = {
51 |                 "lr_scale": this_scale,
52 |                 "weight_decay": this_decay,
53 |                 "params": [],
54 |             }
55 | 
56 |         param_group_names[group_name]["params"].append(n)
57 |         param_groups[group_name]["params"].append(p)
58 | 
59 |     # print("parameter groups: \n%s" % json.dumps(param_group_names, indent=2))
60 | 
61 |     return list(param_groups.values())
62 | 
63 | 
64 | def get_layer_id_for_vit(name, num_layers):
65 |     """
66 |     Assign a parameter with its layer id
67 |     Following BEiT: https://github.com/microsoft/unilm/blob/master/beit/optim_factory.py#L33
68 |     """
69 |     if name in ['cls_token', 'pos_embed']:
70 |         return 0
71 |     elif name.startswith('patch_embed'):
72 |         return 0
73 |     elif name.startswith('blocks'):
74 |         return int(name.split('.')[1]) + 1
75 |     else:
76 |         return num_layers


--------------------------------------------------------------------------------
/gorilla/alpaca_finetuning_v1/util/lr_sched.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | 
 7 | import math
 8 | 
 9 | 
10 | def adjust_learning_rate(optimizer, epoch, args):
11 |     """Decay the learning rate with half-cycle cosine after warmup"""
12 |     if epoch < args.warmup_epochs:
13 |         lr = args.lr * epoch / args.warmup_epochs
14 |     else:
15 |         lr = args.min_lr + (args.lr - args.min_lr) * 0.5 * (
16 |             1.0 + math.cos(math.pi * (epoch - args.warmup_epochs) / (args.epochs - args.warmup_epochs))
17 |         )
18 |     for param_group in optimizer.param_groups:
19 |         if "lr_scale" in param_group:
20 |             param_group["lr"] = lr * param_group["lr_scale"]
21 |         else:
22 |             param_group["lr"] = lr
23 |     return lr
24 | 


--------------------------------------------------------------------------------
/gorilla/finetune/configs/finetune/EN.yaml:
--------------------------------------------------------------------------------
1 | META:
2 |   - '../data/alpaca_gpt4_data.json'


--------------------------------------------------------------------------------
/gorilla/finetune/configs/finetune/gorilla_hf.yaml:
--------------------------------------------------------------------------------
1 | META:
2 |   - '../gorilla-main/data/apibench/huggingface_train.json'


--------------------------------------------------------------------------------
/gorilla/finetune/configs/finetune/gorilla_tf.yaml:
--------------------------------------------------------------------------------
1 | META:
2 |   - '../gorilla-main/data/apibench/tensorflow_train.json'


--------------------------------------------------------------------------------
/gorilla/finetune/configs/finetune/gorilla_th.yaml:
--------------------------------------------------------------------------------
1 | META:
2 |   - '../gorilla-main/data/apibench/torchhub_train.json'


--------------------------------------------------------------------------------
/gorilla/finetune/data_preprocess.py:
--------------------------------------------------------------------------------
 1 | import json
 2 | 
 3 | PROMPT_DICT = {
 4 |     "prompt_input": (
 5 |         "Below is an instruction that describes a task, paired with an input that provides further context. "
 6 |         "Write a response that appropriately completes the request.\n\n"
 7 |         "### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:"
 8 |     ),
 9 |     "prompt_no_input": (
10 |         "Below is an instruction that describes a task. "
11 |         "Write a response that appropriately completes the request.\n\n"
12 |         "### Instruction:\n{instruction}\n\n### Response:"
13 |     ),
14 | }
15 | import pdb
16 | pdb.set_trace()
17 | 
18 | datas = json.load(open('/home/pgao/stanford_alpaca/stanford_alpaca/alpaca_data.json'))
19 | prompt_input, prompt_no_input = PROMPT_DICT["prompt_input"], PROMPT_DICT["prompt_no_input"]
20 | sources = [
21 |         prompt_input.format_map(example) if example.get("input", "") != "" else prompt_no_input.format_map(example)
22 |         for example in datas
23 |         ]
24 | 
25 | 
26 | targets = [f"{example['output']}" for example in datas]
27 | examples = [s + t for s, t in zip(sources, targets)]
28 | for strings in (examples, sources):
29 |     print(strings)
30 | 
31 | 


--------------------------------------------------------------------------------
/gorilla/finetune/exps/train/base/run.sh:
--------------------------------------------------------------------------------
1 | exp_name="train/base_wamrup2000_lr_decay_1800000_batch16_32gpu_accmulation_4_lr_0005_adam_095_09_weight_decay_0_dot_1_clip_2"
2 | mkdir -p output/"$exp_name"
3 | 
4 | srun -p alpha_vl --gres=gpu:8 --cpus-per-task 16 -n32 \
5 | --ntasks-per-node=8 --quotatype=reserved python -u main_pretrain.py --batch_size 16 \
6 | --llama_type llama --weight_decay 0.1 --output_dir output/"$exp_name" \
7 | --accum_iter 4 --warmup_iters 2000 --lr_decay_iters 1800000 --lr 0.0005 --min_lr 0.00005 --clip_grad 2 \
8 | 2>&1 | tee -a output/"$exp_name"/output.log
9 | 


--------------------------------------------------------------------------------
/gorilla/finetune/exps/train/rev/run.sh:
--------------------------------------------------------------------------------
1 | exp_name="train/rev/wamrup2000_lr_decay_1800000_batch16_32gpu_accmulation_4_lr_0005_adam_095_09_weight_decay_0_dot_1_clip_2"
2 | mkdir -p output/"$exp_name"
3 | 
4 | srun -p alpha_vl --gres=gpu:8 --cpus-per-task 16 -n32 \
5 | --ntasks-per-node=8 --quotatype=reserved python -u main_pretrain.py --batch_size 16 \
6 | --llama_type revllama --reversible_grad --weight_decay 0.1 --output_dir output/"$exp_name" \
7 | --accum_iter 4 --warmup_iters 2000 --lr_decay_iters 1800000 --lr 0.0005 --min_lr 0.00005 --clip_grad 2 \
8 | 2>&1 | tee -a output/"$exp_name"/output.log
9 | 


--------------------------------------------------------------------------------
/gorilla/finetune/global_configs.py:
--------------------------------------------------------------------------------
1 | tokenizer_path = '/data1/llma/tokenizer.model'
2 | petrel_conf = "/mnt/petrelfs/share_data/gaopeng/ldy/petreloss_all.conf"
3 | petrel_prefix = "cluster_p_ssd:s3://falcon-refinedweb/data"
4 | data_meta_path = "/mnt/petrelfs/share_data/gaopeng/ldy/falcon_list.json"
5 | 


--------------------------------------------------------------------------------
/gorilla/finetune/model/LLM/__init__.py:
--------------------------------------------------------------------------------
1 | from . import llama
2 | from . import revllama


--------------------------------------------------------------------------------
/gorilla/finetune/model/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/gorilla/finetune/model/__init__.py


--------------------------------------------------------------------------------
/gorilla/finetune/model/meta.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import torch.nn as nn
 3 | import json
 4 | from .tokenizer import Tokenizer
 5 | from . import LLM
 6 | from global_configs import tokenizer_path
 7 | 
 8 | 
 9 | class MetaModel(nn.Module):
10 |     """ Masked Autoencoder with VisionTransformer backbone
11 |     """
12 |     def __init__(self, llama_type, reversible_grad: bool, llama_config):
13 |         super().__init__()
14 | 
15 |         self.criterion = torch.nn.CrossEntropyLoss(ignore_index=0)
16 | 
17 |         ModelArgs = LLM.__dict__[llama_type].ModelArgs
18 |         Transformer = LLM.__dict__[llama_type].Transformer
19 | 
20 |         with open(llama_config, "r") as f:
21 |             params = json.loads(f.read())
22 |         model_args: ModelArgs = ModelArgs(
23 |             max_seq_len=2048, max_batch_size=32, **params
24 |         )
25 |         tokenizer = Tokenizer(model_path=tokenizer_path)
26 |         model_args.vocab_size = tokenizer.n_words
27 |         if reversible_grad:
28 |             if hasattr(model_args, "reversible_gradient"):
29 |                 model_args.reversible_gradient = True
30 |             else:
31 |                 raise KeyError (f"{ModelArgs} object has no attribute reversible_gradient")
32 | 
33 |         model = Transformer(model_args)
34 |         self.llma = model
35 |         for name, param in self.named_parameters():
36 |             if param.requires_grad:
37 |                print(f"Trainable param: {name}, {param.shape}, {param.dtype}")
38 |         count = sum(p.numel() for p in self.parameters() if p.requires_grad)
39 |         print(f"Parameter count : {count}")
40 | 
41 |     def forward(self, examples, labels):
42 |         output = self.llma(examples)
43 |         output = output[:, :-1, :]
44 |         labels = labels[:, 1:]
45 | 
46 |         if labels.sum() == 0:
47 |            c_loss = output.mean() * 0
48 |         else:
49 |            c_loss = self.criterion(output.reshape(-1, 32000), labels.flatten())
50 |         pred = 0
51 |         mask = 0
52 |         return c_loss, c_loss, pred, mask


--------------------------------------------------------------------------------
/gorilla/finetune/model/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from sentencepiece import SentencePieceProcessor
 5 | from logging import getLogger
 6 | from typing import List
 7 | import os
 8 | 
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(
26 |             f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}"
27 |         )
28 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
29 | 
30 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
31 |         assert type(s) is str
32 |         t = self.sp_model.encode(s)
33 |         if bos:
34 |             t = [self.bos_id] + t
35 |         if eos:
36 |             t = t + [self.eos_id]
37 |         return t
38 | 
39 |     def decode(self, t: List[int]) -> str:
40 |         return self.sp_model.decode(t)
41 | 


--------------------------------------------------------------------------------
/gorilla/finetune/params.json:
--------------------------------------------------------------------------------
1 | {"dim": 2048, "multiple_of": 256, "n_heads": 16, "n_layers": 12, "norm_eps": 1e-06, "vocab_size": -1}
2 | 


--------------------------------------------------------------------------------
/gorilla/finetune/scripts/finetune/finetune_7B_gorilla_hf.sh:
--------------------------------------------------------------------------------
 1 | data_parallel="$1"
 2 | mp="$2"
 3 | llama_path="/data1/llma/7B"
 4 | 
 5 | exp_name=finetune_"$data_parallel"_mp"$mp"_bsz2_accum_4_gpu8_lr_00002_warmup1_epoch3_max_len512_gorilla_huggingface_consolidate
 6 | mkdir -p output/"$exp_name"
 7 | 
 8 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env main_finetune.py \
 9 | --llama_type llama --weight_decay 0.1 --output_dir output/"$exp_name" \
10 | --accum_iter 4 --batch_size 2 --warmup_epochs 1 --epochs 3 --lr 0.00002 --min_lr 0.000005 --clip_grad 2 \
11 | --llama_config "$llama_path"/params.json \
12 | --data_parallel "$data_parallel" --model_parallel_size "$mp" \
13 | --max_words 512 --data_config configs/finetune/gorilla_hf.yaml --llama_tokenizer_path "$llama_path"/tokenizer.model \
14 | --pretrained_path "$llama_path" --pretrained_type meta_ori --checkpointing \
15 | --save_consolidated 2>&1 | tee -a output/"$exp_name"/output.log


--------------------------------------------------------------------------------
/gorilla/finetune/scripts/finetune/finetune_7B_gorilla_tf.sh:
--------------------------------------------------------------------------------
 1 | data_parallel="$1"
 2 | mp="$2"
 3 | llama_path="/data1/llma/7B"
 4 | 
 5 | exp_name=finetune_"$data_parallel"_mp"$mp"_bsz2_accum_4_gpu8_lr_00002_warmup1_epoch3_max_len512_gorilla_tensorflow_consolidate
 6 | mkdir -p output/"$exp_name"
 7 | 
 8 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env main_finetune.py \
 9 | --llama_type llama --weight_decay 0.1 --output_dir output/"$exp_name" \
10 | --accum_iter 4 --batch_size 2 --warmup_epochs 1 --epochs 3 --lr 0.00002 --min_lr 0.000005 --clip_grad 2 \
11 | --llama_config "$llama_path"/params.json \
12 | --data_parallel "$data_parallel" --model_parallel_size "$mp" \
13 | --max_words 512 --data_config configs/finetune/gorilla_tf.yaml --llama_tokenizer_path "$llama_path"/tokenizer.model \
14 | --pretrained_path "$llama_path" --pretrained_type meta_ori --checkpointing \
15 | --save_consolidated 2>&1 | tee -a output/"$exp_name"/output.log
16 | 


--------------------------------------------------------------------------------
/gorilla/finetune/scripts/finetune/finetune_7B_gorilla_th.sh:
--------------------------------------------------------------------------------
 1 | data_parallel="$1"
 2 | mp="$2"
 3 | llama_path="/data1/llma/7B"
 4 | 
 5 | exp_name=finetune_"$data_parallel"_mp"$mp"_bsz2_accum_4_gpu8_lr_00002_warmup1_epoch3_max_len512_gorilla_torchhub_consolidate
 6 | mkdir -p output/"$exp_name"
 7 | 
 8 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env main_finetune.py \
 9 | --llama_type llama --weight_decay 0.1 --output_dir output/"$exp_name" \
10 | --accum_iter 4 --batch_size 2 --warmup_epochs 1 --epochs 3 --lr 0.00002 --min_lr 0.000005 --clip_grad 2 \
11 | --llama_config "$llama_path"/params.json \
12 | --data_parallel "$data_parallel" --model_parallel_size "$mp" \
13 | --max_words 512 --data_config configs/finetune/gorilla_th.yaml --llama_tokenizer_path "$llama_path"/tokenizer.model \
14 | --pretrained_path "$llama_path" --pretrained_type meta_ori --checkpointing \
15 | --save_consolidated 2>&1 | tee -a output/"$exp_name"/output.log
16 | 


--------------------------------------------------------------------------------
/gorilla/finetune/scripts/tools/debug_finetune_131_7B.sh:
--------------------------------------------------------------------------------
 1 | load_dir="$1"
 2 | save_dir="$2"
 3 | 
 4 | exp_name=tool/get_consolidated_ckpt
 5 | mkdir -p output/"$exp_name"
 6 | mkdir -p "$save_dir"
 7 | 
 8 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
 9 | tools/get_consolidated_ckpt.py \
10 | --llama_type llama \
11 | --llama_config /data1/llma/7B/params.json \
12 | --data_parallel sdp --model_parallel_size 1 \
13 | --load_dir "$load_dir" --save_dir "$save_dir" \
14 | 2>&1 | tee -a output/"$exp_name"/output.log
15 | 


--------------------------------------------------------------------------------
/gorilla/finetune/scripts/tools/merge130.sh:
--------------------------------------------------------------------------------
 1 | load_dir="$1"
 2 | save_dir="$2"
 3 | 
 4 | exp_name=tool/get_consolidated_ckpt
 5 | mkdir -p output/"$exp_name"
 6 | mkdir -p "$save_dir"
 7 | 
 8 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
 9 | tools/get_consolidated_ckpt.py \
10 | --llama_type llama \
11 | --llama_config /data1/llma/7B/params.json \
12 | --data_parallel sdp --model_parallel_size 1 \
13 | --load_dir "$load_dir" --save_dir "$save_dir" \
14 | 2>&1 | tee -a output/"$exp_name"/output.log
15 | 


--------------------------------------------------------------------------------
/gorilla/finetune/util/crop.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | 
 7 | import math
 8 | 
 9 | import torch
10 | 
11 | from torchvision import transforms
12 | from torchvision.transforms import functional as F
13 | 
14 | 
15 | class RandomResizedCrop(transforms.RandomResizedCrop):
16 |     """
17 |     RandomResizedCrop for matching TF/TPU implementation: no for-loop is used.
18 |     This may lead to results different with torchvision's version.
19 |     Following BYOL's TF code:
20 |     https://github.com/deepmind/deepmind-research/blob/master/byol/utils/dataset.py#L206
21 |     """
22 |     @staticmethod
23 |     def get_params(img, scale, ratio):
24 |         width, height = F._get_image_size(img)
25 |         area = height * width
26 | 
27 |         target_area = area * torch.empty(1).uniform_(scale[0], scale[1]).item()
28 |         log_ratio = torch.log(torch.tensor(ratio))
29 |         aspect_ratio = torch.exp(
30 |             torch.empty(1).uniform_(log_ratio[0], log_ratio[1])
31 |         ).item()
32 | 
33 |         w = int(round(math.sqrt(target_area * aspect_ratio)))
34 |         h = int(round(math.sqrt(target_area / aspect_ratio)))
35 | 
36 |         w = min(w, width)
37 |         h = min(h, height)
38 | 
39 |         i = torch.randint(0, height - h + 1, size=(1,)).item()
40 |         j = torch.randint(0, width - w + 1, size=(1,)).item()
41 | 
42 |         return i, j, h, w


--------------------------------------------------------------------------------
/gorilla/finetune/util/lr_decay.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | # --------------------------------------------------------
 7 | # References:
 8 | # ELECTRA https://github.com/google-research/electra
 9 | # BEiT: https://github.com/microsoft/unilm/tree/master/beit
10 | # --------------------------------------------------------
11 | 
12 | import json
13 | 
14 | 
15 | def param_groups_lrd(model, weight_decay=0.05, no_weight_decay_list=[], layer_decay=.75):
16 |     """
17 |     Parameter groups for layer-wise lr decay
18 |     Following BEiT: https://github.com/microsoft/unilm/blob/master/beit/optim_factory.py#L58
19 |     """
20 |     param_group_names = {}
21 |     param_groups = {}
22 | 
23 |     num_layers = len(model.blocks) + 1
24 | 
25 |     layer_scales = list(layer_decay ** (num_layers - i) for i in range(num_layers + 1))
26 | 
27 |     for n, p in model.named_parameters():
28 |         if not p.requires_grad:
29 |             continue
30 | 
31 |         # no decay: all 1D parameters and model specific ones
32 |         if p.ndim == 1 or n in no_weight_decay_list:
33 |             g_decay = "no_decay"
34 |             this_decay = 0.
35 |         else:
36 |             g_decay = "decay"
37 |             this_decay = weight_decay
38 |             
39 |         layer_id = get_layer_id_for_vit(n, num_layers)
40 |         group_name = "layer_%d_%s" % (layer_id, g_decay)
41 | 
42 |         if group_name not in param_group_names:
43 |             this_scale = layer_scales[layer_id]
44 | 
45 |             param_group_names[group_name] = {
46 |                 "lr_scale": this_scale,
47 |                 "weight_decay": this_decay,
48 |                 "params": [],
49 |             }
50 |             param_groups[group_name] = {
51 |                 "lr_scale": this_scale,
52 |                 "weight_decay": this_decay,
53 |                 "params": [],
54 |             }
55 | 
56 |         param_group_names[group_name]["params"].append(n)
57 |         param_groups[group_name]["params"].append(p)
58 | 
59 |     # print("parameter groups: \n%s" % json.dumps(param_group_names, indent=2))
60 | 
61 |     return list(param_groups.values())
62 | 
63 | 
64 | def get_layer_id_for_vit(name, num_layers):
65 |     """
66 |     Assign a parameter with its layer id
67 |     Following BEiT: https://github.com/microsoft/unilm/blob/master/beit/optim_factory.py#L33
68 |     """
69 |     if name in ['cls_token', 'pos_embed']:
70 |         return 0
71 |     elif name.startswith('patch_embed'):
72 |         return 0
73 |     elif name.startswith('blocks'):
74 |         return int(name.split('.')[1]) + 1
75 |     else:
76 |         return num_layers


--------------------------------------------------------------------------------
/gorilla/finetune/util/lr_sched.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | 
 7 | import math
 8 | 
 9 | def adjust_learning_rate(optimizer, it, args):
10 |     """Decay the learning rate with half-cycle cosine after warmup"""
11 |     if it < args.warmup_iters: # 1) linear warmup for warmup_iters steps
12 |         lr = args.lr * it / args.warmup_iters
13 |     elif it > args.lr_decay_iters: # 2) if it > lr_decay_iters, return min learning rate
14 |         lr = args.min_lr
15 |     else: # 3) in between, use cosine decay down to min learning rate
16 |         decay_ratio = (it - args.warmup_iters) / (args.lr_decay_iters - args.warmup_iters)
17 |         assert 0 <= decay_ratio <= 1
18 |         coeff = 0.5 * (1.0 + math.cos(math.pi * decay_ratio))  # coeff ranges 0..1
19 |         lr = args.min_lr + (args.lr - args.min_lr) * coeff
20 | 
21 |     for param_group in optimizer.param_groups:
22 |         if "lr_scale" in param_group:
23 |             param_group["lr"] = lr * param_group["lr_scale"]
24 |         else:
25 |             param_group["lr"] = lr
26 |     return lr
27 | 
28 | 
29 | def adjust_learning_rate_epoch(optimizer, epoch, args):
30 |     """Decay the learning rate with half-cycle cosine after warmup"""
31 |     if epoch < args.warmup_epochs:
32 |         lr = args.lr * epoch / args.warmup_epochs
33 |     else:
34 |         lr = args.min_lr + (args.lr - args.min_lr) * 0.5 * \
35 |             (1. + math.cos(math.pi * (epoch - args.warmup_epochs) / (args.epochs - args.warmup_epochs)))
36 |     for param_group in optimizer.param_groups:
37 |         if "lr_scale" in param_group:
38 |             param_group["lr"] = lr * param_group["lr_scale"]
39 |         else:
40 |             param_group["lr"] = lr
41 |     return lr
42 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/.github/ISSUE_TEMPLATE/apibench.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: APIBench
 3 | about: Create a report to help us improve APIBench
 4 | title: "[Apibench] "
 5 | labels: apibench-data
 6 | assignees: ''
 7 | 
 8 | ---
 9 | 
10 | **Describe the issue**
11 | A clear and concise description of what the issue is.
12 | 
13 | **ID datapoint**
14 | 1. Datapoint permalink: (If more than one, include as a python list of strings)
15 | 2. Provider: TorchHub/HuggingFace/PyTorch Hub
16 | 2. Gorilla repo commit #: 
17 | 
18 | **What is the issue**
19 | 
20 | **Proposed Changes**
21 | 
22 | {
23 |  'previous_datapoint':[], 
24 |  'updated_datapoint':[]
25 | }
26 | 
27 | **Additional context**
28 | Add any other context about the problem here.
29 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/.github/ISSUE_TEMPLATE/custom-template.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Custom template
 3 | about: Custom template
 4 | title: ''
 5 | labels: ''
 6 | assignees: ''
 7 | 
 8 | ---
 9 | 
10 | 
11 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/.github/ISSUE_TEMPLATE/feature_request.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: Feature request
 3 | about: Suggest an idea for this project
 4 | title: "[feature] "
 5 | labels: enhancement
 6 | assignees: ''
 7 | 
 8 | ---
 9 | 
10 | **Is the feature request related to a problem?**
11 | Ex. I'm like to see [...] 
12 | 
13 | **Describe the solution you'd like**
14 | When I run [X], I want to see [Y]
15 | 
16 | **Additional context**
17 | Add any other context or screenshots about the feature request here.
18 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/.github/ISSUE_TEMPLATE/hosted-gorilla-.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | name: 'Hosted Gorilla '
 3 | about: Issues when using hosted Gorilla
 4 | title: "[bug] Hosted Gorilla: <Issue>"
 5 | labels: hosted-gorilla
 6 | assignees: ''
 7 | 
 8 | ---
 9 | 
10 | **Describe the bug**
11 | A clear and concise description of what the bug is.
12 | 
13 | **To Reproduce**
14 | Steps to reproduce the behavior:
15 | 1. I tried '...' on <data> and <time> 
16 | 2. I was expecting '...'
17 | 3. But encountered '...'
18 | 4. How frequent is this error '...'
19 | 5. Error
20 | 
21 | **Screenshots**
22 | If applicable, add screenshots to help explain your problem.
23 | 
24 | **Proposed Solution**
25 | If you want to suggest a proposed solution or an idea for one? 
26 | 
27 | **Additional context**
28 | Add any other context about the problem here.
29 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/.gitignore:
--------------------------------------------------------------------------------
 1 | build
 2 | dist
 3 | *.egg-info
 4 | **/__pycache__/
 5 | *.log
 6 | **/*.lic
 7 | .vscode
 8 | .idea
 9 | .editorconfig
10 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/data/apizoo/shawnharmsen1.json:
--------------------------------------------------------------------------------
 1 | [
 2 |   {
 3 |     "user_name": "example_username_api",
 4 |     "api_name": "GPT4All Python API",
 5 |     "api_call": "chat_completion(messages, default_prompt_header=True, default_prompt_footer=True, verbose=True, streaming=True, **generate_kwargs)",
 6 |     "api_version": "2.0",
 7 |     "api_arguments": {
 8 |       "messages": "[{'role': 'user', 'content': 'Name 3 colors'}]",
 9 |       "default_prompt_header": true,
10 |       "default_prompt_footer": true,
11 |       "verbose": true,
12 |       "streaming": true,
13 |       "generate_kwargs": "{}"
14 |     },
15 |     "functionality": "Text generation",
16 |     "env_requirements": ["gpt4all"],
17 |     "example_code": "import gpt4all\n\nmodel = gpt4all.GPT4All('ggml-gpt4all-j-v1.3-groovy')\nmessages = [{'role': 'user', 'content': 'Name 3 colors'}]\nmodel.chat_completion(messages)",
18 |     "meta_data": {
19 |       "description": "The GPT4All package provides Python bindings and an API to the C/C++ model backend libraries. By default, models are stored in ~/.cache/gpt4all/ (you can change this with model_path). If the file already exists, model download will be skipped.",
20 |       "performance": null
21 |     },
22 |     "questions": [
23 |       "Can you name three colors?",
24 |       "What is the meaning of life?",
25 |       "What is the capital of France?"
26 |     ]
27 |   }
28 | ]
29 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/README.md:
--------------------------------------------------------------------------------
 1 | # Gorilla
 2 | 
 3 | <img src="https://github.com/ShishirPatil/gorilla/blob/gh-pages/assets/img/logo.png" width=50% height=50%>
 4 | 
 5 | ## Get Started
 6 | 
 7 | ### Getting GPT-3.5-turbo, GPT-4 and Claude Responses
 8 | 
 9 | To get LLM responses for the API calls, use the following command:
10 | 
11 | ```bash
12 | python get_llm_responses.py --model gpt-3.5-turbo --api_key $API_KEY --output_file gpt-3.5-turbo_torchhub_0_shot.jsonl --question_data eval-data/questions/torchhub/questions_torchhub_0_shot.jsonl --api_name torchhub
13 | ```
14 | 
15 | ### Evaluate the Response with AST tree matching
16 | 
17 | After the responses of the LLM is generated, we can start to evaluate the generated responses with respect to our dataset:
18 | 
19 | ```bash 
20 | cd eval-scripts
21 | python ast_eval_th.py --api_dataset ../../data/api/torchhub_api.jsonl --apibench ../../data/apibench/torchhub_eval.json --llm_responses ../eval-data/responses/torchhub/response_torchhub_Gorilla_FT_0_shot.jsonl
22 | ```
23 | 
24 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/gorilla/gorilla-main/eval/eval-scripts/codebleu/__init__.py


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/keywords/c_sharp.txt:
--------------------------------------------------------------------------------
  1 | abstract
  2 | as
  3 | base
  4 | bool
  5 | break
  6 | byte
  7 | case
  8 | catch
  9 | char
 10 | checked
 11 | class
 12 | const
 13 | continue
 14 | decimal
 15 | default
 16 | delegate
 17 | do
 18 | double
 19 | else
 20 | enum
 21 | event
 22 | explicit
 23 | extern
 24 | false
 25 | finally
 26 | fixed
 27 | float
 28 | for
 29 | foreach
 30 | goto
 31 | if
 32 | implicit
 33 | in
 34 | int
 35 | interface
 36 | internal
 37 | is
 38 | lock
 39 | long
 40 | namespace
 41 | new
 42 | null
 43 | object
 44 | operator
 45 | out
 46 | override
 47 | params
 48 | private
 49 | protected
 50 | public
 51 | readonly
 52 | ref
 53 | return
 54 | sbyte
 55 | sealed
 56 | short
 57 | sizeof
 58 | stackalloc
 59 | static
 60 | string
 61 | struct
 62 | switch
 63 | this
 64 | throw
 65 | true
 66 | try
 67 | typeof
 68 | uint
 69 | ulong
 70 | unchecked
 71 | unsafe
 72 | ushort
 73 | using
 74 | virtual
 75 | void
 76 | volatile
 77 | while
 78 | add
 79 | alias
 80 | ascending
 81 | async
 82 | await
 83 | by
 84 | descending
 85 | dynamic
 86 | equals
 87 | from
 88 | get
 89 | global
 90 | group
 91 | into
 92 | join
 93 | let
 94 | nameof
 95 | notnull
 96 | on
 97 | orderby
 98 | partial
 99 | remove
100 | select
101 | set
102 | unmanaged
103 | value
104 | var
105 | when
106 | where
107 | yield
108 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/keywords/java.txt:
--------------------------------------------------------------------------------
 1 | abstract
 2 | assert
 3 | boolean
 4 | break
 5 | byte
 6 | case
 7 | catch
 8 | char
 9 | class
10 | const
11 | continue
12 | default
13 | do
14 | double
15 | else
16 | enum
17 | extends
18 | final
19 | finally
20 | float
21 | for
22 | goto
23 | if
24 | implements
25 | import
26 | instanceof
27 | int
28 | interface
29 | long
30 | native
31 | new
32 | package
33 | private
34 | protected
35 | public
36 | return
37 | short
38 | static
39 | strictfp
40 | super
41 | switch
42 | synchronized
43 | this
44 | throw
45 | throws
46 | transient
47 | try
48 | void
49 | volatile
50 | while
51 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/keywords/python.txt:
--------------------------------------------------------------------------------
 1 | False
 2 | None
 3 | True
 4 | and
 5 | as
 6 | assert
 7 | async
 8 | await
 9 | break
10 | class
11 | continue
12 | def
13 | del
14 | elif
15 | else
16 | except
17 | finally
18 | for
19 | from
20 | global
21 | if
22 | import
23 | in
24 | is
25 | lambda
26 | nonlocal
27 | not
28 | or
29 | pass
30 | raise
31 | return
32 | try
33 | while
34 | with
35 | yield


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Microsoft Corporation. 
2 | # Licensed under the MIT license.
3 | 
4 | from .utils import (remove_comments_and_docstrings,
5 |                    tree_to_token_index,
6 |                    index_to_code_token,
7 |                    tree_to_variable_index)
8 | from .DFG import DFG_python,DFG_java,DFG_ruby,DFG_go,DFG_php,DFG_javascript,DFG_csharp


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/build.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Microsoft Corporation. 
 2 | # Licensed under the MIT license.
 3 | 
 4 | from tree_sitter import Language, Parser
 5 | 
 6 | Language.build_library(
 7 |   # Store the library in the `build` directory
 8 |   'my-languages.so',
 9 | 
10 |   # Include one or more languages
11 |   [ 'tree-sitter-python',
12 |   ]
13 | )
14 | 
15 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/build.sh:
--------------------------------------------------------------------------------
1 | git clone https://github.com/tree-sitter/tree-sitter-python
2 | pip install tree_sitter
3 | python build.py
4 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/.gitattributes:
--------------------------------------------------------------------------------
1 | /src/** linguist-vendored
2 | /examples/* linguist-vendored
3 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/.github/workflows/ci.yml:
--------------------------------------------------------------------------------
 1 | name: Build/test
 2 | on:
 3 |   pull_request:
 4 |     branches:
 5 |       - "**"
 6 |   push:
 7 |     branches:
 8 |       - "master"
 9 | jobs:
10 |   test:
11 |     runs-on: ${{ matrix.os }}
12 |     strategy:
13 |       fail-fast: true
14 |       matrix:
15 |         os: [macos-latest, ubuntu-latest]
16 |     steps:
17 |       - uses: actions/checkout@v2
18 |       - uses: actions/setup-node@v2
19 |         with:
20 |           node-version: 16
21 |       - run: npm install
22 |       - run: npm test
23 |   test_windows:
24 |     runs-on: windows-latest
25 |     steps:
26 |       - uses: actions/checkout@v2
27 |       - uses: actions/setup-node@v2
28 |         with:
29 |           node-version: 16
30 |       - run: npm install
31 |       - run: npm run-script test-windows
32 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/.gitignore:
--------------------------------------------------------------------------------
1 | Cargo.lock
2 | package-lock.json
3 | node_modules
4 | build
5 | *.log
6 | /examples/*/
7 | /target/
8 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/.npmignore:
--------------------------------------------------------------------------------
1 | corpus
2 | examples
3 | build
4 | script
5 | target
6 | bindings/rust
7 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/Cargo.toml:
--------------------------------------------------------------------------------
 1 | [package]
 2 | name = "tree-sitter-python"
 3 | description = "Python grammar for the tree-sitter parsing library"
 4 | version = "0.20.2"
 5 | authors = [
 6 |     "Max Brunsfeld <maxbrunsfeld@gmail.com>",
 7 |     "Douglas Creager <dcreager@dcreager.net>",
 8 | ]
 9 | license = "MIT"
10 | readme = "bindings/rust/README.md"
11 | keywords = ["incremental", "parsing", "python"]
12 | categories = ["parsing", "text-editors"]
13 | repository = "https://github.com/tree-sitter/tree-sitter-python"
14 | edition = "2018"
15 | 
16 | build = "bindings/rust/build.rs"
17 | include = [
18 |   "bindings/rust/*",
19 |   "grammar.js",
20 |   "queries/*",
21 |   "src/*",
22 | ]
23 | 
24 | [lib]
25 | path = "bindings/rust/lib.rs"
26 | 
27 | [dependencies]
28 | tree-sitter = ">= 0.19, < 0.21"
29 | 
30 | [build-dependencies]
31 | cc = "1.0"
32 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/LICENSE:
--------------------------------------------------------------------------------
 1 | The MIT License (MIT)
 2 | 
 3 | Copyright (c) 2016 Max Brunsfeld
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/README.md:
--------------------------------------------------------------------------------
 1 | tree-sitter-python
 2 | ==================
 3 | 
 4 | [![build](https://github.com/tree-sitter/tree-sitter-python/actions/workflows/ci.yml/badge.svg)](https://github.com/tree-sitter/tree-sitter-python/actions/workflows/ci.yml)
 5 | 
 6 | Python grammar for [tree-sitter][].
 7 | 
 8 | [tree-sitter]: https://github.com/tree-sitter/tree-sitter
 9 | 
10 | #### References
11 | 
12 | * [Python 2 Grammar](https://docs.python.org/2/reference/grammar.html)
13 | * [Python 3 Grammar](https://docs.python.org/3/reference/grammar.html)
14 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/binding.gyp:
--------------------------------------------------------------------------------
 1 | {
 2 |   "targets": [
 3 |     {
 4 |       "target_name": "tree_sitter_python_binding",
 5 |       "include_dirs": [
 6 |         "<!(node -e \"require('nan')\")",
 7 |         "src"
 8 |       ],
 9 |       "sources": [
10 |         "src/parser.c",
11 |         "bindings/node/binding.cc",
12 |         "src/scanner.cc"
13 |       ],
14 |       "cflags_c": [
15 |         "-std=c99",
16 |       ]
17 |     }
18 |   ]
19 | }
20 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/bindings/node/binding.cc:
--------------------------------------------------------------------------------
 1 | #include "tree_sitter/parser.h"
 2 | #include <node.h>
 3 | #include "nan.h"
 4 | 
 5 | using namespace v8;
 6 | 
 7 | extern "C" TSLanguage * tree_sitter_python();
 8 | 
 9 | namespace {
10 | 
11 | NAN_METHOD(New) {}
12 | 
13 | void Init(Local<Object> exports, Local<Object> module) {
14 |   Local<FunctionTemplate> tpl = Nan::New<FunctionTemplate>(New);
15 |   tpl->SetClassName(Nan::New("Language").ToLocalChecked());
16 |   tpl->InstanceTemplate()->SetInternalFieldCount(1);
17 | 
18 |   Local<Function> constructor = Nan::GetFunction(tpl).ToLocalChecked();
19 |   Local<Object> instance = constructor->NewInstance(Nan::GetCurrentContext()).ToLocalChecked();
20 |   Nan::SetInternalFieldPointer(instance, 0, tree_sitter_python());
21 | 
22 |   Nan::Set(instance, Nan::New("name").ToLocalChecked(), Nan::New("python").ToLocalChecked());
23 |   Nan::Set(module, Nan::New("exports").ToLocalChecked(), instance);
24 | }
25 | 
26 | NODE_MODULE(tree_sitter_python_binding, Init)
27 | 
28 | }  // namespace
29 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/bindings/node/index.js:
--------------------------------------------------------------------------------
 1 | try {
 2 |   module.exports = require("../../build/Release/tree_sitter_python_binding");
 3 | } catch (error1) {
 4 |   if (error1.code !== 'MODULE_NOT_FOUND') {
 5 |     throw error1;
 6 |   }
 7 |   try {
 8 |     module.exports = require("../../build/Debug/tree_sitter_python_binding");
 9 |   } catch (error2) {
10 |     if (error2.code !== 'MODULE_NOT_FOUND') {
11 |       throw error2;
12 |     }
13 |     throw error1
14 |   }
15 | }
16 | 
17 | try {
18 |   module.exports.nodeTypeInfo = require("../../src/node-types.json");
19 | } catch (_) {}
20 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/bindings/rust/README.md:
--------------------------------------------------------------------------------
 1 | # tree-sitter-python
 2 | 
 3 | This crate provides a Python grammar for the [tree-sitter][] parsing library.
 4 | To use this crate, add it to the `[dependencies]` section of your `Cargo.toml`
 5 | file.  (Note that you will probably also need to depend on the
 6 | [`tree-sitter`][tree-sitter crate] crate to use the parsed result in any useful
 7 | way.)
 8 | 
 9 | ``` toml
10 | [dependencies]
11 | tree-sitter = "0.17"
12 | tree-sitter-python = "0.17"
13 | ```
14 | 
15 | Typically, you will use the [language][language func] function to add this
16 | grammar to a tree-sitter [Parser][], and then use the parser to parse some code:
17 | 
18 | ``` rust
19 | let code = r#"
20 |     def double(x):
21 |         return x * 2
22 | "#;
23 | let mut parser = Parser::new();
24 | parser.set_language(tree_sitter_python::language()).expect("Error loading Python grammar");
25 | let parsed = parser.parse(code, None);
26 | ```
27 | 
28 | If you have any questions, please reach out to us in the [tree-sitter
29 | discussions] page.
30 | 
31 | [Language]: https://docs.rs/tree-sitter/*/tree_sitter/struct.Language.html
32 | [language func]: https://docs.rs/tree-sitter-python/*/tree_sitter_python/fn.language.html
33 | [Parser]: https://docs.rs/tree-sitter/*/tree_sitter/struct.Parser.html
34 | [tree-sitter]: https://tree-sitter.github.io/
35 | [tree-sitter crate]: https://crates.io/crates/tree-sitter
36 | [tree-sitter discussions]: https://github.com/tree-sitter/tree-sitter/discussions
37 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/bindings/rust/build.rs:
--------------------------------------------------------------------------------
 1 | use std::path::Path;
 2 | extern crate cc;
 3 | 
 4 | fn main() {
 5 |     let src_dir = Path::new("src");
 6 | 
 7 |     let mut c_config = cc::Build::new();
 8 |     c_config.include(&src_dir);
 9 |     c_config
10 |         .flag_if_supported("-Wno-unused-parameter")
11 |         .flag_if_supported("-Wno-unused-but-set-variable")
12 |         .flag_if_supported("-Wno-trigraphs");
13 |     let parser_path = src_dir.join("parser.c");
14 |     c_config.file(&parser_path);
15 |     println!("cargo:rerun-if-changed={}", parser_path.to_str().unwrap());
16 |     c_config.compile("parser");
17 | 
18 |     let mut cpp_config = cc::Build::new();
19 |     cpp_config.cpp(true);
20 |     cpp_config.include(&src_dir);
21 |     cpp_config
22 |         .flag_if_supported("-Wno-unused-parameter")
23 |         .flag_if_supported("-Wno-unused-but-set-variable");
24 |     let scanner_path = src_dir.join("scanner.cc");
25 |     cpp_config.file(&scanner_path);
26 |     println!("cargo:rerun-if-changed={}", scanner_path.to_str().unwrap());
27 |     cpp_config.compile("scanner");
28 | }
29 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/bindings/rust/lib.rs:
--------------------------------------------------------------------------------
 1 | // -*- coding: utf-8 -*-
 2 | // ------------------------------------------------------------------------------------------------
 3 | // Copyright © 2020, tree-sitter-python authors.
 4 | // See the LICENSE file in this repo for license details.
 5 | // ------------------------------------------------------------------------------------------------
 6 | 
 7 | //! This crate provides a Python grammar for the [tree-sitter][] parsing library.
 8 | //!
 9 | //! Typically, you will use the [language][language func] function to add this grammar to a
10 | //! tree-sitter [Parser][], and then use the parser to parse some code:
11 | //!
12 | //! ```
13 | //! use tree_sitter::Parser;
14 | //!
15 | //! let code = r#"
16 | //!     def double(x):
17 | //!         return x * 2
18 | //! "#;
19 | //! let mut parser = Parser::new();
20 | //! parser.set_language(tree_sitter_python::language()).expect("Error loading Python grammar");
21 | //! let parsed = parser.parse(code, None);
22 | //! # let parsed = parsed.unwrap();
23 | //! # let root = parsed.root_node();
24 | //! # assert!(!root.has_error());
25 | //! ```
26 | //!
27 | //! [Language]: https://docs.rs/tree-sitter/*/tree_sitter/struct.Language.html
28 | //! [language func]: fn.language.html
29 | //! [Parser]: https://docs.rs/tree-sitter/*/tree_sitter/struct.Parser.html
30 | //! [tree-sitter]: https://tree-sitter.github.io/
31 | 
32 | use tree_sitter::Language;
33 | 
34 | extern "C" {
35 |     fn tree_sitter_python() -> Language;
36 | }
37 | 
38 | /// Returns the tree-sitter [Language][] for this grammar.
39 | ///
40 | /// [Language]: https://docs.rs/tree-sitter/*/tree_sitter/struct.Language.html
41 | pub fn language() -> Language {
42 |     unsafe { tree_sitter_python() }
43 | }
44 | 
45 | /// The source of the Python tree-sitter grammar description.
46 | pub const GRAMMAR: &'static str = include_str!("../../grammar.js");
47 | 
48 | /// The syntax highlighting query for this language.
49 | pub const HIGHLIGHT_QUERY: &'static str = include_str!("../../queries/highlights.scm");
50 | 
51 | /// The content of the [`node-types.json`][] file for this grammar.
52 | ///
53 | /// [`node-types.json`]: https://tree-sitter.github.io/tree-sitter/using-parsers#static-node-types
54 | pub const NODE_TYPES: &'static str = include_str!("../../src/node-types.json");
55 | 
56 | /// The symbol tagging query for this language.
57 | pub const TAGGING_QUERY: &'static str = include_str!("../../queries/tags.scm");
58 | 
59 | #[cfg(test)]
60 | mod tests {
61 |     #[test]
62 |     fn can_load_grammar() {
63 |         let mut parser = tree_sitter::Parser::new();
64 |         parser
65 |             .set_language(super::language())
66 |             .expect("Error loading Python grammar");
67 |     }
68 | }
69 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/examples/compound-statement-without-trailing-newline.py:
--------------------------------------------------------------------------------
1 | 
2 | class Foo:
3 |   def bar():
4 |     print "hi"


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/examples/crlf-line-endings.py:
--------------------------------------------------------------------------------
1 | print a
2 | 
3 | if b:    
4 |     if c:
5 |         d
6 |     e
7 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/examples/mixed-spaces-tabs.py:
--------------------------------------------------------------------------------
1 | def main():
2 | 	print "hello"
3 | 	# 1 tab = 8 spaces in Python 2
4 |         return
5 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/examples/multiple-newlines.py:
--------------------------------------------------------------------------------
 1 | def hi():
 2 | 
 3 | 
 4 | 
 5 |     print "hi"
 6 | 
 7 | 
 8 | def bye():
 9 |     print "bye"
10 | 
11 | 
12 | 
13 | 
14 | 
15 | 
16 | 
17 | 
18 | 
19 | 
20 | 
21 | 
22 | 
23 | 
24 | 
25 | 
26 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/examples/simple-statements-without-trailing-newline.py:
--------------------------------------------------------------------------------
1 | pass; print "hi"


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/examples/tabs.py:
--------------------------------------------------------------------------------
 1 | def set_password(args):
 2 | 	password = args.password
 3 | 	while not password  :
 4 | 		password1 = getpass("" if args.quiet else "Provide password: ")
 5 | 		password_repeat = getpass("" if args.quiet else "Repeat password:  ")
 6 | 		if password1 != password_repeat:
 7 | 			print("Passwords do not match, try again")
 8 | 		elif len(password1) < 4:
 9 | 			print("Please provide at least 4 characters")
10 | 		else:
11 | 			password = password1
12 | 
13 | 	password_hash = passwd(password)
14 | 	cfg = BaseJSONConfigManager(config_dir=jupyter_config_dir())
15 | 	cfg.update('jupyter_notebook_config', {
16 | 		'NotebookApp': {
17 | 			'password': password_hash,
18 | 		}
19 | 	})
20 | 	if not args.quiet:
21 | 		print("password stored in config dir: %s" % jupyter_config_dir())
22 | 
23 | def main(argv):
24 | 	parser = argparse.ArgumentParser(argv[0])
25 | 	subparsers = parser.add_subparsers()
26 | 	parser_password = subparsers.add_parser('password', help='sets a password for your notebook server')
27 | 	parser_password.add_argument("password", help="password to set, if not given, a password will be queried for (NOTE: this may not be safe)",
28 | 			nargs="?")
29 | 	parser_password.add_argument("--quiet", help="suppress messages", action="store_true")
30 | 	parser_password.set_defaults(function=set_password)
31 | 	args = parser.parse_args(argv[1:])
32 | 	args.function(args)
33 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/examples/trailing-whitespace.py:
--------------------------------------------------------------------------------
1 | print a    
2 | 
3 | if b:    
4 |     if c:    
5 |         d
6 |     e     
7 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/package.json:
--------------------------------------------------------------------------------
 1 | {
 2 |   "name": "tree-sitter-python",
 3 |   "version": "0.20.2",
 4 |   "description": "Python grammar for tree-sitter",
 5 |   "main": "bindings/node",
 6 |   "keywords": [
 7 |     "parser",
 8 |     "lexer"
 9 |   ],
10 |   "author": "Max Brunsfeld",
11 |   "license": "MIT",
12 |   "dependencies": {
13 |     "nan": "^2.15.0"
14 |   },
15 |   "devDependencies": {
16 |     "tree-sitter-cli": "^0.20.1"
17 |   },
18 |   "scripts": {
19 |     "build": "tree-sitter generate && node-gyp build",
20 |     "test": "tree-sitter test && script/parse-examples",
21 |     "parse": "tree-sitter parse",
22 |     "test-windows": "tree-sitter test"
23 |   },
24 |   "repository": "https://github.com/tree-sitter/tree-sitter-python",
25 |   "tree-sitter": [
26 |     {
27 |       "scope": "source.python",
28 |       "file-types": [
29 |         "py"
30 |       ]
31 |     }
32 |   ]
33 | }
34 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/queries/highlights.scm:
--------------------------------------------------------------------------------
  1 | ; Identifier naming conventions
  2 | 
  3 | ((identifier) @constructor
  4 |  (#match? @constructor "^[A-Z]"))
  5 | 
  6 | ((identifier) @constant
  7 |  (#match? @constant "^[A-Z][A-Z_]*$"))
  8 | 
  9 | ; Builtin functions
 10 | 
 11 | ((call
 12 |   function: (identifier) @function.builtin)
 13 |  (#match?
 14 |    @function.builtin
 15 |    "^(abs|all|any|ascii|bin|bool|breakpoint|bytearray|bytes|callable|chr|classmethod|compile|complex|delattr|dict|dir|divmod|enumerate|eval|exec|filter|float|format|frozenset|getattr|globals|hasattr|hash|help|hex|id|input|int|isinstance|issubclass|iter|len|list|locals|map|max|memoryview|min|next|object|oct|open|ord|pow|print|property|range|repr|reversed|round|set|setattr|slice|sorted|staticmethod|str|sum|super|tuple|type|vars|zip|__import__)$"))
 16 | 
 17 | ; Function calls
 18 | 
 19 | (decorator) @function
 20 | 
 21 | (call
 22 |   function: (attribute attribute: (identifier) @function.method))
 23 | (call
 24 |   function: (identifier) @function)
 25 | 
 26 | ; Function definitions
 27 | 
 28 | (function_definition
 29 |   name: (identifier) @function)
 30 | 
 31 | (identifier) @variable
 32 | (attribute attribute: (identifier) @property)
 33 | (type (identifier) @type)
 34 | 
 35 | ; Literals
 36 | 
 37 | [
 38 |   (none)
 39 |   (true)
 40 |   (false)
 41 | ] @constant.builtin
 42 | 
 43 | [
 44 |   (integer)
 45 |   (float)
 46 | ] @number
 47 | 
 48 | (comment) @comment
 49 | (string) @string
 50 | (escape_sequence) @escape
 51 | 
 52 | (interpolation
 53 |   "{" @punctuation.special
 54 |   "}" @punctuation.special) @embedded
 55 | 
 56 | [
 57 |   "-"
 58 |   "-="
 59 |   "!="
 60 |   "*"
 61 |   "**"
 62 |   "**="
 63 |   "*="
 64 |   "/"
 65 |   "//"
 66 |   "//="
 67 |   "/="
 68 |   "&"
 69 |   "%"
 70 |   "%="
 71 |   "^"
 72 |   "+"
 73 |   "->"
 74 |   "+="
 75 |   "<"
 76 |   "<<"
 77 |   "<="
 78 |   "<>"
 79 |   "="
 80 |   ":="
 81 |   "=="
 82 |   ">"
 83 |   ">="
 84 |   ">>"
 85 |   "|"
 86 |   "~"
 87 |   "and"
 88 |   "in"
 89 |   "is"
 90 |   "not"
 91 |   "or"
 92 | ] @operator
 93 | 
 94 | [
 95 |   "as"
 96 |   "assert"
 97 |   "async"
 98 |   "await"
 99 |   "break"
100 |   "class"
101 |   "continue"
102 |   "def"
103 |   "del"
104 |   "elif"
105 |   "else"
106 |   "except"
107 |   "exec"
108 |   "finally"
109 |   "for"
110 |   "from"
111 |   "global"
112 |   "if"
113 |   "import"
114 |   "lambda"
115 |   "nonlocal"
116 |   "pass"
117 |   "print"
118 |   "raise"
119 |   "return"
120 |   "try"
121 |   "while"
122 |   "with"
123 |   "yield"
124 |   "match"
125 |   "case"
126 | ] @keyword
127 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/queries/tags.scm:
--------------------------------------------------------------------------------
 1 | (class_definition
 2 |   name: (identifier) @name) @definition.class
 3 | 
 4 | (function_definition
 5 |   name: (identifier) @name) @definition.function
 6 | 
 7 | (call
 8 |   function: [
 9 |       (identifier) @name
10 |       (attribute
11 |         attribute: (identifier) @name)
12 |   ]) @reference.call
13 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/script/known_failures.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/script/known_failures.txt


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/script/parse-examples:
--------------------------------------------------------------------------------
 1 | #!/bin/bash
 2 | 
 3 | set -e
 4 | 
 5 | cd "$(dirname "$0")/.."
 6 | 
 7 | function checkout() {
 8 |   repo=$1; url=$2; sha=$3
 9 | 
10 |   if [ ! -d "$repo" ]; then
11 |     git clone "https://github.com/$url" "$repo"
12 |   fi
13 | 
14 |   pushd "$repo"
15 |   git fetch && git reset --hard "$sha"
16 |   popd
17 | }
18 | 
19 | checkout examples/numpy numpy/numpy 058851c5cfc98f50f11237b1c13d77cfd1f40475
20 | checkout examples/django django/django 01974d7f7549b2dca2a729c3c1a1ea7d4585eb3a
21 | checkout examples/flask pallets/flask de464c03e134127140e5622e230790806a133ff9
22 | 
23 | known_failures="$(cat script/known_failures.txt)"
24 | 
25 | tree-sitter parse -q \
26 |   'examples/**/*.py' \
27 |   $(for file in $known_failures; do echo "!${file}"; done)
28 | 
29 | example_count=$(find examples -name '*.py' | wc -l)
30 | failure_count=$(wc -w <<< "$known_failures")
31 | success_count=$(( $example_count - $failure_count ))
32 | success_percent=$(bc -l <<< "100*${success_count}/${example_count}")
33 | 
34 | printf \
35 |   "Successfully parsed %d of %d example files (%.1f%%)\n" \
36 |   $success_count $example_count $success_percent
37 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/test/corpus/errors.txt:
--------------------------------------------------------------------------------
 1 | ====================================
 2 | An error before a string literal
 3 | ====================================
 4 | 
 5 | def a(b):
 6 |     c.
 7 | 
 8 |     """
 9 |     d
10 |     """
11 | 
12 |     e
13 | 
14 | ---
15 | 
16 | (module
17 |   (function_definition
18 |     (identifier)
19 |     (parameters
20 |       (identifier))
21 |     (ERROR
22 |       (identifier))
23 |     (block
24 |       (expression_statement
25 |         (string (string_content)))
26 |       (expression_statement
27 |         (identifier)))))
28 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/test/highlight/keywords.py:
--------------------------------------------------------------------------------
 1 | if foo():
 2 | # <- keyword
 3 |     pass
 4 |     # <- keyword
 5 | elif bar():
 6 | # <- keyword
 7 |     pass
 8 | else:
 9 | # <- keyword
10 |     foo
11 | 
12 | return
13 | # ^ keyword
14 | raise e
15 | # ^ keyword
16 | 
17 | for i in foo():
18 | # <- keyword
19 | #   ^ variable
20 | #     ^ operator
21 | #        ^ function
22 |     continue
23 |     # <- keyword
24 |     break
25 |     # <- keyword
26 | 
27 | a and b or c
28 | # ^ operator
29 | #     ^ variable
30 | #       ^ operator
31 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/test/highlight/parameters.py:
--------------------------------------------------------------------------------
1 | def g(h, i, /, j, *, k=100, **kwarg):
2 |     #       ^ operator
3 |     #             ^ operator
4 |     pass
5 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/parser/tree-sitter-python/test/highlight/pattern_matching.py:
--------------------------------------------------------------------------------
 1 | match command.split():
 2 | # ^ keyword
 3 |     case ["quit"]:
 4 |     # ^ keyword
 5 |         print("Goodbye!")
 6 |         quit_game()
 7 |     case ["look"]:
 8 |     # ^ keyword
 9 |         current_room.describe()
10 |     case ["get", obj]:
11 |     # ^ keyword
12 |         character.get(obj, current_room)
13 |     case ["go", direction]:
14 |     # ^ keyword
15 |         current_room = current_room.neighbor(direction)
16 |     # The rest of your commands go here
17 | 
18 | match command.split():
19 | # ^ keyword
20 |     case ["drop", *objects]:
21 |     # ^ keyword
22 |         for obj in objects:
23 |             character.drop(obj, current_room)
24 | 
25 | match command.split():
26 | # ^ keyword
27 |     case ["quit"]: ... # Code omitted for brevity
28 |     case ["go", direction]: pass
29 |     case ["drop", *objects]: pass
30 |     case _:
31 |         print(f"Sorry, I couldn't understand {command!r}")
32 | 
33 | match command.split():
34 | # ^ keyword
35 |     case ["north"] | ["go", "north"]:
36 |     # ^ keyword
37 |         current_room = current_room.neighbor("north")
38 |     case ["get", obj] | ["pick", "up", obj] | ["pick", obj, "up"]:
39 |     # ^ keyword
40 |         pass
41 | 
42 | match = 2
43 | #   ^ variable
44 | match, a = 2, 3
45 | #   ^ variable
46 | match: int = secret
47 | #   ^ variable
48 | x, match: str = 2, "hey, what's up?"
49 | # <- variable
50 | #   ^ variable
51 | 
52 | if match := re.fullmatch(r"(-)?(\d+:)?\d?\d:\d\d(\.\d*)?", time, flags=re.ASCII):
53 |     # ^ variable
54 |     return match
55 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/readme.txt:
--------------------------------------------------------------------------------
1 | python calc_code_bleu.py --refs reference_files --hyp candidate_file --language java ( or c_sharp) --params 0.25,0.25,0.25,0.25(default)


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/syntax_check.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Microsoft Corporation. 
 2 | # Licensed under the MIT license.
 3 | 
 4 | from codebleu.parser import DFG_python,DFG_java,DFG_ruby,DFG_go,DFG_php,DFG_javascript,DFG_csharp
 5 | from codebleu.parser import (remove_comments_and_docstrings,
 6 |                    tree_to_token_index,
 7 |                    index_to_code_token,
 8 |                    tree_to_variable_index)
 9 | from tree_sitter import Language, Parser
10 | 
11 | dfg_function={
12 |     'python':DFG_python,
13 |     'java':DFG_java,
14 |     'ruby':DFG_ruby,
15 |     'go':DFG_go,
16 |     'php':DFG_php,
17 |     'javascript':DFG_javascript,
18 |     'c_sharp':DFG_csharp,
19 | }
20 | 
21 | def calc_syntax_match(references, candidate, lang):
22 |     return corpus_syntax_match([references], [candidate], lang)
23 | 
24 | def corpus_syntax_check(references, candidates, lang):   
25 |     LANGUAGE = Language('codebleu/parser/my-languages.so', lang)
26 |     parser = Parser()
27 |     parser.set_language(LANGUAGE)
28 |     match_count = 0
29 |     total_count = 0
30 |     scores = []
31 | 
32 |     for i in range(len(candidates)):
33 |         references_sample = references[i]
34 |         candidate = candidates[i] 
35 |         for reference in references_sample:
36 |             try:
37 |                 candidate=remove_comments_and_docstrings(candidate,'java')
38 |             except:
39 |                 pass    
40 |             try:
41 |                 reference=remove_comments_and_docstrings(reference,'java')
42 |             except:
43 |                 pass  
44 | 
45 |             candidate_tree = parser.parse(bytes(candidate,'utf8')).root_node
46 | 
47 |             reference_tree = parser.parse(bytes(reference,'utf8')).root_node
48 | 
49 |             def get_all_sub_trees(root_node):
50 |                 node_stack = []
51 |                 sub_tree_sexp_list = []
52 |                 depth = 1
53 |                 node_stack.append([root_node, depth])
54 |                 while len(node_stack) != 0:
55 |                     cur_node, cur_depth = node_stack.pop()
56 |                     sub_tree_sexp_list.append([cur_node.sexp(), cur_depth])
57 |                     for child_node in cur_node.children:
58 |                         if len(child_node.children) != 0:
59 |                             depth = cur_depth + 1
60 |                             node_stack.append([child_node, depth])
61 |                 return sub_tree_sexp_list
62 |             cand_sexps = [x[0] for x in get_all_sub_trees(candidate_tree)]
63 |             # print(len(cand_sexps))
64 |             # for i, sub_tree in enumerate(cand_sexps):
65 |             #     print(i, sub_tree)
66 |             # exit()
67 |             ref_sexps = get_all_sub_trees(reference_tree)
68 | 
69 |             score = 0 - str(candidate_tree.sexp()).count("ERROR")
70 |             # for sub_tree, depth in ref_sexps:
71 |             #     if sub_tree in cand_sexps:
72 |             #          match_count += 1
73 |             # total_count += len(ref_sexps)          
74 |        
75 |     # score = match_count / total_count
76 |     return score
77 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/eval/eval-scripts/codebleu/syntax_match.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Microsoft Corporation. 
 2 | # Licensed under the MIT license.
 3 | 
 4 | from codebleu.parser import DFG_python,DFG_java,DFG_ruby,DFG_go,DFG_php,DFG_javascript,DFG_csharp
 5 | from codebleu.parser import (remove_comments_and_docstrings,
 6 |                    tree_to_token_index,
 7 |                    index_to_code_token,
 8 |                    tree_to_variable_index)
 9 | from tree_sitter import Language, Parser
10 | 
11 | dfg_function={
12 |     'python':DFG_python,
13 |     'java':DFG_java,
14 |     'ruby':DFG_ruby,
15 |     'go':DFG_go,
16 |     'php':DFG_php,
17 |     'javascript':DFG_javascript,
18 |     'c_sharp':DFG_csharp,
19 | }
20 | 
21 | def calc_syntax_match(references, candidate, lang):
22 |     return corpus_syntax_match([references], [candidate], lang)
23 | 
24 | def corpus_syntax_match(references, candidates, lang):   
25 |     '''
26 |     Language.build_library(# Store the library in the `build` directory
27 |         'build/my-languages.so',
28 |         'vendor/tree-sitter-python')
29 |     '''
30 |     # LANGUAGE = Language('codebleu/parser/my-languages.so', lang)
31 |     LANGUAGE = Language('./build/my-languages.so', lang)
32 |     parser = Parser()
33 |     parser.set_language(LANGUAGE)
34 |     match_count = 0
35 |     total_count = 0
36 | 
37 |     for i in range(len(candidates)):
38 |         references_sample = references[i]
39 |         candidate = candidates[i] 
40 |         for reference in references_sample:
41 |             try:
42 |                 candidate=remove_comments_and_docstrings(candidate,'java')
43 |             except:
44 |                 pass    
45 |             try:
46 |                 reference=remove_comments_and_docstrings(reference,'java')
47 |             except:
48 |                 pass  
49 | 
50 |             candidate_tree = parser.parse(bytes(candidate,'utf8')).root_node
51 | 
52 |             reference_tree = parser.parse(bytes(reference,'utf8')).root_node
53 |             '''
54 |             print(candidate)
55 |             print(reference_tree.sexp())
56 |             print(candidate_tree.sexp())
57 |             print(reference_tree.sexp() == candidate_tree.sexp())
58 |             exit()
59 |             '''
60 | 
61 |             '''
62 |             if candidate_tree.sexp() == reference_tree.sexp():
63 |                 total_match = 1/0.3
64 |             else:
65 |                 total_match = -1/0.3
66 |             '''
67 |             total_match = 0
68 | 
69 |             def get_all_sub_trees(root_node):
70 |                 node_stack = []
71 |                 sub_tree_sexp_list = []
72 |                 depth = 1
73 |                 node_stack.append([root_node, depth])
74 |                 while len(node_stack) != 0:
75 |                     cur_node, cur_depth = node_stack.pop()
76 |                     sub_tree_sexp_list.append([cur_node.sexp(), cur_depth])
77 |                     for child_node in cur_node.children:
78 |                         if len(child_node.children) != 0:
79 |                             depth = cur_depth + 1
80 |                             node_stack.append([child_node, depth])
81 |                 return sub_tree_sexp_list
82 |             cand_sexps = [x[0] for x in get_all_sub_trees(candidate_tree)]
83 |             ref_sexps = get_all_sub_trees(reference_tree)
84 | 
85 |             # print(cand_sexps)
86 |             # print(ref_sexps)
87 |             
88 |             for sub_tree, depth in ref_sexps:
89 |                 if sub_tree in cand_sexps:
90 |                      match_count += 1
91 |             total_count += len(ref_sexps)  
92 |         
93 |     if total_count == 0:
94 |         return 0 + total_match
95 | 
96 |     score = match_count / total_count + total_match
97 |     return score
98 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/inference/example_questions/example_questions.jsonl:
--------------------------------------------------------------------------------
1 | {"question_id": 1, "text": "I want to generate image from text."}
2 | {"question_id": 2, "text": "I want to generate text from image"}
3 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/inference/requirements.txt:
--------------------------------------------------------------------------------
1 | transformers==4.28.1
2 | huggingface-hub==0.14.1
3 | torch==2.0.1
4 | tqdm==4.65.0
5 | prompt_toolkit==3.0.38
6 | sentencepiece==0.1.99
7 | accelerate==0.19.0
8 | 


--------------------------------------------------------------------------------
/gorilla/gorilla-main/requirements.txt:
--------------------------------------------------------------------------------
1 | openai
2 | anthropic
3 | tree_sitter
4 | 


--------------------------------------------------------------------------------
/gorilla/inference/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contributing to LLaMA
 2 | We want to make contributing to this project as easy and transparent as
 3 | possible.
 4 | 
 5 | ## Pull Requests
 6 | We actively welcome your pull requests.
 7 | 
 8 | 1. Fork the repo and create your branch from `main`.
 9 | 2. If you've added code that should be tested, add tests.
10 | 3. If you've changed APIs, update the documentation.
11 | 4. Ensure the test suite passes.
12 | 5. Make sure your code lints.
13 | 6. If you haven't already, complete the Contributor License Agreement ("CLA").
14 | 
15 | ## Contributor License Agreement ("CLA")
16 | In order to accept your pull request, we need you to submit a CLA. You only need
17 | to do this once to work on any of Meta's open source projects.
18 | 
19 | Complete your CLA here: <https://code.facebook.com/cla>
20 | 
21 | ## Issues
22 | We use GitHub issues to track public bugs. Please ensure your description is
23 | clear and has sufficient instructions to be able to reproduce the issue.
24 | 
25 | Meta has a [bounty program](https://www.facebook.com/whitehat/) for the safe
26 | disclosure of security bugs. In those cases, please go through the process
27 | outlined on that page and do not file a public issue.
28 | 
29 | ## License
30 | By contributing to LLaMA, you agree that your contributions will be licensed
31 | under the LICENSE file in the root directory of this source tree.


--------------------------------------------------------------------------------
/gorilla/inference/FAQ.md:
--------------------------------------------------------------------------------
 1 | # FAQ
 2 | ## <a name="1"></a>1. The download.sh script doesn't work on default bash in MacOS X:
 3 | 
 4 | Please see answers from theses issues:
 5 |  - https://github.com/facebookresearch/llama/issues/41#issuecomment-1451290160
 6 |  - https://github.com/facebookresearch/llama/issues/53#issue-1606582963
 7 | 
 8 | 
 9 | ## <a name="2"></a>2. Generations are bad! 
10 | 
11 | Keep in mind these models are not finetuned for question answering. As such, they should be prompted so that the expected answer is the natural continuation of the prompt.
12 | 
13 | Here are a few examples of prompts (from [issue#69](https://github.com/facebookresearch/llama/issues/69)) geared towards finetuned models, and how to modify them to get the expected results:
14 |  - Do not prompt with "What is the meaning of life? Be concise and do not repeat yourself." but with "I believe the meaning of life is"
15 |  - Do not prompt with "Explain the theory of relativity." but with "Simply put, the theory of relativity states that"
16 |  - Do not prompt with "Ten easy steps to build a website..." but with "Building a website can be done in 10 simple steps:\n"
17 | 
18 | To be able to directly prompt the models with questions / instructions, you can either:
19 |  - Prompt it with few-shot examples so that the model understands the task you have in mind.
20 |  - Finetune the models on datasets of instructions to make them more robust to input prompts.
21 | 
22 | We've updated `example.py` with more sample prompts. Overall, always keep in mind that models are very sensitive to prompts (particularly when they have not been finetuned).
23 | 
24 | ## <a name="3"></a>3. CUDA Out of memory errors
25 | 
26 | The `example.py` file pre-allocates a cache according to these settings:
27 | ```python
28 | model_args: ModelArgs = ModelArgs(max_seq_len=max_seq_len, max_batch_size=max_batch_size, **params)
29 | ```
30 | 
31 | Accounting for 14GB of memory for the model weights (7B model), this leaves 16GB available for the decoding cache which stores 2 * 2 * n_layers * max_batch_size * max_seq_len * n_heads * head_dim bytes.
32 | 
33 | With default parameters, this cache was about 17GB (2 * 2 * 32 * 32 * 1024 * 32 * 128) for the 7B model.
34 | 
35 | We've added command line options to `example.py` and changed the default `max_seq_len` to 512 which should allow decoding on 30GB GPUs.
36 | 
37 | Feel free to lower these settings according to your hardware.
38 | 
39 | ## <a name="4"></a>4. Other languages
40 | The model was trained primarily on English, but also on a few other languages with Latin or Cyrillic alphabets.
41 | 
42 | For instance, LLaMA was trained on Wikipedia for the 20 following languages: bg, ca, cs, da, de, en, es, fr, hr, hu, it, nl, pl, pt, ro, ru, sl, sr, sv, uk.
43 | 
44 | LLaMA's tokenizer splits unseen characters into UTF-8 bytes, as a result, it might also be able to process other languages like Chinese or Japanese, even though they use different characters.
45 | 
46 | Although the fraction of these languages in the training was negligible, LLaMA still showcases some abilities in Chinese-English translation:
47 | 
48 | ```
49 | Prompt = "J'aime le chocolat = I like chocolate\n祝你一天过得愉快 ="
50 | Output = "I wish you a nice day"
51 | ```


--------------------------------------------------------------------------------
/gorilla/inference/README.md:
--------------------------------------------------------------------------------
 1 | # LLaMA 
 2 | 
 3 | This repository is intended as a minimal, hackable and readable example to load [LLaMA](https://ai.facebook.com/blog/large-language-model-llama-meta-ai/) ([arXiv](https://arxiv.org/abs/2302.13971v1)) models and run inference.
 4 | In order to download the checkpoints and tokenizer, fill this [google form](https://forms.gle/jk851eBVbX1m5TAv5)
 5 | 
 6 | ## Setup
 7 | 
 8 | In a conda env with pytorch / cuda available, run:
 9 | ```
10 | pip install -r requirements.txt
11 | ```
12 | Then in this repository:
13 | ```
14 | pip install -e .
15 | ```
16 | 
17 | ## Download
18 | 
19 | Once your request is approved, you will receive links to download the tokenizer and model files.
20 | Edit the `download.sh` script with the signed url provided in the email to download the model weights and tokenizer.
21 | 
22 | ## Inference
23 | 
24 | The provided `example.py` can be run on a single or multi-gpu node with `torchrun` and will output completions for two pre-defined prompts. Using `TARGET_FOLDER` as defined in `download.sh`:
25 | ```
26 | torchrun --nproc_per_node MP example.py --ckpt_dir $TARGET_FOLDER/model_size --tokenizer_path $TARGET_FOLDER/tokenizer.model
27 | ```
28 | 
29 | Different models require different MP values:
30 | 
31 | |  Model | MP |
32 | |--------|----|
33 | | 7B     | 1  |
34 | | 13B    | 2  |
35 | | 33B    | 4  |
36 | | 65B    | 8  |
37 | 
38 | ## FAQ
39 | 
40 | - [1. The download.sh script doesn't work on default bash in MacOS X](FAQ.md#1)
41 | - [2. Generations are bad!](FAQ.md#2)
42 | - [3. CUDA Out of memory errors](FAQ.md#3)
43 | - [4. Other languages](FAQ.md#4)
44 | 
45 | ## Reference
46 | 
47 | LLaMA: Open and Efficient Foundation Language Models -- https://arxiv.org/abs/2302.13971
48 | 
49 | ```
50 | @article{touvron2023llama,
51 |   title={LLaMA: Open and Efficient Foundation Language Models},
52 |   author={Touvron, Hugo and Lavril, Thibaut and Izacard, Gautier and Martinet, Xavier and Lachaux, Marie-Anne and Lacroix, Timoth{\'e}e and Rozi{\`e}re, Baptiste and Goyal, Naman and Hambro, Eric and Azhar, Faisal and Rodriguez, Aurelien and Joulin, Armand and Grave, Edouard and Lample, Guillaume},
53 |   journal={arXiv preprint arXiv:2302.13971},
54 |   year={2023}
55 | }
56 | ```
57 | 
58 | ## Model Card
59 | See [MODEL_CARD.md](MODEL_CARD.md)
60 | 
61 | ## License
62 | See the [LICENSE](LICENSE) file.
63 | 


--------------------------------------------------------------------------------
/gorilla/inference/download.sh:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | PRESIGNED_URL=""             # replace with presigned url from email
 5 | MODEL_SIZE="7B,13B,30B,65B"  # edit this list with the model sizes you wish to download
 6 | TARGET_FOLDER=""             # where all files should end up
 7 | 
 8 | declare -A N_SHARD_DICT
 9 | 
10 | N_SHARD_DICT["7B"]="0"
11 | N_SHARD_DICT["13B"]="1"
12 | N_SHARD_DICT["30B"]="3"
13 | N_SHARD_DICT["65B"]="7"
14 | 
15 | echo "Downloading tokenizer"
16 | wget ${PRESIGNED_URL/'*'/"tokenizer.model"} -O ${TARGET_FOLDER}"/tokenizer.model"
17 | wget ${PRESIGNED_URL/'*'/"tokenizer_checklist.chk"} -O ${TARGET_FOLDER}"/tokenizer_checklist.chk"
18 | 
19 | (cd ${TARGET_FOLDER} && md5sum -c tokenizer_checklist.chk)
20 | 
21 | for i in ${MODEL_SIZE//,/ }
22 | do
23 |     echo "Downloading ${i}"
24 |     mkdir -p ${TARGET_FOLDER}"/${i}"
25 |     for s in $(seq -f "0%g" 0 ${N_SHARD_DICT[$i]})
26 |     do
27 |         wget ${PRESIGNED_URL/'*'/"${i}/consolidated.${s}.pth"} -O ${TARGET_FOLDER}"/${i}/consolidated.${s}.pth"
28 |     done
29 |     wget ${PRESIGNED_URL/'*'/"${i}/params.json"} -O ${TARGET_FOLDER}"/${i}/params.json"
30 |     wget ${PRESIGNED_URL/'*'/"${i}/checklist.chk"} -O ${TARGET_FOLDER}"/${i}/checklist.chk"
31 |     echo "Checking checksums"
32 |     (cd ${TARGET_FOLDER}"/${i}" && md5sum -c checklist.chk)
33 | done


--------------------------------------------------------------------------------
/gorilla/inference/llama/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from .generation import LLaMA
5 | from .model import ModelArgs, Transformer
6 | from .tokenizer import Tokenizer
7 | 


--------------------------------------------------------------------------------
/gorilla/inference/llama/generation.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from typing import List
 5 | 
 6 | import torch
 7 | 
 8 | from llama.tokenizer import Tokenizer
 9 | from llama.model import Transformer
10 | 
11 | 
12 | class LLaMA:
13 |     def __init__(self, model: Transformer, tokenizer: Tokenizer):
14 |         self.model = model
15 |         self.tokenizer = tokenizer
16 | 
17 |     def generate(
18 |         self,
19 |         prompts: List[str],
20 |         max_gen_len: int,
21 |         temperature: float = 0.8,
22 |         top_p: float = 0.95,
23 |     ) -> List[str]:
24 |         bsz = len(prompts)
25 |         params = self.model.params
26 |         assert bsz <= params.max_batch_size, (bsz, params.max_batch_size)
27 | 
28 |         prompt_tokens = [self.tokenizer.encode(x, bos=True, eos=False) for x in prompts]
29 | 
30 |         min_prompt_size = min([len(t) for t in prompt_tokens])
31 |         max_prompt_size = max([len(t) for t in prompt_tokens])
32 | 
33 |         total_len = min(params.max_seq_len, max_gen_len + max_prompt_size)
34 | 
35 |         tokens = torch.full((bsz, total_len), self.tokenizer.pad_id).cuda().long()
36 |         for k, t in enumerate(prompt_tokens):
37 |             tokens[k, : len(t)] = torch.tensor(t).long()
38 |         input_text_mask = tokens != self.tokenizer.pad_id
39 |         start_pos = min_prompt_size
40 |         prev_pos = 0
41 |         for cur_pos in range(start_pos, total_len):
42 |             logits = self.model.forward(tokens[:, prev_pos:cur_pos], prev_pos)
43 |             if temperature > 0:
44 |                 probs = torch.softmax(logits / temperature, dim=-1)
45 |                 next_token = sample_top_p(probs, top_p)
46 |             else:
47 |                 next_token = torch.argmax(logits, dim=-1)
48 |             next_token = next_token.reshape(-1)
49 |             # only replace token if prompt has already been generated
50 |             next_token = torch.where(
51 |                 input_text_mask[:, cur_pos], tokens[:, cur_pos], next_token
52 |             )
53 |             tokens[:, cur_pos] = next_token
54 |             prev_pos = cur_pos
55 | 
56 |         decoded = []
57 |         for i, t in enumerate(tokens.tolist()):
58 |             # cut to max gen len
59 |             t = t[: len(prompt_tokens[i]) + max_gen_len]
60 |             # cut to eos tok if any
61 |             try:
62 |                 t = t[: t.index(self.tokenizer.eos_id)]
63 |             except ValueError:
64 |                 pass
65 |             decoded.append(self.tokenizer.decode(t))
66 |         return decoded
67 | 
68 | 
69 | def sample_top_p(probs, p):
70 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
71 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
72 |     mask = probs_sum - probs_sort > p
73 |     probs_sort[mask] = 0.0
74 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
75 |     next_token = torch.multinomial(probs_sort, num_samples=1)
76 |     next_token = torch.gather(probs_idx, -1, next_token)
77 |     return next_token
78 | 


--------------------------------------------------------------------------------
/gorilla/inference/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from sentencepiece import SentencePieceProcessor
 5 | from logging import getLogger
 6 | from typing import List
 7 | import os
 8 | 
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(
26 |             f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}"
27 |         )
28 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
29 | 
30 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
31 |         assert type(s) is str
32 |         t = self.sp_model.encode(s)
33 |         if bos:
34 |             t = [self.bos_id] + t
35 |         if eos:
36 |             t = t + [self.eos_id]
37 |         return t
38 | 
39 |     def decode(self, t: List[int]) -> str:
40 |         return self.sp_model.decode(t)
41 | 


--------------------------------------------------------------------------------
/gorilla/inference/llama_for_adapter/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from .generation import LLaMA
5 | from .model import ModelArgs, Transformer
6 | from .tokenizer import Tokenizer
7 | 


--------------------------------------------------------------------------------
/gorilla/inference/llama_for_adapter/generation.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from typing import List
 5 | 
 6 | import torch
 7 | 
 8 | from llama.model import Transformer
 9 | from llama.tokenizer import Tokenizer
10 | 
11 | 
12 | class LLaMA:
13 |     def __init__(self, model: Transformer, tokenizer: Tokenizer):
14 |         self.model = model
15 |         self.tokenizer = tokenizer
16 | 
17 |     def generate(
18 |         self,
19 |         prompts: List[str],
20 |         max_gen_len: int,
21 |         temperature: float = 0.8,
22 |         top_p: float = 0.95,
23 |     ) -> List[str]:
24 |         bsz = len(prompts)
25 |         params = self.model.params
26 |         assert bsz <= params.max_batch_size, (bsz, params.max_batch_size)
27 | 
28 |         prompt_tokens = [self.tokenizer.encode(x, bos=True, eos=False) for x in prompts]
29 | 
30 |         min_prompt_size = min([len(t) for t in prompt_tokens])
31 |         max_prompt_size = max([len(t) for t in prompt_tokens])
32 | 
33 |         total_len = min(params.max_seq_len, max_gen_len + max_prompt_size)
34 | 
35 |         tokens = torch.full((bsz, total_len), self.tokenizer.pad_id).cuda().long()
36 |         for k, t in enumerate(prompt_tokens):
37 |             tokens[k, : len(t)] = torch.tensor(t).long()
38 |         input_text_mask = tokens != self.tokenizer.pad_id
39 |         start_pos = min_prompt_size
40 |         prev_pos = 0
41 |         for cur_pos in range(start_pos, total_len):
42 |             logits = self.model.forward(tokens[:, prev_pos:cur_pos], prev_pos)
43 |             if temperature > 0:
44 |                 probs = torch.softmax(logits / temperature, dim=-1)
45 |                 next_token = sample_top_p(probs, top_p)
46 |             else:
47 |                 next_token = torch.argmax(logits, dim=-1)
48 |             next_token = next_token.reshape(-1)
49 |             # only replace token if prompt has already been generated
50 |             next_token = torch.where(input_text_mask[:, cur_pos], tokens[:, cur_pos], next_token)
51 |             tokens[:, cur_pos] = next_token
52 |             prev_pos = cur_pos
53 | 
54 |         decoded = []
55 |         for i, t in enumerate(tokens.tolist()):
56 |             # cut to max gen len
57 |             t = t[: len(prompt_tokens[i]) + max_gen_len]
58 |             # cut to eos tok if any
59 |             try:
60 |                 t = t[: t.index(self.tokenizer.eos_id)]
61 |             except ValueError:
62 |                 pass
63 |             decoded.append(self.tokenizer.decode(t))
64 |         return decoded
65 | 
66 | 
67 | def sample_top_p(probs, p):
68 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
69 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
70 |     mask = probs_sum - probs_sort > p
71 |     probs_sort[mask] = 0.0
72 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
73 |     next_token = torch.multinomial(probs_sort, num_samples=1)
74 |     next_token = torch.gather(probs_idx, -1, next_token)
75 |     return next_token
76 | 


--------------------------------------------------------------------------------
/gorilla/inference/llama_for_adapter/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | import os
 5 | from logging import getLogger
 6 | from typing import List
 7 | 
 8 | from sentencepiece import SentencePieceProcessor
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}")
26 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
27 | 
28 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
29 |         assert type(s) is str
30 |         t = self.sp_model.encode(s)
31 |         if bos:
32 |             t = [self.bos_id] + t
33 |         if eos:
34 |             t = t + [self.eos_id]
35 |         return t
36 | 
37 |     def decode(self, t: List[int]) -> str:
38 |         return self.sp_model.decode(t)
39 | 


--------------------------------------------------------------------------------
/gorilla/inference/requirements.txt:
--------------------------------------------------------------------------------
1 | torch
2 | fairscale
3 | fire
4 | sentencepiece


--------------------------------------------------------------------------------
/gorilla/inference/setup.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from setuptools import setup, find_packages
5 | 
6 | setup(name="llama", version="0.0.0", packages=find_packages())
7 | 


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/.assets/bird_audio.wav:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/.assets/bird_audio.wav


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/.assets/bird_image.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/.assets/bird_image.jpg


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/.assets/car_audio.wav:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/.assets/car_audio.wav


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/.assets/car_image.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/.assets/car_image.jpg


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/.assets/dog_audio.wav:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/.assets/dog_audio.wav


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/.assets/dog_image.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/.assets/dog_image.jpg


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/.gitignore:
--------------------------------------------------------------------------------
1 | **__pycache__
2 | .vscode
3 | .DS_Store
4 | 


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/CODE_OF_CONDUCT.md:
--------------------------------------------------------------------------------
 1 | # Code of Conduct
 2 | 
 3 | ## Our Pledge
 4 | 
 5 | In the interest of fostering an open and welcoming environment, we as
 6 | contributors and maintainers pledge to make participation in our project and
 7 | our community a harassment-free experience for everyone, regardless of age, body
 8 | size, disability, ethnicity, sex characteristics, gender identity and expression,
 9 | level of experience, education, socio-economic status, nationality, personal
10 | appearance, race, religion, or sexual identity and orientation.
11 | 
12 | ## Our Standards
13 | 
14 | Examples of behavior that contributes to creating a positive environment
15 | include:
16 | 
17 | * Using welcoming and inclusive language
18 | * Being respectful of differing viewpoints and experiences
19 | * Gracefully accepting constructive criticism
20 | * Focusing on what is best for the community
21 | * Showing empathy towards other community members
22 | 
23 | Examples of unacceptable behavior by participants include:
24 | 
25 | * The use of sexualized language or imagery and unwelcome sexual attention or
26 | advances
27 | * Trolling, insulting/derogatory comments, and personal or political attacks
28 | * Public or private harassment
29 | * Publishing others' private information, such as a physical or electronic
30 | address, without explicit permission
31 | * Other conduct which could reasonably be considered inappropriate in a
32 | professional setting
33 | 
34 | ## Our Responsibilities
35 | 
36 | Project maintainers are responsible for clarifying the standards of acceptable
37 | behavior and are expected to take appropriate and fair corrective action in
38 | response to any instances of unacceptable behavior.
39 | 
40 | Project maintainers have the right and responsibility to remove, edit, or
41 | reject comments, commits, code, wiki edits, issues, and other contributions
42 | that are not aligned to this Code of Conduct, or to ban temporarily or
43 | permanently any contributor for other behaviors that they deem inappropriate,
44 | threatening, offensive, or harmful.
45 | 
46 | ## Scope
47 | 
48 | This Code of Conduct applies within all project spaces, and it also applies when
49 | an individual is representing the project or its community in public spaces.
50 | Examples of representing a project or community include using an official
51 | project e-mail address, posting via an official social media account, or acting
52 | as an appointed representative at an online or offline event. Representation of
53 | a project may be further defined and clarified by project maintainers.
54 | 
55 | This Code of Conduct also applies outside the project spaces when there is a
56 | reasonable belief that an individual's behavior may have a negative impact on
57 | the project or its community.
58 | 
59 | ## Enforcement
60 | 
61 | Instances of abusive, harassing, or otherwise unacceptable behavior may be
62 | reported by contacting the project team at <opensource-conduct@fb.com>. All
63 | complaints will be reviewed and investigated and will result in a response that
64 | is deemed necessary and appropriate to the circumstances. The project team is
65 | obligated to maintain confidentiality with regard to the reporter of an incident.
66 | Further details of specific enforcement policies may be posted separately.
67 | 
68 | Project maintainers who do not follow or enforce the Code of Conduct in good
69 | faith may face temporary or permanent repercussions as determined by other
70 | members of the project's leadership.
71 | 
72 | ## Attribution
73 | 
74 | This Code of Conduct is adapted from the [Contributor Covenant][homepage], version 1.4,
75 | available at https://www.contributor-covenant.org/version/1/4/code-of-conduct.html
76 | 
77 | [homepage]: https://www.contributor-covenant.org
78 | 
79 | For answers to common questions about this code of conduct, see
80 | https://www.contributor-covenant.org/faq


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | # Contributing to ImageBind
 2 | We want to make contributing to this project as easy and transparent as
 3 | possible.
 4 | 
 5 | ## Pull Requests
 6 | We actively welcome your pull requests.
 7 | 
 8 | 1. Fork the repo and create your branch from `main`.
 9 | 2. If you've added code that should be tested, add tests.
10 | 3. If you've changed APIs, update the documentation.
11 | 4. Ensure the test suite passes.
12 | 5. Make sure your code lints.
13 | 6. If you haven't already, complete the Contributor License Agreement ("CLA").
14 | 
15 | ## Contributor License Agreement ("CLA")
16 | In order to accept your pull request, we need you to submit a CLA. You only need
17 | to do this once to work on any of Meta's open source projects.
18 | 
19 | Complete your CLA here: <https://code.facebook.com/cla>
20 | 
21 | ## Issues
22 | We use GitHub issues to track public bugs. Please ensure your description is
23 | clear and has sufficient instructions to be able to reproduce the issue.
24 | 
25 | Meta has a [bounty program](https://www.facebook.com/whitehat/) for the safe
26 | disclosure of security bugs. In those cases, please go through the process
27 | outlined on that page and do not file a public issue.
28 | 
29 | ## License
30 | By contributing to Omnivore, you agree that your contributions will be licensed
31 | under the [LICENSE](LICENSE) file in the root directory of this source tree.
32 | 


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/bpe/bpe_simple_vocab_16e6.txt.gz:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/bpe/bpe_simple_vocab_16e6.txt.gz


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/demo.py:
--------------------------------------------------------------------------------
 1 | import data
 2 | import torch
 3 | from models import imagebind_model
 4 | from models.imagebind_model import ModalityType
 5 | 
 6 | text_list=["A dog.", "A car", "A bird"]
 7 | image_paths=[".assets/dog_image.jpg", ".assets/car_image.jpg", ".assets/bird_image.jpg"]
 8 | audio_paths=[".assets/dog_audio.wav", ".assets/car_audio.wav", ".assets/bird_audio.wav"]
 9 | 
10 | device = "cuda:0" if torch.cuda.is_available() else "cpu"
11 | 
12 | # Instantiate model
13 | model = imagebind_model.imagebind_huge(pretrained=True)
14 | model.eval()
15 | model.to(device)
16 | 
17 | # Load data
18 | inputs = {
19 |     ModalityType.TEXT: data.load_and_transform_text(text_list, device),
20 |     ModalityType.VISION: data.load_and_transform_vision_data(image_paths, device),
21 |     ModalityType.AUDIO: data.load_and_transform_audio_data(audio_paths, device),
22 | }
23 | 
24 | with torch.no_grad():
25 |     embeddings = model(inputs)
26 | 
27 | print(
28 |     "Vision x Text: ",
29 |     torch.softmax(embeddings[ModalityType.VISION] @ embeddings[ModalityType.TEXT].T, dim=-1),
30 | )
31 | print(
32 |     "Audio x Text: ",
33 |     torch.softmax(embeddings[ModalityType.AUDIO] @ embeddings[ModalityType.TEXT].T, dim=-1),
34 | )
35 | print(
36 |     "Vision x Audio: ",
37 |     torch.softmax(embeddings[ModalityType.VISION] @ embeddings[ModalityType.AUDIO].T, dim=-1),
38 | )
39 | 
40 | # Expected output:
41 | #
42 | # Vision x Text:
43 | # tensor([[9.9761e-01, 2.3694e-03, 1.8612e-05],
44 | #         [3.3836e-05, 9.9994e-01, 2.4118e-05],
45 | #         [4.7997e-05, 1.3496e-02, 9.8646e-01]])
46 | #
47 | # Audio x Text:
48 | # tensor([[1., 0., 0.],
49 | #         [0., 1., 0.],
50 | #         [0., 0., 1.]])
51 | #
52 | # Vision x Audio:
53 | # tensor([[0.8070, 0.1088, 0.0842],
54 | #         [0.1036, 0.7884, 0.1079],
55 | #         [0.0018, 0.0022, 0.9960]])
56 | 


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/models/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/ImageBind/models/__init__.py


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/models/pointbert/PointTransformer_8192point.yaml:
--------------------------------------------------------------------------------
 1 | optimizer : {
 2 |   type: AdamW,
 3 |   kwargs: {
 4 |   lr : 0.0005, 
 5 |   weight_decay : 0.05
 6 | }}
 7 | 
 8 | scheduler: {
 9 |   type: CosLR,
10 |   kwargs: {
11 |     epochs: 300,
12 |     initial_epochs : 10
13 | }}
14 | 
15 | model : {
16 |   NAME: PointTransformer,
17 |   trans_dim: 384, 
18 |   depth: 12, 
19 |   drop_path_rate: 0.1, 
20 |   cls_dim: 40, 
21 |   num_heads: 6,
22 |   group_size: 32, 
23 |   num_group: 512,
24 |   encoder_dims: 256,
25 | }
26 | npoints: 8192
27 | total_bs : 32
28 | step_per_update : 1
29 | max_epoch : 300
30 | grad_norm_clip : 10
31 | 
32 | consider_metric: CDL1


--------------------------------------------------------------------------------
/imagebind_LLM/ImageBind/requirements.txt:
--------------------------------------------------------------------------------
 1 | --extra-index-url https://download.pytorch.org/whl/cu113
 2 | torch==1.13.0
 3 | torchvision==0.14.0
 4 | torchaudio==0.13.0
 5 | pytorchvideo @ git+https://github.com/facebookresearch/pytorchvideo.git@28fe037d212663c6a24f373b94cc5d478c8c1a1d
 6 | timm==0.6.7
 7 | ftfy
 8 | regex
 9 | einops
10 | fvcore
11 | decord==0.6.0
12 | iopath
13 | numpy
14 | matplotlib
15 | types-regex
16 | mayavi
17 | cartopy
18 | 


--------------------------------------------------------------------------------
/imagebind_LLM/convert_ckpt.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | from collections import OrderedDict
 3 | import argparse
 4 | from pathlib import Path
 5 | 
 6 | parser = argparse.ArgumentParser()
 7 | parser.add_argument(
 8 |     "--ori", required=True, type=str,
 9 |     help="Name of or path to LLaMAAdapter pretrained checkpoint",
10 | )
11 | parser.add_argument(
12 |     "--target", default=None,
13 |     help="target position for the ckpt",
14 | )
15 | args = parser.parse_args()
16 | 
17 | ori_ckpt_path = Path(args.ori)
18 | target_ckpt_path = ori_ckpt_path.with_stem("converted_" + ori_ckpt_path.stem)
19 | 
20 | ckpt = torch.load(ori_ckpt_path, map_location='cpu')
21 | 
22 | replace_dict = {
23 |     'llma': 'llama'
24 | }
25 | renamed_ckpt = {}
26 | for key, val in ckpt['model'].items():
27 |     for replace_key, replace_val in replace_dict.items():
28 |         key = key.replace(replace_key, replace_val)
29 |     renamed_ckpt[key] = val
30 | 
31 | 
32 | new_ckpt = {}
33 | discarded  = []
34 | 
35 | for key, val in renamed_ckpt.items():
36 |     if key.startswith('image_bind.'):
37 |         discarded.append(key)
38 |     elif key.startswith("llama.") and "bias" not in key and "gate" not in key and "lora" not in key and "norm" not in key:
39 |         discarded.append(key)
40 |     else:
41 |         new_ckpt[key] = val
42 | 
43 | to_remove = ['prefix_projector_norm.weight', 'prefix_projector_norm.bias']
44 | for _ in to_remove:
45 |     if _ in new_ckpt:
46 |         del new_ckpt[_]
47 | 
48 | 
49 | print(f"discarded: {discarded}")
50 | print(f"saved: {list(new_ckpt.keys())}")
51 | 
52 | new_ckpt = {'model': new_ckpt}
53 | torch.save(new_ckpt, target_ckpt_path)


--------------------------------------------------------------------------------
/imagebind_LLM/demo.py:
--------------------------------------------------------------------------------
 1 | import ImageBind.data as data
 2 | import llama
 3 | 
 4 | 
 5 | llama_dir = "/path/to/LLaMA"
 6 | 
 7 | model = llama.load("7B", llama_dir, knn=True)
 8 | model.eval()
 9 | 
10 | inputs = {}
11 | image = data.load_and_transform_vision_data(["examples/girl.jpg"], device='cuda')
12 | inputs['Image'] = [image, 1]
13 | audio = data.load_and_transform_audio_data(['examples/girl_bgm.wav'], device='cuda')
14 | inputs['Audio'] = [audio, 1]
15 | 
16 | results = model.generate(
17 |     inputs,
18 |     [llama.format_prompt("Guess the girl's mood based on the background music and explain the reason?")],
19 |     max_gen_len=256
20 | )
21 | result = results[0].strip()
22 | print(result)


--------------------------------------------------------------------------------
/imagebind_LLM/demo_3d.py:
--------------------------------------------------------------------------------
 1 | import ImageBind.data as data
 2 | import llama
 3 | 
 4 | 
 5 | llama_dir = "/path/to/LLaMA"
 6 | 
 7 | model = llama.load("7B", llama_dir, knn=True)
 8 | model.eval()
 9 | 
10 | inputs = {}
11 | point = data.load_and_transform_point_cloud_data(["examples/airplane.pt"], device='cuda')
12 | inputs['Point'] = [point, 1]
13 | 
14 | results = model.generate(
15 |     inputs,
16 |     [llama.format_prompt("Describe the 3D object in detail.")],
17 |     max_gen_len=256
18 | )
19 | result = results[0].strip()
20 | print(result)
21 | 


--------------------------------------------------------------------------------
/imagebind_LLM/docs/train.md:
--------------------------------------------------------------------------------
 1 | The training process of ImageBind-LLM consists of the pre-training and fine-tuning phases. 
 2 | 
 3 | ## Pre-training
 4 | ### Data
 5 | * We use multiple datasets with **image-text pairs** for pre-training. The texts are English-only.
 6 | 
 7 | * For each dataset, the meta file should be organized in the `.csv` format as following:
 8 | 
 9 |   ```
10 |   url		caption
11 |   /path/to/image1		caption1
12 |   /path/to/image2		caption2
13 |   ...
14 |   ```
15 | 
16 |   Alternatively, you may modify the [`PretrainDataset`](/data/dataset.py) implementation to adapt to your own meta file format.
17 | 
18 | * Write a `.yaml` config file to specify the datasets for pre-training:
19 |   ```
20 |   META:
21 |     - '/path/to/cc3m.csv'
22 |     - '/path/to/coco.csv'
23 |     ...
24 |   ```
25 | 
26 | ### Start pre-training
27 | 
28 | We are now ready to start pre-training (please make sure that the original LLaMA / Open-Chinese-LLaMA weights are available in `/path/to/llama_model_weights`). 
29 | 
30 | ```bash
31 | . exps/pretrain.sh /path/to/llama_model_weights /path/to/pretrain-data-config.yaml /output/path
32 | ```
33 | 
34 | ### Pre-trained checkpoint
35 | We release our image-text pre-trained checkpoint for reproduction. You may directly use it for fine-tuning.
36 | 
37 | | Name              | Link                                                                                  |
38 | |-------------------|---------------------------------------------------------------------------------------|
39 | | 7B-pretrained.pth | [File Link](https://huggingface.co/Cxxs/ImageBind-LLM/resolve/main/7B-pretrained.pth) |
40 | 
41 | 
42 | 
43 | 
44 | ## Fine-tuning
45 | 
46 | ### Data
47 | 
48 | * We fine-tune ImageBind-LLM on text-only as well as image-text instruction following datasets.
49 | 
50 | * The following lists the datasets we use for training our release weights:
51 | 
52 |   | Name                     | Link                                                         |
53 |   | ------------------------ | ------------------------------------------------------------ |
54 |   | alpaca_gpt4_data.json    | [File Link](https://github.com/Instruction-Tuning-with-GPT-4/GPT-4-LLM/blob/main/data/alpaca_gpt4_data.json) |
55 |   | alpaca_gpt4_data_zh.json | [File Link](https://github.com/Instruction-Tuning-with-GPT-4/GPT-4-LLM/blob/main/data/alpaca_gpt4_data_zh.json) |
56 |   | llava_instruct_150k.json | [File Link](https://huggingface.co/datasets/liuhaotian/LLaVA-Instruct-150K/raw/main/llava_instruct_150k.json) |
57 |   | alpaca_data_zh_51k.json  | [File Link](https://github.com/ymcui/Chinese-LLaMA-Alpaca/blob/main/data/alpaca_data_zh_51k.json) |
58 | 
59 | * Similar to pre-training, write a `.yaml` config file to specify the datasets for fine-tuning:
60 | 
61 |   ```
62 |   META:
63 |     - '/path/to/alpaca_gpt4_data.json'
64 |     - '/path/to/alpaca_gpt4_data_zh.json'
65 |     ...
66 |   ```
67 | 
68 | ### Start fine-tuning
69 | 
70 | ```bash
71 | . exps/finetune.sh \
72 |  /path/to/llama_model_weights /path/to/pre-trained/checkopint.pth \
73 |  /path/to/finetune-data-config.yaml /output/path
74 | ```
75 | 
76 | 


--------------------------------------------------------------------------------
/imagebind_LLM/engine_finetune.py:
--------------------------------------------------------------------------------
 1 | import math
 2 | import sys
 3 | from typing import Iterable
 4 | 
 5 | import torch
 6 | 
 7 | import util.misc as misc
 8 | import util.lr_sched as lr_sched
 9 | 
10 | from llama import LLaMA_adapter
11 | 
12 | def train_one_epoch(model: LLaMA_adapter,
13 |                     data_loader: Iterable, optimizer: torch.optim.Optimizer,
14 |                     device: torch.device, epoch: int, loss_scaler,
15 |                     log_writer=None,
16 |                     args=None):
17 |     model.train(True)
18 |     # model.module.set_default_trainability()
19 | 
20 |     metric_logger = misc.MetricLogger(delimiter="  ")
21 |     metric_logger.add_meter('lr', misc.SmoothedValue(window_size=1, fmt='{value:.6f}'))
22 |     header = 'Epoch: [{}]'.format(epoch)
23 |     print_freq = 10
24 | 
25 |     accum_iter = args.accum_iter
26 | 
27 |     optimizer.zero_grad()
28 | 
29 |     if log_writer is not None:
30 |         print('log_dir: {}'.format(log_writer.log_dir))
31 |     for data_iter_step, (examples, labels, example_mask, imgs) in enumerate(metric_logger.log_every(data_loader, print_freq, header)):
32 |         # we use a per iteration (instead of per epoch) lr scheduler
33 |         if data_iter_step % accum_iter == 0:
34 |             lr_sched.adjust_learning_rate(optimizer, data_iter_step / len(data_loader) + epoch, args)
35 | 
36 |         imgs = imgs.to(device, non_blocking=True)
37 |         with torch.cuda.amp.autocast():
38 |              c_loss, m_loss = model(examples, labels, imgs)
39 |         loss = c_loss  + m_loss * 0
40 |         loss_value = loss.item()
41 |         c_loss_value = c_loss.item()
42 |         m_loss_value = m_loss
43 |         if not math.isfinite(loss_value):
44 |             print("Loss is {}, stopping training".format(loss_value))
45 |             sys.exit(1)
46 | 
47 |         loss /= accum_iter
48 |         loss_scaler(loss, optimizer, parameters=model.parameters(),
49 |                     update_grad=(data_iter_step + 1) % accum_iter == 0)
50 |         if (data_iter_step + 1) % accum_iter == 0:
51 |             optimizer.zero_grad()
52 | 
53 |         torch.cuda.synchronize()
54 | 
55 |         metric_logger.update(closs=c_loss_value)
56 |         metric_logger.update(mloss=m_loss_value)
57 | 
58 |         lr = optimizer.param_groups[0]["lr"]
59 |         metric_logger.update(lr=lr)
60 | 
61 |         loss_value_reduce = misc.all_reduce_mean(loss_value)
62 |         c_loss_value_reduce = misc.all_reduce_mean(c_loss_value)
63 |         m_loss_value_reduce = misc.all_reduce_mean(m_loss_value)
64 |         if log_writer is not None and (data_iter_step + 1) % accum_iter == 0:
65 |             """ We use epoch_1000x as the x-axis in tensorboard.
66 |             This calibrates different curves when batch size changes.
67 |             """
68 |             epoch_1000x = int((data_iter_step / len(data_loader) + epoch) * 1000)
69 |             log_writer.add_scalar('c_train_loss', c_loss_value_reduce, epoch_1000x)
70 |             log_writer.add_scalar('m_train_loss', m_loss_value_reduce, epoch_1000x)
71 |             log_writer.add_scalar('lr', lr, epoch_1000x)
72 | 
73 | 
74 |     # gather the stats from all processes
75 |     metric_logger.synchronize_between_processes()
76 |     print("Averaged stats:", metric_logger)
77 |     return {k: meter.global_avg for k, meter in metric_logger.meters.items()}
78 | 


--------------------------------------------------------------------------------
/imagebind_LLM/engine_pretrain.py:
--------------------------------------------------------------------------------
 1 | import math
 2 | import sys
 3 | from typing import Iterable
 4 | 
 5 | import torch
 6 | 
 7 | import util.misc as misc
 8 | import util.lr_sched as lr_sched
 9 | 
10 | from llama import LLaMA_adapter
11 | 
12 | def train_one_epoch(model: LLaMA_adapter,
13 |                     data_loader: Iterable, optimizer: torch.optim.Optimizer,
14 |                     device: torch.device, epoch: int, loss_scaler,
15 |                     log_writer=None,
16 |                     args=None):
17 |     model.train(True)
18 |     # model.module.set_default_trainability()
19 | 
20 |     metric_logger = misc.MetricLogger(delimiter="  ")
21 |     metric_logger.add_meter('lr', misc.SmoothedValue(window_size=1, fmt='{value:.6f}'))
22 |     header = 'Epoch: [{}]'.format(epoch)
23 |     print_freq = 10
24 | 
25 |     accum_iter = args.accum_iter
26 | 
27 |     optimizer.zero_grad()
28 | 
29 |     if log_writer is not None:
30 |         print('log_dir: {}'.format(log_writer.log_dir))
31 |     for data_iter_step, (examples, labels, example_mask, imgs) in enumerate(metric_logger.log_every(data_loader, print_freq, header)):
32 |         # we use a per iteration (instead of per epoch) lr scheduler
33 |         if data_iter_step % accum_iter == 0:
34 |             lr_sched.adjust_learning_rate(optimizer, data_iter_step / len(data_loader) + epoch, args)
35 | 
36 |         imgs = imgs.to(device, non_blocking=True)
37 |         with torch.cuda.amp.autocast():
38 |              c_loss, m_loss = model(examples, labels, imgs)
39 |         loss = c_loss  + m_loss * 0
40 |         loss_value = loss.item()
41 |         c_loss_value = c_loss.item()
42 |         m_loss_value = m_loss
43 |         if not math.isfinite(loss_value):
44 |             print("Loss is {}, stopping training".format(loss_value))
45 |             sys.exit(1)
46 | 
47 |         loss /= accum_iter
48 |         loss_scaler(loss, optimizer, parameters=model.parameters(),
49 |                     update_grad=(data_iter_step + 1) % accum_iter == 0)
50 |         if (data_iter_step + 1) % accum_iter == 0:
51 |             optimizer.zero_grad()
52 | 
53 |         torch.cuda.synchronize()
54 | 
55 |         metric_logger.update(closs=c_loss_value)
56 |         metric_logger.update(mloss=m_loss_value)
57 | 
58 |         lr = optimizer.param_groups[0]["lr"]
59 |         metric_logger.update(lr=lr)
60 | 
61 |         loss_value_reduce = misc.all_reduce_mean(loss_value)
62 |         c_loss_value_reduce = misc.all_reduce_mean(c_loss_value)
63 |         m_loss_value_reduce = misc.all_reduce_mean(m_loss_value)
64 |         if log_writer is not None and (data_iter_step + 1) % accum_iter == 0:
65 |             """ We use epoch_1000x as the x-axis in tensorboard.
66 |             This calibrates different curves when batch size changes.
67 |             """
68 |             epoch_1000x = int((data_iter_step / len(data_loader) + epoch) * 1000)
69 |             log_writer.add_scalar('c_train_loss', c_loss_value_reduce, epoch_1000x)
70 |             log_writer.add_scalar('m_train_loss', m_loss_value_reduce, epoch_1000x)
71 |             log_writer.add_scalar('lr', lr, epoch_1000x)
72 | 
73 | 
74 |     # gather the stats from all processes
75 |     metric_logger.synchronize_between_processes()
76 |     print("Averaged stats:", metric_logger)
77 |     return {k: meter.global_avg for k, meter in metric_logger.meters.items()}
78 | 


--------------------------------------------------------------------------------
/imagebind_LLM/examples/airplane.pt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/examples/airplane.pt


--------------------------------------------------------------------------------
/imagebind_LLM/examples/car.pt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/examples/car.pt


--------------------------------------------------------------------------------
/imagebind_LLM/examples/door.pt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/examples/door.pt


--------------------------------------------------------------------------------
/imagebind_LLM/examples/girl.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/examples/girl.jpg


--------------------------------------------------------------------------------
/imagebind_LLM/examples/girl_bgm.wav:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/examples/girl_bgm.wav


--------------------------------------------------------------------------------
/imagebind_LLM/examples/toilet.pt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/OpenGVLab/LLaMA-Adapter/521a09da84f70f6913d54b7421afa24010319e47/imagebind_LLM/examples/toilet.pt


--------------------------------------------------------------------------------
/imagebind_LLM/exps/finetune.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/bash
 2 | 
 3 | LLAMA_PATH="$1"
 4 | PRETRAINED_PATH="$2" # path to pre-trained checkpoint
 5 | CONFIG="$3"
 6 | OUTPUT_DIR="$4"
 7 | 
 8 | mkdir -p "$OUTPUT_DIR"
 9 | 
10 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
11 |  main_finetune.py --data_config "$CONFIG" --batch_size 4 \
12 |  --epochs 4 --warmup_epochs 1 --blr 10e-4 --weight_decay 0.02 \
13 |  --llama_path "$LLAMA_PATH" \
14 |  --output_dir "$OUTPUT_DIR" \
15 |  --pretrained_path "$PRETRAINED_PATH" \
16 |  &>> "$OUTPUT_DIR"/output.log &


--------------------------------------------------------------------------------
/imagebind_LLM/exps/finetune_ENCN.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/bash
 2 | 
 3 | LLAMA_PATH="$1"
 4 | PRETRAINED_PATH="$2" # path to pre-trained checkpoint
 5 | OUTPUT_DIR="$3"
 6 | 
 7 | mkdir -p "$OUTPUT_DIR"
 8 | 
 9 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
10 |  main_finetune.py --batch_size 4 --data_config='configs/data/finetune/EN_CN.yaml' \
11 |  --epochs 4 --warmup_epochs 1 --blr 10e-4 --weight_decay 0.02 \
12 |  --llama_path "$LLAMA_PATH" \
13 |  --output_dir "$OUTPUT_DIR" --llama_type 7B_chinese \
14 |  --pretrained_path "$PRETRAINED_PATH" \
15 |  &>> "$OUTPUT_DIR"/output.log &


--------------------------------------------------------------------------------
/imagebind_LLM/exps/pretrain.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/bash
 2 | 
 3 | LLAMA_PATH="$1"
 4 | CONFIG="$2"
 5 | OUTPUT_DIR="$3"
 6 | 
 7 | mkdir -p "$OUTPUT_DIR"
 8 | 
 9 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
10 |  main_pretrain.py --data_config "$CONFIG" --batch_size 4 \
11 |  --epochs 150 --split_epoch 50 --warmup_epochs 5 --blr 1.0e-4 --weight_decay 0.05 \
12 |  --llama_path "$LLAMA_PATH" \
13 |  --output_dir "$OUTPUT_DIR" \
14 |  &>> "$OUTPUT_DIR"/output.log &


--------------------------------------------------------------------------------
/imagebind_LLM/image_generate.py:
--------------------------------------------------------------------------------
 1 | import llama
 2 | import torch
 3 | import numpy as np
 4 | 
 5 | 
 6 | @torch.inference_mode()
 7 | def image_generate(inputs, model: llama.LLaMA_adapter, pipe, prompt, cache_size, cache_t, cache_weight, knn=True, point_scale=5.):
 8 | 
 9 |     embeddings = []
10 |     embeddings_weights = []
11 | 
12 |     for input_type, (input, input_weight) in inputs.items():
13 |         if input_type in ['Image', 'Video']:
14 |             type = 'vision'
15 |         else:
16 |             type = input_type.lower()
17 |         embedding = model.image_bind({type : input}, prenorm=True)[1][type]
18 |         if type == 'point':
19 |             embedding = embedding / point_scale
20 |         embeddings.append(embedding)
21 |         embeddings_weights.append(input_weight)
22 |     embeddings_weights = [x/(sum(embeddings_weights)+1e-6) for x in embeddings_weights]
23 |     embedding = sum([embedding*embedding_weight for embedding, embedding_weight in zip(embeddings, embeddings_weights)])
24 | 
25 |     if knn:
26 |         index = model.index
27 | 
28 |         embedding_norm_scale = embedding.norm(dim=-1, keepdim=True)
29 |         embedding = embedding / embedding_norm_scale
30 |         embedding_ori = embedding
31 | 
32 |         sims, indices = index.search(embedding.detach().cpu(), int(cache_size))
33 |         B = sims.shape[0]
34 |         prototypes = [index.reconstruct(x) for x in indices.reshape(-1, ).tolist()]
35 |         prototypes = np.vstack(prototypes).reshape(B, int(cache_size), -1)  # [N, top_k, 1024]
36 |         sims = torch.tensor(sims, device='cuda')
37 |         prototypes = torch.tensor(prototypes, device='cuda')
38 | 
39 |         sims = (sims * cache_t).softmax(dim=-1)
40 |         embedding = sims @ prototypes
41 |         embedding = embedding / embedding.norm(dim=-1, keepdim=True)
42 | 
43 |         embedding = (1-cache_weight) * embedding_ori + cache_weight * embedding
44 |         embedding = embedding / embedding.norm(dim=-1, keepdim=True)
45 | 
46 |         embedding = embedding_norm_scale*embedding
47 | 
48 |     embedding = torch.squeeze(embedding,0)
49 |     image = pipe(prompt=prompt, image_embeds=embedding).images[0]
50 | 
51 |     return image


--------------------------------------------------------------------------------
/imagebind_LLM/llama/__init__.py:
--------------------------------------------------------------------------------
1 | from .llama import ModelArgs, Transformer
2 | from .tokenizer import Tokenizer
3 | from .llama_adapter import *
4 | from .utils import format_prompt


--------------------------------------------------------------------------------
/imagebind_LLM/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from sentencepiece import SentencePieceProcessor
 5 | from logging import getLogger
 6 | from typing import List
 7 | import os
 8 | 
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(
26 |             f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}"
27 |         )
28 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
29 | 
30 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
31 |         assert type(s) is str
32 |         t = self.sp_model.encode(s)
33 |         if bos:
34 |             t = [self.bos_id] + t
35 |         if eos:
36 |             t = t + [self.eos_id]
37 |         return t
38 | 
39 |     def decode(self, t: List[int]) -> str:
40 |         return self.sp_model.decode(t)
41 | 


--------------------------------------------------------------------------------
/imagebind_LLM/llama/utils.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | 
 4 | def sample_top_p(probs, p):
 5 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
 6 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
 7 |     mask = probs_sum - probs_sort > p
 8 |     probs_sort[mask] = 0.0
 9 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
10 |     next_token = torch.multinomial(probs_sort, num_samples=1)
11 |     next_token = torch.gather(probs_idx, -1, next_token)
12 |     return next_token
13 | 
14 | 
15 | def format_prompt(instruction, input=None):
16 | 
17 |     PROMPT_DICT = {
18 |         "prompt_input": (
19 |             "Below is an instruction that describes a task, paired with an input that provides further context. "
20 |             "Write a response that appropriately completes the request.\n\n"
21 |             "### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:"
22 |         ),
23 |         "prompt_no_input": (
24 |             "Below is an instruction that describes a task. "
25 |             "Write a response that appropriately completes the request.\n\n"
26 |             "### Instruction:\n{instruction}\n\n### Response:"
27 |         ),
28 |     }
29 |     if input is None or input=='':
30 |         return PROMPT_DICT['prompt_no_input'].format_map({'instruction': instruction})
31 |     else:
32 |         return PROMPT_DICT["prompt_input"].format_map({'instruction': instruction, 'input': input})
33 | 
34 | 


--------------------------------------------------------------------------------
/imagebind_LLM/requirements.txt:
--------------------------------------------------------------------------------
 1 | fairscale
 2 | sentencepiece
 3 | Pillow
 4 | opencv-python
 5 | gradio
 6 | tqdm
 7 | autofaiss
 8 | tensorboard
 9 | diffusers
10 | plotly
11 | easydict
12 | https://github.com/unlimblue/KNN_CUDA/releases/download/0.2/KNN_CUDA-0.2-py3-none-any.whl
13 | huggingface_hub
14 | transformers
15 | open3d


--------------------------------------------------------------------------------
/imagebind_LLM/tools/get_chinese_llama.py:
--------------------------------------------------------------------------------
 1 | # Script for obtaining Chinese LLaMA weights from the OpenChineseLLaMA project (https://github.com/OpenLMLab/OpenChineseLLaMA)
 2 | # Due to the License of LLaMA, we only provide a delta-version patch
 3 | # Adding the patch to the original LLaMA weights makes the Chinese LLaMA weights
 4 | import os
 5 | import sys
 6 | sys.path.append(os.path.abspath(__file__).rsplit('/', 2)[0])
 7 | import shutil
 8 | import torch
 9 | import argparse
10 | from util.misc import download
11 | 
12 | parser = argparse.ArgumentParser()
13 | parser.add_argument(
14 |     "--llama_dir", default="/path/to/llama", type=str,
15 |     help="Path to official LLaMA weights",
16 | )
17 | args = parser.parse_args()
18 | 
19 | ori_path = os.path.join(args.llama_dir, '7B')
20 | delta_path = os.path.join(args.llama_dir, '7B_chinese_delta')
21 | new_path = os.path.join(args.llama_dir, '7B_chinese')
22 | 
23 | 
24 | download('https://huggingface.co/Cxxs/Open-Chinese-LLaMA/resolve/main/7B_chinese_delta/consolidated.00.pth',
25 |          delta_path)
26 | download('https://huggingface.co/Cxxs/Open-Chinese-LLaMA/resolve/main/7B_chinese_delta/params.json',
27 |          delta_path)
28 | 
29 | os.makedirs(new_path, exist_ok=True)
30 | shutil.copyfile(os.path.join(delta_path, 'params.json'), os.path.join(new_path, 'params.json'))
31 | 
32 | ori_dict = torch.load(os.path.join(ori_path, 'consolidated.00.pth'), map_location="cpu")
33 | delta_dict = torch.load(os.path.join(delta_path, 'consolidated.00.pth'), map_location="cpu")
34 | new_dict = {}
35 | for key in ori_dict:
36 |     if "rope" in key: continue
37 |     new_value = (ori_dict[key].float() + delta_dict[key].float()).half()
38 |     new_dict[key] = new_value
39 | 
40 | torch.save(new_dict, os.path.join(new_path, 'consolidated.00.pth'))
41 | 


--------------------------------------------------------------------------------
/imagebind_LLM/util/lr_sched.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | 
 7 | import math
 8 | 
 9 | def adjust_learning_rate(optimizer, epoch, args):
10 |     """Decay the learning rate with half-cycle cosine after warmup"""
11 |     if epoch < args.warmup_epochs:
12 |         lr = args.lr * epoch / args.warmup_epochs 
13 |     else:
14 |         lr = args.min_lr + (args.lr - args.min_lr) * 0.5 * \
15 |             (1. + math.cos(math.pi * (epoch - args.warmup_epochs) / (args.epochs - args.warmup_epochs)))
16 |     for param_group in optimizer.param_groups:
17 |         if "lr_scale" in param_group:
18 |             param_group["lr"] = lr * param_group["lr_scale"]
19 |         else:
20 |             param_group["lr"] = lr
21 |     return lr
22 | 


--------------------------------------------------------------------------------
/llama/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from .generation import LLaMA
5 | from .model import ModelArgs, Transformer
6 | from .tokenizer import Tokenizer
7 | 


--------------------------------------------------------------------------------
/llama/generation.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from typing import List
 5 | 
 6 | import torch
 7 | 
 8 | from llama.model import Transformer
 9 | from llama.tokenizer import Tokenizer
10 | 
11 | 
12 | class LLaMA:
13 |     def __init__(self, model: Transformer, tokenizer: Tokenizer):
14 |         self.model = model
15 |         self.tokenizer = tokenizer
16 | 
17 |     def generate(
18 |         self,
19 |         prompts: List[str],
20 |         max_gen_len: int,
21 |         temperature: float = 0.8,
22 |         top_p: float = 0.95,
23 |     ) -> List[str]:
24 |         bsz = len(prompts)
25 |         params = self.model.params
26 |         assert bsz <= params.max_batch_size, (bsz, params.max_batch_size)
27 | 
28 |         prompt_tokens = [self.tokenizer.encode(x, bos=True, eos=False) for x in prompts]
29 | 
30 |         min_prompt_size = min([len(t) for t in prompt_tokens])
31 |         max_prompt_size = max([len(t) for t in prompt_tokens])
32 | 
33 |         total_len = min(params.max_seq_len, max_gen_len + max_prompt_size)
34 | 
35 |         tokens = torch.full((bsz, total_len), self.tokenizer.pad_id).cuda().long()
36 |         for k, t in enumerate(prompt_tokens):
37 |             tokens[k, : len(t)] = torch.tensor(t).long()
38 |         input_text_mask = tokens != self.tokenizer.pad_id
39 |         start_pos = min_prompt_size
40 |         prev_pos = 0
41 |         for cur_pos in range(start_pos, total_len):
42 |             logits = self.model.forward(tokens[:, prev_pos:cur_pos], prev_pos)
43 |             if temperature > 0:
44 |                 probs = torch.softmax(logits / temperature, dim=-1)
45 |                 next_token = sample_top_p(probs, top_p)
46 |             else:
47 |                 next_token = torch.argmax(logits, dim=-1)
48 |             next_token = next_token.reshape(-1)
49 |             # only replace token if prompt has already been generated
50 |             next_token = torch.where(input_text_mask[:, cur_pos], tokens[:, cur_pos], next_token)
51 |             tokens[:, cur_pos] = next_token
52 |             prev_pos = cur_pos
53 | 
54 |         decoded = []
55 |         for i, t in enumerate(tokens.tolist()):
56 |             # cut to max gen len
57 |             t = t[: len(prompt_tokens[i]) + max_gen_len]
58 |             # cut to eos tok if any
59 |             try:
60 |                 t = t[: t.index(self.tokenizer.eos_id)]
61 |             except ValueError:
62 |                 pass
63 |             decoded.append(self.tokenizer.decode(t))
64 |         return decoded
65 | 
66 | 
67 | def sample_top_p(probs, p):
68 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
69 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
70 |     mask = probs_sum - probs_sort > p
71 |     probs_sort[mask] = 0.0
72 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
73 |     next_token = torch.multinomial(probs_sort, num_samples=1)
74 |     next_token = torch.gather(probs_idx, -1, next_token)
75 |     return next_token
76 | 


--------------------------------------------------------------------------------
/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | import os
 5 | from logging import getLogger
 6 | from typing import List
 7 | 
 8 | from sentencepiece import SentencePieceProcessor
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}")
26 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
27 | 
28 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
29 |         assert type(s) is str
30 |         t = self.sp_model.encode(s)
31 |         if bos:
32 |             t = [self.bos_id] + t
33 |         if eos:
34 |             t = t + [self.eos_id]
35 |         return t
36 | 
37 |     def decode(self, t: List[int]) -> str:
38 |         return self.sp_model.decode(t)
39 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_chat65b/checkpoints/model_zoo.md:
--------------------------------------------------------------------------------
 1 | # LLaMA-Adapter-V2-65B chat model zoo
 2 | 
 3 | This page provides a summary of all released models. Download links are also included. We will continue to release improved models and new architectures.
 4 | 
 5 | ## Bias-scale-norm tuning
 6 | 
 7 | **Description:** For the bias-scale-norm tuned models, a learnable channel-wise scaling factor is added before the fully connected layers, and a learnable channel-wise bias is added after the fully connected layers. The parameters in the normalization layers are also tuned.
 8 | 
 9 | | Version | Training data | Download url | Notes |
10 | | --- | --- | --- | --- |
11 | | v1 | ShareGPT | [Google drive](https://drive.google.com/file/d/1EGDVyXKNt2k9rApoXQY2i0Wm34OatkgK/view?usp=sharing) | Initial version |
12 | 
13 | ## Bias-scale-norm tuning + LoRA
14 | 
15 | Coming soon


--------------------------------------------------------------------------------
/llama_adapter_v2_chat65b/environment.yml:
--------------------------------------------------------------------------------
  1 | name: llama_adapter_chat
  2 | channels:
  3 |   - pytorch
  4 |   - nvidia
  5 |   - defaults
  6 | dependencies:
  7 |   - _libgcc_mutex=0.1=main
  8 |   - _openmp_mutex=5.1=1_gnu
  9 |   - blas=1.0=mkl
 10 |   - brotlipy=0.7.0=py310h7f8727e_1002
 11 |   - bzip2=1.0.8=h7b6447c_0
 12 |   - ca-certificates=2023.01.10=h06a4308_0
 13 |   - certifi=2022.12.7=py310h06a4308_0
 14 |   - cffi=1.15.1=py310h5eee18b_3
 15 |   - charset-normalizer=2.0.4=pyhd3eb1b0_0
 16 |   - cryptography=39.0.1=py310h9ce1e76_0
 17 |   - cuda-cudart=11.8.89=0
 18 |   - cuda-cupti=11.8.87=0
 19 |   - cuda-libraries=11.8.0=0
 20 |   - cuda-nvrtc=11.8.89=0
 21 |   - cuda-nvtx=11.8.86=0
 22 |   - cuda-runtime=11.8.0=0
 23 |   - ffmpeg=4.3=hf484d3e_0
 24 |   - filelock=3.9.0=py310h06a4308_0
 25 |   - freetype=2.12.1=h4a9f257_0
 26 |   - giflib=5.2.1=h5eee18b_3
 27 |   - gmp=6.2.1=h295c915_3
 28 |   - gmpy2=2.1.2=py310heeb90bb_0
 29 |   - gnutls=3.6.15=he1e5248_0
 30 |   - idna=3.4=py310h06a4308_0
 31 |   - intel-openmp=2021.4.0=h06a4308_3561
 32 |   - jinja2=3.1.2=py310h06a4308_0
 33 |   - jpeg=9e=h5eee18b_1
 34 |   - lame=3.100=h7b6447c_0
 35 |   - lcms2=2.12=h3be6417_0
 36 |   - ld_impl_linux-64=2.38=h1181459_1
 37 |   - lerc=3.0=h295c915_0
 38 |   - libcublas=11.11.3.6=0
 39 |   - libcufft=10.9.0.58=0
 40 |   - libcufile=1.6.1.9=0
 41 |   - libcurand=10.3.2.106=0
 42 |   - libcusolver=11.4.1.48=0
 43 |   - libcusparse=11.7.5.86=0
 44 |   - libdeflate=1.17=h5eee18b_0
 45 |   - libffi=3.4.2=h6a678d5_6
 46 |   - libgcc-ng=11.2.0=h1234567_1
 47 |   - libgomp=11.2.0=h1234567_1
 48 |   - libiconv=1.16=h7f8727e_2
 49 |   - libidn2=2.3.2=h7f8727e_0
 50 |   - libnpp=11.8.0.86=0
 51 |   - libnvjpeg=11.9.0.86=0
 52 |   - libpng=1.6.39=h5eee18b_0
 53 |   - libstdcxx-ng=11.2.0=h1234567_1
 54 |   - libtasn1=4.19.0=h5eee18b_0
 55 |   - libtiff=4.5.0=h6a678d5_2
 56 |   - libunistring=0.9.10=h27cfd23_0
 57 |   - libuuid=1.41.5=h5eee18b_0
 58 |   - libwebp=1.2.4=h11a3e52_1
 59 |   - libwebp-base=1.2.4=h5eee18b_1
 60 |   - lz4-c=1.9.4=h6a678d5_0
 61 |   - markupsafe=2.1.1=py310h7f8727e_0
 62 |   - mkl=2021.4.0=h06a4308_640
 63 |   - mkl-service=2.4.0=py310h7f8727e_0
 64 |   - mkl_fft=1.3.1=py310hd6ae3a3_0
 65 |   - mkl_random=1.2.2=py310h00e6091_0
 66 |   - mpc=1.1.0=h10f8cd9_1
 67 |   - mpfr=4.0.2=hb69a4c5_1
 68 |   - ncurses=6.4=h6a678d5_0
 69 |   - nettle=3.7.3=hbbd107a_1
 70 |   - networkx=2.8.4=py310h06a4308_1
 71 |   - numpy=1.24.3=py310hd5efca6_0
 72 |   - numpy-base=1.24.3=py310h8e6c178_0
 73 |   - openh264=2.1.1=h4ff587b_0
 74 |   - openssl=1.1.1t=h7f8727e_0
 75 |   - pillow=9.4.0=py310h6a678d5_0
 76 |   - pip=23.0.1=py310h06a4308_0
 77 |   - pycparser=2.21=pyhd3eb1b0_0
 78 |   - pyopenssl=23.0.0=py310h06a4308_0
 79 |   - pysocks=1.7.1=py310h06a4308_0
 80 |   - python=3.10.11=h7a1cb2a_2
 81 |   - pytorch=2.0.0=py3.10_cuda11.8_cudnn8.7.0_0
 82 |   - pytorch-cuda=11.8=h7e8668a_3
 83 |   - pytorch-mutex=1.0=cuda
 84 |   - readline=8.2=h5eee18b_0
 85 |   - requests=2.29.0=py310h06a4308_0
 86 |   - setuptools=66.0.0=py310h06a4308_0
 87 |   - six=1.16.0=pyhd3eb1b0_1
 88 |   - sqlite=3.41.2=h5eee18b_0
 89 |   - sympy=1.11.1=py310h06a4308_0
 90 |   - tk=8.6.12=h1ccaba5_0
 91 |   - torchaudio=2.0.0=py310_cu118
 92 |   - torchtriton=2.0.0=py310
 93 |   - torchvision=0.15.0=py310_cu118
 94 |   - typing_extensions=4.5.0=py310h06a4308_0
 95 |   - tzdata=2023c=h04d1e81_0
 96 |   - urllib3=1.26.15=py310h06a4308_0
 97 |   - wheel=0.38.4=py310h06a4308_0
 98 |   - xz=5.2.10=h5eee18b_1
 99 |   - zlib=1.2.13=h5eee18b_0
100 |   - zstd=1.5.5=hc292b87_0
101 |   - pip:
102 |       - fairscale==0.4.13
103 |       - mpmath==1.2.1
104 |       - sentencepiece==0.1.98
105 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_chat65b/llama/__init__.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from .generation import LLaMA
5 | from .model import ModelArgs, Transformer
6 | from .tokenizer import Tokenizer
7 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_chat65b/llama/generation.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from typing import List
 5 | 
 6 | import torch
 7 | 
 8 | from llama.model import Transformer
 9 | from llama.tokenizer import Tokenizer
10 | 
11 | 
12 | class LLaMA:
13 |     def __init__(self, model: Transformer, tokenizer: Tokenizer) -> None:
14 |         self.model = model
15 |         self.tokenizer = tokenizer
16 | 
17 |     def generate(
18 |         self,
19 |         prompts: List[str],
20 |         max_gen_len: int,
21 |         temperature: float = 0.8,
22 |         top_p: float = 0.95,
23 |     ) -> List[str]:
24 |         bsz = len(prompts)
25 |         params = self.model.params
26 |         self.model.enable_cache()
27 | 
28 |         prompt_tokens = [self.tokenizer.encode(x, bos=True, eos=False) for x in prompts]
29 |         prompt_tokens = [x[-(2048 - max_gen_len) :] for x in prompt_tokens]
30 | 
31 |         min_prompt_size = min([len(t) for t in prompt_tokens])
32 |         max_prompt_size = max([len(t) for t in prompt_tokens])
33 | 
34 |         total_len = min(params.max_seq_len, max_gen_len + max_prompt_size)
35 | 
36 |         tokens = torch.full((bsz, total_len), self.tokenizer.pad_id).cuda().long()
37 |         for k, t in enumerate(prompt_tokens):
38 |             tokens[k, : len(t)] = torch.tensor(t).long()
39 |         input_text_mask = tokens != self.tokenizer.pad_id
40 |         start_pos = min_prompt_size
41 |         prev_pos = 0
42 |         for cur_pos in range(start_pos, total_len):
43 |             logits = self.model.forward_inference(tokens[:, prev_pos:cur_pos], prev_pos)
44 |             if temperature > 0:
45 |                 probs = torch.softmax(logits / temperature, dim=-1)
46 |                 next_token = sample_top_p(probs, top_p)
47 |             else:
48 |                 next_token = torch.argmax(logits, dim=-1)
49 |             next_token = next_token.reshape(-1)
50 |             # only replace token if prompt has already been generated
51 |             next_token = torch.where(input_text_mask[:, cur_pos], tokens[:, cur_pos], next_token)
52 |             tokens[:, cur_pos] = next_token
53 |             prev_pos = cur_pos
54 | 
55 |         self.model.disable_cache()
56 | 
57 |         decoded = []
58 |         for i, t in enumerate(tokens.tolist()):
59 |             # cut to max gen len
60 |             t = t[len(prompt_tokens[i]) : len(prompt_tokens[i]) + max_gen_len]
61 |             # cut to eos tok if any
62 |             try:
63 |                 t = t[: t.index(self.tokenizer.eos_id)]
64 |             except ValueError:
65 |                 pass
66 |             decoded.append(self.tokenizer.decode(t))
67 |         return decoded
68 | 
69 | 
70 | def sample_top_p(probs, p):
71 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
72 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
73 |     mask = probs_sum - probs_sort > p
74 |     probs_sort[mask] = 0.0
75 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
76 |     next_token = torch.multinomial(probs_sort, num_samples=1)
77 |     next_token = torch.gather(probs_idx, -1, next_token)
78 |     return next_token
79 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_chat65b/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | import os
 5 | from logging import getLogger
 6 | from typing import List
 7 | 
 8 | from sentencepiece import SentencePieceProcessor
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}")
26 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
27 | 
28 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
29 |         assert type(s) is str
30 |         t = self.sp_model.encode(s)
31 |         if bos:
32 |             t = [self.bos_id] + t
33 |         if eos:
34 |             t = t + [self.eos_id]
35 |         return t
36 | 
37 |     def decode(self, t: List[int]) -> str:
38 |         return self.sp_model.decode(t)
39 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_chat65b/scripts/srun_chat_llama65b_bias_scale_norm.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env sh
 2 | 
 3 | # slurm partition name.
 4 | partition=
 5 | # total number of GPUs to use.
 6 | n_gpus=
 7 | # directory containing LLaMA backbone weights downloaded from facebook.
 8 | llama_model_path=
 9 | 
10 | 
11 | srun -p "${partition}" --gres=gpu:${n_gpus} -n ${n_gpus} --ntasks-per-node ${n_gpus} --unbuffered \
12 |   python -u chat_demo.py \
13 |     --model_name Llama65B_bias_scale_norm_tuning \
14 |     --model_path checkpoints/chat_llama65b_bias_scale_norm_tuning_v1.pth \
15 |     --llama_model_path "${llama_model_path}" 
16 | 
17 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_chat65b/scripts/torchrun_chat_llama65b_bias_scale_norm.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env sh
 2 | 
 3 | # total number of GPUs to use.
 4 | n_gpus=
 5 | # directory containing LLaMA backbone weights downloaded from facebook.
 6 | llama_model_path=
 7 | 
 8 | 
 9 | torchrun --nproc_per_node ${n_gpus} chat_demo.py \
10 |   --model_name Llama65B_bias_scale_norm_tuning \
11 |   --model_path checkpoints/chat_llama65b_bias_scale_norm_tuning_v1.pth \
12 |   --llama_model_path "${llama_model_path}" 
13 | 
14 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/README.md:
--------------------------------------------------------------------------------
 1 | # LLaMA-Adapter-V2 Multi-modal
 2 | 
 3 | ## News
 4 | * [Oct 11, 2023] Release LLaMA-Adapter V2.1 and evaluation on MME.
 5 | * [July 5, 2023] Release pre-traininig and fine-tuning codes.
 6 | * [May 26, 2023] Initial release.
 7 | 
 8 | 
 9 | ## Setup
10 | 
11 | * setup up a new conda env and install necessary packages.
12 |   ```bash
13 |   conda create -n llama_adapter_v2 python=3.8 -y
14 |   pip install -r requirements.txt
15 |   ```
16 | 
17 | * Obtain the LLaMA backbone weights using [this form](https://forms.gle/jk851eBVbX1m5TAv5). Please note that checkpoints from unofficial sources (e.g., BitTorrent) may contain malicious code and should be used with care. Organize the downloaded file in the following structure
18 |   ```
19 |   /path/to/llama_model_weights
20 |   ├── 7B
21 |   │   ├── checklist.chk
22 |   │   ├── consolidated.00.pth
23 |   │   └── params.json
24 |   └── tokenizer.model
25 |   ```
26 | 
27 | ## Inference
28 | 
29 | Here is a simple inference script for LLaMA-Adapter V2. The pre-trained model will be downloaded directly from [Github Release](https://github.com/OpenGVLab/LLaMA-Adapter/releases/tag/v.2.0.0).
30 | 
31 | ```python
32 | import cv2
33 | import llama
34 | import torch
35 | from PIL import Image
36 | 
37 | device = "cuda" if torch.cuda.is_available() else "cpu"
38 | 
39 | llama_dir = "/path/to/LLaMA/"
40 | 
41 | # choose from BIAS-7B, LORA-BIAS-7B, LORA-BIAS-7B-v21
42 | model, preprocess = llama.load("BIAS-7B", llama_dir, llama_type="7B", device=device)
43 | model.eval()
44 | 
45 | prompt = llama.format_prompt("Please introduce this painting.")
46 | img = Image.fromarray(cv2.imread("../docs/logo_v1.png"))
47 | img = preprocess(img).unsqueeze(0).to(device)
48 | 
49 | result = model.generate(img, [prompt])[0]
50 | 
51 | print(result)
52 | ```
53 | 
54 | The output will look like the following:
55 | ```
56 | The painting features a cute white lama, or llama, standing on a wooden floor. The llama is holding a variety of tools and accessories, such as a paintbrush, a pencil, a ruler, a pair of scissors, and a paint can. The llama is dressed in a suit, which adds a touch of sophistication to the scene. The painting is a creative and whimsical representation of a person or animal holding various tools and accessories, making it an interesting and unique piece of art.
57 | ```
58 | 
59 | ## Evaluation
60 | Check [eval.md](./docs/eval.md) for details.
61 | 
62 | ## Online demo
63 | 
64 | We provide an online demo at [OpenGVLab](http://llama-adapter.opengvlab.com).
65 | 
66 | You can also start it locally with:
67 | ```bash
68 | python gradio_app.py
69 | ```
70 | 
71 | ## Models
72 | 
73 | You can check our models by running:
74 | ```python
75 | import llama
76 | print(llama.available_models())
77 | ```
78 | 
79 | Now we provide `BIAS-7B` which fine-tunes the `bias` and `norm` parameters of LLaMA, and `LORA-BIAS-7B` which fine-tunes the `bias`, `norm` and `lora` parameters of LLaMA. We will include more pretrained models in the future, such as the LoRA fine-tuning model `LORA-7B` and partial-tuning model `PARTIAL-7B`.
80 | 
81 | ## Pre-traininig & Fine-tuning
82 | See [train.md](docs/train.md)
83 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/demo.py:
--------------------------------------------------------------------------------
 1 | import cv2
 2 | import llama
 3 | import torch
 4 | from PIL import Image
 5 | 
 6 | device = "cuda" if torch.cuda.is_available() else "cpu"
 7 | 
 8 | llama_dir = "/path/to/LLaMA/"
 9 | 
10 | # choose from BIAS-7B, LORA-BIAS-7B, CAPTION-7B.pth
11 | model, preprocess = llama.load("BIAS-7B", llama_dir, device)
12 | model.eval()
13 | 
14 | prompt = llama.format_prompt('Please introduce this painting.')
15 | img = Image.fromarray(cv2.imread("../docs/logo_v1.png"))
16 | img = preprocess(img).unsqueeze(0).to(device)
17 | 
18 | result = model.generate(img, [prompt])[0]
19 | 
20 | print(result)
21 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/docs/eval.md:
--------------------------------------------------------------------------------
 1 | # Evaluation on MME Benchmark
 2 | 
 3 | [MME](https://github.com/BradyFU/Awesome-Multimodal-Large-Language-Models/tree/Evaluation) is a comprehensive evaluation benchmark for multimodal large language models. It measures both perception and cognition abilities on a total of 14 subtasks, including existence, count, position, color, poster, celebrity, scene, landmark, artwork, OCR, commonsense reasoning, numerical calculation, text translation, and code reasoning.
 4 | 
 5 | ## Setup & Evaluation
 6 | 
 7 | 1. Download MME datasets and `eval_tool` from the [MME repo](https://github.com/bradyfu/awesome-multimodal-large-language-models#our-mllm-works), and put them under `MME_Benchmark_release_version`. Now the folder structure will be:
 8 |     ```
 9 |     MME_Benchmark_release_version
10 |         ├── artwork
11 |         ├── celebrity
12 |         ├── code_reasoning
13 |         ├── color
14 |         ├── commonsense_reasoning
15 |         ├── count
16 |         ├── eval_tool
17 |         │   ├── calculation.py
18 |         │   ├── LaVIN
19 |         │   └── Your_Results
20 |         ├── existence
21 |         ├── landmark
22 |         ├── numerical_calculation
23 |         ├── OCR
24 |         ├── position
25 |         ├── posters
26 |         ├── scene
27 |         └── text_translation
28 |     ```
29 | 2. Generate MME results using: `python util/evaluate_mme.py --pretrained_path [MODEL_PATH] --llama_path [LLAMA_DIR] --output_path [RESULT_FILE_PATH]`
30 | 3. Evaluate LLaMA-Adapter V2.1 with MME's eval_tool: `python MME_Benchmark_release_version/eval_tool/calculation.py --results_dir [RESULT_FILE_PATH]`
31 | 
32 | ## Results
33 | 
34 | > For comparisons with other works, please check [MME Leaderboard](https://github.com/BradyFU/Awesome-Multimodal-Large-Language-Models/tree/Evaluation).
35 | 
36 | * **LLaMA-Adapter V2.1**
37 | 
38 |     ```
39 |     =========== Perception ===========
40 |     total score: 1326.0875953396435 
41 | 
42 |             existence  score: 185.0
43 |             count  score: 133.33333333333331
44 |             position  score: 56.666666666666664
45 |             color  score: 118.33333333333334
46 |             posters  score: 147.9591836734694
47 |             celebrity  score: 134.70588235294116
48 |             scene  score: 156.25
49 |             landmark  score: 167.8391959798995
50 |             artwork  score: 123.5
51 |             OCR  score: 102.5
52 | 
53 | 
54 |     =========== Cognition ===========
55 |     total score: 356.42857142857144 
56 | 
57 |             commonsense_reasoning  score: 106.42857142857144
58 |             numerical_calculation  score: 47.5
59 |             text_translation  score: 112.5
60 |             code_reasoning  score: 90.0
61 | 
62 |     ```
63 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/docs/train.md:
--------------------------------------------------------------------------------
 1 | The training process of LLaMA-Adapter V2 consists of the pre-training and fine-tuning phases.
 2 | 
 3 | ## Pre-training
 4 | 
 5 | ### Data
 6 | 
 7 | * We use multiple datasets with **image-text pairs** for pre-training. The texts are English-only.
 8 | * For each dataset, the meta file should be organized in the `.csv` format as following:
 9 | 
10 |   ```
11 |   url		caption
12 |   /path/to/image1		caption1
13 |   /path/to/image2		caption2
14 |   ...
15 |   ```
16 | 
17 |   Alternatively, you may modify the [`PretrainDataset`](/data/dataset.py) implementation to adapt to your own meta file format.
18 | * Write a `.yaml` config file to specify the datasets for pre-training:
19 | 
20 |   ```
21 |   META:
22 |     - '/path/to/cc3m.csv'
23 |     - '/path/to/coco.csv'
24 |     ...
25 |   ```
26 | 
27 | ### Start pre-training
28 | 
29 | We are now ready to start pre-training (please make sure that the original LLaMA weights are available in `/path/to/llama_model_weights`).
30 | 
31 | ```bash
32 | . exps/pretrain.sh /path/to/llama_model_weights /path/to/pretrain-data-config.yaml /output/path
33 | ```
34 | 
35 | ## Fine-tuning
36 | 
37 | ### Data
38 | 
39 | * We fine-tune LLaMA-Adapter V2 on text-only as well as image-text instruction following datasets.
40 | * The following lists the datasets we use for training our release weights:
41 | 
42 |   | Name                     | Link                                                                                                         |
43 |   | ------------------------ | ------------------------------------------------------------------------------------------------------------ |
44 |   | alpaca_gpt4_data.json    | [File Link](https://github.com/Instruction-Tuning-with-GPT-4/GPT-4-LLM/blob/main/data/alpaca_gpt4_data.json)    |
45 |   | alpaca_gpt4_data_zh.json | [File Link](https://github.com/Instruction-Tuning-with-GPT-4/GPT-4-LLM/blob/main/data/alpaca_gpt4_data_zh.json) |
46 |   | llava_instruct_150k.json | [File Link](https://huggingface.co/datasets/liuhaotian/LLaVA-Instruct-150K/raw/main/llava_instruct_150k.json)   |
47 |   | alpaca_data_zh_51k.json  | [File Link](https://github.com/ymcui/Chinese-LLaMA-Alpaca/blob/main/data/alpaca_data_zh_51k.json)               |
48 | * Similar to pre-training, write a `.yaml` config file to specify the datasets for fine-tuning:
49 | 
50 |   ```
51 |   META:
52 |     - '/path/to/alpaca_gpt4_data.json'
53 |     - '/path/to/alpaca_gpt4_data_zh.json'
54 |     ...
55 |   ```
56 | 
57 | ### Start fine-tuning
58 | 
59 | ```bash
60 | . exps/finetune.sh \
61 |  /path/to/llama_model_weights /path/to/pre-trained/checkpoint.pth \
62 |  /path/to/finetune-data-config.yaml /output/path
63 | ```
64 | 
65 | ### Test and Save
66 | 
67 | ```python
68 | import os 
69 | from llama.llama_adapter import LLaMA_adapter
70 | import util.misc as misc
71 | import util.extract_adapter_from_checkpoint as extract
72 | from PIL import Image
73 | import cv2
74 | import torch
75 | import llama
76 | 
77 | device = "cuda" if torch.cuda.is_available() else "cpu"
78 | 
79 | llama_dir = "path/to/llama/"
80 | llama_type = '7B'
81 | llama_ckpt_dir = os.path.join(llama_dir, llama_type)
82 | llama_tokenzier_path = os.path.join(llama_dir, 'tokenizer.model')
83 | model = LLaMA_adapter(llama_ckpt_dir, llama_tokenzier_path)
84 | 
85 | misc.load_model(model, 'path/to/finetune/checkpoint.pth')
86 | model.eval()
87 | model.to(device)
88 | 
89 | prompt = llama.format_prompt('your prompt')
90 | img = Image.fromarray(cv2.imread("your image"))
91 | img = model.clip_transform(img).unsqueeze(0).to(device)
92 | 
93 | result = model.generate(img, [prompt])[0]
94 | print(result)
95 | 
96 | extract.save(model,'path/to/adapter-7B.pth','BIAS') # Please end it with -llama_type.pth
97 | ```
98 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/engine_finetune.py:
--------------------------------------------------------------------------------
 1 | import math
 2 | import sys
 3 | from typing import Iterable
 4 | 
 5 | import torch
 6 | 
 7 | import util.misc as misc
 8 | import util.lr_sched as lr_sched
 9 | 
10 | from llama import LLaMA_adapter
11 | 
12 | def train_one_epoch(model: LLaMA_adapter,
13 |                     data_loader: Iterable, optimizer: torch.optim.Optimizer,
14 |                     device: torch.device, epoch: int, loss_scaler,
15 |                     log_writer=None,
16 |                     args=None):
17 |     model.train(True)
18 |     # model.module.set_default_trainability()
19 | 
20 |     metric_logger = misc.MetricLogger(delimiter="  ")
21 |     metric_logger.add_meter('lr', misc.SmoothedValue(window_size=1, fmt='{value:.6f}'))
22 |     header = 'Epoch: [{}]'.format(epoch)
23 |     print_freq = 10
24 | 
25 |     accum_iter = args.accum_iter
26 | 
27 |     optimizer.zero_grad()
28 | 
29 |     if log_writer is not None:
30 |         print('log_dir: {}'.format(log_writer.log_dir))
31 |     for data_iter_step, (examples, labels, example_mask, imgs) in enumerate(metric_logger.log_every(data_loader, print_freq, header)):
32 |         # we use a per iteration (instead of per epoch) lr scheduler
33 |         if data_iter_step % accum_iter == 0:
34 |             lr_sched.adjust_learning_rate(optimizer, data_iter_step / len(data_loader) + epoch, args)
35 | 
36 |         imgs = imgs.to(device, non_blocking=True)
37 |         with torch.cuda.amp.autocast():
38 |              c_loss, m_loss = model(examples, labels, imgs)
39 |         loss = c_loss  + m_loss * 0
40 |         loss_value = loss.item()
41 |         c_loss_value = c_loss.item()
42 |         m_loss_value = m_loss
43 |         if not math.isfinite(loss_value):
44 |             print("Loss is {}, stopping training".format(loss_value))
45 |             sys.exit(1)
46 | 
47 |         loss /= accum_iter
48 |         loss_scaler(loss, optimizer, parameters=model.parameters(),
49 |                     update_grad=(data_iter_step + 1) % accum_iter == 0)
50 |         if (data_iter_step + 1) % accum_iter == 0:
51 |             optimizer.zero_grad()
52 | 
53 |         torch.cuda.synchronize()
54 | 
55 |         metric_logger.update(closs=c_loss_value)
56 |         metric_logger.update(mloss=m_loss_value)
57 | 
58 |         lr = optimizer.param_groups[0]["lr"]
59 |         metric_logger.update(lr=lr)
60 | 
61 |         loss_value_reduce = misc.all_reduce_mean(loss_value)
62 |         c_loss_value_reduce = misc.all_reduce_mean(c_loss_value)
63 |         m_loss_value_reduce = misc.all_reduce_mean(m_loss_value)
64 |         if log_writer is not None and (data_iter_step + 1) % accum_iter == 0:
65 |             """ We use epoch_1000x as the x-axis in tensorboard.
66 |             This calibrates different curves when batch size changes.
67 |             """
68 |             epoch_1000x = int((data_iter_step / len(data_loader) + epoch) * 1000)
69 |             log_writer.add_scalar('c_train_loss', c_loss_value_reduce, epoch_1000x)
70 |             log_writer.add_scalar('m_train_loss', m_loss_value_reduce, epoch_1000x)
71 |             log_writer.add_scalar('lr', lr, epoch_1000x)
72 | 
73 | 
74 |     # gather the stats from all processes
75 |     metric_logger.synchronize_between_processes()
76 |     print("Averaged stats:", metric_logger)
77 |     return {k: meter.global_avg for k, meter in metric_logger.meters.items()}
78 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/engine_pretrain.py:
--------------------------------------------------------------------------------
 1 | import math
 2 | import sys
 3 | from typing import Iterable
 4 | 
 5 | import torch
 6 | 
 7 | import util.misc as misc
 8 | import util.lr_sched as lr_sched
 9 | 
10 | from llama import LLaMA_adapter
11 | 
12 | def train_one_epoch(model: LLaMA_adapter,
13 |                     data_loader: Iterable, optimizer: torch.optim.Optimizer,
14 |                     device: torch.device, epoch: int, loss_scaler,
15 |                     log_writer=None,
16 |                     args=None):
17 |     model.train(True)
18 |     # model.module.set_default_trainability()
19 | 
20 |     metric_logger = misc.MetricLogger(delimiter="  ")
21 |     metric_logger.add_meter('lr', misc.SmoothedValue(window_size=1, fmt='{value:.6f}'))
22 |     header = 'Epoch: [{}]'.format(epoch)
23 |     print_freq = 10
24 | 
25 |     accum_iter = args.accum_iter
26 | 
27 |     optimizer.zero_grad()
28 | 
29 |     if log_writer is not None:
30 |         print('log_dir: {}'.format(log_writer.log_dir))
31 |     for data_iter_step, (examples, labels, example_mask, imgs) in enumerate(metric_logger.log_every(data_loader, print_freq, header)):
32 |         # we use a per iteration (instead of per epoch) lr scheduler
33 |         if data_iter_step % accum_iter == 0:
34 |             lr_sched.adjust_learning_rate(optimizer, data_iter_step / len(data_loader) + epoch, args)
35 | 
36 |         imgs = imgs.to(device, non_blocking=True)
37 |         with torch.cuda.amp.autocast():
38 |              c_loss, m_loss = model(examples, labels, imgs)
39 |         loss = c_loss  + m_loss * 0
40 |         loss_value = loss.item()
41 |         c_loss_value = c_loss.item()
42 |         m_loss_value = m_loss
43 |         if not math.isfinite(loss_value):
44 |             print("Loss is {}, stopping training".format(loss_value))
45 |             sys.exit(1)
46 | 
47 |         loss /= accum_iter
48 |         loss_scaler(loss, optimizer, parameters=model.parameters(),
49 |                     update_grad=(data_iter_step + 1) % accum_iter == 0)
50 |         if (data_iter_step + 1) % accum_iter == 0:
51 |             optimizer.zero_grad()
52 | 
53 |         torch.cuda.synchronize()
54 | 
55 |         metric_logger.update(closs=c_loss_value)
56 |         metric_logger.update(mloss=m_loss_value)
57 | 
58 |         lr = optimizer.param_groups[0]["lr"]
59 |         metric_logger.update(lr=lr)
60 | 
61 |         loss_value_reduce = misc.all_reduce_mean(loss_value)
62 |         c_loss_value_reduce = misc.all_reduce_mean(c_loss_value)
63 |         m_loss_value_reduce = misc.all_reduce_mean(m_loss_value)
64 |         if log_writer is not None and (data_iter_step + 1) % accum_iter == 0:
65 |             """ We use epoch_1000x as the x-axis in tensorboard.
66 |             This calibrates different curves when batch size changes.
67 |             """
68 |             epoch_1000x = int((data_iter_step / len(data_loader) + epoch) * 1000)
69 |             log_writer.add_scalar('c_train_loss', c_loss_value_reduce, epoch_1000x)
70 |             log_writer.add_scalar('m_train_loss', m_loss_value_reduce, epoch_1000x)
71 |             log_writer.add_scalar('lr', lr, epoch_1000x)
72 | 
73 | 
74 |     # gather the stats from all processes
75 |     metric_logger.synchronize_between_processes()
76 |     print("Averaged stats:", metric_logger)
77 |     return {k: meter.global_avg for k, meter in metric_logger.meters.items()}
78 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/exps/finetune.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/bash
 2 | 
 3 | LLAMA_PATH="$1"
 4 | PRETRAINED_PATH="$2" # path to pre-trained checkpoint
 5 | CONFIG="$3"
 6 | OUTPUT_DIR="$4"
 7 | 
 8 | mkdir -p "$OUTPUT_DIR"
 9 | 
10 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
11 |  main_finetune.py --data_config "$CONFIG" --batch_size 4 \
12 |  --epochs 4 --warmup_epochs 1 --blr 10e-4 --weight_decay 0.02 \
13 |  --llama_path "$LLAMA_PATH" \
14 |  --output_dir "$OUTPUT_DIR" \
15 |  --pretrained_path "$PRETRAINED_PATH" \
16 |  &>> "$OUTPUT_DIR"/output.log &


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/exps/pretrain.sh:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/bash
 2 | 
 3 | LLAMA_PATH="$1"
 4 | CONFIG="$2"
 5 | OUTPUT_DIR="$3"
 6 | 
 7 | mkdir -p "$OUTPUT_DIR"
 8 | 
 9 | python -u -m torch.distributed.launch --master_port=1112 --nproc_per_node=8 --use_env \
10 |  main_pretrain.py --data_config "$CONFIG" --batch_size 4 \
11 |  --epochs 150 --split_epoch 50 --warmup_epochs 5 --blr 1.0e-4 --weight_decay 0.05 \
12 |  --llama_path "$LLAMA_PATH" \
13 |  --output_dir "$OUTPUT_DIR" \
14 |  &>> "$OUTPUT_DIR"/output.log &


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/gradio_app.py:
--------------------------------------------------------------------------------
 1 | import cv2
 2 | import gradio as gr
 3 | import torch
 4 | from PIL import Image
 5 | 
 6 | import llama
 7 | 
 8 | 
 9 | device = "cuda" if torch.cuda.is_available() else "cpu"
10 | 
11 | llama_dir = "/path/to/LLaMA/"
12 | 
13 | model, preprocess = llama.load("BIAS-7B", llama_dir, device)
14 | model.half()
15 | model.eval()
16 | 
17 | def multi_modal_generate(
18 |     img_path: str,
19 |     prompt: str,
20 |     max_gen_len=256,
21 |     temperature: float = 0.1,
22 |     top_p: float = 0.75,
23 | ):
24 |     try:
25 |         img = Image.fromarray(cv2.imread(img_path))
26 |     except:
27 |         return ""
28 | 
29 |     img = preprocess(img).unsqueeze(0).half().to(device)
30 |     prompt = llama.format_prompt(prompt)
31 | 
32 |     result = model.generate(img, [prompt], 
33 |                             max_gen_len=max_gen_len, 
34 |                             temperature=temperature, 
35 |                             top_p=top_p)
36 |     print(result[0])
37 |     return result[0]
38 | 
39 | 
40 | def create_multi_modal_demo():
41 |     with gr.Blocks() as instruct_demo:
42 |         with gr.Row():
43 |             with gr.Column():
44 |                 img = gr.Image(label='Input', type='filepath')
45 |                 question = gr.Textbox(lines=2, label="Prompt")
46 |                 max_len = gr.Slider(minimum=1, maximum=512,
47 |                                     value=256, label="Max length")
48 |                 with gr.Accordion(label='Advanced options', open=False):
49 |                     temp = gr.Slider(minimum=0, maximum=1,
50 |                                      value=0.1, label="Temperature")
51 |                     top_p = gr.Slider(minimum=0, maximum=1,
52 |                                       value=0.75, label="Top p")
53 | 
54 |                 run_botton = gr.Button("Run")
55 | 
56 |             with gr.Column():
57 |                 outputs = gr.Textbox(lines=10, label="Output")
58 | 
59 |         inputs = [img, question, max_len, temp, top_p]
60 | 
61 |         examples = [
62 |             ["../docs/logo_v1.png", "Please introduce this painting.", 256, 0.1, 0.75],
63 |         ]
64 | 
65 |         gr.Examples(
66 |             examples=examples,
67 |             inputs=inputs,
68 |             outputs=outputs,
69 |             fn=multi_modal_generate,
70 |             cache_examples=False
71 |         )
72 |         run_botton.click(fn=multi_modal_generate,
73 |                          inputs=inputs, outputs=outputs)
74 |     return instruct_demo
75 | 
76 | 
77 | description = """
78 | # LLaMA-Adapter V2🚀
79 | The official demo for **LLaMA-Adapter V2: Parameter-Efficient Visual Instruction Model**.
80 | 
81 | Please refer to our [arXiv paper](https://arxiv.org/abs/2304.15010) and [github](https://github.com/ZrrSkywalker/LLaMA-Adapter) for more details.
82 | 
83 | The demo for **LLaMA-Adapter V1** is available at: [Huggingface Spaces](https://huggingface.co/spaces/csuhan/LLaMA-Adapter).
84 | """
85 | 
86 | with gr.Blocks(css="h1,p {text-align: center;}") as demo:
87 |     gr.Markdown(description)
88 |     with gr.TabItem("Multi-Modal Interaction"):
89 |         create_multi_modal_demo()
90 | 
91 | demo.queue(api_open=True, concurrency_count=1).launch(share=True)
92 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/llama/__init__.py:
--------------------------------------------------------------------------------
1 | from .llama import ModelArgs, Transformer
2 | from .tokenizer import Tokenizer
3 | from .llama_adapter import *
4 | from .utils import format_prompt


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/llama/tokenizer.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
 3 | 
 4 | from sentencepiece import SentencePieceProcessor
 5 | from logging import getLogger
 6 | from typing import List
 7 | import os
 8 | 
 9 | 
10 | logger = getLogger()
11 | 
12 | 
13 | class Tokenizer:
14 |     def __init__(self, model_path: str):
15 |         # reload tokenizer
16 |         assert os.path.isfile(model_path), model_path
17 |         self.sp_model = SentencePieceProcessor(model_file=model_path)
18 |         logger.info(f"Reloaded SentencePiece model from {model_path}")
19 | 
20 |         # BOS / EOS token IDs
21 |         self.n_words: int = self.sp_model.vocab_size()
22 |         self.bos_id: int = self.sp_model.bos_id()
23 |         self.eos_id: int = self.sp_model.eos_id()
24 |         self.pad_id: int = self.sp_model.pad_id()
25 |         logger.info(
26 |             f"#words: {self.n_words} - BOS ID: {self.bos_id} - EOS ID: {self.eos_id}"
27 |         )
28 |         assert self.sp_model.vocab_size() == self.sp_model.get_piece_size()
29 | 
30 |     def encode(self, s: str, bos: bool, eos: bool) -> List[int]:
31 |         assert type(s) is str
32 |         t = self.sp_model.encode(s)
33 |         if bos:
34 |             t = [self.bos_id] + t
35 |         if eos:
36 |             t = t + [self.eos_id]
37 |         return t
38 | 
39 |     def decode(self, t: List[int]) -> str:
40 |         return self.sp_model.decode(t)
41 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/llama/utils.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import urllib
 3 | import hashlib
 4 | import warnings
 5 | 
 6 | from tqdm import tqdm
 7 | import torch
 8 | 
 9 | 
10 | def sample_top_p(probs, p):
11 |     probs_sort, probs_idx = torch.sort(probs, dim=-1, descending=True)
12 |     probs_sum = torch.cumsum(probs_sort, dim=-1)
13 |     mask = probs_sum - probs_sort > p
14 |     probs_sort[mask] = 0.0
15 |     probs_sort.div_(probs_sort.sum(dim=-1, keepdim=True))
16 |     next_token = torch.multinomial(probs_sort, num_samples=1)
17 |     next_token = torch.gather(probs_idx, -1, next_token)
18 |     return next_token
19 | 
20 | 
21 | def format_prompt(instruction, input=None):
22 | 
23 |     PROMPT_DICT = {
24 |         "prompt_input": (
25 |             "Below is an instruction that describes a task, paired with an input that provides further context. "
26 |             "Write a response that appropriately completes the request.\n\n"
27 |             "### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:"
28 |         ),
29 |         "prompt_no_input": (
30 |             "Below is an instruction that describes a task. "
31 |             "Write a response that appropriately completes the request.\n\n"
32 |             "### Instruction:\n{instruction}\n\n### Response:"
33 |         ),
34 |     }
35 |     if input is None:
36 |         return PROMPT_DICT['prompt_no_input'].format_map({'instruction': instruction})
37 |     else:
38 |         return PROMPT_DICT["prompt_input"].format_map({'instruction': instruction, 'input': input})
39 | 
40 | 
41 | def _download(url: str, root: str):
42 |     os.makedirs(root, exist_ok=True)
43 |     filename = os.path.basename(url)
44 |     # assume the url is https://some/path/sha256_model.pth
45 |     expected_sha256 = url.split("/")[-1].split('_')[0]
46 |     # expected_sha256 = url.split("/")[-2]
47 |     download_target = os.path.join(root, filename)
48 | 
49 |     if os.path.exists(download_target) and not os.path.isfile(download_target):
50 |         raise RuntimeError(f"{download_target} exists and is not a regular file")
51 | 
52 |     if os.path.isfile(download_target):
53 |         if hashlib.sha256(open(download_target, "rb").read()).hexdigest() == expected_sha256:
54 |             return download_target
55 |         else:
56 |             warnings.warn(f"{download_target} exists, but the SHA256 checksum does not match; re-downloading the file")
57 | 
58 |     with urllib.request.urlopen(url) as source, open(download_target, "wb") as output:
59 |         with tqdm(total=int(source.info().get("Content-Length")), ncols=80, unit='iB', unit_scale=True, unit_divisor=1024) as loop:
60 |             while True:
61 |                 buffer = source.read(8192)
62 |                 if not buffer:
63 |                     break
64 | 
65 |                 output.write(buffer)
66 |                 loop.update(len(buffer))
67 | 
68 |     if hashlib.sha256(open(download_target, "rb").read()).hexdigest() != expected_sha256:
69 |         raise RuntimeError("Model has been downloaded but the SHA256 checksum does not not match")
70 | 
71 |     return download_target
72 | 


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/requirements.txt:
--------------------------------------------------------------------------------
 1 | --extra-index-url https://download.pytorch.org/whl/cu117
 2 | torch==2.0.0+cu117
 3 | torchvision==0.15.1+cu117
 4 | fairscale
 5 | sentencepiece
 6 | Pillow
 7 | opencv-python
 8 | gradio
 9 | tqdm
10 | git+https://github.com/csuhan/timm_0_3_2.git
11 | git+https://github.com/openai/CLIP.git


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/util/extract_adapter_from_checkpoint.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | 
 3 | def save(full_model, path, model_type = 'BIAS'):
 4 |     if model_type == 'BIAS':
 5 |         keys = [
 6 |             f'visual_blocks.{i}.{key}.{suffix}'
 7 |             for i in range(8)
 8 |             for key in ['norm1', 'attn.qkv', 'attn.proj', 'norm2', 'mlp.fc1', 'mlp.fc2']
 9 |             for suffix in ['weight', 'bias']
10 |         ] + [
11 |             f'llama.layers.{i}.{key}'
12 |             for i in range(32)
13 |             for key in ['attention.gate', 'attention.wq.bias', 'attention.wo.bias', 'feed_forward.w1.bias', 'feed_forward.w2.bias', 'feed_forward.w3.bias', 'attention_norm.weight', 'ffn_norm.weight']
14 |         ] + [
15 |             f'{base_key}.{suffix}'
16 |             for base_key in ['clip_proj_norm', 'visual_proj_norm', 'visual_proj', 'clip_proj']
17 |             for suffix in ['weight', 'bias']
18 |         ] + ['llama.norm.weight', 'visual_query.weight', 'adapter_query.weight']
19 | 
20 |     
21 |     elif model_type == 'LORA':
22 |         keys = [
23 |             f'visual_blocks.{i}.{key}.{suffix}'
24 |             for i in range(8)
25 |             for key in [f'norm{j}' for j in range(1, 3)] + ['attn.qkv', 'attn.proj', 'mlp.fc1', 'mlp.fc2']
26 |             for suffix in ['weight', 'bias']
27 |         ] + [
28 |             f'llama.layers.{i}.{key}'
29 |             for i in range(32)
30 |             for key in ['attention.gate', 'attention.wq.bias', 'attention.wo.bias', 'feed_forward.w1.bias', 'feed_forward.w2.bias', 'feed_forward.w3.bias', 'attention_norm.weight', 'ffn_norm.weight']
31 |                 + [f'attention.lora_wk_l{j}.weight' for j in range(1, 3)]
32 |                 + [f'attention.lora_wo_l{j}.weight' for j in range(1, 3)]
33 |                 + [f'feed_forward.lora_w{k}_l{j}.weight' for k in range(1, 4) for j in range(1, 3)]
34 |                 + [f'attention.lora_wq_l{j}.weight' for j in range(1, 3)]
35 |                 + [f'attention.lora_wv_l{j}.weight' for j in range(1, 3)]
36 |                 + ['attention.new_gate']
37 |         ] + [
38 |             f'{base_key}.{suffix}'
39 |             for base_key in ['clip_proj_norm', 'visual_proj_norm', 'visual_proj', 'clip_proj']
40 |             for suffix in ['weight', 'bias']
41 |         ] + ['llama.norm.weight', 'visual_query.weight', 'adapter_query.weight']
42 | 
43 |     ## TODO: Add other model types
44 | 
45 |     full_model_state_dict = full_model.state_dict()
46 |     small_weights = {key: full_model_state_dict[key] for key in keys}
47 |     if model_type == 'BIAS':
48 |         wrapped_small_weights = {'model': small_weights,'config': {'w_bias': True, 'w_lora': False, 'lora_rank': 16}}
49 |     elif model_type == 'LORA':
50 |         wrapped_small_weights = {'model': small_weights,'config': {'w_bias': True, 'w_lora': True,  'lora_rank': 16}}
51 |     # Save the wrapped small weights
52 |     torch.save(wrapped_small_weights, path)


--------------------------------------------------------------------------------
/llama_adapter_v2_multimodal7b/util/lr_sched.py:
--------------------------------------------------------------------------------
 1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
 2 | # All rights reserved.
 3 | 
 4 | # This source code is licensed under the license found in the
 5 | # LICENSE file in the root directory of this source tree.
 6 | 
 7 | import math
 8 | 
 9 | def adjust_learning_rate(optimizer, epoch, args):
10 |     """Decay the learning rate with half-cycle cosine after warmup"""
11 |     if epoch < args.warmup_epochs:
12 |         lr = args.lr * epoch / args.warmup_epochs 
13 |     else:
14 |         lr = args.min_lr + (args.lr - args.min_lr) * 0.5 * \
15 |             (1. + math.cos(math.pi * (epoch - args.warmup_epochs) / (args.epochs - args.warmup_epochs)))
16 |     for param_group in optimizer.param_groups:
17 |         if "lr_scale" in param_group:
18 |             param_group["lr"] = lr * param_group["lr_scale"]
19 |         else:
20 |             param_group["lr"] = lr
21 |     return lr
22 | 


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
 1 | [build-system]
 2 | requires = [
 3 |     "setuptools",
 4 |     "wheel",
 5 | ]
 6 | 
 7 | [tool.black]
 8 | line-length = 120
 9 | ignore = "E203"
10 | 
11 | [tool.isort]
12 | profile = "black"
13 | line_length = 120
14 | force_sort_within_sections = "False"
15 | order_by_type = "False"
16 | 
17 | [tool.ruff]
18 | line-length = 120
19 | # Enable Pyflakes `E` and `F` codes by default.
20 | select = [
21 |     "E", "W",  # see: https://pypi.org/project/pycodestyle
22 |     "F",  # see: https://pypi.org/project/pyflakes
23 | ]
24 | ignore = [
25 |     "E731",
26 | ]
27 | # Exclude a variety of commonly ignored directories.
28 | exclude = [
29 |     ".git",
30 |     "docs"
31 | ]
32 | ignore-init-module-imports = true
33 | 
34 | [tool.ruff.mccabe]
35 | # Unlike Flake8, default to a complexity level of 10.
36 | max-complexity = 10
37 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | torch
2 | fairscale
3 | fire
4 | sentencepiece
5 | transformers
6 | timm
7 | tensorboard
8 | 


--------------------------------------------------------------------------------
/setup.cfg:
--------------------------------------------------------------------------------
 1 | [options]
 2 | zip_safe = False
 3 | packages = find:
 4 | install_requires =
 5 |     torch
 6 |     fairscale
 7 |     fire
 8 |     sentencepiece
 9 |     transformers
10 |     timm
11 |     tensorboard
12 | 
13 | [options.extras_require]
14 | dev =
15 |     ruff
16 |     black
17 |     pytest
18 |     mypy
19 |     bandit
20 |     coverage
21 |     pre-commit
22 |     isort
23 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
1 | # Copyright (c) Meta Platforms, Inc. and affiliates.
2 | # This software may be used and distributed according to the terms of the GNU General Public License version 3.
3 | 
4 | from setuptools import find_packages, setup
5 | 
6 | setup(name="llama", version="0.0.0", packages=find_packages())
7 | 


--------------------------------------------------------------------------------
/utils/quantization.py:
--------------------------------------------------------------------------------
 1 | import torch
 2 | import bitsandbytes as bnb
 3 | 
 4 | 
 5 | '''
 6 | lit-llama
 7 | '''
 8 | class Linear8bitLt(bnb.nn.Linear8bitLt):
 9 |     """Wraps `bnb.nn.Linear8bitLt` and enables instantiation directly on the device and
10 |     re-quantizaton when loading the state dict.
11 | 
12 | 
13 |     """
14 | 
15 |     def __init__(self, *args, **kwargs):
16 |         super().__init__(*args, **kwargs, has_fp16_weights=False, threshold=6.0)
17 | 
18 |         # We quantize the initial weight here so we don't end up filling the device
19 |         # memory with float32 weights which could lead to OOM.
20 |         self._quantize_weight(self.weight.data)
21 | 
22 |     def _load_from_state_dict(self, local_state_dict, *args, **kwargs):
23 | 
24 |         # There is only one key that ends with `*.weight`, the other one is the bias
25 |         weight_key = next(
26 |             (name for name in local_state_dict.keys() if name.endswith("weight")),
27 |             None,
28 |         )
29 |         if weight_key is None:
30 |             return
31 | 
32 |         # Load the weight from the state dict and re-quantize it
33 |         weight = local_state_dict.pop(weight_key)
34 |         self._quantize_weight(weight)
35 | 
36 |         # If there is a bias, let nn.Module load it
37 |         if local_state_dict:
38 |             super()._load_from_state_dict(local_state_dict, *args, **kwargs)
39 | 
40 |     def _quantize_weight(self, weight: torch.Tensor) -> None:
41 | 
42 |         # This code is taken and adapted from `bnb.nn.Int8Params.cuda()`
43 |         B = weight.contiguous().half().cuda()
44 |         CB, CBt, SCB, SCBt, coo_tensorB = bnb.functional.double_quant(B)
45 |         del CBt
46 |         del SCBt
47 |         self.weight.data = CB
48 |         setattr(self.weight, "CB", CB)
49 |         setattr(self.weight, "SCB", SCB)
50 | 


--------------------------------------------------------------------------------