├── .devcontainer
    ├── Dockerfile
    ├── devcontainer.env
    ├── devcontainer.json
    └── postCreateCommand.sh
├── .dockerignore
├── .editorconfig
├── .gitattributes
├── .github
    └── ISSUE_TEMPLATE
    │   ├── 1-usage.yaml
    │   ├── 2-feature-request.yaml
    │   ├── 3-question.yaml
    │   └── 4-discussion.yaml
├── .gitignore
├── LICENSE
├── README.md
├── cog.yaml
├── docs
    ├── Customize_Component.md
    ├── Data.md
    ├── Evaluation.md
    ├── Finetune_Custom_Data.md
    ├── Intel.md
    ├── LLaVA_Bench.md
    ├── LLaVA_from_LLaMA2.md
    ├── LoRA.md
    ├── MODEL_ZOO.md
    ├── ScienceQA.md
    ├── Windows.md
    └── macOS.md
├── evaluation
    ├── evaluate_final.py
    ├── inference.py
    └── llm_generate.py
├── images
    ├── demo_cli.gif
    ├── llava_example_cmp.png
    ├── llava_logo.png
    └── llava_v1_5_radar.jpg
├── llava
    ├── __init__.py
    ├── constants.py
    ├── conversation.py
    ├── eval
    │   ├── eval_gpt_review.py
    │   ├── eval_gpt_review_bench.py
    │   ├── eval_gpt_review_visual.py
    │   ├── eval_pope.py
    │   ├── eval_science_qa.py
    │   ├── eval_science_qa_gpt4.py
    │   ├── eval_science_qa_gpt4_requery.py
    │   ├── eval_textvqa.py
    │   ├── generate_webpage_data_from_table.py
    │   ├── m4c_evaluator.py
    │   ├── model_qa.py
    │   ├── model_vqa.py
    │   ├── model_vqa_loader.py
    │   ├── model_vqa_mmbench.py
    │   ├── model_vqa_science.py
    │   ├── qa_baseline_gpt35.py
    │   ├── run_llava.py
    │   ├── summarize_gpt_review.py
    │   └── webpage
    │   │   ├── figures
    │   │       ├── alpaca.png
    │   │       ├── bard.jpg
    │   │       ├── chatgpt.svg
    │   │       ├── llama.jpg
    │   │       ├── swords_FILL0_wght300_GRAD0_opsz48.svg
    │   │       └── vicuna.jpeg
    │   │   ├── index.html
    │   │   ├── script.js
    │   │   └── styles.css
    ├── mm_utils.py
    ├── model
    │   ├── __init__.py
    │   ├── apply_delta.py
    │   ├── builder.py
    │   ├── consolidate.py
    │   ├── depth
    │   │   ├── DA-2K.md
    │   │   ├── LICENSE
    │   │   ├── README.md
    │   │   ├── app.py
    │   │   ├── assets
    │   │   │   ├── DA-2K.png
    │   │   │   ├── examples
    │   │   │   │   ├── demo01.jpg
    │   │   │   │   ├── demo02.jpg
    │   │   │   │   ├── demo03.jpg
    │   │   │   │   ├── demo04.jpg
    │   │   │   │   ├── demo05.jpg
    │   │   │   │   ├── demo06.jpg
    │   │   │   │   ├── demo07.jpg
    │   │   │   │   ├── demo08.jpg
    │   │   │   │   ├── demo09.jpg
    │   │   │   │   ├── demo10.jpg
    │   │   │   │   ├── demo11.jpg
    │   │   │   │   ├── demo12.jpg
    │   │   │   │   ├── demo13.jpg
    │   │   │   │   ├── demo14.jpg
    │   │   │   │   ├── demo15.jpg
    │   │   │   │   ├── demo16.jpg
    │   │   │   │   ├── demo17.jpg
    │   │   │   │   ├── demo18.jpg
    │   │   │   │   ├── demo19.jpg
    │   │   │   │   └── demo20.jpg
    │   │   │   ├── examples_video
    │   │   │   │   ├── basketball.mp4
    │   │   │   │   └── ferris_wheel.mp4
    │   │   │   └── teaser.png
    │   │   ├── depth_anything_v2
    │   │   │   ├── dinov2.py
    │   │   │   ├── dinov2_layers
    │   │   │   │   ├── __init__.py
    │   │   │   │   ├── attention.py
    │   │   │   │   ├── block.py
    │   │   │   │   ├── drop_path.py
    │   │   │   │   ├── layer_scale.py
    │   │   │   │   ├── mlp.py
    │   │   │   │   ├── patch_embed.py
    │   │   │   │   └── swiglu_ffn.py
    │   │   │   ├── dpt.py
    │   │   │   └── util
    │   │   │   │   ├── blocks.py
    │   │   │   │   └── transform.py
    │   │   ├── metric_depth
    │   │   │   ├── README.md
    │   │   │   ├── assets
    │   │   │   │   └── compare_zoedepth.png
    │   │   │   ├── dataset
    │   │   │   │   ├── hypersim.py
    │   │   │   │   ├── kitti.py
    │   │   │   │   ├── splits
    │   │   │   │   │   ├── hypersim
    │   │   │   │   │   │   ├── train.txt
    │   │   │   │   │   │   └── val.txt
    │   │   │   │   │   ├── kitti
    │   │   │   │   │   │   └── val.txt
    │   │   │   │   │   └── vkitti2
    │   │   │   │   │   │   └── train.txt
    │   │   │   │   ├── transform.py
    │   │   │   │   └── vkitti2.py
    │   │   │   ├── depth_anything_v2
    │   │   │   │   ├── dinov2.py
    │   │   │   │   ├── dinov2_layers
    │   │   │   │   │   ├── __init__.py
    │   │   │   │   │   ├── attention.py
    │   │   │   │   │   ├── block.py
    │   │   │   │   │   ├── drop_path.py
    │   │   │   │   │   ├── layer_scale.py
    │   │   │   │   │   ├── mlp.py
    │   │   │   │   │   ├── patch_embed.py
    │   │   │   │   │   └── swiglu_ffn.py
    │   │   │   │   ├── dpt.py
    │   │   │   │   └── util
    │   │   │   │   │   ├── blocks.py
    │   │   │   │   │   └── transform.py
    │   │   │   ├── depth_to_pointcloud.py
    │   │   │   ├── dist_train.sh
    │   │   │   ├── requirements.txt
    │   │   │   ├── run.py
    │   │   │   ├── train.py
    │   │   │   └── util
    │   │   │   │   ├── dist_helper.py
    │   │   │   │   ├── loss.py
    │   │   │   │   ├── metric.py
    │   │   │   │   └── utils.py
    │   │   ├── requirements.txt
    │   │   ├── run.py
    │   │   └── run_video.py
    │   ├── depth_encoding.py
    │   ├── language_model
    │   │   ├── llava_llama.py
    │   │   ├── llava_mistral.py
    │   │   └── llava_mpt.py
    │   ├── llava_arch.py
    │   ├── make_delta.py
    │   ├── multimodal_encoder
    │   │   ├── builder.py
    │   │   └── clip_encoder.py
    │   ├── multimodal_projector
    │   │   └── builder.py
    │   └── utils.py
    ├── serve
    │   ├── __init__.py
    │   ├── cli.py
    │   ├── controller.py
    │   ├── examples
    │   │   ├── extreme_ironing.jpg
    │   │   └── waterview.jpg
    │   ├── gradio_web_server.py
    │   ├── model_worker.py
    │   ├── register_worker.py
    │   ├── sglang_worker.py
    │   └── test_message.py
    ├── train
    │   ├── llama_flash_attn_monkey_patch.py
    │   ├── llama_xformers_attn_monkey_patch.py
    │   ├── llava_trainer.py
    │   ├── train.py
    │   ├── train_mem.py
    │   └── train_xformers.py
    └── utils.py
├── predict.py
├── pyproject.toml
└── scripts
    ├── convert_gqa_for_eval.py
    ├── convert_mmbench_for_submission.py
    ├── convert_mmvet_for_eval.py
    ├── convert_seed_for_submission.py
    ├── convert_sqa_to_llava.py
    ├── convert_sqa_to_llava_base_prompt.py
    ├── convert_vizwiz_for_submission.py
    ├── convert_vqav2_for_submission.py
    ├── extract_mm_projector.py
    ├── finetune.sh
    ├── finetune_full_schedule.sh
    ├── finetune_lora.sh
    ├── finetune_qlora.sh
    ├── finetune_sqa.sh
    ├── merge_lora_weights.py
    ├── pretrain.sh
    ├── pretrain_xformers.sh
    ├── sqa_eval_batch.sh
    ├── sqa_eval_gather.sh
    ├── upload_pypi.sh
    └── v1_5
        ├── eval
            ├── gqa.sh
            ├── llavabench.sh
            ├── mmbench.sh
            ├── mmbench_cn.sh
            ├── mme.sh
            ├── mmvet.sh
            ├── pope.sh
            ├── qbench.sh
            ├── qbench_zh.sh
            ├── seed.sh
            ├── sqa.sh
            ├── textvqa.sh
            ├── vizwiz.sh
            └── vqav2.sh
        ├── finetune.sh
        ├── finetune_task.sh
        ├── finetune_task_lora.sh
        └── pretrain.sh


/.devcontainer/Dockerfile:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.devcontainer/Dockerfile


--------------------------------------------------------------------------------
/.devcontainer/devcontainer.env:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.devcontainer/devcontainer.env


--------------------------------------------------------------------------------
/.devcontainer/devcontainer.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.devcontainer/devcontainer.json


--------------------------------------------------------------------------------
/.devcontainer/postCreateCommand.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.devcontainer/postCreateCommand.sh


--------------------------------------------------------------------------------
/.dockerignore:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.dockerignore


--------------------------------------------------------------------------------
/.editorconfig:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.editorconfig


--------------------------------------------------------------------------------
/.gitattributes:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.gitattributes


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/1-usage.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.github/ISSUE_TEMPLATE/1-usage.yaml


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/2-feature-request.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.github/ISSUE_TEMPLATE/2-feature-request.yaml


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/3-question.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.github/ISSUE_TEMPLATE/3-question.yaml


--------------------------------------------------------------------------------
/.github/ISSUE_TEMPLATE/4-discussion.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.github/ISSUE_TEMPLATE/4-discussion.yaml


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/.gitignore


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/LICENSE


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/README.md


--------------------------------------------------------------------------------
/cog.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/cog.yaml


--------------------------------------------------------------------------------
/docs/Customize_Component.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/Customize_Component.md


--------------------------------------------------------------------------------
/docs/Data.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/Data.md


--------------------------------------------------------------------------------
/docs/Evaluation.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/Evaluation.md


--------------------------------------------------------------------------------
/docs/Finetune_Custom_Data.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/Finetune_Custom_Data.md


--------------------------------------------------------------------------------
/docs/Intel.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/Intel.md


--------------------------------------------------------------------------------
/docs/LLaVA_Bench.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/LLaVA_Bench.md


--------------------------------------------------------------------------------
/docs/LLaVA_from_LLaMA2.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/LLaVA_from_LLaMA2.md


--------------------------------------------------------------------------------
/docs/LoRA.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/LoRA.md


--------------------------------------------------------------------------------
/docs/MODEL_ZOO.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/MODEL_ZOO.md


--------------------------------------------------------------------------------
/docs/ScienceQA.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/ScienceQA.md


--------------------------------------------------------------------------------
/docs/Windows.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/Windows.md


--------------------------------------------------------------------------------
/docs/macOS.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/docs/macOS.md


--------------------------------------------------------------------------------
/evaluation/evaluate_final.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/evaluation/evaluate_final.py


--------------------------------------------------------------------------------
/evaluation/inference.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/evaluation/inference.py


--------------------------------------------------------------------------------
/evaluation/llm_generate.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/evaluation/llm_generate.py


--------------------------------------------------------------------------------
/images/demo_cli.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/images/demo_cli.gif


--------------------------------------------------------------------------------
/images/llava_example_cmp.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/images/llava_example_cmp.png


--------------------------------------------------------------------------------
/images/llava_logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/images/llava_logo.png


--------------------------------------------------------------------------------
/images/llava_v1_5_radar.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/images/llava_v1_5_radar.jpg


--------------------------------------------------------------------------------
/llava/__init__.py:
--------------------------------------------------------------------------------
1 | from .model import LlavaLlamaForCausalLM
2 | 


--------------------------------------------------------------------------------
/llava/constants.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/constants.py


--------------------------------------------------------------------------------
/llava/conversation.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/conversation.py


--------------------------------------------------------------------------------
/llava/eval/eval_gpt_review.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_gpt_review.py


--------------------------------------------------------------------------------
/llava/eval/eval_gpt_review_bench.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_gpt_review_bench.py


--------------------------------------------------------------------------------
/llava/eval/eval_gpt_review_visual.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_gpt_review_visual.py


--------------------------------------------------------------------------------
/llava/eval/eval_pope.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_pope.py


--------------------------------------------------------------------------------
/llava/eval/eval_science_qa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_science_qa.py


--------------------------------------------------------------------------------
/llava/eval/eval_science_qa_gpt4.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_science_qa_gpt4.py


--------------------------------------------------------------------------------
/llava/eval/eval_science_qa_gpt4_requery.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_science_qa_gpt4_requery.py


--------------------------------------------------------------------------------
/llava/eval/eval_textvqa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/eval_textvqa.py


--------------------------------------------------------------------------------
/llava/eval/generate_webpage_data_from_table.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/generate_webpage_data_from_table.py


--------------------------------------------------------------------------------
/llava/eval/m4c_evaluator.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/m4c_evaluator.py


--------------------------------------------------------------------------------
/llava/eval/model_qa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/model_qa.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/model_vqa.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa_loader.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/model_vqa_loader.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa_mmbench.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/model_vqa_mmbench.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa_science.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/model_vqa_science.py


--------------------------------------------------------------------------------
/llava/eval/qa_baseline_gpt35.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/qa_baseline_gpt35.py


--------------------------------------------------------------------------------
/llava/eval/run_llava.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/run_llava.py


--------------------------------------------------------------------------------
/llava/eval/summarize_gpt_review.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/summarize_gpt_review.py


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/alpaca.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/figures/alpaca.png


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/bard.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/figures/bard.jpg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/chatgpt.svg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/figures/chatgpt.svg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/llama.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/figures/llama.jpg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/vicuna.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/figures/vicuna.jpeg


--------------------------------------------------------------------------------
/llava/eval/webpage/index.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/index.html


--------------------------------------------------------------------------------
/llava/eval/webpage/script.js:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/script.js


--------------------------------------------------------------------------------
/llava/eval/webpage/styles.css:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/eval/webpage/styles.css


--------------------------------------------------------------------------------
/llava/mm_utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/mm_utils.py


--------------------------------------------------------------------------------
/llava/model/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/__init__.py


--------------------------------------------------------------------------------
/llava/model/apply_delta.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/apply_delta.py


--------------------------------------------------------------------------------
/llava/model/builder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/builder.py


--------------------------------------------------------------------------------
/llava/model/consolidate.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/consolidate.py


--------------------------------------------------------------------------------
/llava/model/depth/DA-2K.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/DA-2K.md


--------------------------------------------------------------------------------
/llava/model/depth/LICENSE:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/LICENSE


--------------------------------------------------------------------------------
/llava/model/depth/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/README.md


--------------------------------------------------------------------------------
/llava/model/depth/app.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/app.py


--------------------------------------------------------------------------------
/llava/model/depth/assets/DA-2K.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/DA-2K.png


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo01.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo01.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo02.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo02.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo03.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo03.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo04.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo04.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo05.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo05.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo06.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo06.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo07.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo07.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo08.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo08.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo09.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo09.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo10.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo10.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo11.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo11.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo12.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo12.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo13.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo13.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo14.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo14.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo15.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo15.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo16.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo16.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo17.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo17.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo18.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo18.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo19.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo19.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples/demo20.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples/demo20.jpg


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples_video/basketball.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples_video/basketball.mp4


--------------------------------------------------------------------------------
/llava/model/depth/assets/examples_video/ferris_wheel.mp4:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/examples_video/ferris_wheel.mp4


--------------------------------------------------------------------------------
/llava/model/depth/assets/teaser.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/assets/teaser.png


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/__init__.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/attention.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/attention.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/block.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/block.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/drop_path.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/drop_path.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/layer_scale.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/layer_scale.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/mlp.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/mlp.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/patch_embed.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/patch_embed.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dinov2_layers/swiglu_ffn.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dinov2_layers/swiglu_ffn.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/dpt.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/dpt.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/util/blocks.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/util/blocks.py


--------------------------------------------------------------------------------
/llava/model/depth/depth_anything_v2/util/transform.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/depth_anything_v2/util/transform.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/README.md


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/assets/compare_zoedepth.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/assets/compare_zoedepth.png


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/hypersim.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/hypersim.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/kitti.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/kitti.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/splits/hypersim/train.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/splits/hypersim/train.txt


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/splits/hypersim/val.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/splits/hypersim/val.txt


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/splits/kitti/val.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/splits/kitti/val.txt


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/splits/vkitti2/train.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/splits/vkitti2/train.txt


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/transform.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/transform.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dataset/vkitti2.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dataset/vkitti2.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/__init__.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/attention.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/attention.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/block.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/block.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/drop_path.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/drop_path.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/layer_scale.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/layer_scale.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/mlp.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/mlp.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/patch_embed.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/patch_embed.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/swiglu_ffn.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dinov2_layers/swiglu_ffn.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/dpt.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/dpt.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/util/blocks.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/util/blocks.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_anything_v2/util/transform.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_anything_v2/util/transform.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/depth_to_pointcloud.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/depth_to_pointcloud.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/dist_train.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/dist_train.sh


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/requirements.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/requirements.txt


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/run.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/run.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/train.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/train.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/util/dist_helper.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/util/dist_helper.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/util/loss.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/util/loss.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/util/metric.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/util/metric.py


--------------------------------------------------------------------------------
/llava/model/depth/metric_depth/util/utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/metric_depth/util/utils.py


--------------------------------------------------------------------------------
/llava/model/depth/requirements.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/requirements.txt


--------------------------------------------------------------------------------
/llava/model/depth/run.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/run.py


--------------------------------------------------------------------------------
/llava/model/depth/run_video.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth/run_video.py


--------------------------------------------------------------------------------
/llava/model/depth_encoding.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/depth_encoding.py


--------------------------------------------------------------------------------
/llava/model/language_model/llava_llama.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/language_model/llava_llama.py


--------------------------------------------------------------------------------
/llava/model/language_model/llava_mistral.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/language_model/llava_mistral.py


--------------------------------------------------------------------------------
/llava/model/language_model/llava_mpt.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/language_model/llava_mpt.py


--------------------------------------------------------------------------------
/llava/model/llava_arch.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/llava_arch.py


--------------------------------------------------------------------------------
/llava/model/make_delta.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/make_delta.py


--------------------------------------------------------------------------------
/llava/model/multimodal_encoder/builder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/multimodal_encoder/builder.py


--------------------------------------------------------------------------------
/llava/model/multimodal_encoder/clip_encoder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/multimodal_encoder/clip_encoder.py


--------------------------------------------------------------------------------
/llava/model/multimodal_projector/builder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/multimodal_projector/builder.py


--------------------------------------------------------------------------------
/llava/model/utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/model/utils.py


--------------------------------------------------------------------------------
/llava/serve/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/llava/serve/cli.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/cli.py


--------------------------------------------------------------------------------
/llava/serve/controller.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/controller.py


--------------------------------------------------------------------------------
/llava/serve/examples/extreme_ironing.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/examples/extreme_ironing.jpg


--------------------------------------------------------------------------------
/llava/serve/examples/waterview.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/examples/waterview.jpg


--------------------------------------------------------------------------------
/llava/serve/gradio_web_server.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/gradio_web_server.py


--------------------------------------------------------------------------------
/llava/serve/model_worker.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/model_worker.py


--------------------------------------------------------------------------------
/llava/serve/register_worker.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/register_worker.py


--------------------------------------------------------------------------------
/llava/serve/sglang_worker.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/sglang_worker.py


--------------------------------------------------------------------------------
/llava/serve/test_message.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/serve/test_message.py


--------------------------------------------------------------------------------
/llava/train/llama_flash_attn_monkey_patch.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/train/llama_flash_attn_monkey_patch.py


--------------------------------------------------------------------------------
/llava/train/llama_xformers_attn_monkey_patch.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/train/llama_xformers_attn_monkey_patch.py


--------------------------------------------------------------------------------
/llava/train/llava_trainer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/train/llava_trainer.py


--------------------------------------------------------------------------------
/llava/train/train.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/train/train.py


--------------------------------------------------------------------------------
/llava/train/train_mem.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/train/train_mem.py


--------------------------------------------------------------------------------
/llava/train/train_xformers.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/train/train_xformers.py


--------------------------------------------------------------------------------
/llava/utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/llava/utils.py


--------------------------------------------------------------------------------
/predict.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/predict.py


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/pyproject.toml


--------------------------------------------------------------------------------
/scripts/convert_gqa_for_eval.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_gqa_for_eval.py


--------------------------------------------------------------------------------
/scripts/convert_mmbench_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_mmbench_for_submission.py


--------------------------------------------------------------------------------
/scripts/convert_mmvet_for_eval.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_mmvet_for_eval.py


--------------------------------------------------------------------------------
/scripts/convert_seed_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_seed_for_submission.py


--------------------------------------------------------------------------------
/scripts/convert_sqa_to_llava.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_sqa_to_llava.py


--------------------------------------------------------------------------------
/scripts/convert_sqa_to_llava_base_prompt.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_sqa_to_llava_base_prompt.py


--------------------------------------------------------------------------------
/scripts/convert_vizwiz_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_vizwiz_for_submission.py


--------------------------------------------------------------------------------
/scripts/convert_vqav2_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/convert_vqav2_for_submission.py


--------------------------------------------------------------------------------
/scripts/extract_mm_projector.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/extract_mm_projector.py


--------------------------------------------------------------------------------
/scripts/finetune.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/finetune.sh


--------------------------------------------------------------------------------
/scripts/finetune_full_schedule.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/finetune_full_schedule.sh


--------------------------------------------------------------------------------
/scripts/finetune_lora.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/finetune_lora.sh


--------------------------------------------------------------------------------
/scripts/finetune_qlora.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/finetune_qlora.sh


--------------------------------------------------------------------------------
/scripts/finetune_sqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/finetune_sqa.sh


--------------------------------------------------------------------------------
/scripts/merge_lora_weights.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/merge_lora_weights.py


--------------------------------------------------------------------------------
/scripts/pretrain.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/pretrain.sh


--------------------------------------------------------------------------------
/scripts/pretrain_xformers.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/pretrain_xformers.sh


--------------------------------------------------------------------------------
/scripts/sqa_eval_batch.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/sqa_eval_batch.sh


--------------------------------------------------------------------------------
/scripts/sqa_eval_gather.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/sqa_eval_gather.sh


--------------------------------------------------------------------------------
/scripts/upload_pypi.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/upload_pypi.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/gqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/gqa.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/llavabench.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/llavabench.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mmbench.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/mmbench.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mmbench_cn.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/mmbench_cn.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mme.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/mme.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mmvet.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/mmvet.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/pope.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/pope.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/qbench.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/qbench.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/qbench_zh.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/qbench_zh.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/seed.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/seed.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/sqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/sqa.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/textvqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/textvqa.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/vizwiz.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/vizwiz.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/vqav2.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/eval/vqav2.sh


--------------------------------------------------------------------------------
/scripts/v1_5/finetune.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/finetune.sh


--------------------------------------------------------------------------------
/scripts/v1_5/finetune_task.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/finetune_task.sh


--------------------------------------------------------------------------------
/scripts/v1_5/finetune_task_lora.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/finetune_task_lora.sh


--------------------------------------------------------------------------------
/scripts/v1_5/pretrain.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/cpystan/SD-VLM/HEAD/scripts/v1_5/pretrain.sh


--------------------------------------------------------------------------------