├── LICENSE
├── README.md
├── assets
    ├── -twitter-blue.svg
    ├── Paper-Arxiv-orange.svg
    ├── case.png
    ├── data.png
    └── main.png
├── cog.yaml
├── docs
    ├── Customize_Component.md
    ├── Data.md
    ├── Evaluation.md
    ├── Finetune_Custom_Data.md
    ├── Intel.md
    ├── LLaVA_Bench.md
    ├── LLaVA_from_LLaMA2.md
    ├── LoRA.md
    ├── MODEL_ZOO.md
    ├── ScienceQA.md
    ├── Windows.md
    └── macOS.md
├── images
    ├── demo_cli.gif
    ├── llava_example_cmp.png
    ├── llava_logo.png
    └── llava_v1_5_radar.jpg
├── llava
    ├── __init__.py
    ├── constants.py
    ├── conversation.py
    ├── eval
    │   ├── eval_gpt_review.py
    │   ├── eval_gpt_review_bench.py
    │   ├── eval_gpt_review_visual.py
    │   ├── eval_pope.py
    │   ├── eval_science_qa.py
    │   ├── eval_science_qa_gpt4.py
    │   ├── eval_science_qa_gpt4_requery.py
    │   ├── eval_textvqa.py
    │   ├── generate_webpage_data_from_table.py
    │   ├── m4c_evaluator.py
    │   ├── model_qa.py
    │   ├── model_vqa.py
    │   ├── model_vqa_loader.py
    │   ├── model_vqa_mmbench.py
    │   ├── model_vqa_science.py
    │   ├── qa_baseline_gpt35.py
    │   ├── run_llava.py
    │   ├── summarize_gpt_review.py
    │   ├── table
    │   │   ├── answer
    │   │   │   ├── answer_alpaca-13b.jsonl
    │   │   │   ├── answer_bard.jsonl
    │   │   │   ├── answer_gpt35.jsonl
    │   │   │   ├── answer_llama-13b.jsonl
    │   │   │   └── answer_vicuna-13b.jsonl
    │   │   ├── caps_boxes_coco2014_val_80.jsonl
    │   │   ├── model.jsonl
    │   │   ├── prompt.jsonl
    │   │   ├── question.jsonl
    │   │   ├── results
    │   │   │   ├── test_sqa_llava_13b_v0.json
    │   │   │   └── test_sqa_llava_lcs_558k_sqa_12e_vicuna_v1_3_13b.json
    │   │   ├── review
    │   │   │   ├── review_alpaca-13b_vicuna-13b.jsonl
    │   │   │   ├── review_bard_vicuna-13b.jsonl
    │   │   │   ├── review_gpt35_vicuna-13b.jsonl
    │   │   │   └── review_llama-13b_vicuna-13b.jsonl
    │   │   ├── reviewer.jsonl
    │   │   └── rule.json
    │   └── webpage
    │   │   ├── figures
    │   │       ├── alpaca.png
    │   │       ├── bard.jpg
    │   │       ├── chatgpt.svg
    │   │       ├── llama.jpg
    │   │       ├── swords_FILL0_wght300_GRAD0_opsz48.svg
    │   │       └── vicuna.jpeg
    │   │   ├── index.html
    │   │   ├── script.js
    │   │   └── styles.css
    ├── mm_utils.py
    ├── model
    │   ├── __init__.py
    │   ├── apply_delta.py
    │   ├── builder.py
    │   ├── consolidate.py
    │   ├── language_model
    │   │   ├── llava_llama.py
    │   │   ├── llava_mistral.py
    │   │   └── llava_mpt.py
    │   ├── llava_arch.py
    │   ├── make_delta.py
    │   ├── multimodal_encoder
    │   │   ├── builder.py
    │   │   └── clip_encoder.py
    │   ├── multimodal_projector
    │   │   └── builder.py
    │   └── utils.py
    ├── serve
    │   ├── __init__.py
    │   ├── cli.py
    │   ├── controller.py
    │   ├── examples
    │   │   ├── extreme_ironing.jpg
    │   │   └── waterview.jpg
    │   ├── gradio_web_server.py
    │   ├── model_worker.py
    │   ├── register_worker.py
    │   ├── sglang_worker.py
    │   └── test_message.py
    ├── train
    │   ├── llama_flash_attn_monkey_patch.py
    │   ├── llama_xformers_attn_monkey_patch.py
    │   ├── llava_trainer.py
    │   ├── train.py
    │   ├── train_dpo.py
    │   ├── train_dpo_inherent.py
    │   ├── train_mem.py
    │   └── train_xformers.py
    └── utils.py
├── playground
    └── data
    │   ├── coco2014_val_gpt4_qa_30x3.jsonl
    │   ├── coco2014_val_qa_eval
    │       ├── qa90_gpt4_answer.jsonl
    │       └── qa90_questions.jsonl
    │   └── prompts
    │       ├── complex_reasoning
    │           ├── 000_caps.txt
    │           ├── 000_conv.txt
    │           ├── 001_caps.txt
    │           ├── 001_conv.txt
    │           ├── 002_caps.txt
    │           ├── 002_conv.txt
    │           └── system_message.txt
    │       ├── conversation
    │           ├── 000_caps.txt
    │           ├── 000_conv.txt
    │           ├── 001_caps.txt
    │           ├── 001_conv.txt
    │           └── system_message.txt
    │       └── detail_description
    │           ├── 000_caps.txt
    │           ├── 000_conv.txt
    │           ├── 001_caps.txt
    │           ├── 001_conv.txt
    │           ├── 002_caps.txt
    │           ├── 002_conv.txt
    │           └── system_message.txt
├── povid_infer.py
├── predict.py
├── pyproject.toml
├── scripts
    ├── convert_gqa_for_eval.py
    ├── convert_mmbench_for_submission.py
    ├── convert_mmvet_for_eval.py
    ├── convert_seed_for_submission.py
    ├── convert_sqa_to_llava.py
    ├── convert_sqa_to_llava_base_prompt.py
    ├── convert_vizwiz_for_submission.py
    ├── convert_vqav2_for_submission.py
    ├── extract_mm_projector.py
    ├── finetune.sh
    ├── finetune_full_schedule.sh
    ├── finetune_lora.sh
    ├── finetune_qlora.sh
    ├── finetune_sqa.sh
    ├── merge_lora_weights.py
    ├── pretrain.sh
    ├── pretrain_xformers.sh
    ├── run_dpo.sh
    ├── run_povid.sh
    ├── sqa_eval_batch.sh
    ├── sqa_eval_gather.sh
    ├── upload_pypi.sh
    ├── v1_5
    │   ├── eval
    │   │   ├── gqa.sh
    │   │   ├── llavabench.sh
    │   │   ├── mmbench.sh
    │   │   ├── mmbench_cn.sh
    │   │   ├── mme.sh
    │   │   ├── mmvet.sh
    │   │   ├── pope.sh
    │   │   ├── qbench.sh
    │   │   ├── qbench_zh.sh
    │   │   ├── seed.sh
    │   │   ├── sqa.sh
    │   │   ├── textvqa.sh
    │   │   ├── vizwiz.sh
    │   │   └── vqav2.sh
    │   ├── finetune.sh
    │   ├── finetune_lora.sh
    │   ├── finetune_task.sh
    │   ├── finetune_task_lora.sh
    │   └── pretrain.sh
    ├── zero2.json
    ├── zero3.json
    └── zero3_offload.json
└── tool
    ├── dpo_trainer.py
    └── dpo_trainer_inherent.py


/LICENSE:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/LICENSE


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/README.md


--------------------------------------------------------------------------------
/assets/-twitter-blue.svg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/assets/-twitter-blue.svg


--------------------------------------------------------------------------------
/assets/Paper-Arxiv-orange.svg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/assets/Paper-Arxiv-orange.svg


--------------------------------------------------------------------------------
/assets/case.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/assets/case.png


--------------------------------------------------------------------------------
/assets/data.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/assets/data.png


--------------------------------------------------------------------------------
/assets/main.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/assets/main.png


--------------------------------------------------------------------------------
/cog.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/cog.yaml


--------------------------------------------------------------------------------
/docs/Customize_Component.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/Customize_Component.md


--------------------------------------------------------------------------------
/docs/Data.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/Data.md


--------------------------------------------------------------------------------
/docs/Evaluation.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/Evaluation.md


--------------------------------------------------------------------------------
/docs/Finetune_Custom_Data.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/Finetune_Custom_Data.md


--------------------------------------------------------------------------------
/docs/Intel.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/Intel.md


--------------------------------------------------------------------------------
/docs/LLaVA_Bench.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/LLaVA_Bench.md


--------------------------------------------------------------------------------
/docs/LLaVA_from_LLaMA2.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/LLaVA_from_LLaMA2.md


--------------------------------------------------------------------------------
/docs/LoRA.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/LoRA.md


--------------------------------------------------------------------------------
/docs/MODEL_ZOO.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/MODEL_ZOO.md


--------------------------------------------------------------------------------
/docs/ScienceQA.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/ScienceQA.md


--------------------------------------------------------------------------------
/docs/Windows.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/Windows.md


--------------------------------------------------------------------------------
/docs/macOS.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/docs/macOS.md


--------------------------------------------------------------------------------
/images/demo_cli.gif:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/images/demo_cli.gif


--------------------------------------------------------------------------------
/images/llava_example_cmp.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/images/llava_example_cmp.png


--------------------------------------------------------------------------------
/images/llava_logo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/images/llava_logo.png


--------------------------------------------------------------------------------
/images/llava_v1_5_radar.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/images/llava_v1_5_radar.jpg


--------------------------------------------------------------------------------
/llava/__init__.py:
--------------------------------------------------------------------------------
1 | from .model import LlavaLlamaForCausalLM
2 | 


--------------------------------------------------------------------------------
/llava/constants.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/constants.py


--------------------------------------------------------------------------------
/llava/conversation.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/conversation.py


--------------------------------------------------------------------------------
/llava/eval/eval_gpt_review.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_gpt_review.py


--------------------------------------------------------------------------------
/llava/eval/eval_gpt_review_bench.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_gpt_review_bench.py


--------------------------------------------------------------------------------
/llava/eval/eval_gpt_review_visual.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_gpt_review_visual.py


--------------------------------------------------------------------------------
/llava/eval/eval_pope.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_pope.py


--------------------------------------------------------------------------------
/llava/eval/eval_science_qa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_science_qa.py


--------------------------------------------------------------------------------
/llava/eval/eval_science_qa_gpt4.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_science_qa_gpt4.py


--------------------------------------------------------------------------------
/llava/eval/eval_science_qa_gpt4_requery.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_science_qa_gpt4_requery.py


--------------------------------------------------------------------------------
/llava/eval/eval_textvqa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/eval_textvqa.py


--------------------------------------------------------------------------------
/llava/eval/generate_webpage_data_from_table.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/generate_webpage_data_from_table.py


--------------------------------------------------------------------------------
/llava/eval/m4c_evaluator.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/m4c_evaluator.py


--------------------------------------------------------------------------------
/llava/eval/model_qa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/model_qa.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/model_vqa.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa_loader.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/model_vqa_loader.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa_mmbench.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/model_vqa_mmbench.py


--------------------------------------------------------------------------------
/llava/eval/model_vqa_science.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/model_vqa_science.py


--------------------------------------------------------------------------------
/llava/eval/qa_baseline_gpt35.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/qa_baseline_gpt35.py


--------------------------------------------------------------------------------
/llava/eval/run_llava.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/run_llava.py


--------------------------------------------------------------------------------
/llava/eval/summarize_gpt_review.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/summarize_gpt_review.py


--------------------------------------------------------------------------------
/llava/eval/table/answer/answer_alpaca-13b.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/answer/answer_alpaca-13b.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/answer/answer_bard.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/answer/answer_bard.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/answer/answer_gpt35.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/answer/answer_gpt35.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/answer/answer_llama-13b.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/answer/answer_llama-13b.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/answer/answer_vicuna-13b.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/answer/answer_vicuna-13b.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/caps_boxes_coco2014_val_80.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/caps_boxes_coco2014_val_80.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/model.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/model.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/prompt.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/prompt.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/question.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/question.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/results/test_sqa_llava_13b_v0.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/results/test_sqa_llava_13b_v0.json


--------------------------------------------------------------------------------
/llava/eval/table/results/test_sqa_llava_lcs_558k_sqa_12e_vicuna_v1_3_13b.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/results/test_sqa_llava_lcs_558k_sqa_12e_vicuna_v1_3_13b.json


--------------------------------------------------------------------------------
/llava/eval/table/review/review_alpaca-13b_vicuna-13b.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/review/review_alpaca-13b_vicuna-13b.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/review/review_bard_vicuna-13b.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/review/review_bard_vicuna-13b.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/review/review_gpt35_vicuna-13b.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/review/review_gpt35_vicuna-13b.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/review/review_llama-13b_vicuna-13b.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/review/review_llama-13b_vicuna-13b.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/reviewer.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/reviewer.jsonl


--------------------------------------------------------------------------------
/llava/eval/table/rule.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/table/rule.json


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/alpaca.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/figures/alpaca.png


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/bard.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/figures/bard.jpg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/chatgpt.svg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/figures/chatgpt.svg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/llama.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/figures/llama.jpg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg


--------------------------------------------------------------------------------
/llava/eval/webpage/figures/vicuna.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/figures/vicuna.jpeg


--------------------------------------------------------------------------------
/llava/eval/webpage/index.html:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/index.html


--------------------------------------------------------------------------------
/llava/eval/webpage/script.js:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/script.js


--------------------------------------------------------------------------------
/llava/eval/webpage/styles.css:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/eval/webpage/styles.css


--------------------------------------------------------------------------------
/llava/mm_utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/mm_utils.py


--------------------------------------------------------------------------------
/llava/model/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/__init__.py


--------------------------------------------------------------------------------
/llava/model/apply_delta.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/apply_delta.py


--------------------------------------------------------------------------------
/llava/model/builder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/builder.py


--------------------------------------------------------------------------------
/llava/model/consolidate.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/consolidate.py


--------------------------------------------------------------------------------
/llava/model/language_model/llava_llama.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/language_model/llava_llama.py


--------------------------------------------------------------------------------
/llava/model/language_model/llava_mistral.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/language_model/llava_mistral.py


--------------------------------------------------------------------------------
/llava/model/language_model/llava_mpt.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/language_model/llava_mpt.py


--------------------------------------------------------------------------------
/llava/model/llava_arch.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/llava_arch.py


--------------------------------------------------------------------------------
/llava/model/make_delta.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/make_delta.py


--------------------------------------------------------------------------------
/llava/model/multimodal_encoder/builder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/multimodal_encoder/builder.py


--------------------------------------------------------------------------------
/llava/model/multimodal_encoder/clip_encoder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/multimodal_encoder/clip_encoder.py


--------------------------------------------------------------------------------
/llava/model/multimodal_projector/builder.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/multimodal_projector/builder.py


--------------------------------------------------------------------------------
/llava/model/utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/model/utils.py


--------------------------------------------------------------------------------
/llava/serve/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/llava/serve/cli.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/cli.py


--------------------------------------------------------------------------------
/llava/serve/controller.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/controller.py


--------------------------------------------------------------------------------
/llava/serve/examples/extreme_ironing.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/examples/extreme_ironing.jpg


--------------------------------------------------------------------------------
/llava/serve/examples/waterview.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/examples/waterview.jpg


--------------------------------------------------------------------------------
/llava/serve/gradio_web_server.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/gradio_web_server.py


--------------------------------------------------------------------------------
/llava/serve/model_worker.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/model_worker.py


--------------------------------------------------------------------------------
/llava/serve/register_worker.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/register_worker.py


--------------------------------------------------------------------------------
/llava/serve/sglang_worker.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/sglang_worker.py


--------------------------------------------------------------------------------
/llava/serve/test_message.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/serve/test_message.py


--------------------------------------------------------------------------------
/llava/train/llama_flash_attn_monkey_patch.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/llama_flash_attn_monkey_patch.py


--------------------------------------------------------------------------------
/llava/train/llama_xformers_attn_monkey_patch.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/llama_xformers_attn_monkey_patch.py


--------------------------------------------------------------------------------
/llava/train/llava_trainer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/llava_trainer.py


--------------------------------------------------------------------------------
/llava/train/train.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/train.py


--------------------------------------------------------------------------------
/llava/train/train_dpo.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/train_dpo.py


--------------------------------------------------------------------------------
/llava/train/train_dpo_inherent.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/train_dpo_inherent.py


--------------------------------------------------------------------------------
/llava/train/train_mem.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/train_mem.py


--------------------------------------------------------------------------------
/llava/train/train_xformers.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/train/train_xformers.py


--------------------------------------------------------------------------------
/llava/utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/llava/utils.py


--------------------------------------------------------------------------------
/playground/data/coco2014_val_gpt4_qa_30x3.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/coco2014_val_gpt4_qa_30x3.jsonl


--------------------------------------------------------------------------------
/playground/data/coco2014_val_qa_eval/qa90_gpt4_answer.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/coco2014_val_qa_eval/qa90_gpt4_answer.jsonl


--------------------------------------------------------------------------------
/playground/data/coco2014_val_qa_eval/qa90_questions.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/coco2014_val_qa_eval/qa90_questions.jsonl


--------------------------------------------------------------------------------
/playground/data/prompts/complex_reasoning/000_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/complex_reasoning/000_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/complex_reasoning/000_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/complex_reasoning/000_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/complex_reasoning/001_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/complex_reasoning/001_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/complex_reasoning/001_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/complex_reasoning/001_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/complex_reasoning/002_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/complex_reasoning/002_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/complex_reasoning/002_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/complex_reasoning/002_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/complex_reasoning/system_message.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/complex_reasoning/system_message.txt


--------------------------------------------------------------------------------
/playground/data/prompts/conversation/000_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/conversation/000_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/conversation/000_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/conversation/000_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/conversation/001_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/conversation/001_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/conversation/001_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/conversation/001_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/conversation/system_message.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/conversation/system_message.txt


--------------------------------------------------------------------------------
/playground/data/prompts/detail_description/000_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/detail_description/000_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/detail_description/000_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/detail_description/000_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/detail_description/001_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/detail_description/001_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/detail_description/001_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/detail_description/001_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/detail_description/002_caps.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/detail_description/002_caps.txt


--------------------------------------------------------------------------------
/playground/data/prompts/detail_description/002_conv.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/detail_description/002_conv.txt


--------------------------------------------------------------------------------
/playground/data/prompts/detail_description/system_message.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/playground/data/prompts/detail_description/system_message.txt


--------------------------------------------------------------------------------
/povid_infer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/povid_infer.py


--------------------------------------------------------------------------------
/predict.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/predict.py


--------------------------------------------------------------------------------
/pyproject.toml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/pyproject.toml


--------------------------------------------------------------------------------
/scripts/convert_gqa_for_eval.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_gqa_for_eval.py


--------------------------------------------------------------------------------
/scripts/convert_mmbench_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_mmbench_for_submission.py


--------------------------------------------------------------------------------
/scripts/convert_mmvet_for_eval.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_mmvet_for_eval.py


--------------------------------------------------------------------------------
/scripts/convert_seed_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_seed_for_submission.py


--------------------------------------------------------------------------------
/scripts/convert_sqa_to_llava.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_sqa_to_llava.py


--------------------------------------------------------------------------------
/scripts/convert_sqa_to_llava_base_prompt.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_sqa_to_llava_base_prompt.py


--------------------------------------------------------------------------------
/scripts/convert_vizwiz_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_vizwiz_for_submission.py


--------------------------------------------------------------------------------
/scripts/convert_vqav2_for_submission.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/convert_vqav2_for_submission.py


--------------------------------------------------------------------------------
/scripts/extract_mm_projector.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/extract_mm_projector.py


--------------------------------------------------------------------------------
/scripts/finetune.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/finetune.sh


--------------------------------------------------------------------------------
/scripts/finetune_full_schedule.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/finetune_full_schedule.sh


--------------------------------------------------------------------------------
/scripts/finetune_lora.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/finetune_lora.sh


--------------------------------------------------------------------------------
/scripts/finetune_qlora.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/finetune_qlora.sh


--------------------------------------------------------------------------------
/scripts/finetune_sqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/finetune_sqa.sh


--------------------------------------------------------------------------------
/scripts/merge_lora_weights.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/merge_lora_weights.py


--------------------------------------------------------------------------------
/scripts/pretrain.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/pretrain.sh


--------------------------------------------------------------------------------
/scripts/pretrain_xformers.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/pretrain_xformers.sh


--------------------------------------------------------------------------------
/scripts/run_dpo.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/run_dpo.sh


--------------------------------------------------------------------------------
/scripts/run_povid.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/run_povid.sh


--------------------------------------------------------------------------------
/scripts/sqa_eval_batch.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/sqa_eval_batch.sh


--------------------------------------------------------------------------------
/scripts/sqa_eval_gather.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/sqa_eval_gather.sh


--------------------------------------------------------------------------------
/scripts/upload_pypi.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/upload_pypi.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/gqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/gqa.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/llavabench.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/llavabench.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mmbench.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/mmbench.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mmbench_cn.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/mmbench_cn.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mme.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/mme.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/mmvet.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/mmvet.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/pope.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/pope.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/qbench.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/qbench.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/qbench_zh.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/qbench_zh.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/seed.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/seed.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/sqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/sqa.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/textvqa.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/textvqa.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/vizwiz.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/vizwiz.sh


--------------------------------------------------------------------------------
/scripts/v1_5/eval/vqav2.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/eval/vqav2.sh


--------------------------------------------------------------------------------
/scripts/v1_5/finetune.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/finetune.sh


--------------------------------------------------------------------------------
/scripts/v1_5/finetune_lora.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/finetune_lora.sh


--------------------------------------------------------------------------------
/scripts/v1_5/finetune_task.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/finetune_task.sh


--------------------------------------------------------------------------------
/scripts/v1_5/finetune_task_lora.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/finetune_task_lora.sh


--------------------------------------------------------------------------------
/scripts/v1_5/pretrain.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/v1_5/pretrain.sh


--------------------------------------------------------------------------------
/scripts/zero2.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/zero2.json


--------------------------------------------------------------------------------
/scripts/zero3.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/zero3.json


--------------------------------------------------------------------------------
/scripts/zero3_offload.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/scripts/zero3_offload.json


--------------------------------------------------------------------------------
/tool/dpo_trainer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/tool/dpo_trainer.py


--------------------------------------------------------------------------------
/tool/dpo_trainer_inherent.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/YiyangZhou/POVID/HEAD/tool/dpo_trainer_inherent.py


--------------------------------------------------------------------------------