├── .gitignore ├── README.md ├── assets └── InternSR.png ├── dataset ├── __init__.py ├── egoexo_bench.py ├── mmscan │ ├── __init__.py │ ├── evaluator │ │ ├── gpt_evaluation.py │ │ ├── metrics │ │ │ ├── box_metric.py │ │ │ └── lang_metric.py │ │ ├── qa_evaluation.py │ │ └── vg_evaluation.py │ ├── mmscan.py │ └── utils │ │ ├── box_utils.py │ │ ├── data_io.py │ │ ├── euler_utils.py │ │ ├── lang_utils.py │ │ └── task_utils.py ├── mmscan_2d.py ├── mmsi_bench.py ├── ost_bench.py └── utils │ ├── __init__.py │ ├── egoexobench.py │ ├── image_base.py │ ├── judge_util.py │ ├── multiple_choice.py │ └── video_base.py ├── eval_tool ├── __init__.py ├── config.py ├── inference.py ├── inference_video.py └── tools.py ├── requirements.txt ├── scripts ├── eval_mmscan_gpt.py ├── eval_mmscan_qa.py ├── llava3d │ ├── llava_mmscan_qa.sh │ ├── model_mmscan_qa.py │ └── multiprocess_llava_mmscan_qa.sh └── run.py ├── setup.py ├── utils ├── __init__.py ├── base_utils │ ├── __init__.py │ ├── file.py │ ├── log.py │ ├── misc.py │ └── vlm.py ├── matching_util.py ├── mp_util.py └── result_transfer.py └── vlm ├── __init__.py ├── api ├── __init__.py ├── base.py ├── claude.py ├── gemini.py ├── gpt.py └── hf_chat_model.py ├── base.py ├── internvl ├── __init__.py ├── gui_template.yaml ├── internvl_chat.py └── utils.py ├── llava ├── __init__.py ├── llava.py └── llava_xtuner.py ├── llava_3d ├── llava │ ├── __init__.py │ ├── constants.py │ ├── conversation.py │ ├── eval │ │ ├── capeval │ │ │ ├── bleu │ │ │ │ ├── __init__.py │ │ │ │ ├── bleu.py │ │ │ │ └── bleu_scorer.py │ │ │ ├── cider │ │ │ │ ├── __init__.py │ │ │ │ ├── cider.py │ │ │ │ └── cider_scorer.py │ │ │ ├── get_stanford_models.sh │ │ │ ├── meteor │ │ │ │ ├── __init__.py │ │ │ │ ├── data │ │ │ │ │ └── paraphrase-en.gz │ │ │ │ ├── meteor-1.5.jar │ │ │ │ └── meteor.py │ │ │ └── rouge │ │ │ │ ├── __init__.py │ │ │ │ └── rouge.py │ │ ├── eval_gpt_review.py │ │ ├── eval_gpt_review_bench.py │ │ ├── eval_gpt_review_visual.py │ │ ├── eval_pope.py │ │ ├── eval_science_qa.py │ │ ├── eval_science_qa_gpt4.py │ │ ├── eval_science_qa_gpt4_requery.py │ │ ├── eval_textvqa.py │ │ ├── generate_webpage_data_from_table.py │ │ ├── m4c_evaluator.py │ │ ├── model_mmscan_obj_caption.py │ │ ├── model_mmscan_qa.py │ │ ├── model_openeqa.py │ │ ├── model_qa.py │ │ ├── model_scan2cap.py │ │ ├── model_scanqa.py │ │ ├── model_sqa3d.py │ │ ├── model_vqa.py │ │ ├── model_vqa_loader.py │ │ ├── model_vqa_mmbench.py │ │ ├── model_vqa_science.py │ │ ├── qa_baseline_gpt35.py │ │ ├── run_llava.py │ │ ├── run_llava_3d.py │ │ ├── scanqa_evaluator.py │ │ ├── sqa3d_evaluator.py │ │ ├── summarize_gpt_review.py │ │ ├── table │ │ │ ├── answer │ │ │ │ ├── answer_alpaca-13b.jsonl │ │ │ │ ├── answer_bard.jsonl │ │ │ │ ├── answer_gpt35.jsonl │ │ │ │ ├── answer_llama-13b.jsonl │ │ │ │ └── answer_vicuna-13b.jsonl │ │ │ ├── caps_boxes_coco2014_val_80.jsonl │ │ │ ├── model.jsonl │ │ │ ├── prompt.jsonl │ │ │ ├── question.jsonl │ │ │ ├── review │ │ │ │ ├── review_alpaca-13b_vicuna-13b.jsonl │ │ │ │ ├── review_bard_vicuna-13b.jsonl │ │ │ │ ├── review_gpt35_vicuna-13b.jsonl │ │ │ │ └── review_llama-13b_vicuna-13b.jsonl │ │ │ └── reviewer.jsonl │ │ └── webpage │ │ │ ├── figures │ │ │ ├── alpaca.png │ │ │ ├── chatgpt.svg │ │ │ ├── swords_FILL0_wght300_GRAD0_opsz48.svg │ │ │ └── vicuna.jpeg │ │ │ ├── index.html │ │ │ ├── script.js │ │ │ └── styles.css │ ├── mm_utils.py │ ├── model │ │ ├── __init__.py │ │ ├── apply_delta.py │ │ ├── builder.py │ │ ├── consolidate.py │ │ ├── language_model │ │ │ ├── llava_llama.py │ │ │ ├── llava_mistral.py │ │ │ └── llava_mpt.py │ │ ├── llava_arch.py │ │ ├── make_delta.py │ │ ├── multimodal_encoder │ │ │ ├── builder.py │ │ │ ├── clip_encoder.py │ │ │ ├── position_encodings.py │ │ │ ├── spatial_aware_module.py │ │ │ ├── unproject.py │ │ │ ├── video_encoder.py │ │ │ └── video_processor.py │ │ ├── multimodal_projector │ │ │ └── builder.py │ │ └── utils.py │ ├── train │ │ ├── llama_flash_attn_monkey_patch.py │ │ ├── llama_xformers_attn_monkey_patch.py │ │ ├── llava_trainer.py │ │ ├── train.py │ │ ├── train_mem.py │ │ └── train_xformers.py │ └── utils.py └── pyproject.toml ├── misc ├── blip2_instruct_vicuna13b.yaml ├── blip2_instruct_vicuna7b.yaml ├── minigpt4_13b_eval.yaml ├── minigpt4_7b_eval.yaml └── minigptv2_eval.yaml └── qwen2_vl ├── __init__.py ├── model.py └── prompt.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/README.md -------------------------------------------------------------------------------- /assets/InternSR.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/assets/InternSR.png -------------------------------------------------------------------------------- /dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/__init__.py -------------------------------------------------------------------------------- /dataset/egoexo_bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/egoexo_bench.py -------------------------------------------------------------------------------- /dataset/mmscan/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/__init__.py -------------------------------------------------------------------------------- /dataset/mmscan/evaluator/gpt_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/evaluator/gpt_evaluation.py -------------------------------------------------------------------------------- /dataset/mmscan/evaluator/metrics/box_metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/evaluator/metrics/box_metric.py -------------------------------------------------------------------------------- /dataset/mmscan/evaluator/metrics/lang_metric.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/evaluator/metrics/lang_metric.py -------------------------------------------------------------------------------- /dataset/mmscan/evaluator/qa_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/evaluator/qa_evaluation.py -------------------------------------------------------------------------------- /dataset/mmscan/evaluator/vg_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/evaluator/vg_evaluation.py -------------------------------------------------------------------------------- /dataset/mmscan/mmscan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/mmscan.py -------------------------------------------------------------------------------- /dataset/mmscan/utils/box_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/utils/box_utils.py -------------------------------------------------------------------------------- /dataset/mmscan/utils/data_io.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/utils/data_io.py -------------------------------------------------------------------------------- /dataset/mmscan/utils/euler_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/utils/euler_utils.py -------------------------------------------------------------------------------- /dataset/mmscan/utils/lang_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/utils/lang_utils.py -------------------------------------------------------------------------------- /dataset/mmscan/utils/task_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan/utils/task_utils.py -------------------------------------------------------------------------------- /dataset/mmscan_2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmscan_2d.py -------------------------------------------------------------------------------- /dataset/mmsi_bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/mmsi_bench.py -------------------------------------------------------------------------------- /dataset/ost_bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/ost_bench.py -------------------------------------------------------------------------------- /dataset/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/utils/__init__.py -------------------------------------------------------------------------------- /dataset/utils/egoexobench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/utils/egoexobench.py -------------------------------------------------------------------------------- /dataset/utils/image_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/utils/image_base.py -------------------------------------------------------------------------------- /dataset/utils/judge_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/utils/judge_util.py -------------------------------------------------------------------------------- /dataset/utils/multiple_choice.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/utils/multiple_choice.py -------------------------------------------------------------------------------- /dataset/utils/video_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/dataset/utils/video_base.py -------------------------------------------------------------------------------- /eval_tool/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/eval_tool/__init__.py -------------------------------------------------------------------------------- /eval_tool/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/eval_tool/config.py -------------------------------------------------------------------------------- /eval_tool/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/eval_tool/inference.py -------------------------------------------------------------------------------- /eval_tool/inference_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/eval_tool/inference_video.py -------------------------------------------------------------------------------- /eval_tool/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/eval_tool/tools.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/eval_mmscan_gpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/scripts/eval_mmscan_gpt.py -------------------------------------------------------------------------------- /scripts/eval_mmscan_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/scripts/eval_mmscan_qa.py -------------------------------------------------------------------------------- /scripts/llava3d/llava_mmscan_qa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/scripts/llava3d/llava_mmscan_qa.sh -------------------------------------------------------------------------------- /scripts/llava3d/model_mmscan_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/scripts/llava3d/model_mmscan_qa.py -------------------------------------------------------------------------------- /scripts/llava3d/multiprocess_llava_mmscan_qa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/scripts/llava3d/multiprocess_llava_mmscan_qa.sh -------------------------------------------------------------------------------- /scripts/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/scripts/run.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/setup.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/__init__.py -------------------------------------------------------------------------------- /utils/base_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/base_utils/__init__.py -------------------------------------------------------------------------------- /utils/base_utils/file.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/base_utils/file.py -------------------------------------------------------------------------------- /utils/base_utils/log.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/base_utils/log.py -------------------------------------------------------------------------------- /utils/base_utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/base_utils/misc.py -------------------------------------------------------------------------------- /utils/base_utils/vlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/base_utils/vlm.py -------------------------------------------------------------------------------- /utils/matching_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/matching_util.py -------------------------------------------------------------------------------- /utils/mp_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/mp_util.py -------------------------------------------------------------------------------- /utils/result_transfer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/utils/result_transfer.py -------------------------------------------------------------------------------- /vlm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/__init__.py -------------------------------------------------------------------------------- /vlm/api/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/api/__init__.py -------------------------------------------------------------------------------- /vlm/api/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/api/base.py -------------------------------------------------------------------------------- /vlm/api/claude.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/api/claude.py -------------------------------------------------------------------------------- /vlm/api/gemini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/api/gemini.py -------------------------------------------------------------------------------- /vlm/api/gpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/api/gpt.py -------------------------------------------------------------------------------- /vlm/api/hf_chat_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/api/hf_chat_model.py -------------------------------------------------------------------------------- /vlm/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/base.py -------------------------------------------------------------------------------- /vlm/internvl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/internvl/__init__.py -------------------------------------------------------------------------------- /vlm/internvl/gui_template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/internvl/gui_template.yaml -------------------------------------------------------------------------------- /vlm/internvl/internvl_chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/internvl/internvl_chat.py -------------------------------------------------------------------------------- /vlm/internvl/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/internvl/utils.py -------------------------------------------------------------------------------- /vlm/llava/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava/__init__.py -------------------------------------------------------------------------------- /vlm/llava/llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava/llava.py -------------------------------------------------------------------------------- /vlm/llava/llava_xtuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava/llava_xtuner.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/__init__.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/constants.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/conversation.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/bleu/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/bleu/bleu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/bleu/bleu.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/bleu/bleu_scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/bleu/bleu_scorer.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/cider/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/cider/cider.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/cider/cider.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/cider/cider_scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/cider/cider_scorer.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/get_stanford_models.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/get_stanford_models.sh -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/meteor/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/meteor/data/paraphrase-en.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/meteor/data/paraphrase-en.gz -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/meteor/meteor-1.5.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/meteor/meteor-1.5.jar -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/meteor/meteor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/meteor/meteor.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/rouge/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/capeval/rouge/rouge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/capeval/rouge/rouge.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_gpt_review.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_gpt_review.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_gpt_review_bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_gpt_review_bench.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_gpt_review_visual.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_gpt_review_visual.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_pope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_pope.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_science_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_science_qa.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_science_qa_gpt4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_science_qa_gpt4.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_science_qa_gpt4_requery.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_science_qa_gpt4_requery.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/eval_textvqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/eval_textvqa.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/generate_webpage_data_from_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/generate_webpage_data_from_table.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/m4c_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/m4c_evaluator.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_mmscan_obj_caption.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_mmscan_obj_caption.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_mmscan_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_mmscan_qa.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_openeqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_openeqa.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_qa.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_scan2cap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_scan2cap.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_scanqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_scanqa.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_sqa3d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_sqa3d.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_vqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_vqa.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_vqa_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_vqa_loader.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_vqa_mmbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_vqa_mmbench.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/model_vqa_science.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/model_vqa_science.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/qa_baseline_gpt35.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/qa_baseline_gpt35.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/run_llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/run_llava.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/run_llava_3d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/run_llava_3d.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/scanqa_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/scanqa_evaluator.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/sqa3d_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/sqa3d_evaluator.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/summarize_gpt_review.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/summarize_gpt_review.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/answer/answer_alpaca-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/answer/answer_alpaca-13b.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/answer/answer_bard.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/answer/answer_bard.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/answer/answer_gpt35.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/answer/answer_gpt35.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/answer/answer_llama-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/answer/answer_llama-13b.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/answer/answer_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/answer/answer_vicuna-13b.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/caps_boxes_coco2014_val_80.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/caps_boxes_coco2014_val_80.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/model.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/model.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/prompt.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/prompt.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/question.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/question.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/review/review_alpaca-13b_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/review/review_alpaca-13b_vicuna-13b.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/review/review_bard_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/review/review_bard_vicuna-13b.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/review/review_gpt35_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/review/review_gpt35_vicuna-13b.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/review/review_llama-13b_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/review/review_llama-13b_vicuna-13b.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/table/reviewer.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/table/reviewer.jsonl -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/webpage/figures/alpaca.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/webpage/figures/alpaca.png -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/webpage/figures/chatgpt.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/webpage/figures/chatgpt.svg -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/webpage/figures/vicuna.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/webpage/figures/vicuna.jpeg -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/webpage/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/webpage/index.html -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/webpage/script.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/webpage/script.js -------------------------------------------------------------------------------- /vlm/llava_3d/llava/eval/webpage/styles.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/eval/webpage/styles.css -------------------------------------------------------------------------------- /vlm/llava_3d/llava/mm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/mm_utils.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/__init__.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/apply_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/apply_delta.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/builder.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/consolidate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/consolidate.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/language_model/llava_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/language_model/llava_llama.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/language_model/llava_mistral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/language_model/llava_mistral.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/language_model/llava_mpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/language_model/llava_mpt.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/llava_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/llava_arch.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/make_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/make_delta.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_encoder/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_encoder/builder.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_encoder/clip_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_encoder/clip_encoder.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_encoder/position_encodings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_encoder/position_encodings.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_encoder/spatial_aware_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_encoder/spatial_aware_module.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_encoder/unproject.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_encoder/unproject.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_encoder/video_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_encoder/video_encoder.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_encoder/video_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_encoder/video_processor.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/multimodal_projector/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/multimodal_projector/builder.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/model/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/model/utils.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/train/llama_flash_attn_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/train/llama_flash_attn_monkey_patch.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/train/llama_xformers_attn_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/train/llama_xformers_attn_monkey_patch.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/train/llava_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/train/llava_trainer.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/train/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/train/train.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/train/train_mem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/train/train_mem.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/train/train_xformers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/train/train_xformers.py -------------------------------------------------------------------------------- /vlm/llava_3d/llava/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/llava/utils.py -------------------------------------------------------------------------------- /vlm/llava_3d/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/llava_3d/pyproject.toml -------------------------------------------------------------------------------- /vlm/misc/blip2_instruct_vicuna13b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/misc/blip2_instruct_vicuna13b.yaml -------------------------------------------------------------------------------- /vlm/misc/blip2_instruct_vicuna7b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/misc/blip2_instruct_vicuna7b.yaml -------------------------------------------------------------------------------- /vlm/misc/minigpt4_13b_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/misc/minigpt4_13b_eval.yaml -------------------------------------------------------------------------------- /vlm/misc/minigpt4_7b_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/misc/minigpt4_7b_eval.yaml -------------------------------------------------------------------------------- /vlm/misc/minigptv2_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/misc/minigptv2_eval.yaml -------------------------------------------------------------------------------- /vlm/qwen2_vl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/qwen2_vl/__init__.py -------------------------------------------------------------------------------- /vlm/qwen2_vl/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/qwen2_vl/model.py -------------------------------------------------------------------------------- /vlm/qwen2_vl/prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/InternRobotics/InternSR/HEAD/vlm/qwen2_vl/prompt.py --------------------------------------------------------------------------------