├── .gitignore ├── LICENSE ├── README.md ├── assets └── Main_VANE-Bench Flow_v7.png └── scripts ├── calc_lmm_vqa_accuracy.py ├── closed_source_models ├── CGM.py ├── QAGM.py ├── eval_vqa_gemini.py ├── evaluate_vqa_GPT.py └── utils.py └── open_source_models ├── README.md ├── TimeChat ├── .gitignore ├── LICENSE ├── LICENSE_Lavis.md ├── LICENSE_Minigpt4.md ├── README.md ├── demo.ipynb ├── docs │ └── DATA.md ├── environment.yml ├── eval.sh ├── eval_configs │ └── timechat.yaml ├── evaluate.py ├── examples │ └── hotdog.mp4 ├── figs │ ├── arch.png │ ├── case_dvc.png │ ├── case_tvg.png │ ├── case_vhd.png │ ├── logo.png │ └── teaser.png ├── inference_vanebench.py ├── prompts │ ├── alignment_image.txt │ ├── concise_description.txt │ ├── concise_image_description.txt │ ├── dvc_description.txt │ ├── dvc_description_with_asr.txt │ ├── dvc_description_zeroshot.txt │ ├── dvc_post_check.txt │ ├── tvg_description.txt │ ├── tvg_description_zeroshot.txt │ ├── tvg_post_check.txt │ ├── vhd_description.txt │ ├── vhd_description_zeroshot.txt │ └── vhd_post_check.txt ├── timechat │ ├── __init__.py │ ├── common │ │ ├── __init__.py │ │ ├── config.py │ │ ├── dist_utils.py │ │ ├── gradcam.py │ │ ├── logger.py │ │ ├── optims.py │ │ ├── registry.py │ │ └── utils.py │ ├── configs │ │ ├── datasets │ │ │ ├── cc_sbu │ │ │ │ ├── align.yaml │ │ │ │ └── defaults.yaml │ │ │ ├── instruct │ │ │ │ ├── charades_instruct.yaml │ │ │ │ ├── llava_instruct.yaml │ │ │ │ ├── qvhighlights_instruct.yaml │ │ │ │ ├── time_instruct.yaml │ │ │ │ ├── valley72k_instruct.yaml │ │ │ │ ├── webvid_instruct.yaml │ │ │ │ └── youcook2_instruct.yaml │ │ │ ├── laion │ │ │ │ └── defaults.yaml │ │ │ └── webvid │ │ │ │ └── defaults.yaml │ │ ├── default.yaml │ │ └── models │ │ │ ├── minigpt4.yaml │ │ │ └── timechat.yaml │ ├── conversation │ │ ├── __init__.py │ │ ├── conversation_video.py │ │ └── conversation_video_batch.py │ ├── datasets │ │ ├── __init__.py │ │ ├── builders │ │ │ ├── __init__.py │ │ │ ├── base_dataset_builder.py │ │ │ ├── image_text_pair_builder.py │ │ │ ├── instruct_builder.py │ │ │ └── video_caption_builder.py │ │ ├── data_utils.py │ │ └── datasets │ │ │ ├── __init__.py │ │ │ ├── base_dataset.py │ │ │ ├── caption_datasets.py │ │ │ ├── cc_sbu_dataset.py │ │ │ ├── dataloader_utils.py │ │ │ ├── laion_dataset.py │ │ │ ├── llava_instruct_dataset.py │ │ │ ├── video_instruct_dataset.py │ │ │ └── webvid_datasets.py │ ├── models │ │ ├── Qformer.py │ │ ├── __init__.py │ │ ├── base_model.py │ │ ├── blip2.py │ │ ├── blip2_outputs.py │ │ ├── eva_vit.py │ │ ├── modeling_llama.py │ │ └── timechat.py │ ├── processors │ │ ├── __init__.py │ │ ├── base_processor.py │ │ ├── blip_processors.py │ │ ├── functional_video.py │ │ ├── randaugment.py │ │ ├── transforms_video.py │ │ └── video_processor.py │ ├── runners │ │ ├── __init__.py │ │ ├── runner_base.py │ │ └── test.py │ └── tasks │ │ ├── __init__.py │ │ ├── base_task.py │ │ ├── image_text_pretrain.py │ │ └── video_text_pretrain.py ├── train.py ├── train_configs │ ├── stage2_finetune_charades.yaml │ ├── stage2_finetune_qvhighlights.yaml │ ├── stage2_finetune_time104k_valley72k.yaml │ └── stage2_finetune_youcook2.yaml └── utils │ ├── asr │ ├── asr.py │ ├── asr_data_process.py │ ├── clean_asr.py │ └── extract_audio.py │ ├── compress_video_data.py │ ├── construct_it_data │ ├── merge.py │ ├── process_action_data.py │ ├── process_dvc_data.py │ ├── process_grounding_data.py │ ├── process_highlight_data.py │ └── process_tsg_data.py │ ├── format_dvc.py │ ├── format_tvg.py │ ├── format_vhd.py │ ├── get_coco_format.py │ ├── process_hirest.py │ └── process_valley.py ├── Video-LLaMA ├── LICENSE ├── LICENSE_Lavis.md ├── LICENSE_Minigpt4.md ├── README.md ├── README_Vicuna.md ├── apply_delta.py ├── demo_audiovideo.py ├── demo_video.py ├── environment.yml ├── eval_configs │ ├── video_llama_eval_only_vl.yaml │ └── video_llama_eval_withaudio.yaml ├── examples │ ├── IronMan.mp4 │ ├── Iron_clothes.jpg │ ├── JonSnow.jpg │ ├── Statue_of_Liberty.jpg │ ├── United_States_Capitol.jpg │ ├── applausing.mp4 │ ├── birthday.mp4 │ ├── boat.mp4 │ ├── dog.jpg │ ├── dog_barking.mp4 │ ├── silence_girl.mp4 │ └── skateboarding_dog.mp4 ├── figs │ ├── architecture.png │ ├── architecture_v2.png │ ├── birthday_demo.gif │ ├── demo.gif │ └── video_llama_logo.jpg ├── inference_vanebench.py ├── playground.ipynb ├── prompts │ └── alignment_image.txt ├── requirement.txt ├── setup.py ├── train.py ├── train_configs │ ├── audiobranch_stage1_pretrain.yaml │ ├── audiobranch_stage2_finetune.yaml │ ├── visionbranch_stage1_pretrain.yaml │ └── visionbranch_stage2_finetune.yaml └── video_llama │ ├── __init__.py │ ├── common │ ├── __init__.py │ ├── config.py │ ├── dist_utils.py │ ├── gradcam.py │ ├── logger.py │ ├── optims.py │ ├── registry.py │ └── utils.py │ ├── configs │ ├── datasets │ │ ├── cc_sbu │ │ │ ├── align.yaml │ │ │ └── defaults.yaml │ │ ├── instruct │ │ │ ├── llava_instruct.yaml │ │ │ └── webvid_instruct.yaml │ │ ├── laion │ │ │ └── defaults.yaml │ │ └── webvid │ │ │ └── defaults.yaml │ ├── default.yaml │ └── models │ │ ├── minigpt4.yaml │ │ └── video_llama.yaml │ ├── conversation │ ├── __init__.py │ └── conversation_video.py │ ├── datasets │ ├── __init__.py │ ├── builders │ │ ├── __init__.py │ │ ├── base_dataset_builder.py │ │ ├── image_text_pair_builder.py │ │ ├── instruct_builder.py │ │ └── video_caption_builder.py │ ├── data_utils.py │ └── datasets │ │ ├── __init__.py │ │ ├── base_dataset.py │ │ ├── caption_datasets.py │ │ ├── cc_sbu_dataset.py │ │ ├── dataloader_utils.py │ │ ├── laion_dataset.py │ │ ├── llava_instruct_dataset.py │ │ ├── video_instruct_dataset.py │ │ └── webvid_datasets.py │ ├── models │ ├── ImageBind │ │ ├── .assets │ │ │ ├── bird_audio.wav │ │ │ ├── bird_image.jpg │ │ │ ├── car_audio.wav │ │ │ ├── car_image.jpg │ │ │ ├── dog_audio.wav │ │ │ └── dog_image.jpg │ │ ├── CODE_OF_CONDUCT.md │ │ ├── CONTRIBUTING.md │ │ ├── LICENSE │ │ ├── README.md │ │ ├── bpe │ │ │ └── bpe_simple_vocab_16e6.txt.gz │ │ ├── data.py │ │ ├── model_card.md │ │ ├── models │ │ │ ├── __init__.py │ │ │ ├── helpers.py │ │ │ ├── imagebind_model.py │ │ │ ├── multimodal_preprocessors.py │ │ │ └── transformer.py │ │ └── requirements.txt │ ├── Qformer.py │ ├── __init__.py │ ├── base_model.py │ ├── blip2.py │ ├── blip2_outputs.py │ ├── eva_vit.py │ ├── modeling_llama.py │ └── video_llama.py │ ├── processors │ ├── .ipynb_checkpoints │ │ └── video_processor-checkpoint.py │ ├── __init__.py │ ├── base_processor.py │ ├── blip_processors.py │ ├── functional_video.py │ ├── randaugment.py │ ├── transforms_video.py │ └── video_processor.py │ ├── runners │ ├── __init__.py │ ├── runner_base.py │ └── test.py │ └── tasks │ ├── __init__.py │ ├── base_task.py │ ├── image_text_pretrain.py │ └── video_text_pretrain.py ├── Video-LLaVA ├── LICENSE ├── README.md ├── TRAIN_AND_VALIDATE.md ├── assets │ ├── demo.mp4 │ ├── gradio.gif │ ├── imagecli.gif │ ├── main.jpg │ ├── res_img.jpg │ ├── res_vi.jpg │ ├── video_llava_result.jpg │ └── videocli.gif ├── pyproject.toml ├── scripts │ ├── convert_gqa_for_eval.py │ ├── convert_mmbench_for_submission.py │ ├── convert_mmvet_for_eval.py │ ├── convert_seed_for_submission.py │ ├── convert_sqa_to_llava.py │ ├── convert_sqa_to_llava_base_prompt.py │ ├── convert_vizwiz_for_submission.py │ ├── convert_vqav2_for_submission.py │ ├── eval_gpt_mmvet.py │ ├── finetune.sh │ ├── finetune_full_schedule.sh │ ├── finetune_lora.sh │ ├── finetune_qlora.sh │ ├── finetune_sqa.sh │ ├── merge_lora_weights.py │ ├── pretrain.sh │ ├── sqa_eval_batch.sh │ ├── sqa_eval_gather.sh │ ├── v1_5 │ │ ├── eval │ │ │ ├── eval_benchmark_1_correctness.sh │ │ │ ├── eval_benchmark_2_detail.sh │ │ │ ├── eval_benchmark_3_contextual.sh │ │ │ ├── eval_benchmark_4_temporal.sh │ │ │ ├── eval_benchmark_5_consistency.sh │ │ │ ├── eval_image_gqa.sh │ │ │ ├── eval_image_llavabench.sh │ │ │ ├── eval_image_mmbench.sh │ │ │ ├── eval_image_mmvet.sh │ │ │ ├── eval_image_pope.sh │ │ │ ├── eval_image_sqa.sh │ │ │ ├── eval_image_textvqa.sh │ │ │ ├── eval_image_vizwiz.sh │ │ │ ├── eval_image_vqav2.sh │ │ │ ├── eval_qa_activitynet.sh │ │ │ ├── eval_qa_msrvtt.sh │ │ │ ├── eval_qa_msvd.sh │ │ │ ├── eval_qa_tgif.sh │ │ │ ├── run_benchmark_1_correctness.sh │ │ │ ├── run_benchmark_2_detail.sh │ │ │ ├── run_benchmark_3_contextual.sh │ │ │ ├── run_benchmark_4_temporal.sh │ │ │ ├── run_benchmark_5_consistency.sh │ │ │ ├── run_qa_activitynet.sh │ │ │ ├── run_qa_msrvtt.sh │ │ │ ├── run_qa_msvd.sh │ │ │ └── run_qa_tgif.sh │ │ ├── finetune.sh │ │ ├── finetune_lora.sh │ │ └── pretrain.sh │ ├── zero2.json │ ├── zero2_offload.json │ ├── zero3.json │ └── zero3_offload.json └── videollava │ ├── __init__.py │ ├── constants.py │ ├── conversation.py │ ├── eval │ ├── eval_gpt_mmvet.py │ ├── eval_gpt_review.py │ ├── eval_gpt_review_bench.py │ ├── eval_gpt_review_visual.py │ ├── eval_gqa.py │ ├── eval_mmlu.py │ ├── eval_pope.py │ ├── eval_science_qa.py │ ├── eval_science_qa_gpt4.py │ ├── eval_science_qa_gpt4_requery.py │ ├── eval_textvqa.py │ ├── generate_webpage_data_from_table.py │ ├── inference_video_llava_vanebench.py │ ├── m4c_evaluator.py │ ├── model_qa.py │ ├── model_vqa.py │ ├── model_vqa_loader.py │ ├── model_vqa_mmbench.py │ ├── model_vqa_qbench.py │ ├── model_vqa_science.py │ ├── qa_baseline_gpt35.py │ ├── run_llava.py │ ├── summarize_gpt_review.py │ ├── table │ │ ├── answer │ │ │ ├── answer_alpaca-13b.jsonl │ │ │ ├── answer_bard.jsonl │ │ │ ├── answer_gpt35.jsonl │ │ │ ├── answer_llama-13b.jsonl │ │ │ └── answer_vicuna-13b.jsonl │ │ ├── caps_boxes_coco2014_val_80.jsonl │ │ ├── model.jsonl │ │ ├── prompt.jsonl │ │ ├── question.jsonl │ │ ├── results │ │ │ ├── test_sqa_llava_13b_v0.json │ │ │ └── test_sqa_llava_lcs_558k_sqa_12e_vicuna_v1_3_13b.json │ │ ├── review │ │ │ ├── review_alpaca-13b_vicuna-13b.jsonl │ │ │ ├── review_bard_vicuna-13b.jsonl │ │ │ ├── review_gpt35_vicuna-13b.jsonl │ │ │ └── review_llama-13b_vicuna-13b.jsonl │ │ ├── reviewer.jsonl │ │ └── rule.json │ ├── video │ │ ├── eval_benchmark_1_correctness.py │ │ ├── eval_benchmark_2_detailed_orientation.py │ │ ├── eval_benchmark_3_context.py │ │ ├── eval_benchmark_4_temporal.py │ │ ├── eval_benchmark_5_consistency.py │ │ ├── eval_video_qa.py │ │ ├── run_inference_benchmark_consistency.py │ │ ├── run_inference_benchmark_general.py │ │ ├── run_inference_video_qa.py │ │ └── run_inference_video_qa_act.py │ └── webpage │ │ ├── figures │ │ ├── alpaca.png │ │ ├── bard.jpg │ │ ├── chatgpt.svg │ │ ├── llama.jpg │ │ ├── swords_FILL0_wght300_GRAD0_opsz48.svg │ │ └── vicuna.jpeg │ │ ├── index.html │ │ ├── script.js │ │ └── styles.css │ ├── mm_utils.py │ ├── model │ ├── __init__.py │ ├── __pycache__ │ │ ├── __init__.cpython-310.pyc │ │ ├── builder.cpython-310.pyc │ │ └── llava_arch.cpython-310.pyc │ ├── apply_delta.py │ ├── builder.py │ ├── consolidate.py │ ├── language_model │ │ ├── __pycache__ │ │ │ ├── llava_llama.cpython-310.pyc │ │ │ └── llava_mpt.cpython-310.pyc │ │ ├── llava_llama.py │ │ ├── llava_mpt.py │ │ └── mpt │ │ │ ├── __pycache__ │ │ │ ├── adapt_tokenizer.cpython-310.pyc │ │ │ ├── attention.cpython-310.pyc │ │ │ ├── blocks.cpython-310.pyc │ │ │ ├── configuration_mpt.cpython-310.pyc │ │ │ ├── custom_embedding.cpython-310.pyc │ │ │ ├── flash_attn_triton.cpython-310.pyc │ │ │ ├── hf_prefixlm_converter.cpython-310.pyc │ │ │ ├── meta_init_context.cpython-310.pyc │ │ │ ├── modeling_mpt.cpython-310.pyc │ │ │ ├── norm.cpython-310.pyc │ │ │ └── param_init_fns.cpython-310.pyc │ │ │ ├── adapt_tokenizer.py │ │ │ ├── attention.py │ │ │ ├── blocks.py │ │ │ ├── configuration_mpt.py │ │ │ ├── custom_embedding.py │ │ │ ├── flash_attn_triton.py │ │ │ ├── hf_prefixlm_converter.py │ │ │ ├── meta_init_context.py │ │ │ ├── modeling_mpt.py │ │ │ ├── norm.py │ │ │ └── param_init_fns.py │ ├── llava_arch.py │ ├── make_delta.py │ ├── multimodal_encoder │ │ ├── __pycache__ │ │ │ ├── builder.cpython-310.pyc │ │ │ └── clip_encoder.cpython-310.pyc │ │ ├── builder.py │ │ ├── clip_encoder.py │ │ └── languagebind │ │ │ ├── __init__.py │ │ │ ├── __pycache__ │ │ │ └── __init__.cpython-310.pyc │ │ │ ├── audio │ │ │ ├── __pycache__ │ │ │ │ ├── configuration_audio.cpython-310.pyc │ │ │ │ ├── modeling_audio.cpython-310.pyc │ │ │ │ ├── processing_audio.cpython-310.pyc │ │ │ │ └── tokenization_audio.cpython-310.pyc │ │ │ ├── configuration_audio.py │ │ │ ├── modeling_audio.py │ │ │ ├── processing_audio.py │ │ │ └── tokenization_audio.py │ │ │ ├── depth │ │ │ ├── __pycache__ │ │ │ │ ├── configuration_depth.cpython-310.pyc │ │ │ │ ├── modeling_depth.cpython-310.pyc │ │ │ │ ├── processing_depth.cpython-310.pyc │ │ │ │ └── tokenization_depth.cpython-310.pyc │ │ │ ├── configuration_depth.py │ │ │ ├── modeling_depth.py │ │ │ ├── processing_depth.py │ │ │ └── tokenization_depth.py │ │ │ ├── image │ │ │ ├── __pycache__ │ │ │ │ ├── configuration_image.cpython-310.pyc │ │ │ │ ├── modeling_image.cpython-310.pyc │ │ │ │ ├── processing_image.cpython-310.pyc │ │ │ │ └── tokenization_image.cpython-310.pyc │ │ │ ├── configuration_image.py │ │ │ ├── modeling_image.py │ │ │ ├── processing_image.py │ │ │ └── tokenization_image.py │ │ │ ├── thermal │ │ │ ├── __pycache__ │ │ │ │ ├── configuration_thermal.cpython-310.pyc │ │ │ │ ├── modeling_thermal.cpython-310.pyc │ │ │ │ ├── processing_thermal.cpython-310.pyc │ │ │ │ └── tokenization_thermal.cpython-310.pyc │ │ │ ├── configuration_thermal.py │ │ │ ├── modeling_thermal.py │ │ │ ├── processing_thermal.py │ │ │ └── tokenization_thermal.py │ │ │ └── video │ │ │ ├── __pycache__ │ │ │ ├── configuration_video.cpython-310.pyc │ │ │ ├── modeling_video.cpython-310.pyc │ │ │ ├── processing_video.cpython-310.pyc │ │ │ └── tokenization_video.cpython-310.pyc │ │ │ ├── configuration_video.py │ │ │ ├── modeling_video.py │ │ │ ├── processing_video.py │ │ │ └── tokenization_video.py │ ├── multimodal_projector │ │ ├── __pycache__ │ │ │ └── builder.cpython-310.pyc │ │ └── builder.py │ └── utils.py │ ├── serve │ ├── __init__.py │ ├── cli.py │ ├── controller.py │ ├── gradio_utils.py │ ├── gradio_web_server.py │ ├── model_worker.py │ ├── register_worker.py │ ├── test_message.py │ └── utils.py │ ├── train │ ├── llama_flash_attn_monkey_patch.py │ ├── llama_xformers_attn_monkey_patch.py │ ├── llava_trainer.py │ ├── train.py │ ├── train_mem.py │ └── train_xformers.py │ └── utils.py └── assets ├── INSTALL.md ├── INSTALL.md~3a0823e459c80f147e9ef5c670cec3bb277419e8 └── PREDICTIONS.md /.gitignore: -------------------------------------------------------------------------------- 1 | .DS_Store 2 | .env 3 | **/__pycache__/ 4 | *.pyc -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/README.md -------------------------------------------------------------------------------- /assets/Main_VANE-Bench Flow_v7.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/assets/Main_VANE-Bench Flow_v7.png -------------------------------------------------------------------------------- /scripts/calc_lmm_vqa_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/calc_lmm_vqa_accuracy.py -------------------------------------------------------------------------------- /scripts/closed_source_models/CGM.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/closed_source_models/CGM.py -------------------------------------------------------------------------------- /scripts/closed_source_models/QAGM.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/closed_source_models/QAGM.py -------------------------------------------------------------------------------- /scripts/closed_source_models/eval_vqa_gemini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/closed_source_models/eval_vqa_gemini.py -------------------------------------------------------------------------------- /scripts/closed_source_models/evaluate_vqa_GPT.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/closed_source_models/evaluate_vqa_GPT.py -------------------------------------------------------------------------------- /scripts/closed_source_models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/closed_source_models/utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/README.md -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/.gitignore -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/LICENSE -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/LICENSE_Lavis.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/LICENSE_Lavis.md -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/LICENSE_Minigpt4.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/LICENSE_Minigpt4.md -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/README.md -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/demo.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/demo.ipynb -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/docs/DATA.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/docs/DATA.md -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/environment.yml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/eval.sh -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/eval_configs/timechat.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/eval_configs/timechat.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/evaluate.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/examples/hotdog.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/examples/hotdog.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/figs/arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/figs/arch.png -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/figs/case_dvc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/figs/case_dvc.png -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/figs/case_tvg.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/figs/case_tvg.png -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/figs/case_vhd.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/figs/case_vhd.png -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/figs/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/figs/logo.png -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/figs/teaser.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/figs/teaser.png -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/inference_vanebench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/inference_vanebench.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/alignment_image.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/alignment_image.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/concise_description.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/concise_description.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/concise_image_description.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/concise_image_description.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/dvc_description.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/dvc_description.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/dvc_description_with_asr.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/dvc_description_with_asr.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/dvc_description_zeroshot.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/dvc_description_zeroshot.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/dvc_post_check.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/dvc_post_check.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/tvg_description.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/tvg_description.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/tvg_description_zeroshot.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/tvg_description_zeroshot.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/tvg_post_check.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/tvg_post_check.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/vhd_description.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/vhd_description.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/vhd_description_zeroshot.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/vhd_description_zeroshot.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/prompts/vhd_post_check.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/prompts/vhd_post_check.txt -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/common/config.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/dist_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/common/dist_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/gradcam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/common/gradcam.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/common/logger.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/optims.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/common/optims.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/common/registry.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/common/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/common/utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/cc_sbu/align.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/cc_sbu/align.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/cc_sbu/defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/cc_sbu/defaults.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/charades_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/charades_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/llava_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/llava_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/qvhighlights_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/qvhighlights_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/time_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/time_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/valley72k_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/valley72k_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/webvid_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/webvid_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/youcook2_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/instruct/youcook2_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/laion/defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/laion/defaults.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/datasets/webvid/defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/datasets/webvid/defaults.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/default.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/models/minigpt4.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/models/minigpt4.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/configs/models/timechat.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/configs/models/timechat.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/conversation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/conversation/conversation_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/conversation/conversation_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/conversation/conversation_video_batch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/conversation/conversation_video_batch.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/builders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/builders/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/builders/base_dataset_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/builders/base_dataset_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/builders/image_text_pair_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/builders/image_text_pair_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/builders/instruct_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/builders/instruct_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/builders/video_caption_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/builders/video_caption_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/data_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/base_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/base_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/caption_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/caption_datasets.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/cc_sbu_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/cc_sbu_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/dataloader_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/dataloader_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/laion_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/laion_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/llava_instruct_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/llava_instruct_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/video_instruct_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/video_instruct_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/datasets/datasets/webvid_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/datasets/datasets/webvid_datasets.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/Qformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/Qformer.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/base_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/base_model.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/blip2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/blip2.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/blip2_outputs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/blip2_outputs.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/eva_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/eva_vit.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/modeling_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/modeling_llama.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/models/timechat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/models/timechat.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/processors/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/processors/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/processors/base_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/processors/base_processor.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/processors/blip_processors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/processors/blip_processors.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/processors/functional_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/processors/functional_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/processors/randaugment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/processors/randaugment.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/processors/transforms_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/processors/transforms_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/processors/video_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/processors/video_processor.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/runners/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/runners/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/runners/runner_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/runners/runner_base.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/runners/test.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/tasks/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/tasks/base_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/tasks/base_task.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/tasks/image_text_pretrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/tasks/image_text_pretrain.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/timechat/tasks/video_text_pretrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/timechat/tasks/video_text_pretrain.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/train.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/train_configs/stage2_finetune_charades.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/train_configs/stage2_finetune_charades.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/train_configs/stage2_finetune_qvhighlights.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/train_configs/stage2_finetune_qvhighlights.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/train_configs/stage2_finetune_time104k_valley72k.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/train_configs/stage2_finetune_time104k_valley72k.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/train_configs/stage2_finetune_youcook2.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/train_configs/stage2_finetune_youcook2.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/asr/asr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/asr/asr.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/asr/asr_data_process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/asr/asr_data_process.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/asr/clean_asr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/asr/clean_asr.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/asr/extract_audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/asr/extract_audio.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/compress_video_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/compress_video_data.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/construct_it_data/merge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/construct_it_data/merge.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/construct_it_data/process_action_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/construct_it_data/process_action_data.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/construct_it_data/process_dvc_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/construct_it_data/process_dvc_data.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/construct_it_data/process_grounding_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/construct_it_data/process_grounding_data.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/construct_it_data/process_highlight_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/construct_it_data/process_highlight_data.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/construct_it_data/process_tsg_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/construct_it_data/process_tsg_data.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/format_dvc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/format_dvc.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/format_tvg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/format_tvg.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/format_vhd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/format_vhd.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/get_coco_format.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/get_coco_format.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/process_hirest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/process_hirest.py -------------------------------------------------------------------------------- /scripts/open_source_models/TimeChat/utils/process_valley.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/TimeChat/utils/process_valley.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/LICENSE -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/LICENSE_Lavis.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/LICENSE_Lavis.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/LICENSE_Minigpt4.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/LICENSE_Minigpt4.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/README.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/README_Vicuna.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/README_Vicuna.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/apply_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/apply_delta.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/demo_audiovideo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/demo_audiovideo.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/demo_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/demo_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/environment.yml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/eval_configs/video_llama_eval_only_vl.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/eval_configs/video_llama_eval_only_vl.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/eval_configs/video_llama_eval_withaudio.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/eval_configs/video_llama_eval_withaudio.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/IronMan.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/IronMan.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/Iron_clothes.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/Iron_clothes.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/JonSnow.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/JonSnow.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/Statue_of_Liberty.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/Statue_of_Liberty.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/United_States_Capitol.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/United_States_Capitol.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/applausing.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/applausing.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/birthday.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/birthday.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/boat.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/boat.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/dog.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/dog.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/dog_barking.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/dog_barking.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/silence_girl.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/silence_girl.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/examples/skateboarding_dog.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/examples/skateboarding_dog.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/figs/architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/figs/architecture.png -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/figs/architecture_v2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/figs/architecture_v2.png -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/figs/birthday_demo.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/figs/birthday_demo.gif -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/figs/demo.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/figs/demo.gif -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/figs/video_llama_logo.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/figs/video_llama_logo.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/inference_vanebench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/inference_vanebench.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/playground.ipynb: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/prompts/alignment_image.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/prompts/alignment_image.txt -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/requirement.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/requirement.txt -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/setup.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/train.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/train_configs/audiobranch_stage1_pretrain.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/train_configs/audiobranch_stage1_pretrain.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/train_configs/audiobranch_stage2_finetune.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/train_configs/audiobranch_stage2_finetune.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/train_configs/visionbranch_stage1_pretrain.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/train_configs/visionbranch_stage1_pretrain.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/train_configs/visionbranch_stage2_finetune.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/train_configs/visionbranch_stage2_finetune.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/common/config.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/dist_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/common/dist_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/gradcam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/common/gradcam.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/common/logger.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/optims.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/common/optims.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/common/registry.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/common/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/common/utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/cc_sbu/align.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/cc_sbu/align.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/cc_sbu/defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/cc_sbu/defaults.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/instruct/llava_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/instruct/llava_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/instruct/webvid_instruct.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/instruct/webvid_instruct.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/laion/defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/laion/defaults.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/webvid/defaults.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/datasets/webvid/defaults.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/default.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/default.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/models/minigpt4.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/models/minigpt4.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/configs/models/video_llama.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/configs/models/video_llama.yaml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/conversation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/conversation/conversation_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/conversation/conversation_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/base_dataset_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/base_dataset_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/image_text_pair_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/image_text_pair_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/instruct_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/instruct_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/video_caption_builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/builders/video_caption_builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/data_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/base_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/base_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/caption_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/caption_datasets.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/cc_sbu_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/cc_sbu_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/dataloader_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/dataloader_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/laion_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/laion_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/llava_instruct_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/llava_instruct_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/video_instruct_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/video_instruct_dataset.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/webvid_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/datasets/datasets/webvid_datasets.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/bird_audio.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/bird_audio.wav -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/bird_image.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/bird_image.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/car_audio.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/car_audio.wav -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/car_image.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/car_image.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/dog_audio.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/dog_audio.wav -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/dog_image.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/.assets/dog_image.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/CONTRIBUTING.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/LICENSE -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/README.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/bpe/bpe_simple_vocab_16e6.txt.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/bpe/bpe_simple_vocab_16e6.txt.gz -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/data.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/model_card.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/model_card.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/helpers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/helpers.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/imagebind_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/imagebind_model.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/multimodal_preprocessors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/multimodal_preprocessors.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/models/transformer.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/ImageBind/requirements.txt -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/Qformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/Qformer.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/base_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/base_model.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/blip2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/blip2.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/blip2_outputs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/blip2_outputs.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/eva_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/eva_vit.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/modeling_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/modeling_llama.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/models/video_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/models/video_llama.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/.ipynb_checkpoints/video_processor-checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/.ipynb_checkpoints/video_processor-checkpoint.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/base_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/base_processor.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/blip_processors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/blip_processors.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/functional_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/functional_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/randaugment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/randaugment.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/transforms_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/transforms_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/processors/video_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/processors/video_processor.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/runners/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/runners/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/runners/runner_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/runners/runner_base.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/runners/test.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/tasks/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/tasks/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/tasks/base_task.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/tasks/base_task.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/tasks/image_text_pretrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/tasks/image_text_pretrain.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaMA/video_llama/tasks/video_text_pretrain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaMA/video_llama/tasks/video_text_pretrain.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/LICENSE -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/README.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/TRAIN_AND_VALIDATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/TRAIN_AND_VALIDATE.md -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/demo.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/demo.mp4 -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/gradio.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/gradio.gif -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/imagecli.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/imagecli.gif -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/main.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/main.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/res_img.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/res_img.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/res_vi.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/res_vi.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/video_llava_result.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/video_llava_result.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/assets/videocli.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/assets/videocli.gif -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/pyproject.toml -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_gqa_for_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_gqa_for_eval.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_mmbench_for_submission.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_mmbench_for_submission.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_mmvet_for_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_mmvet_for_eval.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_seed_for_submission.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_seed_for_submission.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_sqa_to_llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_sqa_to_llava.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_sqa_to_llava_base_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_sqa_to_llava_base_prompt.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_vizwiz_for_submission.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_vizwiz_for_submission.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/convert_vqav2_for_submission.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/convert_vqav2_for_submission.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/eval_gpt_mmvet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/eval_gpt_mmvet.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/finetune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/finetune.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/finetune_full_schedule.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/finetune_full_schedule.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/finetune_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/finetune_lora.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/finetune_qlora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/finetune_qlora.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/finetune_sqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/finetune_sqa.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/merge_lora_weights.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/merge_lora_weights.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/pretrain.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/pretrain.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/sqa_eval_batch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/sqa_eval_batch.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/sqa_eval_gather.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/sqa_eval_gather.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_1_correctness.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_1_correctness.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_2_detail.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_2_detail.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_3_contextual.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_3_contextual.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_4_temporal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_4_temporal.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_5_consistency.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_benchmark_5_consistency.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_gqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_gqa.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_llavabench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_llavabench.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_mmbench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_mmbench.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_mmvet.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_mmvet.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_pope.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_pope.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_sqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_sqa.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_textvqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_textvqa.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_vizwiz.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_vizwiz.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_vqav2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_image_vqav2.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_activitynet.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_activitynet.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_msrvtt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_msrvtt.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_msvd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_msvd.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_tgif.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/eval_qa_tgif.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_1_correctness.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_1_correctness.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_2_detail.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_2_detail.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_3_contextual.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_3_contextual.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_4_temporal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_4_temporal.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_5_consistency.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_benchmark_5_consistency.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_activitynet.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_activitynet.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_msrvtt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_msrvtt.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_msvd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_msvd.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_tgif.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/eval/run_qa_tgif.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/finetune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/finetune.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/finetune_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/finetune_lora.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/v1_5/pretrain.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/v1_5/pretrain.sh -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/zero2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/zero2.json -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/zero2_offload.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/zero2_offload.json -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/zero3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/zero3.json -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/scripts/zero3_offload.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/scripts/zero3_offload.json -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/__init__.py: -------------------------------------------------------------------------------- 1 | from .model import LlavaLlamaForCausalLM 2 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/constants.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/conversation.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_mmvet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_mmvet.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_review.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_review.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_review_bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_review_bench.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_review_visual.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gpt_review_visual.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_gqa.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_mmlu.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_pope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_pope.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_science_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_science_qa.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_science_qa_gpt4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_science_qa_gpt4.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_science_qa_gpt4_requery.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_science_qa_gpt4_requery.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/eval_textvqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/eval_textvqa.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/generate_webpage_data_from_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/generate_webpage_data_from_table.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/inference_video_llava_vanebench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/inference_video_llava_vanebench.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/m4c_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/m4c_evaluator.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/model_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/model_qa.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_loader.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_mmbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_mmbench.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_qbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_qbench.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_science.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/model_vqa_science.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/qa_baseline_gpt35.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/qa_baseline_gpt35.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/run_llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/run_llava.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/summarize_gpt_review.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/summarize_gpt_review.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_alpaca-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_alpaca-13b.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_bard.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_bard.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_gpt35.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_gpt35.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_llama-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_llama-13b.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/answer/answer_vicuna-13b.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/caps_boxes_coco2014_val_80.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/caps_boxes_coco2014_val_80.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/model.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/model.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/prompt.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/prompt.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/question.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/question.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/results/test_sqa_llava_13b_v0.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/results/test_sqa_llava_13b_v0.json -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/results/test_sqa_llava_lcs_558k_sqa_12e_vicuna_v1_3_13b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/results/test_sqa_llava_lcs_558k_sqa_12e_vicuna_v1_3_13b.json -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_alpaca-13b_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_alpaca-13b_vicuna-13b.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_bard_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_bard_vicuna-13b.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_gpt35_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_gpt35_vicuna-13b.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_llama-13b_vicuna-13b.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/review/review_llama-13b_vicuna-13b.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/reviewer.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/reviewer.jsonl -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/table/rule.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/table/rule.json -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_1_correctness.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_1_correctness.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_2_detailed_orientation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_2_detailed_orientation.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_3_context.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_3_context.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_4_temporal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_4_temporal.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_5_consistency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_benchmark_5_consistency.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_video_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/eval_video_qa.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_benchmark_consistency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_benchmark_consistency.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_benchmark_general.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_benchmark_general.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_video_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_video_qa.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_video_qa_act.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/video/run_inference_video_qa_act.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/alpaca.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/alpaca.png -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/bard.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/bard.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/chatgpt.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/chatgpt.svg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/llama.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/llama.jpg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/swords_FILL0_wght300_GRAD0_opsz48.svg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/vicuna.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/figures/vicuna.jpeg -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/index.html -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/script.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/script.js -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/styles.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/eval/webpage/styles.css -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/mm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/mm_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/__pycache__/builder.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/__pycache__/builder.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/__pycache__/llava_arch.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/__pycache__/llava_arch.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/apply_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/apply_delta.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/consolidate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/consolidate.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/__pycache__/llava_llama.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/__pycache__/llava_llama.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/__pycache__/llava_mpt.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/__pycache__/llava_mpt.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/llava_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/llava_llama.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/llava_mpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/llava_mpt.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/adapt_tokenizer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/adapt_tokenizer.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/attention.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/attention.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/blocks.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/blocks.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/configuration_mpt.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/configuration_mpt.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/custom_embedding.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/custom_embedding.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/flash_attn_triton.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/flash_attn_triton.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/hf_prefixlm_converter.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/hf_prefixlm_converter.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/meta_init_context.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/meta_init_context.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/modeling_mpt.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/modeling_mpt.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/norm.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/norm.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/param_init_fns.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/__pycache__/param_init_fns.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/adapt_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/adapt_tokenizer.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/attention.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/blocks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/blocks.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/configuration_mpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/configuration_mpt.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/custom_embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/custom_embedding.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/flash_attn_triton.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/flash_attn_triton.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/hf_prefixlm_converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/hf_prefixlm_converter.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/meta_init_context.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/meta_init_context.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/modeling_mpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/modeling_mpt.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/norm.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/param_init_fns.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/language_model/mpt/param_init_fns.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/llava_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/llava_arch.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/make_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/make_delta.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/__pycache__/builder.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/__pycache__/builder.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/__pycache__/clip_encoder.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/__pycache__/clip_encoder.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/clip_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/clip_encoder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/__init__.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/configuration_audio.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/configuration_audio.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/modeling_audio.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/modeling_audio.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/processing_audio.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/processing_audio.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/tokenization_audio.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/__pycache__/tokenization_audio.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/configuration_audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/configuration_audio.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/modeling_audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/modeling_audio.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/processing_audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/processing_audio.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/tokenization_audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/audio/tokenization_audio.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/configuration_depth.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/configuration_depth.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/modeling_depth.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/modeling_depth.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/processing_depth.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/processing_depth.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/tokenization_depth.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/__pycache__/tokenization_depth.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/configuration_depth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/configuration_depth.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/modeling_depth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/modeling_depth.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/processing_depth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/processing_depth.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/tokenization_depth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/depth/tokenization_depth.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/configuration_image.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/configuration_image.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/modeling_image.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/modeling_image.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/processing_image.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/processing_image.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/tokenization_image.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/__pycache__/tokenization_image.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/configuration_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/configuration_image.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/modeling_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/modeling_image.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/processing_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/processing_image.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/tokenization_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/image/tokenization_image.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/configuration_thermal.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/configuration_thermal.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/modeling_thermal.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/modeling_thermal.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/processing_thermal.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/processing_thermal.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/tokenization_thermal.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/__pycache__/tokenization_thermal.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/configuration_thermal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/configuration_thermal.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/modeling_thermal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/modeling_thermal.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/processing_thermal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/processing_thermal.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/tokenization_thermal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/thermal/tokenization_thermal.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/configuration_video.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/configuration_video.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/modeling_video.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/modeling_video.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/processing_video.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/processing_video.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/tokenization_video.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/__pycache__/tokenization_video.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/configuration_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/configuration_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/modeling_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/modeling_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/processing_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/processing_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/tokenization_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_encoder/languagebind/video/tokenization_video.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_projector/__pycache__/builder.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_projector/__pycache__/builder.cpython-310.pyc -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_projector/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/multimodal_projector/builder.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/model/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/model/utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/cli.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/controller.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/controller.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/gradio_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/gradio_utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/gradio_web_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/gradio_web_server.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/model_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/model_worker.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/register_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/register_worker.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/test_message.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/test_message.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/serve/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/serve/utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/train/llama_flash_attn_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/train/llama_flash_attn_monkey_patch.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/train/llama_xformers_attn_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/train/llama_xformers_attn_monkey_patch.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/train/llava_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/train/llava_trainer.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/train/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/train/train.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/train/train_mem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/train/train_mem.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/train/train_xformers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/train/train_xformers.py -------------------------------------------------------------------------------- /scripts/open_source_models/Video-LLaVA/videollava/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/Video-LLaVA/videollava/utils.py -------------------------------------------------------------------------------- /scripts/open_source_models/assets/INSTALL.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/assets/INSTALL.md -------------------------------------------------------------------------------- /scripts/open_source_models/assets/INSTALL.md~3a0823e459c80f147e9ef5c670cec3bb277419e8: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/assets/INSTALL.md~3a0823e459c80f147e9ef5c670cec3bb277419e8 -------------------------------------------------------------------------------- /scripts/open_source_models/assets/PREDICTIONS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rohit901/VANE-Bench/HEAD/scripts/open_source_models/assets/PREDICTIONS.md --------------------------------------------------------------------------------