├── LICENSE ├── README.md ├── VLMEvalKit ├── .gitignore ├── .pre-commit-config.yaml ├── LICENSE ├── README.md ├── assets │ ├── LOGO.svg │ └── apple.jpg ├── debug_load.py ├── docs │ ├── en │ │ ├── .readthedocs.yaml │ │ ├── ConfigSystem.md │ │ ├── Contributors.md │ │ ├── Development.md │ │ ├── EvalByLMDeploy.md │ │ ├── Makefile │ │ ├── Quickstart.md │ │ ├── _static │ │ │ ├── css │ │ │ │ └── readthedocs.css │ │ │ ├── image │ │ │ │ ├── logo.svg │ │ │ │ └── logo_icon.svg │ │ │ └── js │ │ │ │ └── custom.js │ │ ├── _templates │ │ │ ├── 404.html │ │ │ ├── autosummary │ │ │ │ └── class.rst │ │ │ └── callable.rst │ │ ├── conf.py │ │ ├── docutils.conf │ │ └── index.rst │ ├── ja │ │ └── README_ja.md │ └── zh-CN │ │ ├── .readthedocs.yaml │ │ ├── ConfigSystem.md │ │ ├── Development.md │ │ ├── EvalByLMDeploy.md │ │ ├── Makefile │ │ ├── Quickstart.md │ │ ├── README_zh-CN.md │ │ ├── _static │ │ ├── css │ │ │ └── readthedocs.css │ │ ├── image │ │ │ ├── logo.svg │ │ │ └── logo_icon.svg │ │ └── js │ │ │ └── custom.js │ │ ├── _templates │ │ ├── 404.html │ │ ├── autosummary │ │ │ └── class.rst │ │ └── callable.rst │ │ ├── conf.py │ │ ├── cp_origin_docs.sh │ │ ├── docutils.conf │ │ └── index.rst ├── eval_zyc_api.sh ├── eval_zyc_moonvit.sh ├── eval_zyc_vituhd.sh ├── eval_zyc_vituhd_noupscale.sh ├── llava │ ├── __init__.py │ ├── constants.py │ ├── conversation.py │ ├── eval │ │ ├── eval_ai2d.py │ │ ├── eval_chartqa.py │ │ ├── eval_docvqa.py │ │ ├── eval_gpt_review.py │ │ ├── eval_gpt_review_bench.py │ │ ├── eval_gpt_review_visual.py │ │ ├── eval_pope.py │ │ ├── eval_rec.py │ │ ├── eval_science_qa.py │ │ ├── eval_science_qa_gpt4.py │ │ ├── eval_science_qa_gpt4_requery.py │ │ ├── eval_textvqa.py │ │ ├── evaluate_interleave.py │ │ ├── generate_webpage_data_from_table.py │ │ ├── m4c_evaluator.py │ │ ├── model_qa.py │ │ ├── model_vqa.py │ │ ├── model_vqa_loader.py │ │ ├── model_vqa_mmbench.py │ │ ├── model_vqa_science.py │ │ ├── qa_baseline_gpt35.py │ │ ├── run_llava.py │ │ └── summarize_gpt_review.py │ ├── mm_utils.py │ ├── model │ │ ├── __init__.py │ │ ├── apply_delta.py │ │ ├── builder.py │ │ ├── builder_new.bk │ │ ├── consolidate.py │ │ ├── language_model │ │ │ ├── llava_gemma.py │ │ │ ├── llava_llama.py │ │ │ ├── llava_mistral.py │ │ │ ├── llava_mixtral.py │ │ │ ├── llava_mpt.py │ │ │ ├── llava_qwen.py │ │ │ ├── llava_qwen3.py │ │ │ ├── llava_qwen_moe.py │ │ │ └── modeling_llama.py │ │ ├── llava_arch.py │ │ ├── make_delta.py │ │ ├── multimodal_encoder │ │ │ ├── adapt_clip_vision_model.py │ │ │ ├── attn_res.py │ │ │ ├── builder.py │ │ │ ├── clip_encoder.py │ │ │ ├── dev_eva_clip │ │ │ │ ├── eva_clip │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── bpe_simple_vocab_16e6.txt.gz │ │ │ │ │ ├── constants.py │ │ │ │ │ ├── eva_vit_model.py │ │ │ │ │ ├── factory.py │ │ │ │ │ ├── hf_configs.py │ │ │ │ │ ├── hf_model.py │ │ │ │ │ ├── loss.py │ │ │ │ │ ├── model.py │ │ │ │ │ ├── modified_resnet.py │ │ │ │ │ ├── openai.py │ │ │ │ │ ├── pretrained.py │ │ │ │ │ ├── rope.py │ │ │ │ │ ├── timm_model.py │ │ │ │ │ ├── tokenizer.py │ │ │ │ │ ├── transform.py │ │ │ │ │ ├── transformer.py │ │ │ │ │ └── utils.py │ │ │ │ └── eva_vit.py │ │ │ ├── eva_clip │ │ │ │ ├── eva_clip_encoder.py │ │ │ │ ├── eva_clip_processors.py │ │ │ │ ├── eva_vit.py │ │ │ │ └── factory.py │ │ │ ├── hf_vision.py │ │ │ ├── hubconf.py │ │ │ ├── imagebind.py │ │ │ ├── modeling_moonvit.py │ │ │ ├── modeling_qwen2_5vl.py │ │ │ ├── modeling_siglip2.py │ │ │ ├── modeling_siglip2_cjm.py │ │ │ ├── modeling_siglip2_ps8.py │ │ │ ├── modeling_swin_siglip2.py │ │ │ ├── modeling_swin_siglip2_new.py │ │ │ ├── modeling_swin_siglip2_zyc.py │ │ │ ├── open_clip_encoder.py │ │ │ └── siglip_encoder.py │ │ ├── multimodal_projector │ │ │ ├── adapt_spatial_resampler.py │ │ │ ├── builder.py │ │ │ ├── llava_mlp.py │ │ │ ├── merger.py │ │ │ ├── mlp.py │ │ │ ├── mlp_v2.py │ │ │ ├── percive_sampler.py │ │ │ ├── pooler_projector.py │ │ │ ├── resampler.py │ │ │ └── uhd_v1_resampler.py │ │ ├── multimodal_resampler │ │ │ ├── builder.py │ │ │ ├── masked_drop.py │ │ │ ├── perceiver.py │ │ │ ├── qformer.py │ │ │ └── spatial_pool.py │ │ └── utils.py │ ├── serve │ │ ├── __init__.py │ │ ├── cli.py │ │ ├── controller.py │ │ ├── examples │ │ │ ├── extreme_ironing.jpg │ │ │ └── waterview.jpg │ │ ├── gradio_multi_image.py │ │ ├── gradio_web_server.py │ │ ├── model_worker.py │ │ ├── register_worker.py │ │ ├── sglang_worker.py │ │ └── test_message.py │ ├── slice_process.py │ ├── train │ │ ├── llama_flash_attn_monkey_patch.py │ │ ├── llava_trainer.py │ │ ├── llava_trainer_eval.py │ │ ├── train.py │ │ ├── train_dpo.py │ │ └── train_mem.py │ └── utils.py ├── requirements.txt ├── requirements │ └── docs.txt ├── run.py ├── scripts │ ├── AI2D_preproc.ipynb │ ├── apires_scan.py │ ├── auto_run.py │ ├── cover.sh │ ├── data_browser.py │ ├── mmb_eval_gradio.py │ ├── run.sh │ ├── srun.sh │ ├── summarize.py │ └── visualize.ipynb ├── setup.py ├── test_vlm_load.py └── vlmeval │ ├── __init__.py │ ├── api │ ├── __init__.py │ ├── base.py │ ├── bluelm_v_api.py │ ├── claude.py │ ├── cloudwalk.py │ ├── doubao_vl_api.py │ ├── gemini.py │ ├── glm_vision.py │ ├── gpt.py │ ├── hf_chat_model.py │ ├── hunyuan.py │ ├── jt_vl_chat.py │ ├── lmdeploy.py │ ├── mug_u.py │ ├── qwen_api.py │ ├── qwen_vl_api.py │ ├── reka.py │ ├── sensechat_vision.py │ ├── siliconflow.py │ ├── stepai.py │ ├── taichu.py │ └── taiyi.py │ ├── config.py │ ├── dataset │ ├── GUI │ │ ├── __init__.py │ │ ├── screenspot.py │ │ └── screenspot_pro.py │ ├── Omnidocbench │ │ ├── __init__.py │ │ ├── data_preprocess.py │ │ ├── metrics.py │ │ ├── omnidocbench.py │ │ ├── requirements.txt │ │ └── utils.py │ ├── __init__.py │ ├── cgbench.py │ ├── charxiv.py │ ├── cmmmu.py │ ├── creation.py │ ├── dude.py │ ├── dynamath.py │ ├── emma.py │ ├── gobench.py │ ├── image_base.py │ ├── image_caption.py │ ├── image_ccocr.py │ ├── image_mcq.py │ ├── image_mt.py │ ├── image_shortqa.py │ ├── image_vqa.py │ ├── image_yorn.py │ ├── longvideobench.py │ ├── megabench.py │ ├── miabench.py │ ├── mlvu.py │ ├── mmalignbench.py │ ├── mmbench_video.py │ ├── mmgenbench.py │ ├── mmifeval.py │ ├── mmlongbench.py │ ├── mmmath.py │ ├── moat.py │ ├── moviechat1k.py │ ├── mvbench.py │ ├── qbench_video.py │ ├── slidevqa.py │ ├── spatial457.py │ ├── tamperbench.py │ ├── tempcompass.py │ ├── text_base.py │ ├── text_mcq.py │ ├── utils │ │ ├── __init__.py │ │ ├── ccocr_evaluator │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── common.py │ │ │ ├── doc_parsing_evaluator.py │ │ │ ├── kie_evaluator.py │ │ │ └── ocr_evaluator.py │ │ ├── cgbench.py │ │ ├── crpe.py │ │ ├── hrbench.py │ │ ├── judge_util.py │ │ ├── llavabench.py │ │ ├── logicvista.py │ │ ├── longvideobench.py │ │ ├── mathv.py │ │ ├── mathverse.py │ │ ├── mathvista.py │ │ ├── megabench │ │ │ ├── README.md │ │ │ ├── __init__.py │ │ │ ├── aggregation │ │ │ │ ├── mean_agg.py │ │ │ │ ├── min_agg.py │ │ │ │ └── unsupported_agg.py │ │ │ ├── aggregation_type.py │ │ │ ├── evaluator.py │ │ │ ├── metric_type.py │ │ │ ├── parsing │ │ │ │ ├── answer_str_parse.py │ │ │ │ ├── common │ │ │ │ │ ├── parsers.py │ │ │ │ │ └── utils.py │ │ │ │ ├── dummy_parse.py │ │ │ │ └── json_parse.py │ │ │ ├── requirements.txt │ │ │ ├── response_parse_type.py │ │ │ ├── scoring │ │ │ │ ├── ascii_art_gpt4o_judge.py │ │ │ │ ├── chess_jaccard.py │ │ │ │ ├── common │ │ │ │ │ ├── conversions.py │ │ │ │ │ ├── metrics.py │ │ │ │ │ └── transformations.py │ │ │ │ ├── constrained_generation.py │ │ │ │ ├── coordinate_sequence_match.py │ │ │ │ ├── dict_equality.py │ │ │ │ ├── dict_exact_match_agg_recall.py │ │ │ │ ├── dict_jaccard_agg_jaccard.py │ │ │ │ ├── dict_nbbox_iou_tuple_agg_jaccard.py │ │ │ │ ├── dict_set_equality_agg_jaccard.py │ │ │ │ ├── exact_str_match.py │ │ │ │ ├── exact_str_match_case_insensitive.py │ │ │ │ ├── general_numerical_match.py │ │ │ │ ├── geo_proximity.py │ │ │ │ ├── gleu.py │ │ │ │ ├── jaccard.py │ │ │ │ ├── latex_expr_equality.py │ │ │ │ ├── longest_common_list_prefix_ratio.py │ │ │ │ ├── mse.py │ │ │ │ ├── multi_ref_phrase.py │ │ │ │ ├── nbbox_iou.py │ │ │ │ ├── near_str_match.py │ │ │ │ ├── nli_entailment.py │ │ │ │ ├── normalized_similarity_damerau_levenshtein.py │ │ │ │ ├── number_rel_diff_ratio.py │ │ │ │ ├── positive_int_match.py │ │ │ │ ├── program_judge.py │ │ │ │ ├── sacrebleu_bleu.py │ │ │ │ ├── sequence_equality.py │ │ │ │ ├── set_equality.py │ │ │ │ ├── set_precision.py │ │ │ │ ├── simple_str_match.py │ │ │ │ ├── symbolic_planning.py │ │ │ │ ├── unsupported_scoring.py │ │ │ │ ├── vlm_as_judge.py │ │ │ │ ├── xml_nbbox_iou.py │ │ │ │ ├── xml_norm_point_distance.py │ │ │ │ └── xml_norm_point_in_bbox.py │ │ │ └── utils.py │ │ ├── mlvu.py │ │ ├── mmbench_video.py │ │ ├── mmdu.py │ │ ├── mmif │ │ │ ├── __init__.py │ │ │ └── function_and_compare.py │ │ ├── mmniah.py │ │ ├── mmsci.py │ │ ├── mmsci4eval_req.txt │ │ ├── mmvet.py │ │ ├── moviechat1k.py │ │ ├── multiple_choice.py │ │ ├── mvbench.py │ │ ├── naturalbench.py │ │ ├── ocr_reasoning.py │ │ ├── ocrbench.py │ │ ├── olympiadbench.py │ │ ├── omni3dbench.py │ │ ├── physic.py │ │ ├── physics_eval_utils.py │ │ ├── phyx.py │ │ ├── qbench_video.py │ │ ├── qspatial.py │ │ ├── shortqa.py │ │ ├── spatial457.py │ │ ├── tablevqabench.py │ │ ├── tallyqa.py │ │ ├── tamperbench.py │ │ ├── tdbench.py │ │ ├── tempcompass.py │ │ ├── vdc.py │ │ ├── vgrpbench │ │ │ ├── __init__.py │ │ │ ├── configs │ │ │ │ └── formating-prompt │ │ │ │ │ ├── aquarium │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── battleships │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── binairo │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── coloredsudoku │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── fieldexplore │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── futoshiki │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── hitori │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── jigsawsudoku │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── kakurasu │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── kakuro │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── killersudoku │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── lightup │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── nonogram │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── oddevensudoku │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── renzoku │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── skyscraper │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── starbattle │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── sudoku │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ ├── thermometers │ │ │ │ │ └── filter_prompt.json │ │ │ │ │ └── treesandtents │ │ │ │ │ └── filter_prompt.json │ │ │ ├── evaluation.py │ │ │ ├── puzzles │ │ │ │ ├── aquarium.py │ │ │ │ ├── battleships.py │ │ │ │ ├── binairo.py │ │ │ │ ├── coloredsudoku.py │ │ │ │ ├── common_constriants.py │ │ │ │ ├── common_get_game_factory.py │ │ │ │ ├── common_get_prompt.py │ │ │ │ ├── common_puzzle_factory.py │ │ │ │ ├── fieldexplore.py │ │ │ │ ├── futoshiki.py │ │ │ │ ├── hitori.py │ │ │ │ ├── jigsawsudoku.py │ │ │ │ ├── kakurasu.py │ │ │ │ ├── kakuro.py │ │ │ │ ├── killersudoku.py │ │ │ │ ├── lightup.py │ │ │ │ ├── nonogram.py │ │ │ │ ├── oddevensudoku.py │ │ │ │ ├── renzoku.py │ │ │ │ ├── skyscraper.py │ │ │ │ ├── starbattle.py │ │ │ │ ├── sudoku.py │ │ │ │ ├── thermometers.py │ │ │ │ └── treesandtents.py │ │ │ └── score.py │ │ ├── video_mmlu.py │ │ ├── videoholmes.py │ │ ├── videomme.py │ │ ├── visulogic.py │ │ ├── vlm2bench.py │ │ ├── vmcbench.py │ │ ├── vqa_eval.py │ │ ├── wemath.py │ │ ├── worldsense.py │ │ └── yorn.py │ ├── vcr.py │ ├── vdc.py │ ├── video_base.py │ ├── video_concat_dataset.py │ ├── video_dataset_config.py │ ├── video_holmes.py │ ├── video_mmlu.py │ ├── videomme.py │ ├── vl_rewardbench.py │ ├── vlm2bench.py │ ├── wildvision.py │ └── worldsense.py │ ├── inference.py │ ├── inference_mt.py │ ├── inference_video.py │ ├── smp │ ├── __init__.py │ ├── file.py │ ├── log.py │ ├── misc.py │ └── vlm.py │ ├── tools.py │ ├── utils │ ├── __init__.py │ ├── extract_utils.py │ ├── matching_util.py │ ├── mp_util.py │ └── result_transfer.py │ └── vlm │ ├── __init__.py │ ├── aki.py │ ├── aria.py │ ├── base.py │ ├── bunnyllama3.py │ ├── cambrian.py │ ├── chameleon.py │ ├── cogvlm.py │ ├── deepseek_vl.py │ ├── deepseek_vl2.py │ ├── eagle_x.py │ ├── emu.py │ ├── falcon_vlm.py │ ├── flash_vl.py │ ├── gemma.py │ ├── h2ovl_mississippi.py │ ├── idefics.py │ ├── instructblip.py │ ├── janus.py │ ├── kimi_vl.py │ ├── kosmos.py │ ├── llama4.py │ ├── llama_vision.py │ ├── llava │ ├── __init__.py │ ├── llava.py │ └── llava_xtuner.py │ ├── llava_qwen2_base_new.py │ ├── llava_qwen2_uhd_v3.py │ ├── llava_uhd_siglip2_2048.py │ ├── llava_uhd_v3.py │ ├── long_vita.py │ ├── mantis.py │ ├── mgm.py │ ├── minicpm_v.py │ ├── minigpt4.py │ ├── minimonkey.py │ ├── misc │ ├── blip2_instruct_vicuna13b.yaml │ ├── blip2_instruct_vicuna7b.yaml │ ├── minigpt4_13b_eval.yaml │ ├── minigpt4_7b_eval.yaml │ └── minigptv2_eval.yaml │ ├── mixsense.py │ ├── mmalaya.py │ ├── molmo.py │ ├── monkey.py │ ├── moondream.py │ ├── mplug_owl2.py │ ├── mplug_owl3.py │ ├── nvlm.py │ ├── ola │ ├── __init__.py │ ├── ola │ │ ├── arguments.py │ │ ├── constants.py │ │ ├── conversation.py │ │ ├── datasets │ │ │ ├── __init__.py │ │ │ └── preprocess.py │ │ ├── mm_utils.py │ │ ├── model │ │ │ ├── __init__.py │ │ │ ├── builder.py │ │ │ ├── language_model │ │ │ │ └── ola_qwen.py │ │ │ ├── multimodal_encoder │ │ │ │ ├── builder.py │ │ │ │ └── oryx_vit.py │ │ │ ├── multimodal_projector │ │ │ │ ├── builder.py │ │ │ │ └── pooler_projector.py │ │ │ ├── multimodal_resampler │ │ │ │ ├── builder.py │ │ │ │ └── perceiver.py │ │ │ ├── ola_arch.py │ │ │ ├── speech_encoder │ │ │ │ ├── beats │ │ │ │ │ ├── BEATs.py │ │ │ │ │ ├── Tokenizers.py │ │ │ │ │ ├── __init__.py │ │ │ │ │ ├── backbone.py │ │ │ │ │ ├── kaldi.py │ │ │ │ │ ├── modules.py │ │ │ │ │ └── quantizer.py │ │ │ │ ├── builder.py │ │ │ │ └── speech_encoder.py │ │ │ └── speech_projector │ │ │ │ ├── builder.py │ │ │ │ └── speech_projector.py │ │ └── utils.py │ └── ola_model.py │ ├── omchat.py │ ├── omnilmm.py │ ├── open_flamingo.py │ ├── ovis │ ├── __init__.py │ ├── ovis.py │ └── utils │ │ ├── __init__.py │ │ └── mdp3.py │ ├── pandagpt.py │ ├── parrot.py │ ├── phi3_vision.py │ ├── phi4_multimodal.py │ ├── pixtral.py │ ├── points.py │ ├── qh_360vl.py │ ├── qwen2_vl │ ├── __init__.py │ ├── model.py │ └── prompt.py │ ├── qwen_vl.py │ ├── rbdash.py │ ├── ristretto.py │ ├── ross.py │ ├── sail_vl.py │ ├── slime.py │ ├── smolvlm.py │ ├── transcore_m.py │ ├── ursa │ ├── __init__.py │ ├── ursa_chat.py │ └── ursa_model │ │ ├── __init__.py │ │ ├── clip_encoder.py │ │ ├── configuration_ursa.py │ │ ├── image_processing_vlm.py │ │ ├── modeling_ursa.py │ │ ├── processing_ursa.py │ │ ├── projector.py │ │ ├── sam.py │ │ └── siglip_vit.py │ ├── valley │ ├── __init__.py │ ├── requirements_valley.txt │ └── valley.py │ ├── video_llm │ ├── __init__.py │ ├── chat_uni_vi.py │ ├── configs │ │ ├── llama_vid │ │ │ └── processor │ │ │ │ └── clip-patch14-224 │ │ │ │ ├── config.json │ │ │ │ └── preprocessor_config.json │ │ └── videochat2_hd.json │ ├── llama_vid.py │ ├── pllava.py │ ├── video_chatgpt.py │ ├── video_llava.py │ └── videochat2.py │ ├── vila.py │ ├── vintern_chat.py │ ├── visualglm.py │ ├── vita.py │ ├── vlaa_thinker.py │ ├── vlm_r1.py │ ├── vxverse.py │ ├── wemm.py │ ├── wethink_vl.py │ ├── xcomposer │ ├── __init__.py │ ├── sharecaptioner.py │ ├── xcomposer.py │ ├── xcomposer2.py │ ├── xcomposer2_4KHD.py │ └── xcomposer2d5.py │ ├── xgen_mm.py │ └── yi_vl.py ├── cog.yaml ├── featup ├── __init__.py ├── adaptive_conv_cuda │ ├── __init__.py │ ├── adaptive_conv.cpp │ ├── adaptive_conv.py │ ├── adaptive_conv_cuda.cpp │ └── adaptive_conv_kernel.cu ├── configs │ ├── implicit_upsampler.yaml │ ├── jbu_upsampler.yaml │ ├── train_probe.yaml │ └── validate_train_probe.yaml ├── datasets │ ├── COCO.py │ ├── DAVIS.py │ ├── DOC.py │ ├── DocSceneText.py │ ├── EmbeddingFile.py │ ├── HTML.py │ ├── HighResEmbs.py │ ├── ImageNetSubset.py │ ├── JitteredImage.py │ ├── SCENE.py │ ├── SampleImage.py │ ├── __init__.py │ └── util.py ├── downsamplers.py ├── featurizers │ ├── CLIP.py │ ├── CLIPLarge.py │ ├── ClipEncoder.py │ ├── DINO.py │ ├── DINOv2.py │ ├── DeepLabV3.py │ ├── MAE.py │ ├── MIDAS.py │ ├── MaskCLIP.py │ ├── ResNet.py │ ├── __init__.py │ ├── dinov2 │ │ ├── __init__.py │ │ └── layers │ │ │ ├── __init__.py │ │ │ ├── attention.py │ │ │ ├── block.py │ │ │ ├── dino_head.py │ │ │ ├── drop_path.py │ │ │ ├── layer_scale.py │ │ │ ├── mlp.py │ │ │ ├── patch_embed.py │ │ │ └── swiglu_ffn.py │ ├── maskclip │ │ ├── README.md │ │ ├── __init__.py │ │ ├── bpe_simple_vocab_16e6.txt.gz │ │ ├── clip.py │ │ ├── interpolate.py │ │ ├── model.py │ │ └── simple_tokenizer.py │ ├── modules │ │ ├── __init__.py │ │ ├── layers.py │ │ ├── resnet.py │ │ └── vgg.py │ ├── siglip.py │ └── util.py ├── layers.py ├── losses.py ├── plotting.py ├── upsamplers.py ├── util.py └── validate_probes.py ├── figs ├── LLaVA_UHD_v3.png ├── ViT-UHD-performance-figure.png ├── ViTUHD-performace.png ├── github_banner.png ├── github_banner_puretext.png ├── mllm_numeric_figure_pt1.png ├── mllm_numeric_figure_pt2.png ├── performance&efficiency&radar.jpg └── radar_and_mllm_perfo.png ├── llava.egg-info ├── PKG-INFO ├── SOURCES.txt ├── dependency_links.txt ├── requires.txt └── top_level.txt ├── llava ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-310.pyc │ ├── constants.cpython-310.pyc │ ├── conversation.cpython-310.pyc │ ├── mm_utils.cpython-310.pyc │ ├── slice_process.cpython-310.pyc │ └── utils.cpython-310.pyc ├── constants.py ├── conversation.py ├── mm_utils.py ├── model │ ├── __init__.py │ ├── __pycache__ │ │ ├── __init__.cpython-310.pyc │ │ └── llava_arch.cpython-310.pyc │ ├── builder.py │ ├── consolidate.py │ ├── language_model │ │ ├── __pycache__ │ │ │ ├── llava_llama.cpython-310.pyc │ │ │ ├── llava_mistral.cpython-310.pyc │ │ │ ├── llava_mixtral.cpython-310.pyc │ │ │ ├── llava_qwen.cpython-310.pyc │ │ │ └── llava_qwen3.cpython-310.pyc │ │ ├── llava_llama.py │ │ ├── llava_qwen.py │ │ └── llava_qwen3.py │ ├── llava_arch.py │ ├── multimodal_encoder │ │ ├── __pycache__ │ │ │ ├── builder.cpython-310.pyc │ │ │ ├── hf_vision.cpython-310.pyc │ │ │ ├── imagebind.cpython-310.pyc │ │ │ ├── modeling_moonvit.cpython-310.pyc │ │ │ ├── modeling_siglip2.cpython-310.pyc │ │ │ ├── modeling_swin_siglip2.cpython-310.pyc │ │ │ └── modeling_swin_siglip2_zyc.cpython-310.pyc │ │ ├── builder.py │ │ ├── modeling_moonvit.py │ │ └── modeling_siglip2.py │ ├── multimodal_projector │ │ ├── __pycache__ │ │ │ ├── builder.cpython-310.pyc │ │ │ ├── llava_mlp.cpython-310.pyc │ │ │ ├── merger.cpython-310.pyc │ │ │ ├── resampler.cpython-310.pyc │ │ │ └── uhd_v1_resampler.cpython-310.pyc │ │ ├── builder.py │ │ ├── llava_mlp.py │ │ ├── merger.py │ │ ├── resampler.py │ │ └── uhd_v1_resampler.py │ ├── multimodal_resampler │ │ ├── __pycache__ │ │ │ ├── builder.cpython-310.pyc │ │ │ ├── masked_drop.cpython-310.pyc │ │ │ ├── perceiver.cpython-310.pyc │ │ │ ├── qformer.cpython-310.pyc │ │ │ └── spatial_pool.cpython-310.pyc │ │ ├── builder.py │ │ ├── masked_drop.py │ │ ├── perceiver.py │ │ ├── qformer.py │ │ └── spatial_pool.py │ └── utils.py ├── serve │ ├── __init__.py │ ├── cli.py │ ├── controller.py │ ├── gradio_multi_image.py │ ├── gradio_web_server.py │ ├── model_worker.py │ ├── register_worker.py │ ├── sglang_worker.py │ └── test_message.py ├── slice_process.py ├── train │ ├── __pycache__ │ │ ├── llava_trainer.cpython-310.pyc │ │ └── train.cpython-310.pyc │ ├── llava_trainer.py │ ├── train.py │ └── train_mem.py └── utils.py ├── pyproject.toml ├── requirements.bak ├── scripts ├── archived │ ├── convert_gqa_for_eval.py │ ├── convert_mmvet_for_eval.py │ ├── convert_sqa_to_llava.py │ ├── convert_sqa_to_llava_base_prompt.py │ ├── convert_vizwiz_for_submission.py │ ├── convert_vqav2_for_submission.py │ ├── data_info.py │ ├── dpo_data_info.py │ ├── finetune.sh │ ├── finetune_1.5.sh │ ├── finetune_full_schedule.sh │ ├── finetune_lora.sh │ ├── finetune_mixtral.sh │ ├── finetune_mixtral_1.5.sh │ ├── finetune_mixtral_1.6_336px_anyres.sh │ ├── finetune_mixtral_1.6_336px_anyres_freeze_vision.sh │ ├── finetune_mixtral_1.6_336px_anyres_lmms_eval.sh │ ├── finetune_mixtral_copy.sh │ ├── finetune_qlora.sh │ ├── finetune_sqa.sh │ ├── merge_lora_weights.py │ ├── pretrain.sh │ ├── quick_check.py │ ├── sqa_eval_batch.sh │ └── sqa_eval_gather.sh ├── convert_gqa_for_eval.py ├── interleave │ ├── eval_all.sh │ ├── eval_interleave_3d.sh │ └── eval_multiprocess.sh ├── train │ ├── README.md │ ├── direct_finetune_clip.sh │ ├── direct_finetune_siglip_a4.sh │ ├── dpo.sh │ ├── dpo_ov7b.sh │ ├── finetune_ov.sh │ ├── finetune_si.sh │ ├── mid_stage.yaml │ ├── onevision.yaml │ ├── pretrain_clip.sh │ ├── pretrain_siglip.sh │ └── single_image.yaml ├── v1_5 │ └── eval │ │ ├── ai2d.sh │ │ ├── chartqa.sh │ │ ├── deepform.sh │ │ ├── docvqa_test.sh │ │ ├── docvqa_val.sh │ │ ├── estvqa.sh │ │ ├── gqa.sh │ │ ├── infographics.sh │ │ ├── llavabench.sh │ │ ├── mmbench.sh │ │ ├── mmbench_cn.sh │ │ ├── mme.sh │ │ ├── mmvet.sh │ │ ├── pope.sh │ │ ├── qbench.sh │ │ ├── qbench_zh.sh │ │ ├── rec.sh │ │ ├── sqa.sh │ │ ├── textvqa.sh │ │ ├── vizwiz.sh │ │ └── vqav2.sh ├── video │ ├── demo │ │ └── video_demo.sh │ ├── eval │ │ ├── activitynet_eval.sh │ │ ├── video_chatgpt_benchmark_eval_shard.sh │ │ ├── video_description_from_t2v.sh │ │ ├── video_detail_description_eval_only.sh │ │ └── video_detail_description_eval_shard.sh │ └── train │ │ ├── SO400M_Qwen2_72B_ov_to_video_am9.sh │ │ ├── SO400M_Qwen2_7B_ov_to_video_am9.sh │ │ └── exp.yaml ├── zero2.json ├── zero2_fused_adamw.json ├── zero2_new.json ├── zero2_offload.json ├── zero2_old.json ├── zero3.json ├── zero3_offload.json └── zero3pp.json ├── setup.py ├── setup_train_env.sh ├── train.sh ├── train_moonvit.sh └── trl ├── __init__.py ├── __pycache__ ├── __init__.cpython-310.pyc ├── core.cpython-310.pyc └── import_utils.cpython-310.pyc ├── core.py ├── environment ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-310.pyc │ └── base_environment.cpython-310.pyc └── base_environment.py ├── extras ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-310.pyc │ ├── best_of_n_sampler.cpython-310.pyc │ └── dataset_formatting.cpython-310.pyc ├── best_of_n_sampler.py └── dataset_formatting.py ├── import_utils.py ├── models ├── __init__.py ├── __pycache__ │ ├── __init__.cpython-310.pyc │ ├── modeling_base.cpython-310.pyc │ ├── modeling_value_head.cpython-310.pyc │ └── utils.cpython-310.pyc ├── modeling_base.py ├── modeling_sd_base.py ├── modeling_value_head.py └── utils.py └── trainer ├── __init__.py ├── __pycache__ ├── __init__.cpython-310.pyc ├── base.cpython-310.pyc ├── ddpo_config.cpython-310.pyc ├── dpo_trainer.cpython-310.pyc ├── iterative_sft_trainer.cpython-310.pyc ├── model_config.cpython-310.pyc ├── ppo_config.cpython-310.pyc ├── ppo_trainer.cpython-310.pyc ├── reward_config.cpython-310.pyc ├── reward_trainer.cpython-310.pyc ├── sft_trainer.cpython-310.pyc └── utils.cpython-310.pyc ├── base.py ├── ddpo_config.py ├── ddpo_trainer.py ├── dpo_trainer.py ├── iterative_sft_trainer.py ├── model_config.py ├── ppo_config.py ├── ppo_trainer.py ├── reward_config.py ├── reward_trainer.py ├── sft_trainer.py └── utils.py /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/README.md -------------------------------------------------------------------------------- /VLMEvalKit/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/.gitignore -------------------------------------------------------------------------------- /VLMEvalKit/.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/.pre-commit-config.yaml -------------------------------------------------------------------------------- /VLMEvalKit/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/LICENSE -------------------------------------------------------------------------------- /VLMEvalKit/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/README.md -------------------------------------------------------------------------------- /VLMEvalKit/assets/LOGO.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/assets/LOGO.svg -------------------------------------------------------------------------------- /VLMEvalKit/assets/apple.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/assets/apple.jpg -------------------------------------------------------------------------------- /VLMEvalKit/debug_load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/debug_load.py -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/.readthedocs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/.readthedocs.yaml -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/ConfigSystem.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/ConfigSystem.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/Contributors.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/Contributors.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/Development.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/Development.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/EvalByLMDeploy.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/EvalByLMDeploy.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/Makefile -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/Quickstart.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/Quickstart.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/_static/css/readthedocs.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/_static/css/readthedocs.css -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/_static/image/logo.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/_static/image/logo.svg -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/_static/image/logo_icon.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/_static/image/logo_icon.svg -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/_static/js/custom.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/_static/js/custom.js -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/_templates/404.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/_templates/404.html -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/_templates/autosummary/class.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/_templates/autosummary/class.rst -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/_templates/callable.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/_templates/callable.rst -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/conf.py -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/docutils.conf: -------------------------------------------------------------------------------- 1 | [html writers] 2 | table_style: colwidths-auto 3 | -------------------------------------------------------------------------------- /VLMEvalKit/docs/en/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/en/index.rst -------------------------------------------------------------------------------- /VLMEvalKit/docs/ja/README_ja.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/ja/README_ja.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/.readthedocs.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/.readthedocs.yaml -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/ConfigSystem.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/ConfigSystem.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/Development.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/Development.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/EvalByLMDeploy.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/EvalByLMDeploy.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/Makefile -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/Quickstart.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/Quickstart.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/README_zh-CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/README_zh-CN.md -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/_static/css/readthedocs.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/_static/css/readthedocs.css -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/_static/image/logo.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/_static/image/logo.svg -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/_static/image/logo_icon.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/_static/image/logo_icon.svg -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/_static/js/custom.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/_static/js/custom.js -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/_templates/404.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/_templates/404.html -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/_templates/autosummary/class.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/_templates/autosummary/class.rst -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/_templates/callable.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/_templates/callable.rst -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/conf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/conf.py -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/cp_origin_docs.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/cp_origin_docs.sh -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/docutils.conf: -------------------------------------------------------------------------------- 1 | [html writers] 2 | table_style: colwidths-auto 3 | -------------------------------------------------------------------------------- /VLMEvalKit/docs/zh-CN/index.rst: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/docs/zh-CN/index.rst -------------------------------------------------------------------------------- /VLMEvalKit/eval_zyc_api.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/eval_zyc_api.sh -------------------------------------------------------------------------------- /VLMEvalKit/eval_zyc_moonvit.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/eval_zyc_moonvit.sh -------------------------------------------------------------------------------- /VLMEvalKit/eval_zyc_vituhd.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/eval_zyc_vituhd.sh -------------------------------------------------------------------------------- /VLMEvalKit/eval_zyc_vituhd_noupscale.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/eval_zyc_vituhd_noupscale.sh -------------------------------------------------------------------------------- /VLMEvalKit/llava/__init__.py: -------------------------------------------------------------------------------- 1 | from .model import LlavaLlamaForCausalLM 2 | -------------------------------------------------------------------------------- /VLMEvalKit/llava/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/constants.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/conversation.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_ai2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_ai2d.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_chartqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_chartqa.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_docvqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_docvqa.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_gpt_review.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_gpt_review.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_gpt_review_bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_gpt_review_bench.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_gpt_review_visual.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_gpt_review_visual.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_pope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_pope.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_rec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_rec.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_science_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_science_qa.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_science_qa_gpt4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_science_qa_gpt4.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_science_qa_gpt4_requery.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_science_qa_gpt4_requery.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/eval_textvqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/eval_textvqa.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/evaluate_interleave.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/evaluate_interleave.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/generate_webpage_data_from_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/generate_webpage_data_from_table.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/m4c_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/m4c_evaluator.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/model_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/model_qa.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/model_vqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/model_vqa.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/model_vqa_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/model_vqa_loader.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/model_vqa_mmbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/model_vqa_mmbench.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/model_vqa_science.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/model_vqa_science.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/qa_baseline_gpt35.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/qa_baseline_gpt35.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/run_llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/run_llava.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/eval/summarize_gpt_review.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/eval/summarize_gpt_review.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/mm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/mm_utils.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/apply_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/apply_delta.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/builder_new.bk: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/builder_new.bk -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/consolidate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/consolidate.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_gemma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_gemma.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_llama.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_mistral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_mistral.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_mixtral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_mixtral.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_mpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_mpt.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_qwen.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_qwen3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_qwen3.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/llava_qwen_moe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/llava_qwen_moe.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/language_model/modeling_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/language_model/modeling_llama.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/llava_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/llava_arch.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/make_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/make_delta.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/adapt_clip_vision_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/adapt_clip_vision_model.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/attn_res.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/attn_res.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/clip_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/clip_encoder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/loss.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/model.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/openai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/openai.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/rope.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/rope.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_clip/utils.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/dev_eva_clip/eva_vit.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/eva_clip/eva_clip_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/eva_clip/eva_clip_encoder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/eva_clip/eva_clip_processors.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/eva_clip/eva_clip_processors.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/eva_clip/eva_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/eva_clip/eva_vit.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/eva_clip/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/eva_clip/factory.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/hf_vision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/hf_vision.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/hubconf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/hubconf.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/imagebind.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/imagebind.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_moonvit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_moonvit.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_qwen2_5vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_qwen2_5vl.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_siglip2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_siglip2.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_siglip2_cjm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_siglip2_cjm.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_siglip2_ps8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_siglip2_ps8.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_swin_siglip2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_swin_siglip2.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_swin_siglip2_new.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_swin_siglip2_new.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/modeling_swin_siglip2_zyc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/modeling_swin_siglip2_zyc.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/open_clip_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/open_clip_encoder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_encoder/siglip_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_encoder/siglip_encoder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/adapt_spatial_resampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/adapt_spatial_resampler.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/llava_mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/llava_mlp.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/merger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/merger.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/mlp.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/mlp_v2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/mlp_v2.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/percive_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/percive_sampler.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/pooler_projector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/pooler_projector.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/resampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/resampler.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_projector/uhd_v1_resampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_projector/uhd_v1_resampler.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_resampler/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_resampler/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_resampler/masked_drop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_resampler/masked_drop.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_resampler/perceiver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_resampler/perceiver.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_resampler/qformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_resampler/qformer.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/multimodal_resampler/spatial_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/multimodal_resampler/spatial_pool.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/model/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/model/utils.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/cli.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/controller.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/controller.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/examples/extreme_ironing.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/examples/extreme_ironing.jpg -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/examples/waterview.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/examples/waterview.jpg -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/gradio_multi_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/gradio_multi_image.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/gradio_web_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/gradio_web_server.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/model_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/model_worker.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/register_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/register_worker.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/sglang_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/sglang_worker.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/serve/test_message.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/serve/test_message.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/slice_process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/slice_process.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/train/llama_flash_attn_monkey_patch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/train/llama_flash_attn_monkey_patch.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/train/llava_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/train/llava_trainer.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/train/llava_trainer_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/train/llava_trainer_eval.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/train/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/train/train.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/train/train_dpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/train/train_dpo.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/train/train_mem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/train/train_mem.py -------------------------------------------------------------------------------- /VLMEvalKit/llava/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/llava/utils.py -------------------------------------------------------------------------------- /VLMEvalKit/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/requirements.txt -------------------------------------------------------------------------------- /VLMEvalKit/requirements/docs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/requirements/docs.txt -------------------------------------------------------------------------------- /VLMEvalKit/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/run.py -------------------------------------------------------------------------------- /VLMEvalKit/scripts/AI2D_preproc.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/AI2D_preproc.ipynb -------------------------------------------------------------------------------- /VLMEvalKit/scripts/apires_scan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/apires_scan.py -------------------------------------------------------------------------------- /VLMEvalKit/scripts/auto_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/auto_run.py -------------------------------------------------------------------------------- /VLMEvalKit/scripts/cover.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/cover.sh -------------------------------------------------------------------------------- /VLMEvalKit/scripts/data_browser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/data_browser.py -------------------------------------------------------------------------------- /VLMEvalKit/scripts/mmb_eval_gradio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/mmb_eval_gradio.py -------------------------------------------------------------------------------- /VLMEvalKit/scripts/run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/run.sh -------------------------------------------------------------------------------- /VLMEvalKit/scripts/srun.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/srun.sh -------------------------------------------------------------------------------- /VLMEvalKit/scripts/summarize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/summarize.py -------------------------------------------------------------------------------- /VLMEvalKit/scripts/visualize.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/scripts/visualize.ipynb -------------------------------------------------------------------------------- /VLMEvalKit/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/setup.py -------------------------------------------------------------------------------- /VLMEvalKit/test_vlm_load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/test_vlm_load.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/base.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/bluelm_v_api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/bluelm_v_api.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/claude.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/claude.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/cloudwalk.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/cloudwalk.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/doubao_vl_api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/doubao_vl_api.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/gemini.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/gemini.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/glm_vision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/glm_vision.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/gpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/gpt.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/hf_chat_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/hf_chat_model.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/hunyuan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/hunyuan.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/jt_vl_chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/jt_vl_chat.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/lmdeploy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/lmdeploy.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/mug_u.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/mug_u.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/qwen_api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/qwen_api.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/qwen_vl_api.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/qwen_vl_api.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/reka.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/reka.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/sensechat_vision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/sensechat_vision.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/siliconflow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/siliconflow.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/stepai.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/stepai.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/taichu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/taichu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/api/taiyi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/api/taiyi.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/config.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/GUI/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/GUI/screenspot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/GUI/screenspot.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/GUI/screenspot_pro.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/GUI/screenspot_pro.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/Omnidocbench/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/Omnidocbench/data_preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/Omnidocbench/data_preprocess.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/Omnidocbench/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/Omnidocbench/metrics.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/Omnidocbench/omnidocbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/Omnidocbench/omnidocbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/Omnidocbench/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/Omnidocbench/requirements.txt -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/Omnidocbench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/Omnidocbench/utils.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/cgbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/cgbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/charxiv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/charxiv.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/cmmmu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/cmmmu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/creation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/creation.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/dude.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/dude.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/dynamath.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/dynamath.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/emma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/emma.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/gobench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/gobench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_base.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_caption.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_caption.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_ccocr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_ccocr.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_mcq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_mcq.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_mt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_mt.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_shortqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_shortqa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_vqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_vqa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/image_yorn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/image_yorn.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/longvideobench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/longvideobench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/megabench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/megabench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/miabench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/miabench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mlvu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mlvu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mmalignbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mmalignbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mmbench_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mmbench_video.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mmgenbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mmgenbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mmifeval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mmifeval.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mmlongbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mmlongbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mmmath.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mmmath.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/moat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/moat.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/moviechat1k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/moviechat1k.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/mvbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/mvbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/qbench_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/qbench_video.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/slidevqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/slidevqa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/spatial457.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/spatial457.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/tamperbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/tamperbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/tempcompass.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/tempcompass.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/text_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/text_base.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/text_mcq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/text_mcq.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/README.md -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/common.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/doc_parsing_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/doc_parsing_evaluator.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/kie_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/kie_evaluator.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/ocr_evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ccocr_evaluator/ocr_evaluator.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/cgbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/cgbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/crpe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/crpe.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/hrbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/hrbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/judge_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/judge_util.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/llavabench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/llavabench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/logicvista.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/logicvista.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/longvideobench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/longvideobench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mathv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mathv.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mathverse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mathverse.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mathvista.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mathvista.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/README.md -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation/mean_agg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation/mean_agg.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation/min_agg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation/min_agg.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation/unsupported_agg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation/unsupported_agg.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation_type.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/aggregation_type.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/evaluator.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/metric_type.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/metric_type.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/answer_str_parse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/answer_str_parse.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/common/parsers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/common/parsers.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/common/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/common/utils.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/dummy_parse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/dummy_parse.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/json_parse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/parsing/json_parse.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/requirements.txt -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/response_parse_type.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/response_parse_type.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/chess_jaccard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/chess_jaccard.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/common/conversions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/common/conversions.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/common/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/common/metrics.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/dict_equality.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/dict_equality.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/exact_str_match.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/exact_str_match.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/geo_proximity.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/geo_proximity.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/gleu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/gleu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/jaccard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/jaccard.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/latex_expr_equality.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/latex_expr_equality.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/mse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/mse.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/multi_ref_phrase.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/multi_ref_phrase.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/nbbox_iou.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/nbbox_iou.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/near_str_match.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/near_str_match.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/nli_entailment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/nli_entailment.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/positive_int_match.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/positive_int_match.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/program_judge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/program_judge.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/sacrebleu_bleu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/sacrebleu_bleu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/sequence_equality.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/sequence_equality.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/set_equality.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/set_equality.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/set_precision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/set_precision.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/simple_str_match.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/simple_str_match.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/symbolic_planning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/symbolic_planning.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/unsupported_scoring.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/unsupported_scoring.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/vlm_as_judge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/vlm_as_judge.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/xml_nbbox_iou.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/scoring/xml_nbbox_iou.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/megabench/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/megabench/utils.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mlvu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mlvu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmbench_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mmbench_video.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmdu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mmdu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmif/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmif/function_and_compare.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mmif/function_and_compare.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmniah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mmniah.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmsci.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mmsci.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmsci4eval_req.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mmsci4eval_req.txt -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mmvet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mmvet.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/moviechat1k.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/moviechat1k.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/multiple_choice.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/multiple_choice.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/mvbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/mvbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/naturalbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/naturalbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ocr_reasoning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ocr_reasoning.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/ocrbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/ocrbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/olympiadbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/olympiadbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/omni3dbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/omni3dbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/physic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/physic.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/physics_eval_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/physics_eval_utils.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/phyx.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/phyx.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/qbench_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/qbench_video.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/qspatial.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/qspatial.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/shortqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/shortqa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/spatial457.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/spatial457.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/tablevqabench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/tablevqabench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/tallyqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/tallyqa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/tamperbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/tamperbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/tdbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/tdbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/tempcompass.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/tempcompass.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vdc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vdc.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/evaluation.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/aquarium.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/aquarium.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/battleships.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/battleships.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/binairo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/binairo.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/coloredsudoku.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/coloredsudoku.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/common_constriants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/common_constriants.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/common_get_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/common_get_prompt.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/fieldexplore.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/fieldexplore.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/futoshiki.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/futoshiki.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/hitori.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/hitori.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/jigsawsudoku.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/jigsawsudoku.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/kakurasu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/kakurasu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/kakuro.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/kakuro.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/killersudoku.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/killersudoku.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/lightup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/lightup.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/nonogram.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/nonogram.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/oddevensudoku.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/oddevensudoku.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/renzoku.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/renzoku.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/skyscraper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/skyscraper.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/starbattle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/starbattle.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/sudoku.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/sudoku.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/thermometers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/thermometers.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/treesandtents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/puzzles/treesandtents.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vgrpbench/score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vgrpbench/score.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/video_mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/video_mmlu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/videoholmes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/videoholmes.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/videomme.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/videomme.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/visulogic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/visulogic.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vlm2bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vlm2bench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vmcbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vmcbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/vqa_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/vqa_eval.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/wemath.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/wemath.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/worldsense.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/worldsense.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/utils/yorn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/utils/yorn.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/vcr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/vcr.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/vdc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/vdc.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/video_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/video_base.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/video_concat_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/video_concat_dataset.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/video_dataset_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/video_dataset_config.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/video_holmes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/video_holmes.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/video_mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/video_mmlu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/videomme.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/videomme.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/vl_rewardbench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/vl_rewardbench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/vlm2bench.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/vlm2bench.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/wildvision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/wildvision.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/dataset/worldsense.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/dataset/worldsense.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/inference.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/inference_mt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/inference_mt.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/inference_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/inference_video.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/smp/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/smp/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/smp/file.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/smp/file.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/smp/log.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/smp/log.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/smp/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/smp/misc.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/smp/vlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/smp/vlm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/tools.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/utils/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/utils/extract_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/utils/extract_utils.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/utils/matching_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/utils/matching_util.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/utils/mp_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/utils/mp_util.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/utils/result_transfer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/utils/result_transfer.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/aki.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/aki.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/aria.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/aria.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/base.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/bunnyllama3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/bunnyllama3.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/cambrian.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/cambrian.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/chameleon.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/chameleon.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/cogvlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/cogvlm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/deepseek_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/deepseek_vl.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/deepseek_vl2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/deepseek_vl2.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/eagle_x.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/eagle_x.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/emu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/emu.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/falcon_vlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/falcon_vlm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/flash_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/flash_vl.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/gemma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/gemma.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/h2ovl_mississippi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/h2ovl_mississippi.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/idefics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/idefics.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/instructblip.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/instructblip.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/janus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/janus.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/kimi_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/kimi_vl.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/kosmos.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/kosmos.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llama4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llama4.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llama_vision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llama_vision.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llava/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llava/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llava/llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llava/llava.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llava/llava_xtuner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llava/llava_xtuner.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llava_qwen2_base_new.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llava_qwen2_base_new.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llava_qwen2_uhd_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llava_qwen2_uhd_v3.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llava_uhd_siglip2_2048.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llava_uhd_siglip2_2048.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/llava_uhd_v3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/llava_uhd_v3.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/long_vita.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/long_vita.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/mantis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/mantis.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/mgm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/mgm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/minicpm_v.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/minicpm_v.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/minigpt4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/minigpt4.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/minimonkey.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/minimonkey.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/misc/blip2_instruct_vicuna13b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/misc/blip2_instruct_vicuna13b.yaml -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/misc/blip2_instruct_vicuna7b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/misc/blip2_instruct_vicuna7b.yaml -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/misc/minigpt4_13b_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/misc/minigpt4_13b_eval.yaml -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/misc/minigpt4_7b_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/misc/minigpt4_7b_eval.yaml -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/misc/minigptv2_eval.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/misc/minigptv2_eval.yaml -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/mixsense.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/mixsense.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/mmalaya.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/mmalaya.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/molmo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/molmo.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/monkey.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/monkey.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/moondream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/moondream.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/mplug_owl2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/mplug_owl2.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/mplug_owl3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/mplug_owl3.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/nvlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/nvlm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/__init__.py: -------------------------------------------------------------------------------- 1 | from .ola_model import Ola 2 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/arguments.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/constants.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/conversation.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/datasets/preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/datasets/preprocess.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/mm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/mm_utils.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/language_model/ola_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/language_model/ola_qwen.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_encoder/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_encoder/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_encoder/oryx_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_encoder/oryx_vit.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_projector/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_projector/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_resampler/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_resampler/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_resampler/perceiver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/multimodal_resampler/perceiver.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/ola_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/ola_arch.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/BEATs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/BEATs.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/Tokenizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/Tokenizers.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/backbone.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/backbone.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/kaldi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/kaldi.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/modules.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/quantizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/beats/quantizer.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/speech_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_encoder/speech_encoder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_projector/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_projector/builder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_projector/speech_projector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/model/speech_projector/speech_projector.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola/utils.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ola/ola_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ola/ola_model.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/omchat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/omchat.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/omnilmm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/omnilmm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/open_flamingo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/open_flamingo.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ovis/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ovis/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ovis/ovis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ovis/ovis.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ovis/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ovis/utils/mdp3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ovis/utils/mdp3.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/pandagpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/pandagpt.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/parrot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/parrot.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/phi3_vision.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/phi3_vision.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/phi4_multimodal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/phi4_multimodal.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/pixtral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/pixtral.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/points.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/points.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/qh_360vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/qh_360vl.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/qwen2_vl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/qwen2_vl/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/qwen2_vl/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/qwen2_vl/model.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/qwen2_vl/prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/qwen2_vl/prompt.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/qwen_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/qwen_vl.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/rbdash.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/rbdash.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ristretto.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ristretto.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ross.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ross.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/sail_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/sail_vl.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/slime.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/slime.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/smolvlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/smolvlm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/transcore_m.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/transcore_m.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_chat.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/clip_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/clip_encoder.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/configuration_ursa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/configuration_ursa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/image_processing_vlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/image_processing_vlm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/modeling_ursa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/modeling_ursa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/processing_ursa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/processing_ursa.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/projector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/projector.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/sam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/sam.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/ursa/ursa_model/siglip_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/ursa/ursa_model/siglip_vit.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/valley/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/valley/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/valley/requirements_valley.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/valley/requirements_valley.txt -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/valley/valley.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/valley/valley.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/chat_uni_vi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/chat_uni_vi.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/configs/videochat2_hd.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/configs/videochat2_hd.json -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/llama_vid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/llama_vid.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/pllava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/pllava.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/video_chatgpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/video_chatgpt.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/video_llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/video_llava.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/video_llm/videochat2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/video_llm/videochat2.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/vila.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/vila.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/vintern_chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/vintern_chat.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/visualglm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/visualglm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/vita.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/vita.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/vlaa_thinker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/vlaa_thinker.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/vlm_r1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/vlm_r1.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/vxverse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/vxverse.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/wemm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/wemm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/wethink_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/wethink_vl.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/xcomposer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/xcomposer/__init__.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/xcomposer/sharecaptioner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/xcomposer/sharecaptioner.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer2.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer2_4KHD.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer2_4KHD.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer2d5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/xcomposer/xcomposer2d5.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/xgen_mm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/xgen_mm.py -------------------------------------------------------------------------------- /VLMEvalKit/vlmeval/vlm/yi_vl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/VLMEvalKit/vlmeval/vlm/yi_vl.py -------------------------------------------------------------------------------- /cog.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/cog.yaml -------------------------------------------------------------------------------- /featup/__init__.py: -------------------------------------------------------------------------------- 1 | from featup.upsamplers import JBULearnedRange -------------------------------------------------------------------------------- /featup/adaptive_conv_cuda/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /featup/adaptive_conv_cuda/adaptive_conv.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/adaptive_conv_cuda/adaptive_conv.cpp -------------------------------------------------------------------------------- /featup/adaptive_conv_cuda/adaptive_conv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/adaptive_conv_cuda/adaptive_conv.py -------------------------------------------------------------------------------- /featup/adaptive_conv_cuda/adaptive_conv_cuda.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/adaptive_conv_cuda/adaptive_conv_cuda.cpp -------------------------------------------------------------------------------- /featup/adaptive_conv_cuda/adaptive_conv_kernel.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/adaptive_conv_cuda/adaptive_conv_kernel.cu -------------------------------------------------------------------------------- /featup/configs/implicit_upsampler.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/configs/implicit_upsampler.yaml -------------------------------------------------------------------------------- /featup/configs/jbu_upsampler.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/configs/jbu_upsampler.yaml -------------------------------------------------------------------------------- /featup/configs/train_probe.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/configs/train_probe.yaml -------------------------------------------------------------------------------- /featup/configs/validate_train_probe.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/configs/validate_train_probe.yaml -------------------------------------------------------------------------------- /featup/datasets/COCO.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/COCO.py -------------------------------------------------------------------------------- /featup/datasets/DAVIS.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/DAVIS.py -------------------------------------------------------------------------------- /featup/datasets/DOC.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/DOC.py -------------------------------------------------------------------------------- /featup/datasets/DocSceneText.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/DocSceneText.py -------------------------------------------------------------------------------- /featup/datasets/EmbeddingFile.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/EmbeddingFile.py -------------------------------------------------------------------------------- /featup/datasets/HTML.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/HTML.py -------------------------------------------------------------------------------- /featup/datasets/HighResEmbs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/HighResEmbs.py -------------------------------------------------------------------------------- /featup/datasets/ImageNetSubset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/ImageNetSubset.py -------------------------------------------------------------------------------- /featup/datasets/JitteredImage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/JitteredImage.py -------------------------------------------------------------------------------- /featup/datasets/SCENE.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/SCENE.py -------------------------------------------------------------------------------- /featup/datasets/SampleImage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/SampleImage.py -------------------------------------------------------------------------------- /featup/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /featup/datasets/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/datasets/util.py -------------------------------------------------------------------------------- /featup/downsamplers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/downsamplers.py -------------------------------------------------------------------------------- /featup/featurizers/CLIP.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/CLIP.py -------------------------------------------------------------------------------- /featup/featurizers/CLIPLarge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/CLIPLarge.py -------------------------------------------------------------------------------- /featup/featurizers/ClipEncoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/ClipEncoder.py -------------------------------------------------------------------------------- /featup/featurizers/DINO.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/DINO.py -------------------------------------------------------------------------------- /featup/featurizers/DINOv2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/DINOv2.py -------------------------------------------------------------------------------- /featup/featurizers/DeepLabV3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/DeepLabV3.py -------------------------------------------------------------------------------- /featup/featurizers/MAE.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/MAE.py -------------------------------------------------------------------------------- /featup/featurizers/MIDAS.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/MIDAS.py -------------------------------------------------------------------------------- /featup/featurizers/MaskCLIP.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/MaskCLIP.py -------------------------------------------------------------------------------- /featup/featurizers/ResNet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/ResNet.py -------------------------------------------------------------------------------- /featup/featurizers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /featup/featurizers/dinov2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/__init__.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/attention.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/block.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/block.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/dino_head.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/dino_head.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/drop_path.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/drop_path.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/layer_scale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/layer_scale.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/mlp.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/patch_embed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/patch_embed.py -------------------------------------------------------------------------------- /featup/featurizers/dinov2/layers/swiglu_ffn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/dinov2/layers/swiglu_ffn.py -------------------------------------------------------------------------------- /featup/featurizers/maskclip/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/maskclip/README.md -------------------------------------------------------------------------------- /featup/featurizers/maskclip/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/maskclip/__init__.py -------------------------------------------------------------------------------- /featup/featurizers/maskclip/bpe_simple_vocab_16e6.txt.gz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/maskclip/bpe_simple_vocab_16e6.txt.gz -------------------------------------------------------------------------------- /featup/featurizers/maskclip/clip.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/maskclip/clip.py -------------------------------------------------------------------------------- /featup/featurizers/maskclip/interpolate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/maskclip/interpolate.py -------------------------------------------------------------------------------- /featup/featurizers/maskclip/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/maskclip/model.py -------------------------------------------------------------------------------- /featup/featurizers/maskclip/simple_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/maskclip/simple_tokenizer.py -------------------------------------------------------------------------------- /featup/featurizers/modules/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /featup/featurizers/modules/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/modules/layers.py -------------------------------------------------------------------------------- /featup/featurizers/modules/resnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/modules/resnet.py -------------------------------------------------------------------------------- /featup/featurizers/modules/vgg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/modules/vgg.py -------------------------------------------------------------------------------- /featup/featurizers/siglip.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/siglip.py -------------------------------------------------------------------------------- /featup/featurizers/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/featurizers/util.py -------------------------------------------------------------------------------- /featup/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/layers.py -------------------------------------------------------------------------------- /featup/losses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/losses.py -------------------------------------------------------------------------------- /featup/plotting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/plotting.py -------------------------------------------------------------------------------- /featup/upsamplers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/upsamplers.py -------------------------------------------------------------------------------- /featup/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/util.py -------------------------------------------------------------------------------- /featup/validate_probes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/featup/validate_probes.py -------------------------------------------------------------------------------- /figs/LLaVA_UHD_v3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/LLaVA_UHD_v3.png -------------------------------------------------------------------------------- /figs/ViT-UHD-performance-figure.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/ViT-UHD-performance-figure.png -------------------------------------------------------------------------------- /figs/ViTUHD-performace.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/ViTUHD-performace.png -------------------------------------------------------------------------------- /figs/github_banner.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/github_banner.png -------------------------------------------------------------------------------- /figs/github_banner_puretext.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/github_banner_puretext.png -------------------------------------------------------------------------------- /figs/mllm_numeric_figure_pt1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/mllm_numeric_figure_pt1.png -------------------------------------------------------------------------------- /figs/mllm_numeric_figure_pt2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/mllm_numeric_figure_pt2.png -------------------------------------------------------------------------------- /figs/performance&efficiency&radar.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/performance&efficiency&radar.jpg -------------------------------------------------------------------------------- /figs/radar_and_mllm_perfo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/figs/radar_and_mllm_perfo.png -------------------------------------------------------------------------------- /llava.egg-info/PKG-INFO: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava.egg-info/PKG-INFO -------------------------------------------------------------------------------- /llava.egg-info/SOURCES.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava.egg-info/SOURCES.txt -------------------------------------------------------------------------------- /llava.egg-info/dependency_links.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /llava.egg-info/requires.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava.egg-info/requires.txt -------------------------------------------------------------------------------- /llava.egg-info/top_level.txt: -------------------------------------------------------------------------------- 1 | llava 2 | trl 3 | -------------------------------------------------------------------------------- /llava/__init__.py: -------------------------------------------------------------------------------- 1 | from .model import LlavaLlamaForCausalLM 2 | -------------------------------------------------------------------------------- /llava/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /llava/__pycache__/constants.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/__pycache__/constants.cpython-310.pyc -------------------------------------------------------------------------------- /llava/__pycache__/conversation.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/__pycache__/conversation.cpython-310.pyc -------------------------------------------------------------------------------- /llava/__pycache__/mm_utils.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/__pycache__/mm_utils.cpython-310.pyc -------------------------------------------------------------------------------- /llava/__pycache__/slice_process.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/__pycache__/slice_process.cpython-310.pyc -------------------------------------------------------------------------------- /llava/__pycache__/utils.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/__pycache__/utils.cpython-310.pyc -------------------------------------------------------------------------------- /llava/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/constants.py -------------------------------------------------------------------------------- /llava/conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/conversation.py -------------------------------------------------------------------------------- /llava/mm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/mm_utils.py -------------------------------------------------------------------------------- /llava/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/__init__.py -------------------------------------------------------------------------------- /llava/model/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/__pycache__/llava_arch.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/__pycache__/llava_arch.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/builder.py -------------------------------------------------------------------------------- /llava/model/consolidate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/consolidate.py -------------------------------------------------------------------------------- /llava/model/language_model/__pycache__/llava_llama.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/__pycache__/llava_llama.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/language_model/__pycache__/llava_mistral.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/__pycache__/llava_mistral.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/language_model/__pycache__/llava_mixtral.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/__pycache__/llava_mixtral.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/language_model/__pycache__/llava_qwen.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/__pycache__/llava_qwen.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/language_model/__pycache__/llava_qwen3.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/__pycache__/llava_qwen3.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/language_model/llava_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/llava_llama.py -------------------------------------------------------------------------------- /llava/model/language_model/llava_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/llava_qwen.py -------------------------------------------------------------------------------- /llava/model/language_model/llava_qwen3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/language_model/llava_qwen3.py -------------------------------------------------------------------------------- /llava/model/llava_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/llava_arch.py -------------------------------------------------------------------------------- /llava/model/multimodal_encoder/__pycache__/builder.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_encoder/__pycache__/builder.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_encoder/__pycache__/hf_vision.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_encoder/__pycache__/hf_vision.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_encoder/__pycache__/imagebind.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_encoder/__pycache__/imagebind.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_encoder/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_encoder/builder.py -------------------------------------------------------------------------------- /llava/model/multimodal_encoder/modeling_moonvit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_encoder/modeling_moonvit.py -------------------------------------------------------------------------------- /llava/model/multimodal_encoder/modeling_siglip2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_encoder/modeling_siglip2.py -------------------------------------------------------------------------------- /llava/model/multimodal_projector/__pycache__/builder.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/__pycache__/builder.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_projector/__pycache__/llava_mlp.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/__pycache__/llava_mlp.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_projector/__pycache__/merger.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/__pycache__/merger.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_projector/__pycache__/resampler.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/__pycache__/resampler.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_projector/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/builder.py -------------------------------------------------------------------------------- /llava/model/multimodal_projector/llava_mlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/llava_mlp.py -------------------------------------------------------------------------------- /llava/model/multimodal_projector/merger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/merger.py -------------------------------------------------------------------------------- /llava/model/multimodal_projector/resampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/resampler.py -------------------------------------------------------------------------------- /llava/model/multimodal_projector/uhd_v1_resampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_projector/uhd_v1_resampler.py -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/__pycache__/builder.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/__pycache__/builder.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/__pycache__/masked_drop.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/__pycache__/masked_drop.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/__pycache__/perceiver.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/__pycache__/perceiver.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/__pycache__/qformer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/__pycache__/qformer.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/__pycache__/spatial_pool.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/__pycache__/spatial_pool.cpython-310.pyc -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/builder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/builder.py -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/masked_drop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/masked_drop.py -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/perceiver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/perceiver.py -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/qformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/qformer.py -------------------------------------------------------------------------------- /llava/model/multimodal_resampler/spatial_pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/multimodal_resampler/spatial_pool.py -------------------------------------------------------------------------------- /llava/model/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/model/utils.py -------------------------------------------------------------------------------- /llava/serve/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /llava/serve/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/cli.py -------------------------------------------------------------------------------- /llava/serve/controller.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/controller.py -------------------------------------------------------------------------------- /llava/serve/gradio_multi_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/gradio_multi_image.py -------------------------------------------------------------------------------- /llava/serve/gradio_web_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/gradio_web_server.py -------------------------------------------------------------------------------- /llava/serve/model_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/model_worker.py -------------------------------------------------------------------------------- /llava/serve/register_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/register_worker.py -------------------------------------------------------------------------------- /llava/serve/sglang_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/sglang_worker.py -------------------------------------------------------------------------------- /llava/serve/test_message.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/serve/test_message.py -------------------------------------------------------------------------------- /llava/slice_process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/slice_process.py -------------------------------------------------------------------------------- /llava/train/__pycache__/llava_trainer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/train/__pycache__/llava_trainer.cpython-310.pyc -------------------------------------------------------------------------------- /llava/train/__pycache__/train.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/train/__pycache__/train.cpython-310.pyc -------------------------------------------------------------------------------- /llava/train/llava_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/train/llava_trainer.py -------------------------------------------------------------------------------- /llava/train/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/train/train.py -------------------------------------------------------------------------------- /llava/train/train_mem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/train/train_mem.py -------------------------------------------------------------------------------- /llava/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/llava/utils.py -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements.bak: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/requirements.bak -------------------------------------------------------------------------------- /scripts/archived/convert_gqa_for_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/convert_gqa_for_eval.py -------------------------------------------------------------------------------- /scripts/archived/convert_mmvet_for_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/convert_mmvet_for_eval.py -------------------------------------------------------------------------------- /scripts/archived/convert_sqa_to_llava.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/convert_sqa_to_llava.py -------------------------------------------------------------------------------- /scripts/archived/convert_sqa_to_llava_base_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/convert_sqa_to_llava_base_prompt.py -------------------------------------------------------------------------------- /scripts/archived/convert_vizwiz_for_submission.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/convert_vizwiz_for_submission.py -------------------------------------------------------------------------------- /scripts/archived/convert_vqav2_for_submission.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/convert_vqav2_for_submission.py -------------------------------------------------------------------------------- /scripts/archived/data_info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/data_info.py -------------------------------------------------------------------------------- /scripts/archived/dpo_data_info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/dpo_data_info.py -------------------------------------------------------------------------------- /scripts/archived/finetune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_1.5.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_1.5.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_full_schedule.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_full_schedule.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_lora.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_mixtral.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_mixtral.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_mixtral_1.5.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_mixtral_1.5.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_mixtral_1.6_336px_anyres.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_mixtral_1.6_336px_anyres.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_mixtral_1.6_336px_anyres_freeze_vision.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_mixtral_1.6_336px_anyres_freeze_vision.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_mixtral_1.6_336px_anyres_lmms_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_mixtral_1.6_336px_anyres_lmms_eval.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_mixtral_copy.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_mixtral_copy.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_qlora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_qlora.sh -------------------------------------------------------------------------------- /scripts/archived/finetune_sqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/finetune_sqa.sh -------------------------------------------------------------------------------- /scripts/archived/merge_lora_weights.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/merge_lora_weights.py -------------------------------------------------------------------------------- /scripts/archived/pretrain.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/pretrain.sh -------------------------------------------------------------------------------- /scripts/archived/quick_check.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/quick_check.py -------------------------------------------------------------------------------- /scripts/archived/sqa_eval_batch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/sqa_eval_batch.sh -------------------------------------------------------------------------------- /scripts/archived/sqa_eval_gather.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/archived/sqa_eval_gather.sh -------------------------------------------------------------------------------- /scripts/convert_gqa_for_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/convert_gqa_for_eval.py -------------------------------------------------------------------------------- /scripts/interleave/eval_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/interleave/eval_all.sh -------------------------------------------------------------------------------- /scripts/interleave/eval_interleave_3d.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/interleave/eval_interleave_3d.sh -------------------------------------------------------------------------------- /scripts/interleave/eval_multiprocess.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/interleave/eval_multiprocess.sh -------------------------------------------------------------------------------- /scripts/train/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/README.md -------------------------------------------------------------------------------- /scripts/train/direct_finetune_clip.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/direct_finetune_clip.sh -------------------------------------------------------------------------------- /scripts/train/direct_finetune_siglip_a4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/direct_finetune_siglip_a4.sh -------------------------------------------------------------------------------- /scripts/train/dpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/dpo.sh -------------------------------------------------------------------------------- /scripts/train/dpo_ov7b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/dpo_ov7b.sh -------------------------------------------------------------------------------- /scripts/train/finetune_ov.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/finetune_ov.sh -------------------------------------------------------------------------------- /scripts/train/finetune_si.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/finetune_si.sh -------------------------------------------------------------------------------- /scripts/train/mid_stage.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/mid_stage.yaml -------------------------------------------------------------------------------- /scripts/train/onevision.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/onevision.yaml -------------------------------------------------------------------------------- /scripts/train/pretrain_clip.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/pretrain_clip.sh -------------------------------------------------------------------------------- /scripts/train/pretrain_siglip.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/pretrain_siglip.sh -------------------------------------------------------------------------------- /scripts/train/single_image.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/train/single_image.yaml -------------------------------------------------------------------------------- /scripts/v1_5/eval/ai2d.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/ai2d.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/chartqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/chartqa.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/deepform.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/deepform.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/docvqa_test.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/docvqa_test.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/docvqa_val.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/docvqa_val.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/estvqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/estvqa.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/gqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/gqa.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/infographics.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/infographics.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/llavabench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/llavabench.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/mmbench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/mmbench.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/mmbench_cn.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/mmbench_cn.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/mme.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/mme.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/mmvet.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/mmvet.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/pope.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/pope.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/qbench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/qbench.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/qbench_zh.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/qbench_zh.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/rec.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/rec.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/sqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/sqa.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/textvqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/textvqa.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/vizwiz.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/vizwiz.sh -------------------------------------------------------------------------------- /scripts/v1_5/eval/vqav2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/v1_5/eval/vqav2.sh -------------------------------------------------------------------------------- /scripts/video/demo/video_demo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/demo/video_demo.sh -------------------------------------------------------------------------------- /scripts/video/eval/activitynet_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/eval/activitynet_eval.sh -------------------------------------------------------------------------------- /scripts/video/eval/video_chatgpt_benchmark_eval_shard.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/eval/video_chatgpt_benchmark_eval_shard.sh -------------------------------------------------------------------------------- /scripts/video/eval/video_description_from_t2v.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/eval/video_description_from_t2v.sh -------------------------------------------------------------------------------- /scripts/video/eval/video_detail_description_eval_only.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/eval/video_detail_description_eval_only.sh -------------------------------------------------------------------------------- /scripts/video/eval/video_detail_description_eval_shard.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/eval/video_detail_description_eval_shard.sh -------------------------------------------------------------------------------- /scripts/video/train/SO400M_Qwen2_72B_ov_to_video_am9.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/train/SO400M_Qwen2_72B_ov_to_video_am9.sh -------------------------------------------------------------------------------- /scripts/video/train/SO400M_Qwen2_7B_ov_to_video_am9.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/train/SO400M_Qwen2_7B_ov_to_video_am9.sh -------------------------------------------------------------------------------- /scripts/video/train/exp.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/video/train/exp.yaml -------------------------------------------------------------------------------- /scripts/zero2.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero2.json -------------------------------------------------------------------------------- /scripts/zero2_fused_adamw.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero2_fused_adamw.json -------------------------------------------------------------------------------- /scripts/zero2_new.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero2_new.json -------------------------------------------------------------------------------- /scripts/zero2_offload.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero2_offload.json -------------------------------------------------------------------------------- /scripts/zero2_old.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero2_old.json -------------------------------------------------------------------------------- /scripts/zero3.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero3.json -------------------------------------------------------------------------------- /scripts/zero3_offload.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero3_offload.json -------------------------------------------------------------------------------- /scripts/zero3pp.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/scripts/zero3pp.json -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/setup.py -------------------------------------------------------------------------------- /setup_train_env.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/setup_train_env.sh -------------------------------------------------------------------------------- /train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/train.sh -------------------------------------------------------------------------------- /train_moonvit.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/train_moonvit.sh -------------------------------------------------------------------------------- /trl/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/__init__.py -------------------------------------------------------------------------------- /trl/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /trl/__pycache__/core.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/__pycache__/core.cpython-310.pyc -------------------------------------------------------------------------------- /trl/__pycache__/import_utils.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/__pycache__/import_utils.cpython-310.pyc -------------------------------------------------------------------------------- /trl/core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/core.py -------------------------------------------------------------------------------- /trl/environment/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/environment/__init__.py -------------------------------------------------------------------------------- /trl/environment/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/environment/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /trl/environment/__pycache__/base_environment.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/environment/__pycache__/base_environment.cpython-310.pyc -------------------------------------------------------------------------------- /trl/environment/base_environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/environment/base_environment.py -------------------------------------------------------------------------------- /trl/extras/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/extras/__init__.py -------------------------------------------------------------------------------- /trl/extras/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/extras/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /trl/extras/__pycache__/best_of_n_sampler.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/extras/__pycache__/best_of_n_sampler.cpython-310.pyc -------------------------------------------------------------------------------- /trl/extras/__pycache__/dataset_formatting.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/extras/__pycache__/dataset_formatting.cpython-310.pyc -------------------------------------------------------------------------------- /trl/extras/best_of_n_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/extras/best_of_n_sampler.py -------------------------------------------------------------------------------- /trl/extras/dataset_formatting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/extras/dataset_formatting.py -------------------------------------------------------------------------------- /trl/import_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/import_utils.py -------------------------------------------------------------------------------- /trl/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/__init__.py -------------------------------------------------------------------------------- /trl/models/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /trl/models/__pycache__/modeling_base.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/__pycache__/modeling_base.cpython-310.pyc -------------------------------------------------------------------------------- /trl/models/__pycache__/modeling_value_head.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/__pycache__/modeling_value_head.cpython-310.pyc -------------------------------------------------------------------------------- /trl/models/__pycache__/utils.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/__pycache__/utils.cpython-310.pyc -------------------------------------------------------------------------------- /trl/models/modeling_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/modeling_base.py -------------------------------------------------------------------------------- /trl/models/modeling_sd_base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/modeling_sd_base.py -------------------------------------------------------------------------------- /trl/models/modeling_value_head.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/modeling_value_head.py -------------------------------------------------------------------------------- /trl/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/models/utils.py -------------------------------------------------------------------------------- /trl/trainer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__init__.py -------------------------------------------------------------------------------- /trl/trainer/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/base.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/base.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/ddpo_config.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/ddpo_config.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/dpo_trainer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/dpo_trainer.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/iterative_sft_trainer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/iterative_sft_trainer.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/model_config.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/model_config.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/ppo_config.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/ppo_config.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/ppo_trainer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/ppo_trainer.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/reward_config.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/reward_config.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/reward_trainer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/reward_trainer.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/sft_trainer.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/sft_trainer.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/__pycache__/utils.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/__pycache__/utils.cpython-310.pyc -------------------------------------------------------------------------------- /trl/trainer/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/base.py -------------------------------------------------------------------------------- /trl/trainer/ddpo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/ddpo_config.py -------------------------------------------------------------------------------- /trl/trainer/ddpo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/ddpo_trainer.py -------------------------------------------------------------------------------- /trl/trainer/dpo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/dpo_trainer.py -------------------------------------------------------------------------------- /trl/trainer/iterative_sft_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/iterative_sft_trainer.py -------------------------------------------------------------------------------- /trl/trainer/model_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/model_config.py -------------------------------------------------------------------------------- /trl/trainer/ppo_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/ppo_config.py -------------------------------------------------------------------------------- /trl/trainer/ppo_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/ppo_trainer.py -------------------------------------------------------------------------------- /trl/trainer/reward_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/reward_config.py -------------------------------------------------------------------------------- /trl/trainer/reward_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/reward_trainer.py -------------------------------------------------------------------------------- /trl/trainer/sft_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/sft_trainer.py -------------------------------------------------------------------------------- /trl/trainer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/thunlp/LLaVA-UHD/HEAD/trl/trainer/utils.py --------------------------------------------------------------------------------