├── test ├── lmms_eval │ ├── __init__.py │ ├── api │ │ ├── __init__.py │ │ ├── instance.py │ │ ├── filter.py │ │ ├── samplers.py │ │ ├── group.py │ │ ├── registry.py │ │ └── model.py │ ├── caching │ │ ├── __init__.py │ │ └── cache.py │ ├── models │ │ ├── model_utils │ │ │ ├── __init__.py │ │ │ ├── __pycache__ │ │ │ │ ├── __init__.cpython-310.pyc │ │ │ │ ├── __init__.cpython-312.pyc │ │ │ │ ├── load_video.cpython-310.pyc │ │ │ │ └── load_video.cpython-312.pyc │ │ │ ├── audio_processing.py │ │ │ └── load_video.py │ │ ├── video_chatgpt │ │ │ ├── eval │ │ │ │ ├── __init__.py │ │ │ │ └── model_utils.py │ │ │ ├── __init__.py │ │ │ ├── model │ │ │ │ ├── __init__.py │ │ │ │ ├── consolidate.py │ │ │ │ ├── utils.py │ │ │ │ └── make_delta.py │ │ │ ├── constants.py │ │ │ ├── utils.py │ │ │ ├── video_conversation.py │ │ │ ├── single_video_inference.py │ │ │ └── inference.py │ │ ├── mplug_owl_video │ │ │ ├── tokenization_mplug_owl.py │ │ │ └── __init__.py │ │ ├── __init__.py │ │ ├── from_log.py │ │ ├── whisper_vllm.py │ │ ├── qwen_vl_api.py │ │ ├── llava_sglang.py │ │ ├── xcomposer2d5.py │ │ ├── reka.py │ │ └── batch_gpt4.py │ ├── tasks │ │ ├── _task_utils │ │ │ ├── gpt_eval_utils.py │ │ │ ├── file_utils.py │ │ │ ├── video_loader.py │ │ │ └── vqa_eval_metric.py │ │ ├── mindcube │ │ │ ├── mindcube_qwen.yaml │ │ │ ├── mindcube.yaml │ │ │ ├── mindcube_robo.yaml │ │ │ └── utils.py │ │ ├── omni3d_bench │ │ │ ├── omni3d_bench_qwen.yaml │ │ │ ├── omni3d_bench.yaml │ │ │ ├── omni3d_bench_robo.yaml │ │ │ └── utils.py │ │ ├── super_clevr │ │ │ ├── super_clevr_qwen.yaml │ │ │ ├── super_clevr.yaml │ │ │ ├── super_clevr_robo.yaml │ │ │ └── utils.py │ │ └── vsibench │ │ │ ├── vsibench.yaml │ │ │ ├── vsibench_robo.yaml │ │ │ ├── vsibench_qwen.yaml │ │ │ └── utils.py │ ├── loggers │ │ ├── __init__.py │ │ └── utils.py │ └── filters │ │ ├── decontamination.py │ │ ├── transformation.py │ │ ├── __init__.py │ │ └── selection.py ├── eval_robo.sh ├── eval_euclid.sh ├── eval_qwen.sh └── LICENSE ├── assert ├── arch.png ├── eval.png └── gain.png ├── requirements.txt ├── train ├── math.jinja ├── euclid.py ├── dist_train.sh ├── config.yaml ├── math.py └── model_merger.py └── README.md /test/lmms_eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/lmms_eval/api/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/lmms_eval/caching/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/lmms_eval/models/model_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/lmms_eval/models/video_chatgpt/eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/lmms_eval/tasks/_task_utils/gpt_eval_utils.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /assert/arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/LiamLian0727/Euclids_Gift/HEAD/assert/arch.png -------------------------------------------------------------------------------- /assert/eval.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/LiamLian0727/Euclids_Gift/HEAD/assert/eval.png -------------------------------------------------------------------------------- /assert/gain.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/LiamLian0727/Euclids_Gift/HEAD/assert/gain.png -------------------------------------------------------------------------------- /test/lmms_eval/models/video_chatgpt/__init__.py: -------------------------------------------------------------------------------- 1 | from .model import VideoChatGPTLlamaForCausalLM 2 | -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | datasets>=4.1.1 2 | geo_evalute@git+https://github.com/LiamLian0727/geo_evalute.git@main -------------------------------------------------------------------------------- /test/lmms_eval/loggers/__init__.py: -------------------------------------------------------------------------------- 1 | from .evaluation_tracker import EvaluationTracker 2 | from .wandb_logger import WandbLogger 3 | -------------------------------------------------------------------------------- /test/lmms_eval/models/video_chatgpt/model/__init__.py: -------------------------------------------------------------------------------- 1 | from lmms_eval.models.video_chatgpt.model.video_chatgpt import ( 2 | VideoChatGPTConfig, 3 | VideoChatGPTLlamaForCausalLM, 4 | ) 5 | -------------------------------------------------------------------------------- /test/lmms_eval/models/model_utils/__pycache__/__init__.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/LiamLian0727/Euclids_Gift/HEAD/test/lmms_eval/models/model_utils/__pycache__/__init__.cpython-310.pyc -------------------------------------------------------------------------------- /test/lmms_eval/models/model_utils/__pycache__/__init__.cpython-312.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/LiamLian0727/Euclids_Gift/HEAD/test/lmms_eval/models/model_utils/__pycache__/__init__.cpython-312.pyc -------------------------------------------------------------------------------- /test/lmms_eval/models/model_utils/__pycache__/load_video.cpython-310.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/LiamLian0727/Euclids_Gift/HEAD/test/lmms_eval/models/model_utils/__pycache__/load_video.cpython-310.pyc -------------------------------------------------------------------------------- /test/lmms_eval/models/model_utils/__pycache__/load_video.cpython-312.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/LiamLian0727/Euclids_Gift/HEAD/test/lmms_eval/models/model_utils/__pycache__/load_video.cpython-312.pyc -------------------------------------------------------------------------------- /train/math.jinja: -------------------------------------------------------------------------------- 1 | {{ content | trim }} You FIRST think about the reasoning process as an internal monologue and then provide the final answer. The reasoning process MUST BE enclosed within tags. The final answer MUST BE put in \boxed{}. 2 | -------------------------------------------------------------------------------- /test/lmms_eval/tasks/_task_utils/file_utils.py: -------------------------------------------------------------------------------- 1 | import os 2 | 3 | 4 | def generate_submission_file(file_name, args, subpath="submissions"): 5 | path = os.path.join(args.output_path, subpath) 6 | os.makedirs(path, exist_ok=True) 7 | path = os.path.join(path, file_name) 8 | return os.path.abspath(path) 9 | -------------------------------------------------------------------------------- /test/lmms_eval/models/video_chatgpt/constants.py: -------------------------------------------------------------------------------- 1 | CONTROLLER_HEART_BEAT_EXPIRATION = 30 2 | WORKER_HEART_BEAT_INTERVAL = 15 3 | 4 | LOGDIR = "." 5 | 6 | 7 | # Defining model 8 | DEFAULT_VIDEO_TOKEN = "