├── .asset ├── COCO.png ├── GD_GLIGEN.png ├── GD_SD.png ├── ODinW.png ├── arch.png ├── cat_dog.jpeg ├── cats.png ├── grounding_dino_logo.png ├── hero_figure.png ├── model_explan1.PNG └── model_explan2.PNG ├── .gitignore ├── EVALUATION.md ├── LICENSE ├── README.md ├── config.py ├── configs ├── evaluation_config.yaml ├── test_config.yaml └── train_config.yaml ├── demo ├── create_coco_dataset.py ├── gradio_app.py ├── image_editing_with_groundingdino_gligen.ipynb ├── image_editing_with_groundingdino_stablediffusion.ipynb ├── inference_on_a_image.py └── test_ap_on_coco.py ├── evaluate.py ├── groundingdino ├── __init__.py ├── config │ ├── GroundingDINO_SwinB_cfg.py │ ├── GroundingDINO_SwinT_OGC.py │ └── __init__.py ├── datasets │ ├── __init__.py │ ├── cocogrounding_eval.py │ ├── dataset.py │ └── transforms.py ├── models │ ├── GroundingDINO │ │ ├── __init__.py │ │ ├── backbone │ │ │ ├── __init__.py │ │ │ ├── backbone.py │ │ │ ├── position_encoding.py │ │ │ └── swin_transformer.py │ │ ├── bertwarper.py │ │ ├── csrc │ │ │ ├── MsDeformAttn │ │ │ │ ├── ms_deform_attn.h │ │ │ │ ├── ms_deform_attn_cpu.cpp │ │ │ │ ├── ms_deform_attn_cpu.h │ │ │ │ ├── ms_deform_attn_cuda.cu │ │ │ │ ├── ms_deform_attn_cuda.h │ │ │ │ └── ms_deform_im2col_cuda.cuh │ │ │ ├── cuda_version.cu │ │ │ └── vision.cpp │ │ ├── fuse_modules.py │ │ ├── groundingdino.py │ │ ├── ms_deform_attn.py │ │ ├── transformer.py │ │ ├── transformer_vanilla.py │ │ └── utils.py │ ├── __init__.py │ └── registry.py ├── util │ ├── __init__.py │ ├── box_ops.py │ ├── class_loss.py │ ├── evaluation.py │ ├── get_tokenlizer.py │ ├── inference.py │ ├── logger.py │ ├── lora.py │ ├── losses.py │ ├── matchers.py │ ├── misc.py │ ├── model_utils.py │ ├── slconfig.py │ ├── slio.py │ ├── time_counter.py │ ├── train.py │ ├── utils.py │ ├── visualizer.py │ └── vl_utils.py └── version.py ├── misc └── convert_text_to_csv.py ├── requirements.txt ├── results ├── after_train_0.jpg ├── after_train_1.jpg ├── after_train_2.jpg ├── before_train_0.jpg ├── before_train_1.jpg └── before_train_2.jpg ├── setup.py ├── test.py └── train.py /.asset/COCO.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/COCO.png -------------------------------------------------------------------------------- /.asset/GD_GLIGEN.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/GD_GLIGEN.png -------------------------------------------------------------------------------- /.asset/GD_SD.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/GD_SD.png -------------------------------------------------------------------------------- /.asset/ODinW.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/ODinW.png -------------------------------------------------------------------------------- /.asset/arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/arch.png -------------------------------------------------------------------------------- /.asset/cat_dog.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/cat_dog.jpeg -------------------------------------------------------------------------------- /.asset/cats.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/cats.png -------------------------------------------------------------------------------- /.asset/grounding_dino_logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/grounding_dino_logo.png -------------------------------------------------------------------------------- /.asset/hero_figure.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/hero_figure.png -------------------------------------------------------------------------------- /.asset/model_explan1.PNG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/model_explan1.PNG -------------------------------------------------------------------------------- /.asset/model_explan2.PNG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.asset/model_explan2.PNG -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/.gitignore -------------------------------------------------------------------------------- /EVALUATION.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/EVALUATION.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/README.md -------------------------------------------------------------------------------- /config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/config.py -------------------------------------------------------------------------------- /configs/evaluation_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/configs/evaluation_config.yaml -------------------------------------------------------------------------------- /configs/test_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/configs/test_config.yaml -------------------------------------------------------------------------------- /configs/train_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/configs/train_config.yaml -------------------------------------------------------------------------------- /demo/create_coco_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/demo/create_coco_dataset.py -------------------------------------------------------------------------------- /demo/gradio_app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/demo/gradio_app.py -------------------------------------------------------------------------------- /demo/image_editing_with_groundingdino_gligen.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/demo/image_editing_with_groundingdino_gligen.ipynb -------------------------------------------------------------------------------- /demo/image_editing_with_groundingdino_stablediffusion.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/demo/image_editing_with_groundingdino_stablediffusion.ipynb -------------------------------------------------------------------------------- /demo/inference_on_a_image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/demo/inference_on_a_image.py -------------------------------------------------------------------------------- /demo/test_ap_on_coco.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/demo/test_ap_on_coco.py -------------------------------------------------------------------------------- /evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/evaluate.py -------------------------------------------------------------------------------- /groundingdino/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /groundingdino/config/GroundingDINO_SwinB_cfg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/config/GroundingDINO_SwinB_cfg.py -------------------------------------------------------------------------------- /groundingdino/config/GroundingDINO_SwinT_OGC.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/config/GroundingDINO_SwinT_OGC.py -------------------------------------------------------------------------------- /groundingdino/config/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /groundingdino/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /groundingdino/datasets/cocogrounding_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/datasets/cocogrounding_eval.py -------------------------------------------------------------------------------- /groundingdino/datasets/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/datasets/dataset.py -------------------------------------------------------------------------------- /groundingdino/datasets/transforms.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/datasets/transforms.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/__init__.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/backbone/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/backbone/__init__.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/backbone/backbone.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/backbone/backbone.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/backbone/position_encoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/backbone/position_encoding.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/backbone/swin_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/backbone/swin_transformer.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/bertwarper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/bertwarper.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn.h -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cpu.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cpu.cpp -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cpu.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cpu.h -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cuda.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cuda.cu -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cuda.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_attn_cuda.h -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_im2col_cuda.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/MsDeformAttn/ms_deform_im2col_cuda.cuh -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/cuda_version.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/cuda_version.cu -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/csrc/vision.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/csrc/vision.cpp -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/fuse_modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/fuse_modules.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/groundingdino.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/groundingdino.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/ms_deform_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/ms_deform_attn.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/transformer.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/transformer_vanilla.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/transformer_vanilla.py -------------------------------------------------------------------------------- /groundingdino/models/GroundingDINO/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/GroundingDINO/utils.py -------------------------------------------------------------------------------- /groundingdino/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/__init__.py -------------------------------------------------------------------------------- /groundingdino/models/registry.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/models/registry.py -------------------------------------------------------------------------------- /groundingdino/util/__init__.py: -------------------------------------------------------------------------------- 1 | # Copyright (c) Facebook, Inc. and its affiliates. All Rights Reserved 2 | -------------------------------------------------------------------------------- /groundingdino/util/box_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/box_ops.py -------------------------------------------------------------------------------- /groundingdino/util/class_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/class_loss.py -------------------------------------------------------------------------------- /groundingdino/util/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/evaluation.py -------------------------------------------------------------------------------- /groundingdino/util/get_tokenlizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/get_tokenlizer.py -------------------------------------------------------------------------------- /groundingdino/util/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/inference.py -------------------------------------------------------------------------------- /groundingdino/util/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/logger.py -------------------------------------------------------------------------------- /groundingdino/util/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/lora.py -------------------------------------------------------------------------------- /groundingdino/util/losses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/losses.py -------------------------------------------------------------------------------- /groundingdino/util/matchers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/matchers.py -------------------------------------------------------------------------------- /groundingdino/util/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/misc.py -------------------------------------------------------------------------------- /groundingdino/util/model_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/model_utils.py -------------------------------------------------------------------------------- /groundingdino/util/slconfig.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/slconfig.py -------------------------------------------------------------------------------- /groundingdino/util/slio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/slio.py -------------------------------------------------------------------------------- /groundingdino/util/time_counter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/time_counter.py -------------------------------------------------------------------------------- /groundingdino/util/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/train.py -------------------------------------------------------------------------------- /groundingdino/util/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/utils.py -------------------------------------------------------------------------------- /groundingdino/util/visualizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/visualizer.py -------------------------------------------------------------------------------- /groundingdino/util/vl_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/groundingdino/util/vl_utils.py -------------------------------------------------------------------------------- /groundingdino/version.py: -------------------------------------------------------------------------------- 1 | __version__ = '0.1.0' 2 | -------------------------------------------------------------------------------- /misc/convert_text_to_csv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/misc/convert_text_to_csv.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/requirements.txt -------------------------------------------------------------------------------- /results/after_train_0.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/results/after_train_0.jpg -------------------------------------------------------------------------------- /results/after_train_1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/results/after_train_1.jpg -------------------------------------------------------------------------------- /results/after_train_2.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/results/after_train_2.jpg -------------------------------------------------------------------------------- /results/before_train_0.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/results/before_train_0.jpg -------------------------------------------------------------------------------- /results/before_train_1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/results/before_train_1.jpg -------------------------------------------------------------------------------- /results/before_train_2.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/results/before_train_2.jpg -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/setup.py -------------------------------------------------------------------------------- /test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/test.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/levy-tech-spark/AViD/HEAD/train.py --------------------------------------------------------------------------------