├── .gitignore ├── README.md ├── assets ├── example_video_lvd_gligen_zeroscope.gif ├── example_video_lvd_zeroscope.gif └── example_video_zeroscope_baseline.gif ├── cache ├── cache_demo_v0.1_gpt-4-1106-preview.json ├── cache_lvd_v0.1_gpt-3.5-turbo.json └── cache_lvd_v0.1_gpt-4-1106-preview.json ├── generate.py ├── generation ├── lvd.py ├── lvd_gligen.py ├── lvd_plus.py ├── modelscope_dpm.py └── zeroscope_dpm.py ├── models ├── __init__.py ├── attention.py ├── attention_processor.py ├── controllable_pipeline_text_to_video_synth.py ├── models.py ├── pipelines.py ├── transformer_2d.py ├── transformer_temporal.py ├── unet_2d_blocks.py ├── unet_2d_condition.py ├── unet_3d_blocks.py └── unet_3d_condition.py ├── prompt.py ├── prompt_batch.py ├── requirements.txt ├── scripts ├── eval_owl_vit.py ├── eval_stage_one.py └── upsample.py └── utils ├── __init__.py ├── attn.py ├── cache.py ├── eval ├── __init__.py ├── eval.py ├── lvd.py └── utils.py ├── guidance.py ├── latents.py ├── llm.py ├── parse.py ├── schedule.py ├── utils.py └── vis.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/README.md -------------------------------------------------------------------------------- /assets/example_video_lvd_gligen_zeroscope.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/assets/example_video_lvd_gligen_zeroscope.gif -------------------------------------------------------------------------------- /assets/example_video_lvd_zeroscope.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/assets/example_video_lvd_zeroscope.gif -------------------------------------------------------------------------------- /assets/example_video_zeroscope_baseline.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/assets/example_video_zeroscope_baseline.gif -------------------------------------------------------------------------------- /cache/cache_demo_v0.1_gpt-4-1106-preview.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/cache/cache_demo_v0.1_gpt-4-1106-preview.json -------------------------------------------------------------------------------- /cache/cache_lvd_v0.1_gpt-3.5-turbo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/cache/cache_lvd_v0.1_gpt-3.5-turbo.json -------------------------------------------------------------------------------- /cache/cache_lvd_v0.1_gpt-4-1106-preview.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/cache/cache_lvd_v0.1_gpt-4-1106-preview.json -------------------------------------------------------------------------------- /generate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/generate.py -------------------------------------------------------------------------------- /generation/lvd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/generation/lvd.py -------------------------------------------------------------------------------- /generation/lvd_gligen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/generation/lvd_gligen.py -------------------------------------------------------------------------------- /generation/lvd_plus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/generation/lvd_plus.py -------------------------------------------------------------------------------- /generation/modelscope_dpm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/generation/modelscope_dpm.py -------------------------------------------------------------------------------- /generation/zeroscope_dpm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/generation/zeroscope_dpm.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- 1 | from .models import * 2 | -------------------------------------------------------------------------------- /models/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/attention.py -------------------------------------------------------------------------------- /models/attention_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/attention_processor.py -------------------------------------------------------------------------------- /models/controllable_pipeline_text_to_video_synth.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/controllable_pipeline_text_to_video_synth.py -------------------------------------------------------------------------------- /models/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/models.py -------------------------------------------------------------------------------- /models/pipelines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/pipelines.py -------------------------------------------------------------------------------- /models/transformer_2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/transformer_2d.py -------------------------------------------------------------------------------- /models/transformer_temporal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/transformer_temporal.py -------------------------------------------------------------------------------- /models/unet_2d_blocks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/unet_2d_blocks.py -------------------------------------------------------------------------------- /models/unet_2d_condition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/unet_2d_condition.py -------------------------------------------------------------------------------- /models/unet_3d_blocks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/unet_3d_blocks.py -------------------------------------------------------------------------------- /models/unet_3d_condition.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/models/unet_3d_condition.py -------------------------------------------------------------------------------- /prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/prompt.py -------------------------------------------------------------------------------- /prompt_batch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/prompt_batch.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/eval_owl_vit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/scripts/eval_owl_vit.py -------------------------------------------------------------------------------- /scripts/eval_stage_one.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/scripts/eval_stage_one.py -------------------------------------------------------------------------------- /scripts/upsample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/scripts/upsample.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- 1 | from .utils import * 2 | -------------------------------------------------------------------------------- /utils/attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/attn.py -------------------------------------------------------------------------------- /utils/cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/cache.py -------------------------------------------------------------------------------- /utils/eval/__init__.py: -------------------------------------------------------------------------------- 1 | from .eval import * 2 | -------------------------------------------------------------------------------- /utils/eval/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/eval/eval.py -------------------------------------------------------------------------------- /utils/eval/lvd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/eval/lvd.py -------------------------------------------------------------------------------- /utils/eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/eval/utils.py -------------------------------------------------------------------------------- /utils/guidance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/guidance.py -------------------------------------------------------------------------------- /utils/latents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/latents.py -------------------------------------------------------------------------------- /utils/llm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/llm.py -------------------------------------------------------------------------------- /utils/parse.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/parse.py -------------------------------------------------------------------------------- /utils/schedule.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/schedule.py -------------------------------------------------------------------------------- /utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/utils.py -------------------------------------------------------------------------------- /utils/vis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/TonyLianLong/LLM-groundedVideoDiffusion/HEAD/utils/vis.py --------------------------------------------------------------------------------