├── .gitignore ├── License.txt ├── README.md ├── assets ├── pref_grpo_pipeline.png └── pref_grpo_reward_hacking.png ├── data ├── unigenbench_test_data.csv ├── unigenbench_train_data.txt └── video_prompts.txt ├── env_setup.sh ├── fastvideo ├── data_preprocess │ ├── preprocess_flux_embedding.py │ ├── preprocess_flux_rl_embeddings.sh │ ├── preprocess_qwen_image_rl_embeddings.sh │ ├── preprocess_qwenimage_embedding.py │ ├── preprocess_wan_2_1_embeddings.py │ └── preprocess_wan_2_1_rl_embeddings.sh ├── dataset │ ├── __init__.py │ ├── latent_datasets.py │ ├── latent_flux_rl_datasets.py │ ├── latent_qwenimage_rl_datasets.py │ ├── latent_rl_datasets.py │ ├── latent_wan_2_1_rl_datasets.py │ ├── t2v_datasets.py │ └── transform.py ├── distill │ ├── __init__.py │ ├── discriminator.py │ └── solver.py ├── models │ ├── flash_attn_no_pad.py │ ├── flux_hf │ │ └── pipeline_flux.py │ ├── hunyuan │ │ ├── __init__.py │ │ ├── constants.py │ │ ├── diffusion │ │ │ ├── __init__.py │ │ │ ├── pipelines │ │ │ │ ├── __init__.py │ │ │ │ └── pipeline_hunyuan_video.py │ │ │ └── schedulers │ │ │ │ ├── __init__.py │ │ │ │ └── scheduling_flow_match_discrete.py │ │ ├── idle_config.py │ │ ├── inference.py │ │ ├── modules │ │ │ ├── __init__.py │ │ │ ├── activation_layers.py │ │ │ ├── attenion.py │ │ │ ├── embed_layers.py │ │ │ ├── mlp_layers.py │ │ │ ├── models.py │ │ │ ├── modulate_layers.py │ │ │ ├── norm_layers.py │ │ │ ├── posemb_layers.py │ │ │ └── token_refiner.py │ │ ├── prompt_rewrite.py │ │ ├── text_encoder │ │ │ └── __init__.py │ │ ├── utils │ │ │ ├── __init__.py │ │ │ ├── data_utils.py │ │ │ ├── file_utils.py │ │ │ ├── helpers.py │ │ │ └── preprocess_text_encoder_tokenizer_utils.py │ │ └── vae │ │ │ ├── __init__.py │ │ │ ├── autoencoder_kl_causal_3d.py │ │ │ ├── unet_causal_3d_blocks.py │ │ │ └── vae.py │ ├── hunyuan_hf │ │ ├── modeling_hunyuan.py │ │ └── pipeline_hunyuan.py │ ├── mochi_hf │ │ ├── convert_diffusers_to_mochi.py │ │ ├── mochi_latents_utils.py │ │ ├── modeling_mochi.py │ │ ├── norm.py │ │ └── pipeline_mochi.py │ └── stable_diffusion │ │ ├── ddim_with_logprob.py │ │ └── pipeline_with_logprob.py ├── train_flux_pref_grpo.py ├── train_flux_pref_grpo_lora.py ├── train_flux_unifiedreward.py ├── train_flux_unifiedreward_lora.py ├── train_qwenimage_pref_grpo.py ├── train_qwenimage_pref_grpo_lora.py ├── train_qwenimage_unifiedreward.py ├── train_qwenimage_unifiedreward_lora.py ├── train_wan_2_1_pref_grpo.py ├── train_wan_2_1_pref_grpo_lora.py └── utils │ ├── checkpoint.py │ ├── communications.py │ ├── communications_flux.py │ ├── dataset_utils.py │ ├── env_utils.py │ ├── fsdp_util.py │ ├── fsdp_util_qwenimage.py │ ├── load.py │ ├── logging_.py │ ├── optimizer.py │ ├── parallel_states.py │ └── validation.py ├── inference ├── flux_dist_infer.sh ├── flux_multi_node_inference.py ├── qwen_image_dist_infer.sh ├── qwen_image_multi_node_inference.py ├── wan_dist_infer.sh └── wan_multi_node_inference.py ├── pyproject.toml ├── requirements-lint.txt ├── scripts ├── finetune_prefgrpo_flux.sh ├── finetune_prefgrpo_flux_lora.sh ├── finetune_prefgrpo_qwenimage_grpo.sh ├── finetune_prefgrpo_qwenimage_grpo_lora.sh ├── finetune_prefgrpo_wan_2_1.sh ├── finetune_prefgrpo_wan_2_1_lora.sh ├── finetune_unifiedreward_flux.sh ├── finetune_unifiedreward_flux_lora.sh ├── finetune_unifiedreward_qwenimage_grpo.sh └── finetune_unifiedreward_qwenimage_grpo_lora.sh └── vllm_utils ├── vllm_request.py ├── vllm_server_UnifiedReward.sh └── vllm_server_UnifiedReward_Think.sh /.gitignore: -------------------------------------------------------------------------------- 1 | .DS_Store 2 | -------------------------------------------------------------------------------- /License.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/License.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/README.md -------------------------------------------------------------------------------- /assets/pref_grpo_pipeline.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/assets/pref_grpo_pipeline.png -------------------------------------------------------------------------------- /assets/pref_grpo_reward_hacking.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/assets/pref_grpo_reward_hacking.png -------------------------------------------------------------------------------- /data/unigenbench_test_data.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/data/unigenbench_test_data.csv -------------------------------------------------------------------------------- /data/unigenbench_train_data.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/data/unigenbench_train_data.txt -------------------------------------------------------------------------------- /data/video_prompts.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/data/video_prompts.txt -------------------------------------------------------------------------------- /env_setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/env_setup.sh -------------------------------------------------------------------------------- /fastvideo/data_preprocess/preprocess_flux_embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/data_preprocess/preprocess_flux_embedding.py -------------------------------------------------------------------------------- /fastvideo/data_preprocess/preprocess_flux_rl_embeddings.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/data_preprocess/preprocess_flux_rl_embeddings.sh -------------------------------------------------------------------------------- /fastvideo/data_preprocess/preprocess_qwen_image_rl_embeddings.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/data_preprocess/preprocess_qwen_image_rl_embeddings.sh -------------------------------------------------------------------------------- /fastvideo/data_preprocess/preprocess_qwenimage_embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/data_preprocess/preprocess_qwenimage_embedding.py -------------------------------------------------------------------------------- /fastvideo/data_preprocess/preprocess_wan_2_1_embeddings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/data_preprocess/preprocess_wan_2_1_embeddings.py -------------------------------------------------------------------------------- /fastvideo/data_preprocess/preprocess_wan_2_1_rl_embeddings.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/data_preprocess/preprocess_wan_2_1_rl_embeddings.sh -------------------------------------------------------------------------------- /fastvideo/dataset/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/__init__.py -------------------------------------------------------------------------------- /fastvideo/dataset/latent_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/latent_datasets.py -------------------------------------------------------------------------------- /fastvideo/dataset/latent_flux_rl_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/latent_flux_rl_datasets.py -------------------------------------------------------------------------------- /fastvideo/dataset/latent_qwenimage_rl_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/latent_qwenimage_rl_datasets.py -------------------------------------------------------------------------------- /fastvideo/dataset/latent_rl_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/latent_rl_datasets.py -------------------------------------------------------------------------------- /fastvideo/dataset/latent_wan_2_1_rl_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/latent_wan_2_1_rl_datasets.py -------------------------------------------------------------------------------- /fastvideo/dataset/t2v_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/t2v_datasets.py -------------------------------------------------------------------------------- /fastvideo/dataset/transform.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/dataset/transform.py -------------------------------------------------------------------------------- /fastvideo/distill/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /fastvideo/distill/discriminator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/distill/discriminator.py -------------------------------------------------------------------------------- /fastvideo/distill/solver.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/distill/solver.py -------------------------------------------------------------------------------- /fastvideo/models/flash_attn_no_pad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/flash_attn_no_pad.py -------------------------------------------------------------------------------- /fastvideo/models/flux_hf/pipeline_flux.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/flux_hf/pipeline_flux.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/constants.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/diffusion/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/diffusion/__init__.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/diffusion/pipelines/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/diffusion/pipelines/__init__.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/diffusion/pipelines/pipeline_hunyuan_video.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/diffusion/pipelines/pipeline_hunyuan_video.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/diffusion/schedulers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/diffusion/schedulers/__init__.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/diffusion/schedulers/scheduling_flow_match_discrete.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/diffusion/schedulers/scheduling_flow_match_discrete.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/idle_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/idle_config.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/inference.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/__init__.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/activation_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/activation_layers.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/attenion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/attenion.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/embed_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/embed_layers.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/mlp_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/mlp_layers.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/models.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/modulate_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/modulate_layers.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/norm_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/norm_layers.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/posemb_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/posemb_layers.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/modules/token_refiner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/modules/token_refiner.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/prompt_rewrite.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/prompt_rewrite.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/text_encoder/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/text_encoder/__init__.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/utils/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/utils/data_utils.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/utils/file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/utils/file_utils.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/utils/helpers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/utils/helpers.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/utils/preprocess_text_encoder_tokenizer_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/utils/preprocess_text_encoder_tokenizer_utils.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/vae/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/vae/__init__.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/vae/autoencoder_kl_causal_3d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/vae/autoencoder_kl_causal_3d.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/vae/unet_causal_3d_blocks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/vae/unet_causal_3d_blocks.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan/vae/vae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan/vae/vae.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan_hf/modeling_hunyuan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan_hf/modeling_hunyuan.py -------------------------------------------------------------------------------- /fastvideo/models/hunyuan_hf/pipeline_hunyuan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/hunyuan_hf/pipeline_hunyuan.py -------------------------------------------------------------------------------- /fastvideo/models/mochi_hf/convert_diffusers_to_mochi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/mochi_hf/convert_diffusers_to_mochi.py -------------------------------------------------------------------------------- /fastvideo/models/mochi_hf/mochi_latents_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/mochi_hf/mochi_latents_utils.py -------------------------------------------------------------------------------- /fastvideo/models/mochi_hf/modeling_mochi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/mochi_hf/modeling_mochi.py -------------------------------------------------------------------------------- /fastvideo/models/mochi_hf/norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/mochi_hf/norm.py -------------------------------------------------------------------------------- /fastvideo/models/mochi_hf/pipeline_mochi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/mochi_hf/pipeline_mochi.py -------------------------------------------------------------------------------- /fastvideo/models/stable_diffusion/ddim_with_logprob.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/stable_diffusion/ddim_with_logprob.py -------------------------------------------------------------------------------- /fastvideo/models/stable_diffusion/pipeline_with_logprob.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/models/stable_diffusion/pipeline_with_logprob.py -------------------------------------------------------------------------------- /fastvideo/train_flux_pref_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_flux_pref_grpo.py -------------------------------------------------------------------------------- /fastvideo/train_flux_pref_grpo_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_flux_pref_grpo_lora.py -------------------------------------------------------------------------------- /fastvideo/train_flux_unifiedreward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_flux_unifiedreward.py -------------------------------------------------------------------------------- /fastvideo/train_flux_unifiedreward_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_flux_unifiedreward_lora.py -------------------------------------------------------------------------------- /fastvideo/train_qwenimage_pref_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_qwenimage_pref_grpo.py -------------------------------------------------------------------------------- /fastvideo/train_qwenimage_pref_grpo_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_qwenimage_pref_grpo_lora.py -------------------------------------------------------------------------------- /fastvideo/train_qwenimage_unifiedreward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_qwenimage_unifiedreward.py -------------------------------------------------------------------------------- /fastvideo/train_qwenimage_unifiedreward_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_qwenimage_unifiedreward_lora.py -------------------------------------------------------------------------------- /fastvideo/train_wan_2_1_pref_grpo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_wan_2_1_pref_grpo.py -------------------------------------------------------------------------------- /fastvideo/train_wan_2_1_pref_grpo_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/train_wan_2_1_pref_grpo_lora.py -------------------------------------------------------------------------------- /fastvideo/utils/checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/checkpoint.py -------------------------------------------------------------------------------- /fastvideo/utils/communications.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/communications.py -------------------------------------------------------------------------------- /fastvideo/utils/communications_flux.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/communications_flux.py -------------------------------------------------------------------------------- /fastvideo/utils/dataset_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/dataset_utils.py -------------------------------------------------------------------------------- /fastvideo/utils/env_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/env_utils.py -------------------------------------------------------------------------------- /fastvideo/utils/fsdp_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/fsdp_util.py -------------------------------------------------------------------------------- /fastvideo/utils/fsdp_util_qwenimage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/fsdp_util_qwenimage.py -------------------------------------------------------------------------------- /fastvideo/utils/load.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/load.py -------------------------------------------------------------------------------- /fastvideo/utils/logging_.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/logging_.py -------------------------------------------------------------------------------- /fastvideo/utils/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/optimizer.py -------------------------------------------------------------------------------- /fastvideo/utils/parallel_states.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/parallel_states.py -------------------------------------------------------------------------------- /fastvideo/utils/validation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/fastvideo/utils/validation.py -------------------------------------------------------------------------------- /inference/flux_dist_infer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/inference/flux_dist_infer.sh -------------------------------------------------------------------------------- /inference/flux_multi_node_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/inference/flux_multi_node_inference.py -------------------------------------------------------------------------------- /inference/qwen_image_dist_infer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/inference/qwen_image_dist_infer.sh -------------------------------------------------------------------------------- /inference/qwen_image_multi_node_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/inference/qwen_image_multi_node_inference.py -------------------------------------------------------------------------------- /inference/wan_dist_infer.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/inference/wan_dist_infer.sh -------------------------------------------------------------------------------- /inference/wan_multi_node_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/inference/wan_multi_node_inference.py -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/pyproject.toml -------------------------------------------------------------------------------- /requirements-lint.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/requirements-lint.txt -------------------------------------------------------------------------------- /scripts/finetune_prefgrpo_flux.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_prefgrpo_flux.sh -------------------------------------------------------------------------------- /scripts/finetune_prefgrpo_flux_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_prefgrpo_flux_lora.sh -------------------------------------------------------------------------------- /scripts/finetune_prefgrpo_qwenimage_grpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_prefgrpo_qwenimage_grpo.sh -------------------------------------------------------------------------------- /scripts/finetune_prefgrpo_qwenimage_grpo_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_prefgrpo_qwenimage_grpo_lora.sh -------------------------------------------------------------------------------- /scripts/finetune_prefgrpo_wan_2_1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_prefgrpo_wan_2_1.sh -------------------------------------------------------------------------------- /scripts/finetune_prefgrpo_wan_2_1_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_prefgrpo_wan_2_1_lora.sh -------------------------------------------------------------------------------- /scripts/finetune_unifiedreward_flux.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_unifiedreward_flux.sh -------------------------------------------------------------------------------- /scripts/finetune_unifiedreward_flux_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_unifiedreward_flux_lora.sh -------------------------------------------------------------------------------- /scripts/finetune_unifiedreward_qwenimage_grpo.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_unifiedreward_qwenimage_grpo.sh -------------------------------------------------------------------------------- /scripts/finetune_unifiedreward_qwenimage_grpo_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/scripts/finetune_unifiedreward_qwenimage_grpo_lora.sh -------------------------------------------------------------------------------- /vllm_utils/vllm_request.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/vllm_utils/vllm_request.py -------------------------------------------------------------------------------- /vllm_utils/vllm_server_UnifiedReward.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/vllm_utils/vllm_server_UnifiedReward.sh -------------------------------------------------------------------------------- /vllm_utils/vllm_server_UnifiedReward_Think.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/CodeGoat24/Pref-GRPO/HEAD/vllm_utils/vllm_server_UnifiedReward_Think.sh --------------------------------------------------------------------------------