├── DAMSMencoders └── .gitignore ├── Framework.pdf ├── LICENSE ├── README.md ├── Xu_AttnGAN_Fine-Grained_Text_CVPR_2018_paper.pdf ├── code ├── .gitignore ├── GlobalAttention.py ├── bird.wav ├── cfg │ ├── DAMSM │ │ ├── bird.yml │ │ └── coco.yml │ ├── bird_attn2.yml │ ├── bird_attnDCGAN2.yml │ ├── coco_attn2.yml │ ├── eval_bird.yml │ ├── eval_bird_attnDCGAN2.yml │ └── eval_coco.yml ├── config.py ├── datasets.py ├── gui.py ├── ixtoword.txt ├── main.py ├── miscc │ ├── __init__.py │ ├── config.py │ ├── losses.py │ └── utils.py ├── model.py ├── pictures │ ├── Backgrounds_bird.jpg │ ├── computer.png │ ├── exit.png │ ├── logout.png │ ├── monitor.png │ ├── ok.png │ ├── play.png │ ├── speak.png │ └── stop.png ├── pretrain_DAMSM.py ├── recording.py └── trainer.py ├── data └── .gitignore ├── framework.png ├── howtouse1.jpg ├── howtouse2.png ├── howtouse3.png ├── howtouse4.png ├── models └── .gitignore ├── report.pdf └── sample.png /DAMSMencoders/.gitignore: -------------------------------------------------------------------------------- 1 | * 2 | !.gitignore 3 | -------------------------------------------------------------------------------- /Framework.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/Framework.pdf -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/README.md -------------------------------------------------------------------------------- /Xu_AttnGAN_Fine-Grained_Text_CVPR_2018_paper.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/Xu_AttnGAN_Fine-Grained_Text_CVPR_2018_paper.pdf -------------------------------------------------------------------------------- /code/.gitignore: -------------------------------------------------------------------------------- 1 | *.pyc 2 | !.gitignore -------------------------------------------------------------------------------- /code/GlobalAttention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/GlobalAttention.py -------------------------------------------------------------------------------- /code/bird.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/bird.wav -------------------------------------------------------------------------------- /code/cfg/DAMSM/bird.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/DAMSM/bird.yml -------------------------------------------------------------------------------- /code/cfg/DAMSM/coco.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/DAMSM/coco.yml -------------------------------------------------------------------------------- /code/cfg/bird_attn2.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/bird_attn2.yml -------------------------------------------------------------------------------- /code/cfg/bird_attnDCGAN2.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/bird_attnDCGAN2.yml -------------------------------------------------------------------------------- /code/cfg/coco_attn2.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/coco_attn2.yml -------------------------------------------------------------------------------- /code/cfg/eval_bird.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/eval_bird.yml -------------------------------------------------------------------------------- /code/cfg/eval_bird_attnDCGAN2.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/eval_bird_attnDCGAN2.yml -------------------------------------------------------------------------------- /code/cfg/eval_coco.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/cfg/eval_coco.yml -------------------------------------------------------------------------------- /code/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/config.py -------------------------------------------------------------------------------- /code/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/datasets.py -------------------------------------------------------------------------------- /code/gui.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/gui.py -------------------------------------------------------------------------------- /code/ixtoword.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/ixtoword.txt -------------------------------------------------------------------------------- /code/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/main.py -------------------------------------------------------------------------------- /code/miscc/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/miscc/__init__.py -------------------------------------------------------------------------------- /code/miscc/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/miscc/config.py -------------------------------------------------------------------------------- /code/miscc/losses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/miscc/losses.py -------------------------------------------------------------------------------- /code/miscc/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/miscc/utils.py -------------------------------------------------------------------------------- /code/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/model.py -------------------------------------------------------------------------------- /code/pictures/Backgrounds_bird.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/Backgrounds_bird.jpg -------------------------------------------------------------------------------- /code/pictures/computer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/computer.png -------------------------------------------------------------------------------- /code/pictures/exit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/exit.png -------------------------------------------------------------------------------- /code/pictures/logout.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/logout.png -------------------------------------------------------------------------------- /code/pictures/monitor.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/monitor.png -------------------------------------------------------------------------------- /code/pictures/ok.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/ok.png -------------------------------------------------------------------------------- /code/pictures/play.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/play.png -------------------------------------------------------------------------------- /code/pictures/speak.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/speak.png -------------------------------------------------------------------------------- /code/pictures/stop.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pictures/stop.png -------------------------------------------------------------------------------- /code/pretrain_DAMSM.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/pretrain_DAMSM.py -------------------------------------------------------------------------------- /code/recording.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/recording.py -------------------------------------------------------------------------------- /code/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/code/trainer.py -------------------------------------------------------------------------------- /data/.gitignore: -------------------------------------------------------------------------------- 1 | * 2 | !.gitignore 3 | -------------------------------------------------------------------------------- /framework.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/framework.png -------------------------------------------------------------------------------- /howtouse1.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/howtouse1.jpg -------------------------------------------------------------------------------- /howtouse2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/howtouse2.png -------------------------------------------------------------------------------- /howtouse3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/howtouse3.png -------------------------------------------------------------------------------- /howtouse4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/howtouse4.png -------------------------------------------------------------------------------- /models/.gitignore: -------------------------------------------------------------------------------- 1 | * 2 | !README.md 3 | !.gitignore -------------------------------------------------------------------------------- /report.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/report.pdf -------------------------------------------------------------------------------- /sample.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/csyan5/AttnGAN-Audio-to-image-geneation/HEAD/sample.png --------------------------------------------------------------------------------