├── demo
    ├── __init__.py
    ├── asgi.py
    ├── wsgi.py
    ├── urls.py
    └── settings.py
├── grad_cam
    ├── __init__.py
    ├── tests.py
    ├── static
    │   ├── images
    │   │   ├── img1.jpg
    │   │   ├── img2.jpg
    │   │   ├── img3.jpg
    │   │   ├── img4.jpg
    │   │   ├── img5.jpg
    │   │   ├── img6.jpg
    │   │   ├── network.png
    │   │   └── team
    │   │   │   ├── devi.jpg
    │   │   │   ├── rama.jpeg
    │   │   │   ├── abhishek.jpg
    │   │   │   ├── deshraj.png
    │   │   │   ├── michael.jpg
    │   │   │   ├── stefan.jpg
    │   │   │   └── dhruv_batra.jpg
    │   └── css
    │   │   └── style.css
    ├── templates
    │   ├── form.html
    │   ├── upload_image_url.html
    │   ├── header_content.html
    │   ├── result.html
    │   ├── index_new.html
    │   ├── home.html
    │   ├── home_new.html
    │   ├── index.html
    │   ├── captioning
    │   │   └── captioning.html
    │   ├── base.html
    │   ├── classification
    │   │   └── classification.html
    │   └── vqa
    │   │   └── vqa.html
    ├── routing.py
    ├── consumers.py
    ├── urls.py
    ├── utils.py
    ├── admin.py
    ├── models.py
    ├── constants.py
    ├── home.html
    ├── sender.py
    └── views.py
├── Docker
    ├── deploy.sh
    ├── run_server.sh
    └── GradCAM
    │   └── Dockerfile
├── .gitignore
├── .gitmodules
├── uwsgi.ini
├── requirements.txt
├── manage.py
├── uwsgi_params
├── misc
    ├── DeconvReLU.lua
    ├── GuidedBackpropReLU.lua
    ├── prepro_ques.py
    └── utils.lua
├── models
    └── download_models.sh
├── gradcam_nginx.conf
├── INSTALLATION.md
├── README.md
├── worker_captioning.py
├── worker_classify.py
├── worker_vqa.py
├── classification.lua
├── captioning.lua
└── visual_question_answering.lua


/demo/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/grad_cam/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/Docker/deploy.sh:
--------------------------------------------------------------------------------
1 | python manage.py runserver 0.0.0.0:8000
2 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | models/
2 | !models/download_models.sh
3 | *.pyc
4 | media/
5 | 


--------------------------------------------------------------------------------
/grad_cam/tests.py:
--------------------------------------------------------------------------------
1 | from django.test import TestCase
2 | 
3 | # Create your tests here.
4 | 


--------------------------------------------------------------------------------
/grad_cam/static/images/img1.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/img1.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/img2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/img2.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/img3.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/img3.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/img4.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/img4.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/img5.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/img5.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/img6.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/img6.jpg


--------------------------------------------------------------------------------
/Docker/run_server.sh:
--------------------------------------------------------------------------------
1 | docker build -t cloudcv/grad-cam ./GradCAM/
2 | docker run -d --name cloudcv_grad_cam GradCAM
3 | 
4 | 


--------------------------------------------------------------------------------
/grad_cam/static/images/network.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/network.png


--------------------------------------------------------------------------------
/grad_cam/static/images/team/devi.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/team/devi.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/team/rama.jpeg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/team/rama.jpeg


--------------------------------------------------------------------------------
/grad_cam/static/images/team/abhishek.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/team/abhishek.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/team/deshraj.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/team/deshraj.png


--------------------------------------------------------------------------------
/grad_cam/static/images/team/michael.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/team/michael.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/team/stefan.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/team/stefan.jpg


--------------------------------------------------------------------------------
/grad_cam/static/images/team/dhruv_batra.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Cloud-CV/Grad-CAM/HEAD/grad_cam/static/images/team/dhruv_batra.jpg


--------------------------------------------------------------------------------
/demo/asgi.py:
--------------------------------------------------------------------------------
1 | import os
2 | from channels.asgi import get_channel_layer
3 | 
4 | os.environ.setdefault("DJANGO_SETTINGS_MODULE", "demo.settings")
5 | 
6 | channel_layer = get_channel_layer()
7 | 


--------------------------------------------------------------------------------
/.gitmodules:
--------------------------------------------------------------------------------
1 | [submodule "VQA_LSTM_CNN"]
2 | 	path = VQA_LSTM_CNN
3 | 	url = https://github.com/VT-vision-lab/VQA_LSTM_CNN.git
4 | [submodule "neuraltalk2"]
5 | 	path = neuraltalk2
6 | 	url = https://github.com/karpathy/neuraltalk2.git
7 | 


--------------------------------------------------------------------------------
/grad_cam/templates/form.html:
--------------------------------------------------------------------------------
1 | <!-- Write the html code for the form that will be used for sending the input to the backend -->
2 |     <div class="dz-message" style="color:#0000;">
3 |       <h4>Drop files here or click to upload.</h4>
4 |     </div>


--------------------------------------------------------------------------------
/uwsgi.ini:
--------------------------------------------------------------------------------
 1 | [uwsgi]
 2 | 
 3 | chdir = /home/ubuntu/Projects/Grad-CAM
 4 | module = demo.wsgi:application
 5 | master = true
 6 | processes = 10
 7 | socket = 0.0.0.0:8001
 8 | vaccum = true
 9 | python-autoreload = 1
10 | # buffer-size=32768
11 | daemonize = /var/log/uwsgi/gradcam.log
12 | 


--------------------------------------------------------------------------------
/grad_cam/static/css/style.css:
--------------------------------------------------------------------------------
 1 | .brand-logo{
 2 | 	font-weight: 300;
 3 | }
 4 | 
 5 | .demo_img{
 6 | 	height: 300px !important;
 7 | 	padding: 6px;
 8 | }
 9 | 
10 | #inputImage{
11 | 	max-width: 100% !important;
12 | }
13 | 
14 | #result{
15 | 	font-family: Roboto !important;
16 | }
17 | 
18 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
 1 | numpy==1.11.1
 2 | Django==1.9.8
 3 | Pillow==3.3.0
 4 | h5py==2.6.0
 5 | nltk==3.2.1
 6 | scipy==0.17.1
 7 | channels==0.17.2
 8 | asgi-redis==0.14.1
 9 | pika==0.10.0
10 | pyyaml==3.12
11 | uwsgi==2.0.13.1
12 | websocket-client==0.37.0
13 | daphne==0.15.0
14 | requests==2.11.1
15 | 


--------------------------------------------------------------------------------
/manage.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | import os
 3 | import sys
 4 | 
 5 | if __name__ == "__main__":
 6 |     os.environ.setdefault("DJANGO_SETTINGS_MODULE", "demo.settings")
 7 | 
 8 |     from django.core.management import execute_from_command_line
 9 | 
10 |     execute_from_command_line(sys.argv)
11 | 


--------------------------------------------------------------------------------
/grad_cam/routing.py:
--------------------------------------------------------------------------------
 1 | from channels.routing import route, include
 2 | from grad_cam.consumers import ws_message, ws_connect
 3 | 
 4 | ws_routing = [
 5 |     route("websocket.receive", ws_message),
 6 |     route("websocket.connect", ws_connect),
 7 | ]
 8 | 
 9 | channel_routing = [
10 |     include(ws_routing, path=r"^/chat"),
11 | ]
12 | 


--------------------------------------------------------------------------------
/grad_cam/templates/upload_image_url.html:
--------------------------------------------------------------------------------
1 | <div class="form-group">
2 | 	<input type="url" class="form-control col-sm-6" id="image_url" placeholder="Enter Image URL">
3 | </div>
4 | <button onClick="submitImageUsingUrl();" id="image_url_submit_btn" class="btn btn-default btn-primary" style="margin-top: 10px; margin-bottom: 10px;"> Submit </div>
5 | 


--------------------------------------------------------------------------------
/demo/wsgi.py:
--------------------------------------------------------------------------------
 1 | """
 2 | WSGI config for demo project.
 3 | 
 4 | It exposes the WSGI callable as a module-level variable named ``application``.
 5 | 
 6 | For more information on this file, see
 7 | https://docs.djangoproject.com/en/1.6/howto/deployment/wsgi/
 8 | """
 9 | 
10 | import os
11 | os.environ.setdefault("DJANGO_SETTINGS_MODULE", "demo.settings")
12 | 
13 | from django.core.wsgi import get_wsgi_application
14 | application = get_wsgi_application()
15 | 


--------------------------------------------------------------------------------
/grad_cam/consumers.py:
--------------------------------------------------------------------------------
 1 | from channels import Group
 2 | from grad_cam.utils import log_to_terminal
 3 | 
 4 | def ws_connect(message):
 5 |     print "User connnected via Socket"
 6 | 
 7 | 
 8 | def ws_message(message):
 9 |     print "Message recieved from client side and the content is ", message.content['text']
10 |     # prefix, label = message['path'].strip('/').split('/')
11 |     socketid = message.content['text']
12 |     
13 |     Group(socketid).add(message.reply_channel)
14 |     log_to_terminal(socketid, {"info": "User added to the Channel Group"})
15 | 


--------------------------------------------------------------------------------
/grad_cam/urls.py:
--------------------------------------------------------------------------------
 1 | from django.conf.urls import patterns, include, url
 2 | from grad_cam import views
 3 | 
 4 | urlpatterns = patterns('',
 5 |     # Examples:
 6 |     url(r'^vqa', views.vqa, name='vqa'),
 7 |     url(r'^upload/grad_cam_using_image_url/', views.upload_image_using_url, name='upload-url'),
 8 |     url(r'^upload', views.file_upload, name='upload'),
 9 |     url(r'^classification', views.classification, name='classification'),
10 |     url(r'^captioning', views.captioning, name='captioning'),
11 |     url(r'^$', views.home, name='home'),
12 | )
13 | 


--------------------------------------------------------------------------------
/demo/urls.py:
--------------------------------------------------------------------------------
 1 | from django.conf.urls import patterns, include, url
 2 | from django.contrib import admin
 3 | from django.conf import settings
 4 | 
 5 | admin.autodiscover()
 6 | 
 7 | urlpatterns = patterns('',
 8 |     # Examples:
 9 |     url(r'^admin/', include(admin.site.urls)),
10 |     url(r'^', include('grad_cam.urls')),
11 | )
12 | 
13 | 
14 | if settings.DEBUG:
15 |     # static files (images, css, javascript, etc.)
16 |     urlpatterns += patterns('',
17 |         (r'^media/(?P<path>.*)$', 'django.views.static.serve', {
18 |         'document_root': settings.MEDIA_ROOT}))
19 | 


--------------------------------------------------------------------------------
/grad_cam/templates/header_content.html:
--------------------------------------------------------------------------------
 1 | <div class="container">
 2 |     <div class="page-header">
 3 |         <h1 align="center">CloudCV: Grad-CAM</h1>
 4 |         <h3 align="center">More details about the Grad-CAM dataset can be found <a href="#">here.</a></h3>
 5 |         <font size="4">
 6 |             <p style="text-align:center;"><font size="4">CloudCV can generate heatmaps for questions you ask about an image</font><br><br>
 7 |                 <span style="font-size: 14px;">Browsers currently supported: Google Chrome, Mozilla Firefox</span>
 8 |             </p>
 9 |         </font>
10 |         <br><br>
11 |     </div>
12 | </div>
13 | 


--------------------------------------------------------------------------------
/uwsgi_params:
--------------------------------------------------------------------------------
 1 | uwsgi_param  QUERY_STRING       $query_string;
 2 | uwsgi_param  REQUEST_METHOD     $request_method;
 3 | uwsgi_param  CONTENT_TYPE       $content_type;
 4 | uwsgi_param  CONTENT_LENGTH     $content_length;
 5 | 
 6 | uwsgi_param  REQUEST_URI        $request_uri;
 7 | uwsgi_param  PATH_INFO          $document_uri;
 8 | uwsgi_param  DOCUMENT_ROOT      $document_root;
 9 | uwsgi_param  SERVER_PROTOCOL    $server_protocol;
10 | uwsgi_param  HTTPS              $https if_not_empty;
11 | 
12 | uwsgi_param  REMOTE_ADDR        $remote_addr;
13 | uwsgi_param  REMOTE_PORT        $remote_port;
14 | uwsgi_param  SERVER_PORT        $server_port;
15 | uwsgi_param  SERVER_NAME        $server_name;
16 | 


--------------------------------------------------------------------------------
/misc/DeconvReLU.lua:
--------------------------------------------------------------------------------
 1 | --[[
 2 | 
 3 |     Implementation of DeconvReLU that backpropagates positive gradients
 4 |     irrespective of activations; From the paper:
 5 | 
 6 |     Visualizing and Understanding Convolutional Networks
 7 |     Matthew D. Zeiler, Rob Fergus
 8 |     https://arxiv.org/abs/1311.2901
 9 | 
10 | ]]--
11 | 
12 | local DeconvReLU = torch.class('nn.DeconvReLU', 'nn.Module')
13 | 
14 | function DeconvReLU:updateOutput(input)
15 |   self.output:resizeAs(input):copy(input)
16 |   return self.output:cmul(torch.gt(input,0):typeAs(input))
17 | end
18 | 
19 | function DeconvReLU:updateGradInput(input, gradOutput)
20 |   self.gradInput:resizeAs(gradOutput):copy(gradOutput)
21 |   return self.gradInput:cmul(torch.gt(gradOutput,0):typeAs(input))
22 | end
23 | 


--------------------------------------------------------------------------------
/misc/GuidedBackpropReLU.lua:
--------------------------------------------------------------------------------
 1 | --[[
 2 | 
 3 |     Implementation of GuidedBackpropReLU that backpropagates positive gradients
 4 |     to input elements with positive activations; From the paper:
 5 | 
 6 |     Striving for Simplicity: The All Convolutional Net
 7 |     Jost Tobias Springenberg, Alexey Dosovitskiy, Thomas Brox, Martin Riedmiller
 8 |     http://arxiv.org/abs/1412.6806
 9 | 
10 | ]]--
11 | 
12 | local GuidedBackpropReLU = torch.class('nn.GuidedBackpropReLU', 'nn.Module')
13 | 
14 | function GuidedBackpropReLU:updateOutput(input)
15 |   self.output:resizeAs(input):copy(input)
16 |   return self.output:cmul(torch.gt(input,0):typeAs(input))
17 | end
18 | 
19 | function GuidedBackpropReLU:updateGradInput(input, gradOutput)
20 |   self.gradInput:resizeAs(gradOutput):copy(gradOutput)
21 |   return self.gradInput:cmul(torch.gt(input,0):typeAs(input)):cmul(torch.gt(gradOutput,0):typeAs(input))
22 | end
23 | 


--------------------------------------------------------------------------------
/grad_cam/utils.py:
--------------------------------------------------------------------------------
 1 | from channels import Group
 2 | import json
 3 | 
 4 | def log_to_terminal(socketid, message):
 5 | 	Group(socketid).send({"text": json.dumps(message)})
 6 | 
 7 | 
 8 | # from django.conf import settings
 9 | # from grad_cam.torch_models import VqaTorchModel, ClassificationTorchModel, CaptioningTorchModel
10 | # from grad_cam.torch_models import VqaTorchModel
11 | 
12 | # import grad_cam.constants as constants
13 | 
14 | # import PyTorch
15 | # import PyTorchHelpers
16 | 
17 | 
18 | # def grad_cam_vqa(input_question, input_answer, image_path, output_dir):
19 | 
20 | #     return VqaTorchModel.predict(image_path, constants.VQA_CONFIG['input_sz'], constants.VQA_CONFIG['input_sz'], input_question, input_answer, output_dir)
21 | 
22 | 
23 | # def grad_cam_classification(image_path, label, output_dir):
24 | 
25 | #     return ClassificationTorchModel.predict(image_path, label, output_dir)
26 | 
27 | 
28 | # def grad_cam_captioning(image_path, caption, output_dir):
29 | 
30 | #     return CaptioningTorchModel.predict(image_path, constants.VQA_CONFIG['input_sz'], constants.VQA_CONFIG['input_sz'], caption, output_dir)
31 | 


--------------------------------------------------------------------------------
/grad_cam/templates/result.html:
--------------------------------------------------------------------------------
 1 |     <h4 id="resultHeading" class="center">Result of Grad-CAM Visual Question Answering</h4>
 2 |     <div class="ResultImage">
 3 |       
 4 |     </div>
 5 |       <div class="row" id="result" style="display:None;">
 6 |         <div class="row">
 7 |           <div class="col s4">
 8 |             <h5><b>Input Image</b></h5><img src="" id="inputImage" class="demo_img">
 9 |           </div>
10 |           <div class="col s8">
11 |             <h5><b>Question:</b></h5><h5 id="questionDisplay"></h5>
12 |             <h5><b>Predicted Answer:</b></h5><h5 id="outputAnswer"></h5>
13 |             <h5><b>Generating Visualizations for: </b></h5><h5 id="inputAnswer"></h5>
14 |           </div>
15 |         </div>
16 |           <div class="col s4">
17 |             <img class="demo_img" src="" id="img1">
18 |             <p class="center">Grad-CAM</p>
19 |           </div>
20 |           <div class="col s4">
21 |             <img class="demo_img" src="" id="img2">
22 |             <p class="center">Guided Backprop</p>
23 |           </div>
24 |           <div class="col s4">
25 |             <img class="demo_img" src="" id="img3">
26 |             <p class="center">Guided Grad-CAM</p>
27 |           </div>
28 |       </div>
29 |       <br>
30 | 


--------------------------------------------------------------------------------
/models/download_models.sh:
--------------------------------------------------------------------------------
 1 | #!/bin/sh
 2 | 
 3 | cd models
 4 | 
 5 | # AlexNet
 6 | # wget -c https://raw.githubusercontent.com/BVLC/caffe/master/models/bvlc_alexnet/deploy.prototxt -O bvlc_alexnet_deploy.prototxt
 7 | # wget -c http://dl.caffe.berkeleyvision.org/bvlc_alexnet.caffemodel
 8 | 
 9 | # VGG-16
10 | wget -c https://gist.githubusercontent.com/ksimonyan/211839e770f7b538e2d8/raw/c3ba00e272d9f48594acef1f67e5fd12aff7a806/VGG_ILSVRC_16_layers_deploy.prototxt
11 | wget -c http://www.robots.ox.ac.uk/~vgg/software/very_deep/caffe/VGG_ILSVRC_16_layers.caffemodel
12 | 
13 | # VGG-19
14 | wget -c https://gist.githubusercontent.com/ksimonyan/3785162f95cd2d5fee77/raw/bb2b4fe0a9bb0669211cf3d0bc949dfdda173e9e/VGG_ILSVRC_19_layers_deploy.prototxt
15 | wget -c http://www.robots.ox.ac.uk/~vgg/software/very_deep/caffe/VGG_ILSVRC_19_layers.caffemodel
16 | 
17 | cd ..
18 | 
19 | # VQA
20 | cd VQA_LSTM_CNN
21 | wget -c https://filebox.ece.vt.edu/~jiasenlu/codeRelease/vqaRelease/train_only/data_train_val.zip
22 | wget -c https://filebox.ece.vt.edu/~jiasenlu/codeRelease/vqaRelease/train_only/pretrained_lstm_train_val.t7.zip
23 | unzip data_train_val.zip
24 | unzip pretrained_lstm_train_val.t7.zip
25 | cd ..
26 | 
27 | # neuraltalk2
28 | cd neuraltalk2
29 | wget http://cs.stanford.edu/people/karpathy/neuraltalk2/checkpoint_v1.zip
30 | unzip checkpoint_v1.zip
31 | cd ..
32 | 


--------------------------------------------------------------------------------
/gradcam_nginx.conf:
--------------------------------------------------------------------------------
 1 | # gradcam_nginx.conf
 2 | 
 3 | # the upstream component nginx needs to connect to
 4 | upstream gradcam {
 5 |     server 127.0.0.1:8001; # for a web port socket (we'll use this first)
 6 | }
 7 | 
 8 | # configuration of the server
 9 | server {
10 |     # the port your site will be served on
11 |     listen      80;
12 |     charset     utf-8;
13 |     server_name gradcam.cloudcv.org;
14 | 
15 |     # max upload size
16 |     client_max_body_size 75M;   # adjust to taste
17 | 
18 |     # Django media
19 |     location /media  {
20 |         alias /home/ubuntu/Projects/Grad-CAM/media;  # your Django project's media files - amend as required
21 |     }
22 | 
23 |     location /static {
24 |         alias /home/ubuntu/Projects/Grad-CAM/static; # your Django project's static files - amend as required
25 |     }
26 | 
27 |     # Finally, send all non-media requests to the Django server.
28 |     location /chat {
29 |         proxy_pass          http://127.0.0.1:9000;
30 |         proxy_http_version  1.1;
31 |         proxy_set_header    Upgrade $http_upgrade;
32 |         proxy_set_header    Connection "Upgrade";
33 |     }
34 | 
35 |     location / {
36 |         uwsgi_pass  gradcam;
37 |         include     /home/ubuntu/Projects/Grad-CAM/uwsgi_params; # the uwsgi_params file you installed
38 |         proxy_http_version  1.1;
39 |         proxy_set_header    Upgrade $http_upgrade;
40 |         proxy_set_header    Connection "Upgrade";
41 | 
42 |     }
43 | 
44 | }
45 | 


--------------------------------------------------------------------------------
/grad_cam/admin.py:
--------------------------------------------------------------------------------
 1 | from django.contrib import admin
 2 | 
 3 | # Register your models here.
 4 | from grad_cam.models import VqaJob, ClassificationJob, CaptioningJob
 5 | 
 6 | 
 7 | class VqaJobAdmin(admin.ModelAdmin):
 8 |     list_display = ('job_id', 'image_url', 'question', 'input_answer', 'predicted_answer', 'gcam_image_url', 'createdAt')
 9 | 
10 |     def image_url(self, obj):
11 |         return '<img src="%s" alt="%s" height="150px">' % (obj.image, obj.image)
12 |     image_url.allow_tags = True
13 | 
14 | 
15 |     def gcam_image_url(self, obj):
16 |         return '<img src="%s" alt="%s" height="150px">' % (obj.gcam_image, obj.gcam_image)
17 |     gcam_image_url.allow_tags = True
18 | 
19 | class ClassificationJobAdmin(admin.ModelAdmin):
20 |     list_display = ('job_id', 'image_url', 'input_label', 'predicted_label', 'gcam_image_url', 'createdAt')
21 | 
22 |     def image_url(self, obj):
23 |         return '<img src="%s" alt="%s" height="150px">' % (obj.image, obj.image)
24 |     image_url.allow_tags = True
25 | 
26 | 
27 |     def gcam_image_url(self, obj):
28 |         return '<img src="%s" alt="%s" height="150px">' % (obj.gcam_image, obj.gcam_image)
29 |     gcam_image_url.allow_tags = True
30 | 
31 | class CaptioningJobAdmin(admin.ModelAdmin):
32 |     list_display = ('job_id', 'show_image_url', 'input_caption', 'predicted_caption', 'show_gcam_image_url', 'createdAt')
33 | 
34 |     def show_image_url(self, obj):
35 |         return '<img src="%s" alt="%s" height="150px">' % (obj.image, obj.image)
36 |     show_image_url.allow_tags = True
37 | 
38 | 
39 |     def show_gcam_image_url(self, obj):
40 |         return '<img src="%s" alt="%s" height="150px">' % (obj.gcam_image, obj.gcam_image)
41 |     show_gcam_image_url.allow_tags = True
42 | 
43 | admin.site.register(VqaJob, VqaJobAdmin)
44 | admin.site.register(ClassificationJob, ClassificationJobAdmin)
45 | admin.site.register(CaptioningJob, CaptioningJobAdmin)
46 | 


--------------------------------------------------------------------------------
/grad_cam/models.py:
--------------------------------------------------------------------------------
 1 | from django.db import models
 2 | import uuid
 3 | 
 4 | class ClassificationJob(models.Model):
 5 |     job_id = models.CharField(max_length=1000, blank=True, null=True)
 6 |     image = models.CharField(max_length=1000, blank=True, null=True)
 7 |     input_label = models.CharField(max_length=1000, blank=True, null=True, default="")
 8 |     predicted_label = models.CharField(max_length=1000, blank=True, null=True)
 9 |     gcam_image = models.CharField(max_length=1000, blank=True, null=True)
10 |     createdAt = models.DateTimeField("Time", null=True, auto_now_add=True)
11 | 
12 |     def __unicode__(self):
13 |         return str(self.job_id)
14 | 
15 | class VqaJob(models.Model):
16 |     job_id = models.CharField(max_length=1000, blank=True, null=True)
17 |     image = models.CharField(max_length=1000, blank=True, null=True)
18 |     input_answer = models.CharField(max_length=1000, blank=True, null=True, default="")
19 |     predicted_answer = models.CharField(max_length=1000, blank=True, null=True)
20 |     gcam_image = models.CharField(max_length=1000, blank=True, null=True)
21 |     question = models.CharField(max_length=1000, blank=True, null=True)
22 |     createdAt = models.DateTimeField("Time", null=True, auto_now_add=True)
23 | 
24 |     def __unicode__(self):
25 |         return str(self.job_id)
26 | 
27 | class CaptioningJob(models.Model):
28 |     job_id = models.CharField(max_length=1000, blank=True, null=True)
29 |     image = models.CharField(max_length=1000, blank=True, null=True)
30 |     input_caption = models.CharField(max_length=1000, blank=True, null=True, default="")
31 |     predicted_caption = models.CharField(max_length=1000, blank=True, null=True)
32 |     gcam_image = models.CharField(max_length=1000, blank=True, null=True)
33 |     createdAt = models.DateTimeField("Time", null=True, auto_now_add=True)
34 | 
35 |     def __unicode__(self):
36 |         return str(self.job_id)
37 | 


--------------------------------------------------------------------------------
/grad_cam/constants.py:
--------------------------------------------------------------------------------
 1 | from django.conf import settings
 2 | import os
 3 | 
 4 | COCO_IMAGES_PATH = os.path.join(settings.MEDIA_ROOT, 'coco', 'val2014')
 5 | 
 6 | VQA_GPUID = -1
 7 | 
 8 | VQA_CONFIG = {
 9 |     'proto_file': 'models/VGG_ILSVRC_19_layers_deploy.prototxt',
10 |     'model_file': 'models/VGG_ILSVRC_19_layers.caffemodel',
11 |     'input_sz': 224,
12 |     'backend': '',
13 |     'layer_name': 'relu5_4',
14 |     'model_path': 'VQA_LSTM_CNN/lstm_cpu.t7',
15 |     'input_encoding_size': 200,
16 |     'rnn_size': 512,
17 |     'rnn_layers': 2,
18 |     'common_embedding_size': 1024,
19 |     'num_output': 1000,
20 |     'seed': 123,
21 |     'image_dir': os.path.join(settings.BASE_DIR, 'media', 'grad_cam', 'vqa')
22 | }
23 | 
24 | 
25 | if VQA_GPUID == -1:
26 |     VQA_CONFIG['backend'] = "nn"
27 | else:
28 |     VQA_CONFIG['backend'] = "cudnn"
29 | 
30 | VQA_LUA_PATH = "visual_question_answering.lua"
31 | 
32 | CLASSIFICATION_GPUID = -1
33 | 
34 | CLASSIFICATION_CONFIG = {
35 |     'proto_file': 'models/VGG_ILSVRC_16_layers_deploy.prototxt',
36 |     'model_file': 'models/VGG_ILSVRC_16_layers.caffemodel',
37 |     'input_sz': 224,
38 |     'backend': 'cudnn',
39 |     'layer_name': 'relu5_3',
40 |     'seed': 123,
41 |     'image_dir': os.path.join(settings.BASE_DIR, 'media', 'grad_cam', 'classification')
42 | }
43 | 
44 | 
45 | CLASSIFICATION_LUA_PATH = "classification.lua"
46 | 
47 | if CLASSIFICATION_GPUID == -1:
48 |     CLASSIFICATION_CONFIG['backend'] = "nn"
49 | else:
50 |     CLASSIFICATION_CONFIG['backend'] = "cudnn"
51 | 
52 | CAPTIONING_GPUID = 0
53 | 
54 | CAPTIONING_CONFIG = {
55 |     'input_sz': 224,
56 |     'backend': 'cudnn',
57 |     'layer': 30,
58 |     'model_path': 'neuraltalk2/model_id1-501-1448236541.t7',
59 |     'seed': 123,
60 |     'image_dir': os.path.join(settings.BASE_DIR, 'media', 'grad_cam', 'captioning')
61 | }
62 | 
63 | CAPTIONING_LUA_PATH = "captioning.lua"
64 | 
65 | if CAPTIONING_GPUID == -1:
66 |     CAPTIONING_CONFIG['backend'] = "nn"
67 | else:
68 |     CAPTIONING_CONFIG['backend'] = "cudnn"
69 | 


--------------------------------------------------------------------------------
/INSTALLATION.md:
--------------------------------------------------------------------------------
 1 | ## Installation Instructions
 2 | 
 3 | ### Installing the Essential requirements
 4 |     sudo apt-get install -y git python-pip python-dev
 5 |     sudo apt-get install -y python-dev
 6 |     sudo apt-get install -y autoconf automake libtool curl make g++ unzip
 7 |     sudo apt-get install -y libgflags-dev libgoogle-glog-dev liblmdb-dev
 8 |     sudo apt-get install libprotobuf-dev libleveldb-dev libsnappy-dev libopencv-dev libhdf5-serial-dev protobuf-compiler
 9 | 
10 | ### Install Torch
11 |     git clone https://github.com/torch/distro.git ~/torch --recursive
12 |     cd ~/torch; bash install-deps;
13 |     ./install.sh
14 |     source ~/.bashrc
15 | 
16 | ### Install PyTorch(Python Lua Wrapper)
17 |     git clone https://github.com/hughperkins/pytorch.git
18 |     cd pytorch
19 |     source ~/torch/install/bin/torch-activate
20 |     ./build.sh
21 | 
22 | ### Install RabbitMQ and Redis Server
23 |     sudo apt-get install -y redis-server rabbitmq-server
24 |     sudo rabbitmq-plugins enable rabbitmq_management
25 |     sudo service rabbitmq-server restart 
26 |     sudo service redis-server restart
27 | 
28 | ### Lua dependencies
29 |     luarocks install loadcaffe
30 | The below two dependencies are only required if you are going to use GPU
31 | 
32 |     luarocks install cudnn
33 |     luarocks install cunn
34 | 
35 | ### Cuda Installation
36 | 
37 | Note: CUDA and cuDNN is only required if you are going to use GPU
38 | 
39 | Download and install CUDA and cuDNN from [nvidia website](https://developer.nvidia.com/cuda-downloads) 
40 | 
41 | ### Install dependencies
42 |     git clone https://github.com/Cloud-CV/Grad-CAM.git
43 |     cd Grad-CAM
44 |     git submodule init && git submodule update
45 |     sh models/download_models.sh
46 |     pip install -r requirements.txt
47 |     python -m nltk.downloader all
48 | 
49 | ### Running the RabbitMQ workers and Development Server
50 | 
51 | Open 4 different terminal sessions and run the following commands:
52 | 
53 |     python worker_vqa.py
54 |     python worker_classify.py
55 |     python worker_captioning.py
56 |     python manage.py runserver
57 | 
58 | You are all set now. Visit http://127.0.0.1:8000 and you will have your demo running successfully.
59 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | 
 2 | # Grad-CAM: Gradient-weighted Class Activation Mapping
 3 | 
 4 | [![Join the chat at https://gitter.im/Cloud-CV/Grad-CAM](https://badges.gitter.im/Cloud-CV/Grad-CAM.svg)](https://gitter.im/Cloud-CV/Grad-CAM?utm_source=badge&utm_medium=badge&utm_campaign=pr-badge&utm_content=badge)
 5 | 
 6 | Grad-CAM uses the class-specific gradient information flowing into the final convolutional layer of a CNN to produce a coarse localization map of the important regions in the image. It is a novel technique for making CNN more 'transparent' by producing **visual explanations** i.e visualizations showing what evidence in the image supports a prediction. You can play with Grad-CAM demonstrations at the following links:
 7 | 
 8 | **Arxiv Paper Link**: https://arxiv.org/abs/1610.02391
 9 | 
10 | ### Grad-CAM VQA Demo: http://gradcam.cloudcv.org/vqa
11 | 
12 | 
13 | ![Imgur](http://i.imgur.com/6jB4lAq.gif)
14 | 
15 | ### Grad-CAM Classification Demo: http://gradcam.cloudcv.org/classification
16 | 
17 | 
18 | ![Imgur](http://i.imgur.com/a1IiQg4.gif)
19 | 
20 | ### Grad-CAM Captioning Demo: http://gradcam.cloudcv.org/captioning
21 | 
22 | 
23 | ![Imgur](http://i.imgur.com/BsOOpIn.gif)
24 | 
25 | ## Installing / Getting started
26 | 
27 | We use RabbitMQ to queue the submitted jobs. Also, we use Redis as backend for realtime communication using websockets.
28 | 
29 | All the instructions for setting Grad-CAM from scratch can be found  [here](https://github.com/Cloud-CV/Grad-CAM/blob/master/INSTALLATION.md)
30 | 
31 | Note: For best results, its recommended to run the Grad-CAM demo on GPU enabled machines.
32 | 
33 | ## Interested in Contributing?
34 | 
35 | Cloud-CV always welcomes new contributors to learn the new cutting edge technologies. If you'd like to contribute, please fork the repository and use a feature branch. Pull requests are warmly welcome.
36 | 
37 | if you have more questions about the project, then you can talk to us on our [Gitter Channel](https://gitter.im/Cloud-CV/Grad-CAM).  
38 | 
39 | ## Acknowledgements
40 | 
41 | - [VQA_LSTM_CNN](https://github.com/VT-vision-lab/VQA_LSTM_CNN)
42 | - [HieCoAttenVQA](https://github.com/jiasenlu/HieCoAttenVQA)
43 | - [NeuralTalk2](https://github.com/karpathy/neuraltalk2/)
44 | - [PyTorch](https://github.com/hughperkins/pytorch)
45 | 


--------------------------------------------------------------------------------
/grad_cam/home.html:
--------------------------------------------------------------------------------
 1 | {% load staticfiles %}
 2 | 
 3 | <!DOCTYPE html>
 4 | <html>
 5 | <head>
 6 |   <title>Grad-Cam</title>
 7 |   <!-- Compiled and minified CSS -->
 8 |   <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/materialize/0.97.6/css/materialize.min.css">
 9 |   <link href="http://fonts.googleapis.com/icon?family=Material+Icons" rel="stylesheet">
10 | 
11 |   <link rel="stylesheet" type="text/css" href="{% static 'css/style.css' %}">
12 |   <meta name="viewport" content="width=device-width, initial-scale=1.0"/>
13 |   <script type="text/javascript" src="https://code.jquery.com/jquery-2.1.1.min.js"></script>
14 |   <script type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/reconnecting-websocket/1.0.0/reconnecting-websocket.min.js"></script>
15 | </head>
16 | <body>
17 |   <nav>
18 |     <div class="nav-wrapper red darken-4">
19 |       <a href="#" class="brand-logo center">Gradient-weighted Class Activation Mapping Demo</a>
20 |     </div>
21 |   </nav>
22 |   <div class="container">
23 |     <h3 class="center">Visual Question Answering</h3>
24 |     <div class="row">
25 |       <form class="col s12" action="/demo/vqa/" method="POST" enctype="multipart/form-data" id="vqaForm">
26 |         {% csrf_token %}
27 |         <div class="file-field input-field col s10">
28 |           <div class="btn red darken-4">
29 |             <span>Image</span>
30 |             <input type="file" name="file" id="file" required>
31 |           </div>
32 |           <div class="file-path-wrapper">
33 |             <input class="file-path validate" type="text" placeholder="Upload Image" name="file">
34 |           </div>
35 |         </div>
36 |         <div class="input_field col s6">
37 |           <label for="question">Question</label>
38 |           <input id="question" type="text" class="validate" name="question" id="question" required>
39 |         </div>
40 |         <div class="input_field col s4">
41 |           <label for="answer">Answer(Optional)</label>
42 |           <input id="answer" type="text" name="answer" id="answer">
43 |         </div>
44 |         <div class="col s4">
45 |           <a class="waves-effect waves-light btn red darken-4" onclick="submitForm();"><i class="material-icons right">cloud</i>Submit</a>
46 |         </div>
47 |         </form>
48 |     </div>
49 |   </div>
50 | </body>
51 | </html>
52 | 


--------------------------------------------------------------------------------
/Docker/GradCAM/Dockerfile:
--------------------------------------------------------------------------------
 1 | # Start with CUDA Torch dependencies
 2 | FROM kaixhin/cuda-torch-deps:latest
 3 | 
 4 | MAINTAINER Deshraj <deshrajdry@gmail.com>
 5 | 
 6 | # Run Torch7 installation scripts
 7 | RUN cd /root/torch && \
 8 |   ./install.sh
 9 | 
10 | # Export environment variables manually
11 | ENV LUA_PATH='/root/.luarocks/share/lua/5.1/?.lua;/root/.luarocks/share/lua/5.1/?/init.lua;/root/torch/install/share/lua/5.1/?.lua;/root/torch/install/share/lua/5.1/?/init.lua;./?.lua;/root/torch/install/share/luajit-2.1.0-beta1/?.lua;/usr/local/share/lua/5.1/?.lua;/usr/local/share/lua/5.1/?/init.lua'
12 | ENV LUA_CPATH='/root/.luarocks/lib/lua/5.1/?.so;/root/torch/install/lib/lua/5.1/?.so;./?.so;/usr/local/lib/lua/5.1/?.so;/usr/local/lib/lua/5.1/loadall.so'
13 | ENV PATH=/root/torch/install/bin:$PATH
14 | ENV LD_LIBRARY_PATH=/root/torch/install/lib:$LD_LIBRARY_PATH
15 | ENV DYLD_LIBRARY_PATH=/root/torch/install/lib:$DYLD_LIBRARY_PATH
16 | ENV LUA_CPATH='/root/torch/install/lib/?.so;'$LUA_CPATH
17 | 
18 | RUN apt-get update
19 | RUN apt-get install -y python-dev libhdf5-serial-dev  libprotobuf-dev protobuf-compiler
20 | 
21 | # Install PyTorch
22 | RUN pip install numpy==1.11.1 pytest
23 | RUN git clone https://github.com/hughperkins/pytorch.git && cd pytorch && ./build.sh
24 | 
25 | # Clone the repository
26 | RUN git clone https://github.com/DESHRAJ/grad-cam.git
27 | 
28 | # Update git submodules
29 | RUN cd grad-cam && git submodule init && git submodule update
30 | 
31 | # Change relative path in lua for neuraltalk2
32 | RUN cd grad-cam && sed -i -e "s/local utils = require 'misc.utils'/local utils = require 'neuraltalk2.misc.utils'/g" neuraltalk2/misc/LanguageModel.lua
33 | RUN cd grad-cam && sed -i -e "s/local net_utils = require 'misc.net_utils'/local net_utils = require 'neuraltalk2.misc.net_utils'/g" neuraltalk2/misc/LanguageModel.lua
34 | RUN cd grad-cam && sed -i -e "s/local LSTM = require 'misc.LSTM'/local LSTM = require 'neuraltalk2.misc.LSTM'/g" neuraltalk2/misc/LanguageModel.lua
35 | 
36 | # Install python dependencies
37 | RUN cd grad-cam && pip install -r requirements.txt
38 | RUN python -m nltk.downloader all
39 | 
40 | # Install lua dependencies
41 | RUN luarocks install loadcaffe
42 | RUN luarocks install nn
43 | RUN luarocks install cunn
44 | RUN luarocks install cudnn
45 | 
46 | RUN apt-get install -y unzip wget
47 | 
48 | # Downlaod the models
49 | RUN cd grad-cam && bash models/download_models.sh && pwd
50 | 
51 | WORKDIR /grad-cam
52 | 
53 | EXPOSE 80
54 | EXPOSE 8000
55 | 
56 | CMD  ["/bin/bash", "/grad-cam/Docker/deploy.sh"]
57 | 


--------------------------------------------------------------------------------
/misc/prepro_ques.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Preprocesses a question
 3 | Adapted from https://github.com/VT-vision-lab/VQA_LSTM_CNN/blob/master/prepro.py
 4 | """
 5 | import copy
 6 | from random import shuffle, seed
 7 | import sys
 8 | import os.path
 9 | import argparse
10 | import glob
11 | import numpy as np
12 | from scipy.misc import imread, imresize
13 | import scipy.io
14 | import pdb
15 | import string
16 | import h5py
17 | from nltk.tokenize import word_tokenize
18 | import json
19 | 
20 | import re
21 | 
22 | 
23 | def tokenize(sentence):
24 |     return [i for i in re.split(r"([-.\"',:? !\$#@~()*&\^%;\[\]/\\\+<>\n=])", sentence) if i!='' and i!=' ' and i!='\n'];
25 | 
26 | def prepro_question(s, method='nltk'):
27 |     if method == 'nltk':
28 |         txt = word_tokenize(str(s).lower())
29 |     else:
30 |         txt = tokenize(s)
31 |     return txt
32 | 
33 | def apply_vocab_question(tokens, wtoi):
34 |     # apply the vocab on test.
35 |     question = [w if wtoi.get(w,len(wtoi)+1) != (len(wtoi)+1) else 'UNK' for w in tokens]
36 |     return question
37 | 
38 | def encode_question(ques, wtoi):
39 |     max_length = 26
40 | 
41 |     label_arrays = np.zeros((max_length), dtype='uint32')
42 |     label_length = min(max_length, len(ques)) # record the length of this sequence
43 |     for k, w in enumerate(ques):
44 |         if k < max_length :
45 |             print(w)
46 |             label_arrays[k] = wtoi[w]
47 | 
48 |     return label_arrays, label_length
49 | 
50 | def feat_ques(question):
51 |     # tokenization and preprocessing training question
52 |     tokens = prepro_question(question)
53 | 
54 |     # create the vocab for question
55 |     # Load Vocabulary File
56 |     with open('VQA_LSTM_CNN/data_prepro.json', 'r') as f:
57 |         itow = json.load(f)['ix_to_word']
58 |     wtoi = {w:i for i,w in itow.items()} # inverse table
59 | 
60 |     fin_ques = apply_vocab_question(tokens, wtoi)
61 |     ques, ques_length = encode_question(fin_ques, wtoi)
62 |     q = {}
63 |     q['ques'] = ques.tolist()
64 |     q['ques_length'] = ques_length
65 |     with open('ques_feat.json','w') as q_file:
66 |         json.dump(q,q_file)
67 |     print ques.tolist()
68 | 
69 |     return ques.tolist(), ques_length
70 | 
71 | def main(params):
72 |     question = params['question']
73 |     ques, ques_length = feat_ques(question)
74 | 
75 | if __name__ == "__main__":
76 |     parser = argparse.ArgumentParser()
77 | 
78 |     parser.add_argument('-d', '--question', dest='question', default='what is the man doing', help='question string')
79 |     args = parser.parse_args()
80 |     params = vars(args)
81 |     main(params)
82 | 


--------------------------------------------------------------------------------
/demo/settings.py:
--------------------------------------------------------------------------------
  1 | """
  2 | Django settings for demo project.
  3 | 
  4 | For more information on this file, see
  5 | https://docs.djangoproject.com/en/1.6/topics/settings/
  6 | 
  7 | For the full list of settings and their values, see
  8 | https://docs.djangoproject.com/en/1.6/ref/settings/
  9 | """
 10 | 
 11 | # Build paths inside the project like this: os.path.join(BASE_DIR, ...)
 12 | import os
 13 | BASE_DIR = os.path.dirname(os.path.dirname(__file__))
 14 | 
 15 | 
 16 | # Quick-start development settings - unsuitable for production
 17 | # See https://docs.djangoproject.com/en/1.6/howto/deployment/checklist/
 18 | 
 19 | # SECURITY WARNING: keep the secret key used in production secret!
 20 | SECRET_KEY = 's^5q!)!rui+p&^&+bggew-as=wu@2#b9-=lac_mlu%xg9w&c9y'
 21 | 
 22 | # SECURITY WARNING: don't run with debug turned on in production!
 23 | DEBUG = True
 24 | 
 25 | TEMPLATE_DEBUG = True
 26 | 
 27 | ALLOWED_HOSTS = []
 28 | 
 29 | 
 30 | # Application definition
 31 | 
 32 | INSTALLED_APPS = (
 33 |     'django.contrib.admin',
 34 |     'django.contrib.auth',
 35 |     'django.contrib.contenttypes',
 36 |     'django.contrib.sessions',
 37 |     'django.contrib.messages',
 38 |     'django.contrib.staticfiles',
 39 |     'grad_cam',
 40 |     'channels',
 41 | )
 42 | 
 43 | MIDDLEWARE_CLASSES = (
 44 |     'django.contrib.sessions.middleware.SessionMiddleware',
 45 |     'django.middleware.common.CommonMiddleware',
 46 |     'django.middleware.csrf.CsrfViewMiddleware',
 47 |     'django.contrib.auth.middleware.AuthenticationMiddleware',
 48 |     'django.contrib.messages.middleware.MessageMiddleware',
 49 |     'django.middleware.clickjacking.XFrameOptionsMiddleware',
 50 | )
 51 | 
 52 | ROOT_URLCONF = 'demo.urls'
 53 | 
 54 | WSGI_APPLICATION = 'demo.wsgi.application'
 55 | 
 56 | 
 57 | # Database
 58 | # https://docs.djangoproject.com/en/1.6/ref/settings/#databases
 59 | 
 60 | DATABASES = {
 61 |     'default': {
 62 |         'ENGINE': 'django.db.backends.mysql', 
 63 |         'NAME': 'grad_cam',
 64 |         'USER': 'root',
 65 |         'PASSWORD': 'root123',
 66 |         'HOST': 'localhost',   # Or an IP Address that your DB is hosted on
 67 |         'PORT': '3306',
 68 |     }
 69 | }
 70 | # Internationalization
 71 | # https://docs.djangoproject.com/en/1.6/topics/i18n/
 72 | 
 73 | LANGUAGE_CODE = 'en-us'
 74 | 
 75 | TIME_ZONE = 'UTC'
 76 | 
 77 | USE_I18N = True
 78 | 
 79 | USE_L10N = True
 80 | 
 81 | USE_TZ = True
 82 | 
 83 | 
 84 | # Static files (CSS, JavaScript, Images)
 85 | # https://docs.djangoproject.com/en/1.6/howto/static-files/
 86 | 
 87 | STATIC_URL = '/static/'
 88 | 
 89 | STATIC_ROOT = os.path.join(BASE_DIR, 'static')
 90 | 
 91 | MEDIA_ROOT = os.path.join(BASE_DIR, 'media')
 92 | 
 93 | MEDIA_URL= "/media/"
 94 | 
 95 | CHANNEL_LAYERS = {
 96 |     "default": {
 97 |         "BACKEND": "asgi_redis.RedisChannelLayer",
 98 |         "CONFIG": {
 99 |             "hosts": [("localhost", 6379)],
100 |             "prefix": u"gradcam:",
101 |         },
102 |         "ROUTING": "grad_cam.routing.channel_routing",
103 |     },
104 | }
105 | 


--------------------------------------------------------------------------------
/grad_cam/sender.py:
--------------------------------------------------------------------------------
 1 | from django.conf import settings
 2 | from grad_cam.utils import log_to_terminal
 3 | 
 4 | import os
 5 | import pika
 6 | import sys
 7 | import json
 8 | 
 9 | 
10 | def grad_cam_classification(image_path, label, out_dir, socketid):
11 | 
12 |     connection = pika.BlockingConnection(pika.ConnectionParameters(
13 |             host='localhost'))
14 |     channel = connection.channel()
15 | 
16 |     channel.queue_declare(queue='classify_task_queue', durable=True)
17 |     message = {
18 |         'image_path': image_path,
19 |         'label': label,
20 |         'output_dir': out_dir,
21 |         'socketid': socketid,
22 |     }
23 |     log_to_terminal(socketid, {"terminal": "Publishing job to Classification Queue"})
24 |     channel.basic_publish(exchange='',
25 |                       routing_key='classify_task_queue',
26 |                       body=json.dumps(message),
27 |                       properties=pika.BasicProperties(
28 |                          delivery_mode = 2, # make message persistent
29 |                       ))
30 | 
31 |     print(" [x] Sent %r" % message)
32 |     log_to_terminal(socketid, {"terminal": "Job published successfully"})
33 |     connection.close()
34 | 
35 | 
36 | def grad_cam_vqa(input_question, input_answer, image_path, out_dir, socketid):
37 |     connection = pika.BlockingConnection(pika.ConnectionParameters(
38 |             host='localhost'))
39 |     channel = connection.channel()
40 | 
41 |     channel.queue_declare(queue='vqa_task_queue', durable=True)
42 |     message = {
43 |         'image_path': image_path,
44 |         'input_question': input_question,
45 |         'input_answer': input_answer,
46 |         'output_dir': out_dir,
47 |         'socketid': socketid,
48 |     }
49 |     log_to_terminal(socketid, {"terminal": "Publishing job to VQA Queue"})
50 |     channel.basic_publish(exchange='',
51 |                       routing_key='vqa_task_queue',
52 |                       body=json.dumps(message),
53 |                       properties=pika.BasicProperties(
54 |                          delivery_mode = 2, # make message persistent
55 |                       ))
56 | 
57 |     print(" [x] Sent %r" % message)
58 |     log_to_terminal(socketid, {"terminal": "Job published successfully"})
59 |     connection.close()
60 | 
61 | 
62 | def grad_cam_captioning(image_path, caption, out_dir, socketid):
63 |     connection = pika.BlockingConnection(pika.ConnectionParameters(
64 |             host='localhost'))
65 |     channel = connection.channel()
66 | 
67 |     channel.queue_declare(queue='captioning_task_queue', durable=True)
68 |     message = {
69 |         'image_path': image_path,
70 |         'caption': caption,
71 |         'output_dir': out_dir,
72 |         'socketid': socketid,
73 |     }
74 |     log_to_terminal(socketid, {"terminal": "Publishing job to Captioning Queue"})
75 |     channel.basic_publish(exchange='',
76 |                       routing_key='captioning_task_queue',
77 |                       body=json.dumps(message),
78 |                       properties=pika.BasicProperties(
79 |                          delivery_mode = 2, # make message persistent
80 |                       ))
81 | 
82 |     print(" [x] Sent %r" % message)
83 |     log_to_terminal(socketid, {"terminal": "Job published successfully"})
84 |     connection.close()
85 | 


--------------------------------------------------------------------------------
/worker_captioning.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import
 2 | import os
 3 | os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'demo.settings')
 4 | 
 5 | import django
 6 | django.setup()
 7 | 
 8 | from django.conf import settings
 9 | from grad_cam.utils import log_to_terminal
10 | from grad_cam.models import CaptioningJob
11 | 
12 | import grad_cam.constants as constants
13 | import PyTorch
14 | import PyTorchHelpers
15 | import pika
16 | import time
17 | import yaml
18 | import json
19 | import traceback
20 | import urllib
21 | 
22 | # Close the database connection in order to make sure that MYSQL Timeout doesn't occur
23 | django.db.close_old_connections()
24 | 
25 | CaptioningModel = PyTorchHelpers.load_lua_class(constants.CAPTIONING_LUA_PATH, 'CaptioningTorchModel')
26 | CaptioningTorchModel = CaptioningModel(
27 |     constants.CAPTIONING_CONFIG['model_path'],
28 |     constants.CAPTIONING_CONFIG['backend'],
29 |     constants.CAPTIONING_CONFIG['input_sz'],
30 |     constants.CAPTIONING_CONFIG['layer'],
31 |     constants.CAPTIONING_CONFIG['seed'],
32 |     constants.CAPTIONING_GPUID,
33 | )
34 | 
35 | connection = pika.BlockingConnection(pika.ConnectionParameters(
36 |         host='localhost'))
37 | 
38 | channel = connection.channel()
39 | 
40 | channel.queue_declare(queue='captioning_task_queue', durable=True)
41 | print(' [*] Waiting for messages. To exit press CTRL+C')
42 | 
43 | def callback(ch, method, properties, body):
44 |     try:
45 |         print(" [x] Received %r" % body)
46 |         body = yaml.safe_load(body) # using yaml instead of json.loads since that unicodes the string in value
47 | 
48 |         result = CaptioningTorchModel.predict(body['image_path'], constants.VQA_CONFIG['input_sz'], constants.VQA_CONFIG['input_sz'], body['caption'], body['output_dir'])
49 | 
50 |         CaptioningJob.objects.create(job_id=body['socketid'], input_caption=body['caption'], image=str(result['input_image']).replace(settings.BASE_DIR, '')[1:], predicted_caption = result['pred_caption'], gcam_image=str(result['captioning_gcam']).replace(settings.BASE_DIR, '')[1:])
51 | 
52 |         # Close the database connection in order to make sure that MYSQL Timeout doesn't occur
53 |         django.db.close_old_connections()
54 | 
55 |         result['input_image'] = urllib.urlencode(str(result['input_image']).replace(settings.BASE_DIR, ''))
56 |         result['captioning_gcam'] = urllib.urlencode(str(result['captioning_gcam']).replace(settings.BASE_DIR, ''))
57 |         result['captioning_gcam_raw'] = urllib.urlencode(str(result['captioning_gcam_raw']).replace(settings.BASE_DIR, ''))
58 |         result['captioning_gb'] = str(result['captioning_gb']).replace(settings.BASE_DIR, '')
59 |         result['captioning_gb_gcam'] = str(result['captioning_gb_gcam']).replace(settings.BASE_DIR, '')
60 | 
61 |         log_to_terminal(body['socketid'], {"result": json.dumps(result)})
62 |         log_to_terminal(body['socketid'], {"terminal": json.dumps(result)})
63 |         log_to_terminal(body['socketid'], {"terminal": "Completed the Captioning job"})
64 | 
65 |         ch.basic_ack(delivery_tag = method.delivery_tag)
66 | 
67 |     except Exception, err:
68 |         log_to_terminal(body['socketid'], {"terminal": json.dumps({"Traceback": str(traceback.print_exc())})})
69 | 
70 | channel.basic_consume(callback,
71 |                       queue='captioning_task_queue')
72 | 
73 | channel.start_consuming()
74 | 


--------------------------------------------------------------------------------
/worker_classify.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import
 2 | import os
 3 | os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'demo.settings')
 4 | 
 5 | import django
 6 | django.setup()
 7 | 
 8 | 
 9 | from django.conf import settings
10 | from grad_cam.utils import log_to_terminal
11 | from grad_cam.models import ClassificationJob
12 | import grad_cam.constants as constants
13 | import PyTorch
14 | import PyTorchHelpers
15 | import pika
16 | import time
17 | import yaml
18 | import json
19 | import traceback
20 | 
21 | # Close the database connection in order to make sure that MYSQL Timeout doesn't occur
22 | django.db.close_old_connections()
23 | 
24 | ClassificationModel = PyTorchHelpers.load_lua_class(constants.CLASSIFICATION_LUA_PATH, 'ClassificationTorchModel')
25 | ClassificationTorchModel = ClassificationModel(
26 |     constants.CLASSIFICATION_CONFIG['proto_file'],
27 |     constants.CLASSIFICATION_CONFIG['model_file'],
28 |     constants.CLASSIFICATION_CONFIG['backend'],
29 |     constants.CLASSIFICATION_CONFIG['input_sz'],
30 |     constants.CLASSIFICATION_CONFIG['layer_name'],
31 |     constants.CLASSIFICATION_CONFIG['seed'],
32 |     constants.CLASSIFICATION_GPUID,
33 | )
34 | 
35 | connection = pika.BlockingConnection(pika.ConnectionParameters(
36 |         host='localhost'))
37 | 
38 | channel = connection.channel()
39 | 
40 | channel.queue_declare(queue='classify_task_queue', durable=True)
41 | print(' [*] Waiting for messages. To exit press CTRL+C')
42 | 
43 | def callback(ch, method, properties, body):
44 |     try:
45 |         print(" [x] Received %r" % body)
46 |         body = yaml.safe_load(body) # using yaml instead of json.loads since that unicodes the string in value
47 | 
48 |         result = ClassificationTorchModel.predict(body['image_path'], body['label'], body['output_dir'])
49 | 
50 |         ClassificationJob.objects.create(job_id=body['socketid'], input_label=body['label'], image=str(result['input_image']).replace(settings.BASE_DIR, '')[1:], predicted_label = result['pred_label'], gcam_image=str(result['classify_gcam']).replace(settings.BASE_DIR, '')[1:])
51 | 
52 |         # Close the database connection in order to make sure that MYSQL Timeout doesn't occur
53 |         django.db.close_old_connections()
54 | 
55 |         result['input_image'] = str(result['input_image']).replace(settings.BASE_DIR, '')
56 |         result['classify_gcam'] = str(result['classify_gcam']).replace(settings.BASE_DIR, '')
57 |         result['classify_gcam_raw'] = str(result['classify_gcam_raw']).replace(settings.BASE_DIR, '')
58 |         result['classify_gb'] = str(result['classify_gb']).replace(settings.BASE_DIR, '')
59 |         result['classify_gb_gcam'] = str(result['classify_gb_gcam']).replace(settings.BASE_DIR, '')
60 | 
61 |         print result
62 | 
63 |         log_to_terminal("Hello", {"terminal": "Completed the Classification Task"})
64 |         log_to_terminal(body['socketid'], {"terminal": json.dumps(result)})
65 |         log_to_terminal(body['socketid'], {"result": json.dumps(result)})
66 |         log_to_terminal(body['socketid'], {"terminal": "Completed the Classification Task"})
67 | 
68 |         ch.basic_ack(delivery_tag = method.delivery_tag)
69 |     except Exception, err:
70 |         log_to_terminal(body['socketid'], {"terminal": json.dumps({"Traceback": str(traceback.print_exc())})})
71 | 
72 | channel.basic_consume(callback,
73 |                       queue='classify_task_queue')
74 | 
75 | channel.start_consuming()
76 | 


--------------------------------------------------------------------------------
/worker_vqa.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import
 2 | import os
 3 | os.environ.setdefault('DJANGO_SETTINGS_MODULE', 'demo.settings')
 4 | 
 5 | import django
 6 | django.setup()
 7 | 
 8 | from grad_cam.models import VqaJob
 9 | from django.conf import settings
10 | from grad_cam.utils import log_to_terminal
11 | 
12 | import grad_cam.constants as constants
13 | import PyTorch
14 | import PyTorchHelpers
15 | import pika
16 | import time
17 | import yaml
18 | import json
19 | import traceback
20 | 
21 | # Close the database connection in order to make sure that MYSQL Timeout doesn't occur
22 | django.db.close_old_connections()
23 | 
24 | # Loading the VQA Model forever
25 | VQAModel = PyTorchHelpers.load_lua_class(constants.VQA_LUA_PATH, 'VQATorchModel')
26 | VqaTorchModel = VQAModel(
27 |     constants.VQA_CONFIG['proto_file'],
28 |     constants.VQA_CONFIG['model_file'],
29 |     constants.VQA_CONFIG['input_sz'],
30 |     constants.VQA_CONFIG['backend'],
31 |     constants.VQA_CONFIG['layer_name'],
32 |     constants.VQA_CONFIG['model_path'],
33 |     constants.VQA_CONFIG['input_encoding_size'],
34 |     constants.VQA_CONFIG['rnn_size'],
35 |     constants.VQA_CONFIG['rnn_layers'],
36 |     constants.VQA_CONFIG['common_embedding_size'],
37 |     constants.VQA_CONFIG['num_output'],
38 |     constants.VQA_CONFIG['seed'],
39 |     constants.VQA_GPUID,
40 | )
41 | 
42 | connection = pika.BlockingConnection(pika.ConnectionParameters(
43 |         host='localhost'))
44 | 
45 | channel = connection.channel()
46 | 
47 | channel.queue_declare(queue='vqa_task_queue', durable=True)
48 | print(' [*] Waiting for messages. To exit press CTRL+C')
49 | 
50 | def callback(ch, method, properties, body):
51 |     try:
52 |         print(" [x] Received %r" % body)
53 |         body = yaml.safe_load(body) # using yaml instead of json.loads since that unicodes the string in value
54 | 
55 |         result = VqaTorchModel.predict(body['image_path'], constants.VQA_CONFIG['input_sz'], constants.VQA_CONFIG['input_sz'], body['input_question'], body['input_answer'], body['output_dir'])
56 | 
57 |         VqaJob.objects.create(job_id=body['socketid'], question=body['input_question'], input_answer=body['input_answer'], image=str(result['input_image']).replace(settings.BASE_DIR, '')[1:], predicted_answer = result['answer'], gcam_image=str(result['vqa_gcam']).replace(settings.BASE_DIR, '')[1:])
58 | 
59 |         # Close the database connection in order to make sure that MYSQL Timeout doesn't occur
60 |         django.db.close_old_connections()
61 | 
62 |         result['input_image'] = str(result['input_image']).replace(settings.BASE_DIR, '')
63 |         result['vqa_gcam'] = str(result['vqa_gcam']).replace(settings.BASE_DIR, '')
64 |         result['vqa_gcam_raw'] = str(result['vqa_gcam_raw']).replace(settings.BASE_DIR, '')
65 |         result['vqa_gb'] = str(result['vqa_gb']).replace(settings.BASE_DIR, '')
66 |         result['vqa_gb_gcam'] = str(result['vqa_gb_gcam']).replace(settings.BASE_DIR, '')
67 | 
68 |         log_to_terminal(body['socketid'], {"terminal": json.dumps(result)})
69 |         log_to_terminal(body['socketid'], {"result": json.dumps(result)})
70 |         log_to_terminal(body['socketid'], {"terminal": "Completed the Grad-CAM VQA task"})
71 | 
72 |         ch.basic_ack(delivery_tag = method.delivery_tag)
73 |     except Exception, err:
74 |         log_to_terminal(body['socketid'], {"terminal": json.dumps({"Traceback": str(traceback.print_exc())})})
75 | 
76 | channel.basic_consume(callback,
77 |                       queue='vqa_task_queue')
78 | 
79 | channel.start_consuming()
80 | 


--------------------------------------------------------------------------------
/grad_cam/templates/index_new.html:
--------------------------------------------------------------------------------
  1 | {% extends 'base.html' %}
  2 | 
  3 | {% block header_content %}
  4 | 
  5 | {% include 'header_content.html' %}
  6 | 
  7 | {% endblock %}
  8 | 
  9 | {% block form %}
 10 | 
 11 | <div class="container">
 12 |   <div class="page-header">
 13 |     <h2 id="userImages">Try CloudCV VQA On Your Images</h2>
 14 |   </div>
 15 | 
 16 |   <form id="fileupload" method="post" class="dropzone
 17 |   " action="{% url "upload" %}" enctype="multipart/form-data">
 18 |   {% csrf_token %}
 19 | 
 20 |   {% include 'form.html' %}
 21 |   </form>
 22 | 
 23 | {% endblock %}
 24 | 
 25 | {% block terminal %}
 26 | {% endblock %}
 27 | 
 28 | {% block result %}
 29 | 
 30 | {% include 'result.html' %}
 31 | 
 32 | {% endblock %}
 33 | 
 34 | </body>
 35 | <script type="text/javascript">
 36 |   // handle things after the file is uploaded on the server
 37 |   // 1. Navigate below to show the image thumbnail and a quesiton and answer field 
 38 |   var image_count = 0;
 39 |   function processResult(response_data){
 40 |         image_count = image_count + 1;
 41 | 
 42 |         $('#comments').prepend('<li>' + "Rendering results..." + '</li>');
 43 |         var parentDiv = document.getElementById("ResultImage");
 44 |         var imageDiv = document.createElement("div");
 45 |         var tableDiv = document.createElement("div");
 46 | 
 47 |         imageDiv.className = "col-md-5";
 48 |         imageDiv.style.paddingBottom="30px";
 49 | 
 50 |         imageDiv.style.clear="both";
 51 | 
 52 |         tableDiv.className="col-md-7";
 53 |         tableDiv.style.paddingBottom="30px";
 54 | 
 55 |         var newImage = document.createElement("img");
 56 |         newImage.style.height = "300px";
 57 |       newImage.className = "img-responsive";
 58 | 
 59 |         var newImageURL = response_data['uploaded_image_path'];
 60 |         var imID = "imDiv"+image_count;
 61 | 
 62 |         newImage.src = newImageURL;
 63 |         imageDiv.appendChild(newImage);
 64 |         parentDiv.appendChild(imageDiv);
 65 | 
 66 |         // Add question textbox and submit button here
 67 |         createButton(tableDiv, newImageURL, imID);
 68 | 
 69 |         var ansDiv = document.createElement("div");
 70 |         $(ansDiv).attr("id",imID);
 71 |         tableDiv.appendChild(ansDiv);
 72 |         parentDiv.appendChild(tableDiv);
 73 |         scrollToElement($(imageDiv));
 74 | 
 75 |     }
 76 | 
 77 |     function createButton(context, imgsrc, imageid){
 78 |         // generate question element 
 79 |         var questionArea = document.createElement("questionArea");
 80 |         $(questionArea).attr("rows","1");
 81 |         $(questionArea).attr("id","question"+imageid);
 82 |         // $(questionArea).attr("btid","bt"+imageid);
 83 |         $(questionArea).addClass("form-control")
 84 | 
 85 |         // Generate answer area 
 86 |         var answerArea = document.createElement("input");
 87 |         $(answerArea).attr("id","answer"+imageid);
 88 |         // $(answerArea).attr("btid","bt"+imageid);
 89 |         $(answerArea).addClass("form-control")
 90 |         var button = document.createElement("input");
 91 |         button.type = "button";
 92 |         button.value = "Submit";
 93 |         $(button).attr("onclick","submitQuestion('"+imgsrc+"','"+imageid+"')");
 94 |         $(button).attr("id","bt"+imageid);
 95 |         $(button).addClass("btn");
 96 |         $(button).addClass("btn-primary");
 97 | 
 98 |         
 99 |         context.appendChild(questionArea);
100 |         context.appendChild(answerArea);
101 |       
102 |         context.appendChild(document.createElement("br"));
103 |       }
104 | </script>
105 | 
106 | </html>
107 | 


--------------------------------------------------------------------------------
/classification.lua:
--------------------------------------------------------------------------------
  1 | require 'torch'
  2 | require 'nn'
  3 | require 'image'
  4 | require 'loadcaffe'
  5 | utils = require 'misc.utils'
  6 | 
  7 | local preprocess = utils.preprocess
  8 | 
  9 | local TorchModel = torch.class('ClassificationTorchModel')
 10 | 
 11 | function TorchModel:__init(proto_file, model_file, backend, input_sz, layer_name, seed, gpuid)
 12 | 
 13 |   self.proto_file = proto_file
 14 |   self.model_file = model_file
 15 |   self.backend = backend
 16 |   self.input_sz = input_sz
 17 |   self.layer_name = layer_name
 18 |   self.seed = seed
 19 |   self.gpuid = gpuid
 20 |   self:loadModel(proto_file, model_file, backend)
 21 |   torch.manualSeed(self.seed)
 22 |   -- GPU
 23 |   -- torch.setdefaulttensortype('torch.DoubleTensor')
 24 |   -- CPU
 25 |   torch.setdefaulttensortype('torch.FloatTensor')
 26 |   
 27 |   if gpuid >= 0 then
 28 |     require 'cunn'
 29 |     require 'cutorch'
 30 |     cutorch.setDevice(1)
 31 |     cutorch.manualSeed(seed)
 32 |   end
 33 | 
 34 | end
 35 | 
 36 | function TorchModel:loadModel(proto_file, model_file, backend)
 37 | 
 38 |   self.net = loadcaffe.load(proto_file, model_file, backend)
 39 |   self.net = self.net:float()
 40 | 
 41 |   -- Set to evaluate and remove softmax layer
 42 |   self.net:evaluate()
 43 |   self.net:remove()
 44 | 
 45 |   -- Create GB CNN here itself
 46 |   self.net_gb = self.net:clone()
 47 |   self.net_gb:replace(utils.guidedbackprop)
 48 |   self.net_gb = self.net_gb:float()
 49 | end
 50 | 
 51 | function TorchModel:predict(input_image_path, label, out_path)
 52 |   local img = utils.preprocess(input_image_path, input_sz, input_sz)
 53 | 
 54 |   if self.gpuid >= 0 then
 55 |     self.net:cuda()
 56 |     self.net_gb:cuda()
 57 |     img = img:cuda()
 58 |   else
 59 |     print("THIS GOT EXECUTED")
 60 |     img = img:float()
 61 |   end
 62 |   
 63 |   -- Forward pass
 64 |   local output = self.net:forward(img)
 65 |   local output_gb = self.net_gb:forward(img)
 66 | 
 67 |   -- Take argmax
 68 |   local score, pred_label = torch.max(output,1)
 69 | 
 70 |   if label == -1 then 
 71 |     print("No label provided, using predicted label ", pred_label:float())
 72 |     label = pred_label[1]
 73 |   end
 74 | 
 75 |   -- Set gradInput
 76 |   local doutput = utils.create_grad_input(self.net.modules[#self.net.modules], label)
 77 | 
 78 |   -- Grad-CAM
 79 |   local result = {}
 80 |   local gcam = utils.grad_cam(self.net, self.layer_name, doutput)
 81 |   gcam = image.scale(gcam:float(), self.input_sz, self.input_sz)
 82 |   local hm = utils.to_heatmap(gcam)
 83 | 
 84 |   image.save(out_path .. 'classify_gcam_raw_' .. label .. '.png', image.toDisplayTensor(gcam))
 85 |   result['classify_gcam_raw'] = out_path .. 'classify_gcam_raw_' .. label .. '.png'
 86 | 
 87 |   image.save(out_path .. 'classify_gcam_' .. label .. '.png', image.toDisplayTensor(hm))
 88 |   result['classify_gcam'] = out_path .. 'classify_gcam_' .. label .. '.png'
 89 | 
 90 |   -- Guided Backprop
 91 |   local gb_viz = self.net_gb:backward(img, doutput)
 92 |   
 93 |   -- BGR to RGB
 94 |   gb_viz = gb_viz:index(1, torch.LongTensor{3, 2, 1})
 95 |   image.save(out_path .. 'classify_gb_' .. label .. '.png', image.toDisplayTensor(gb_viz))
 96 |   result['classify_gb'] = out_path .. 'classify_gb_' .. label .. '.png'
 97 | 
 98 |   -- Guided Grad-CAM
 99 |   local gb_gcam = gb_viz:float():cmul(gcam:expandAs(gb_viz))
100 |   image.save(out_path .. 'classify_gb_gcam_' .. label .. '.png', image.toDisplayTensor(gb_gcam))
101 |   result['classify_gb_gcam'] = out_path .. 'classify_gb_gcam_' .. label .. '.png'
102 |   result['input_image'] = input_image_path
103 | 
104 |   result['label'] = label
105 |   result['pred_label'] = pred_label[1]
106 |   return result
107 | 
108 | end
109 | 


--------------------------------------------------------------------------------
/captioning.lua:
--------------------------------------------------------------------------------
  1 | require 'torch'
  2 | require 'nn'
  3 | require 'image'
  4 | utils = require 'misc.utils'
  5 | 
  6 | local preprocess = utils.preprocess
  7 | 
  8 | local TorchModel = torch.class('CaptioningTorchModel')
  9 | 
 10 | function TorchModel:__init(model_path, backend, input_sz, layer, seed, gpuid)
 11 |   self.model_path = model_path
 12 |   self.backend = backend
 13 |   self.input_sz = input_sz
 14 |   self.layer = layer
 15 |   self.seed = seed
 16 |   self.gpuid = gpuid
 17 | 
 18 |   if self.gpuid >= 0 then
 19 |     require 'cunn'
 20 |     require 'cudnn'
 21 |     require 'cutorch'
 22 |     cutorch.setDevice(1)
 23 |     cutorch.manualSeed(self.seed)
 24 |   end
 25 |   
 26 |   self:loadModel(model_path)
 27 |   torch.manualSeed(self.seed)
 28 |   torch.setdefaulttensortype('torch.FloatTensor')
 29 | 
 30 | 
 31 |   -- neuraltalk2-specific dependencies
 32 |   -- https://github.com/karpathy/neuraltalk2
 33 | 
 34 | 
 35 | end
 36 | 
 37 | 
 38 | function TorchModel:loadModel(model_path)
 39 | 
 40 |   -- Load the models
 41 |   local lm_misc_utils = require 'neuraltalk2.misc.utils'
 42 |   require 'neuraltalk2.misc.LanguageModel'
 43 |   local net_utils = require 'neuraltalk2.misc.net_utils'
 44 | 
 45 | 
 46 |   self.net = torch.load(model_path)
 47 |   print(self.net)
 48 |   local cnn_lm_model = self.net
 49 |   local cnn = cnn_lm_model.protos.cnn
 50 |   local lm = cnn_lm_model.protos.lm
 51 |   local vocab = cnn_lm_model.vocab
 52 | 
 53 | 
 54 |   net_utils.unsanitize_gradients(cnn)
 55 |   local lm_modules = lm:getModulesList()
 56 |   for k,v in pairs(lm_modules) do
 57 |     net_utils.unsanitize_gradients(v)
 58 |   end
 59 | 
 60 | 
 61 |   -- Set to evaluate mode
 62 |   lm:evaluate()
 63 |   cnn:evaluate()
 64 |   self.cnn = cnn
 65 |   self.lm = lm
 66 |   self.net_utils = net_utils
 67 |   self.vocab = vocab
 68 | 
 69 | end
 70 | 
 71 | 
 72 | function TorchModel:predict(input_image_path, input_sz, input_sz, input_caption, out_path)
 73 |   print(input_image_path)
 74 |   local img = utils.preprocess(input_image_path, input_sz, input_sz)
 75 | 
 76 |   -- Clone & replace ReLUs for Guided Backprop
 77 |   local cnn_gb = self.cnn:clone()
 78 |   cnn_gb:replace(utils.guidedbackprop)
 79 | 
 80 |   -- Ship model to GPU
 81 |   if self.gpuid >= 0 then
 82 |     self.cnn:cuda()
 83 |     cnn_gb:cuda()
 84 |     img = img:cuda()
 85 |     self.lm:cuda()
 86 |   end
 87 | 
 88 |   -- Forward pass
 89 |   im_feats = self.cnn:forward(img)
 90 |   im_feat = im_feats:view(1, -1)
 91 |   im_feat_gb = cnn_gb:forward(img)
 92 | 
 93 |   -- get the prediction from model
 94 |   local seq, seqlogps = self.lm:sample(im_feat, sample_opts)
 95 |   seq[{{}, 1}] = seq
 96 | 
 97 |   local caption = self.net_utils.decode_sequence(self.vocab, seq)
 98 | 
 99 |   if input_caption == '' then
100 |     print("No caption provided, using generated caption for Grad-CAM.")
101 |     input_caption = caption[1]
102 |   end
103 | 
104 |   print("Generated caption: ", caption[1])
105 |   print("Grad-CAM caption: ", input_caption)
106 | 
107 |   local seq_length = self.seq_length or 16
108 | 
109 |   local labels = utils.sent_to_label(self.vocab, input_caption, seq_length)
110 |   if self.gpuid >=0 then labels = labels:cuda() end
111 | 
112 |   local logprobs = self.lm:forward({im_feat, labels})
113 | 
114 |   local doutput = utils.create_grad_input_lm(logprobs, labels)
115 |   if self.gpuid >=0 then doutput = doutput:cuda() end
116 | 
117 |   -- lm backward
118 |   local dlm, ddummy = unpack(self.lm:backward({im_feat, labels}, doutput))
119 |   local dcnn = dlm[1]
120 | 
121 |   -- Grad-CAM
122 |   local gcam = utils.grad_cam(self.cnn, self.layer, dcnn)
123 |   gcam = image.scale(gcam:float(), self.input_sz, self.input_sz)
124 | 
125 |   local result = {}
126 |   local hm = utils.to_heatmap(gcam)
127 | 
128 |   image.save(out_path .. 'captioning_gcam_raw_' .. input_caption .. '.png', image.toDisplayTensor(gcam))
129 |   result['captioning_gcam_raw'] = out_path .. 'captioning_gcam_raw_' .. input_caption .. '.png'
130 | 
131 |   image.save(out_path .. 'caption_gcam_'  .. input_caption .. '.png', image.toDisplayTensor(hm))
132 |   result['captioning_gcam'] = out_path .. 'caption_gcam_'  .. input_caption .. '.png'
133 | 
134 |   -- Guided Backprop
135 |   local gb_viz = cnn_gb:backward(img, dcnn)
136 | 
137 |   -- BGR to RGB
138 |   gb_viz = gb_viz:index(1, torch.LongTensor{3, 2, 1})
139 | 
140 |   image.save(out_path .. 'caption_gb_' .. input_caption .. '.png', image.toDisplayTensor(gb_viz))
141 |   result['captioning_gb'] = out_path .. 'caption_gb_' .. input_caption .. '.png'
142 | 
143 |   -- Guided Grad-CAM
144 |   local gb_gcam = gb_viz:float():cmul(gcam:expandAs(gb_viz))
145 |   image.save(out_path .. 'caption_gb_gcam_' .. input_caption .. '.png', image.toDisplayTensor(gb_gcam))
146 |   result['captioning_gb_gcam'] = out_path .. 'caption_gb_gcam_' .. input_caption .. '.png'
147 | 
148 |   result['input_image'] = input_image_path
149 |   result['input_caption'] = input_caption
150 |   result['pred_caption'] = caption[1]
151 | 
152 |   return result
153 | 
154 | end
155 | 


--------------------------------------------------------------------------------
/misc/utils.lua:
--------------------------------------------------------------------------------
  1 | local utils = {}
  2 | 
  3 | -- Preprocess the image before passing it to a Caffe model.
  4 | function utils.preprocess(path, width, height)
  5 |   local width = width or 224
  6 |   local height = height or 224
  7 |   -- load image
  8 |   local orig_image = image.load(path)
  9 | 
 10 |   -- handle greyscale and rgba images
 11 |   if orig_image:size(1) == 1 then
 12 |     orig_image = orig_image:repeatTensor(3, 1, 1)
 13 |   elseif orig_image:size(1) == 4 then
 14 |     orig_image = orig_image[{{1,3},{},{}}]
 15 |   end
 16 | 
 17 |   -- get the dimensions of the original image
 18 |   local im_height = orig_image:size(2)
 19 |   local im_width = orig_image:size(3)
 20 | 
 21 |   -- scale and subtract mean
 22 |   local img = image.scale(orig_image, width, height):double()
 23 |   local mean_pixel = torch.DoubleTensor({103.939, 116.779, 123.68})
 24 |   img = img:index(1, torch.LongTensor{3, 2, 1}):mul(255.0)
 25 |   mean_pixel = mean_pixel:view(3, 1, 1):expandAs(img)
 26 |   img:add(-1, mean_pixel)
 27 |   return img, im_height, im_width
 28 | end
 29 | 
 30 | -- Replace ReLUs with DeconvReLUs
 31 | function utils.deconv(m)
 32 |   require 'misc.DeconvReLU'
 33 |   local name = torch.typename(m)
 34 |   if name == 'nn.ReLU' or name == 'cudnn.ReLU' then
 35 |     return nn.DeconvReLU()
 36 |   else
 37 |     return m
 38 |   end
 39 | end
 40 | 
 41 | -- Replace ReLUs with DeconvReLUs
 42 | function utils.guidedbackprop(m)
 43 |   require 'misc.GuidedBackpropReLU'
 44 |   local name = torch.typename(m)
 45 |   if name == 'nn.ReLU' or name == 'cudnn.ReLU' then
 46 |     return nn.GuidedBackpropReLU()
 47 |   else
 48 |     return m
 49 |   end
 50 | end
 51 | 
 52 | -- Get layer id from name
 53 | function utils.cnn_layer_id(cnn, layer_name)
 54 |   for i = 1, #cnn.modules do
 55 |     local layer = cnn:get(i)
 56 |     local name = layer.name
 57 |     if name == layer_name then
 58 |       return i
 59 |     end
 60 |   end
 61 |   return -1
 62 | end
 63 | 
 64 | -- Synthesize gradInput tensor
 65 | function utils.create_grad_input(module, label)
 66 |   local doutput = module.output:clone():view(-1)
 67 |   doutput:fill(0)
 68 |   doutput[label] = 1
 69 |   return doutput
 70 | end
 71 | 
 72 | -- Creates gradInput for neuraltalk2 Language Model
 73 | function utils.create_grad_input_lm(input, labels)
 74 |   local output = torch.zeros(input:size()):fill(0)
 75 |   for t =1,labels:size(1) do
 76 |     if labels[t][1]~=0 then
 77 |       output[t+1][1][labels[t][1]] = 1
 78 |     end
 79 |   end
 80 |   return output
 81 | end
 82 | 
 83 | -- Generate Grad-CAM
 84 | function utils.grad_cam(cnn, layer_name, doutput)
 85 |   -- Split model into two
 86 |   local model1, model2 = nn.Sequential(), nn.Sequential()
 87 |   if tonumber(layer_name) == nil then
 88 | 
 89 |    for i = 1, #cnn.modules do
 90 |       model1:add(cnn:get(i))
 91 |       layer_id = i
 92 |       if cnn:get(i).name == layer_name then
 93 |         break
 94 |       end
 95 |     end
 96 |   else
 97 | 
 98 |     layer_id = tonumber(layer_name)
 99 |     for i = 1, #cnn.modules do
100 |       model1:add(cnn:get(i))
101 |       if i == layer_id then
102 |         break
103 |       end
104 |     end
105 |   end
106 | 
107 |   for i = layer_id+1, #cnn.modules do
108 |     model2:add(cnn:get(i))
109 |   end
110 | 
111 |   -- Get activations and gradients
112 |   model2:zeroGradParameters()
113 |   model2:backward(model1.output, doutput)
114 |   
115 |   -- Get the activations from model1 and and gradients from model2
116 |   local activations = model1.output:squeeze()
117 |   local gradients = model2.gradInput:squeeze()
118 | 
119 |   -- Global average pool gradients
120 |   local weights = torch.sum(gradients:view(activations:size(1), -1), 2)
121 | 
122 |   -- Summing and rectifying weighted activations across depth
123 |   local map = torch.sum(torch.cmul(activations, weights:view(activations:size(1), 1, 1):expandAs(activations)), 1)
124 |   map = map:cmul(torch.gt(map,0):typeAs(map))
125 | 
126 |   return map
127 | end
128 | 
129 | function utils.table_invert(t)
130 |   local s = {}
131 |   for k,v in pairs(t) do
132 |     s[v] = k
133 |   end
134 |   return s
135 | end
136 | 
137 | function utils.sent_to_label(vocab, sent, seq_length)
138 |   local inv_vocab = utils.table_invert(vocab)
139 |   local labels = torch.zeros(seq_length,1)
140 |   local i = 0
141 |   for word in sent:gmatch'%w+' do
142 |     -- we replace out of vocabulary words with UNK
143 |     if inv_vocab[word] == nil then
144 |         word = 'UNK'
145 |     end
146 |     local ix_word = inv_vocab[word]
147 |     i = i+1
148 |     labels[{{i},{1}}] = ix_word
149 |   end
150 |   return labels
151 | end
152 | 
153 | function utils.to_heatmap(map)
154 |   map = image.toDisplayTensor(map)
155 |   local cmap = torch.Tensor(3, map:size(2), map:size(3)):fill(1)
156 |   for i = 1, map:size(2) do
157 |     for j = 1, map:size(3) do
158 |       local value = map[1][i][j]
159 |       if value <= 0.25 then
160 |         cmap[1][i][j] = 0
161 |         cmap[2][i][j] = 4*value
162 |       elseif value <= 0.5 then
163 |         cmap[1][i][j] = 0
164 |         cmap[3][i][j] = 2 - 4*value
165 |       elseif value <= 0.75 then
166 |         cmap[1][i][j] = 4*value - 2
167 |         cmap[3][i][j] = 0
168 |       else
169 |         cmap[2][i][j] = 4 - 4*value
170 |         cmap[3][i][j] = 0
171 |       end
172 |     end
173 |   end
174 |   return cmap
175 | end
176 | 
177 | return utils
178 | 


--------------------------------------------------------------------------------
/visual_question_answering.lua:
--------------------------------------------------------------------------------
  1 | require 'torch'
  2 | require 'nn'
  3 | require 'image'
  4 | require 'loadcaffe'
  5 | utils = require 'misc.utils'
  6 | 
  7 | local preprocess = utils.preprocess
  8 | 
  9 | local TorchModel = torch.class('VQATorchModel')
 10 | 
 11 | function TorchModel:__init(proto_file, model_file, input_sz, backend, layer_name, model_path, input_encoding_size, rnn_size, rnn_layers, common_embedding_size, num_output, seed, gpuid)
 12 | 
 13 |   self.input_sz = input_sz
 14 |   self.layer_name = layer_name
 15 |   self.model_path = model_path
 16 |   self.input_encoding_size = input_encoding_size
 17 |   self.rnn_size = rnn_size
 18 |   self.rnn_layers = rnn_layers
 19 |   self.common_embedding_size = common_embedding_size
 20 |   self.num_output = num_output
 21 |   self.seed = seed
 22 |   self.gpuid = gpuid
 23 |   self:loadModel(proto_file, model_file, backend)
 24 | 
 25 |   torch.manualSeed(self.seed)
 26 |   -- For GPU
 27 |   torch.setdefaulttensortype('torch.FloatTensor')
 28 |   -- For CPU
 29 |   -- torch.setdefaulttensortype('torch.DoubleTensor')
 30 | 
 31 |   if self.gpuid >= 0 then
 32 |     require 'cunn'
 33 |     require 'cutorch'
 34 |     cutorch.setDevice(1)
 35 |     cutorch.manualSeed(self.seed)
 36 |   end
 37 |   collectgarbage()
 38 | end
 39 | 
 40 | function TorchModel:loadModel(proto_file, model_file, backend)
 41 |   -- Load CNN
 42 |   self.net = loadcaffe.load(proto_file, model_file, backend)
 43 | 
 44 |   -- Set to evaluate and remove linear+softmax layer
 45 |   self.net:evaluate()
 46 |   self.net:remove()
 47 |   self.net:remove()
 48 |   self.net:add(nn.Normalize(2))
 49 | 
 50 |   -- Clone & replace ReLUs for Guided Backprop
 51 |   local cnn_gb = self.net:clone()
 52 |   cnn_gb:replace(utils.guidedbackprop)
 53 |   self.cnn_gb = cnn_gb
 54 |   -- VQA-specific dependencies
 55 |   -- https://github.com/VT-vision-lab/VQA_LSTM_CNN/blob/master/eval.lua
 56 | 
 57 |   -- Below is a hacky solution since opt.gpuid is used in VQA_LSTM_CNN/misc.RNNUtils 
 58 |   opt = {}
 59 |   opt.gpuid = self.gpuid
 60 | 
 61 |   require 'VQA_LSTM_CNN/misc.netdef'
 62 |   require 'VQA_LSTM_CNN/misc.RNNUtils'
 63 |   LSTM = require 'VQA_LSTM_CNN/misc.LSTM'
 64 |   cjson = require 'cjson'
 65 | 
 66 |   -- Load vocabulary
 67 |   local file = io.open('VQA_LSTM_CNN/data_prepro.json','r')
 68 |   local text = file:read()
 69 |   file:close()
 70 |   local json_file = cjson.decode(text)
 71 |   local vocabulary_size_q = 0
 72 |   for i, w in pairs(json_file['ix_to_word']) do vocabulary_size_q = vocabulary_size_q + 1 end
 73 | 
 74 | 
 75 |   -- VQA model definition
 76 |   local embedding_net_q = nn.Sequential()
 77 |     :add(nn.Linear(vocabulary_size_q, self.input_encoding_size))
 78 |     :add(nn.Dropout(0.5))
 79 |     :add(nn.Tanh())
 80 | 
 81 |   local encoder_net_q = LSTM.lstm_conventional(self.input_encoding_size, self.rnn_size, 1, self.rnn_layers, 0.5)
 82 | 
 83 |   local multimodal_net = nn.Sequential()
 84 |     :add(netdef.AxB(2 * self.rnn_size * self.rnn_layers, 4096, self.common_embedding_size, 0.5))
 85 |     :add(nn.Dropout(0.5))
 86 |     :add(nn.Linear(self.common_embedding_size, self.num_output))
 87 | 
 88 |   local dummy_state_q = torch.Tensor(self.rnn_size * self.rnn_layers * 2):fill(0)
 89 |   local dummy_output_q = torch.Tensor(1):fill(0)
 90 | 
 91 |   -- Ship model to GPU
 92 |   if self.gpuid >= 0 then
 93 |     embedding_net_q:cuda()
 94 |     encoder_net_q:cuda()
 95 |     multimodal_net:cuda()
 96 |     dummy_state_q = dummy_state_q:cuda()
 97 |     dummy_output_q = dummy_output_q:cuda()
 98 |   end
 99 | 
100 |   -- Set to evaluate
101 |   embedding_net_q:evaluate()
102 |   encoder_net_q:evaluate()
103 |   multimodal_net:evaluate()
104 | 
105 |   -- Zero gradients
106 |   embedding_net_q:zeroGradParameters()
107 |   encoder_net_q:zeroGradParameters()
108 |   multimodal_net:zeroGradParameters()
109 | 
110 |   -- Load pretrained VQA model
111 |   embedding_w_q, embedding_dw_q = embedding_net_q:getParameters()
112 |   encoder_w_q, encoder_dw_q = encoder_net_q:getParameters()
113 |   multimodal_w, multimodal_dw = multimodal_net:getParameters()
114 | 
115 |   model_param = torch.load(self.model_path)
116 |   embedding_w_q:copy(model_param['embedding_w_q'])
117 |   encoder_w_q:copy(model_param['encoder_w_q'])
118 |   multimodal_w:copy(model_param['multimodal_w'])
119 | 
120 |   local encoder_net_buffer_q = dupe_rnn(encoder_net_q, 26)
121 | 
122 |   -- all below variables are used in predict method
123 |   self.embedding_net_q = embedding_net_q
124 |   self.encoder_net_buffer_q = encoder_net_buffer_q
125 |   self.vocabulary_size_q = vocabulary_size_q
126 |   self.multimodal_net = multimodal_net
127 |   self.dummy_state_q = dummy_state_q
128 |   self.json_file = json_file
129 | 
130 | end
131 | 
132 | function TorchModel:predict(input_image_path, input_sz, input_sz, input_question, input_answer, out_path)
133 | 
134 |   -- Load image
135 |   local img = utils.preprocess(input_image_path, input_sz, input_sz)
136 |   -- Ship CNNs and image to GPU
137 |   if self.gpuid >= 0 then
138 |     self.net:cuda()
139 |     self.cnn_gb:cuda()
140 |     img = img:cuda()
141 |   end
142 | 
143 |   -- Forward pass
144 |   fv_im = self.net:forward(img)
145 |   fv_im_gb = self.cnn_gb:forward(img)
146 | 
147 |   -- Tokenize question
148 |   local cmd = 'python misc/prepro_ques.py --question "'.. input_question..'"'
149 |   os.execute(cmd)
150 |   cmd = nil
151 |   local file = io.open('ques_feat.json')
152 |   local text = file:read()
153 |   file:close()
154 |   q_feats = cjson.decode(text)
155 | 
156 |   question = right_align(torch.LongTensor{q_feats.ques}, torch.LongTensor{q_feats.ques_length})
157 |   fv_sorted_q = sort_encoding_onehot_right_align(question, torch.LongTensor{q_feats.ques_length}, self.vocabulary_size_q)
158 | 
159 |   -- Ship question features to GPU
160 |   if self.gpuid >= 0 then
161 |     fv_sorted_q[1] = fv_sorted_q[1]:cuda()
162 |     fv_sorted_q[3] = fv_sorted_q[3]:cuda()
163 |     fv_sorted_q[4] = fv_sorted_q[4]:cuda()
164 |   else
165 |     fv_sorted_q[1] = fv_sorted_q[1]:double()
166 |   end
167 | 
168 |   local question_max_length = fv_sorted_q[2]:size(1)
169 | 
170 |   -- Embedding forward
171 |   local word_embedding_q = split_vector(self.embedding_net_q:forward(fv_sorted_q[1]), fv_sorted_q[2])
172 | 
173 |   -- Encoder forward
174 |   local states_q, _ = rnn_forward(self.encoder_net_buffer_q, torch.repeatTensor(self.dummy_state_q:fill(0), 1, 1), word_embedding_q, fv_sorted_q[2])
175 | 
176 |   -- Multimodal forward
177 |   local tv_q = states_q[question_max_length + 1]:index(1, fv_sorted_q[4])
178 |   local scores = self.multimodal_net:forward({tv_q, fv_im})
179 | 
180 |   -- Get predictions
181 |   _, pred = torch.max(scores:double(), 2)
182 |   answer = self.json_file['ix_to_ans'][tostring(pred[{1, 1}])]
183 | 
184 |   local inv_vocab = utils.table_invert(self.json_file['ix_to_ans'])
185 |   if input_answer ~= '' and inv_vocab[input_answer] ~= nil then answer_idx = inv_vocab[input_answer] else input_answer = answer answer_idx = inv_vocab[answer] end
186 | 
187 |   -- Set gradInput
188 |   local doutput = utils.create_grad_input(self.multimodal_net.modules[#self.multimodal_net.modules], answer_idx)
189 | 
190 |   -- Multimodal backward
191 |   local tmp = self.multimodal_net:backward({tv_q, fv_im}, doutput:view(1,-1))
192 |   local dcnn = tmp[2]
193 | 
194 |   -- Grad-CAM
195 |   local gcam = utils.grad_cam(self.net, self.layer_name, dcnn)
196 |   gcam = image.scale(gcam:float(), self.input_sz, self.input_sz)
197 | 
198 |   local result = {}
199 |   local hm = utils.to_heatmap(gcam)
200 | 
201 |   image.save(out_path .. 'vqa_gcam_raw_' .. input_answer .. '.png', image.toDisplayTensor(gcam))
202 |   result['vqa_gcam_raw'] = out_path .. 'vqa_gcam_raw_' .. input_answer .. '.png'
203 | 
204 |   image.save(out_path .. 'vqa_gcam_' .. input_answer .. '.png', image.toDisplayTensor(hm))
205 |   result['vqa_gcam'] = out_path .. 'vqa_gcam_' .. input_answer .. '.png'
206 | 
207 | 
208 |   -- Guided Backprop
209 |   local gb_viz = self.cnn_gb:backward(img, dcnn)
210 | 
211 |   -- self.cnn_gb = nil
212 |   -- collectgarbage()
213 | 
214 |   -- BGR to RGB
215 |   gb_viz = gb_viz:index(1, torch.LongTensor{3, 2, 1})
216 | 
217 |   image.save(out_path .. 'vqa_gb_' .. input_answer .. '.png', image.toDisplayTensor(gb_viz))
218 |   result['vqa_gb'] = out_path .. 'vqa_gb_' .. input_answer .. '.png'
219 | 
220 |   -- Guided Grad-CAM
221 |   local gb_gcam = gb_viz:float():cmul(gcam:expandAs(gb_viz))
222 |   image.save(out_path .. 'vqa_gb_gcam_' .. input_answer .. '.png', image.toDisplayTensor(gb_gcam))
223 |   result['vqa_gb_gcam'] = out_path .. 'vqa_gb_gcam_' .. input_answer .. '.png'
224 |   result['input_answer'] = input_answer
225 |   result['answer'] = answer
226 |   result['input_image'] = input_image_path
227 |   return result
228 | end
229 | 


--------------------------------------------------------------------------------
/grad_cam/views.py:
--------------------------------------------------------------------------------
  1 | from django.shortcuts import render
  2 | from django.http import JsonResponse
  3 | from django.conf import settings
  4 | from channels import Group
  5 | 
  6 | from grad_cam.sender import grad_cam_classification, grad_cam_vqa, grad_cam_captioning
  7 | from grad_cam.utils import log_to_terminal
  8 | import grad_cam.constants as constants
  9 | import uuid
 10 | import os
 11 | import random
 12 | import traceback
 13 | import urllib2
 14 | import requests
 15 | from urlparse import urlparse
 16 | from django.http import HttpResponse
 17 | 
 18 | 
 19 | def home(request, template_name="index.html"):
 20 |     return render(request, template_name,)
 21 | 
 22 | 
 23 | def vqa(request, template_name="vqa/vqa.html"):
 24 |     socketid = uuid.uuid4()
 25 |     if request.method == "POST":
 26 |         # get the parameters from client side
 27 |         try:
 28 |             socketid = request.POST.get('socketid')
 29 |             input_question = request.POST.get('question', '')
 30 |             input_answer = request.POST.get('answer', None)
 31 |             img_path = request.POST.get('img_path')
 32 |             img_path = urllib2.unquote(img_path)
 33 | 
 34 |             abs_image_path = settings.BASE_DIR + str(img_path)
 35 |             # abs_image_path = os.path.join(settings.BASE_DIR, str(img_path[1:]))
 36 |             out_dir = os.path.dirname(abs_image_path)
 37 |             # Run the VQA wrapper
 38 |             log_to_terminal(socketid, {"terminal": "Starting Visual Question Answering job..."})
 39 |             response = grad_cam_vqa(str(input_question), str(input_answer), str(abs_image_path), str(out_dir+"/"), socketid)
 40 |         except Exception, err:
 41 |             log_to_terminal(socketid, {"terminal": traceback.print_exc()})
 42 | 
 43 |     demo_images = get_demo_images(constants.COCO_IMAGES_PATH)
 44 |     return render(request, template_name, {"demo_images": demo_images, 'socketid': socketid})
 45 | 
 46 | 
 47 | def classification(request, template_name="classification/classification.html"):
 48 |     socketid = uuid.uuid4()
 49 |     if request.method == "POST":
 50 |         try:
 51 |             img_path = request.POST.get('img_path')
 52 |             img_path = urllib2.unquote(img_path)
 53 |             label = request.POST.get('label')
 54 |             socketid = request.POST.get('socketid')
 55 | 
 56 |             abs_image_path = os.path.join(settings.BASE_DIR, str(img_path[1:]))
 57 |             out_dir = os.path.dirname(abs_image_path)
 58 | 
 59 |             # Run the classification wrapper
 60 |             log_to_terminal(socketid, {"terminal": "Starting classification job on VGG_ILSVRC_16_layers.caffemodel"})
 61 |             response = grad_cam_classification(str(abs_image_path), int(label), str(out_dir+"/"), socketid)
 62 |         except Exception, err:
 63 |             log_to_terminal(socketid, {"terminal": traceback.print_exc()})
 64 |     demo_images = get_demo_images(constants.COCO_IMAGES_PATH)
 65 |     return render(request, template_name, {"demo_images": demo_images, 'socketid': socketid})
 66 | 
 67 | 
 68 | def captioning(request, template_name="captioning/captioning.html"):
 69 |     socketid = uuid.uuid4()
 70 |     if request.method == "POST":
 71 |         try:
 72 |             img_path = request.POST.get('img_path')
 73 |             img_path = urllib2.unquote(img_path)
 74 |             caption = request.POST.get('caption', '')
 75 |             socketid = request.POST.get('socketid')
 76 | 
 77 |             abs_image_path = os.path.join(settings.BASE_DIR, str(img_path[1:]))
 78 |             out_dir = os.path.dirname(abs_image_path)
 79 | 
 80 |             # Run the captioning wrapper
 81 |             log_to_terminal(socketid, {"terminal": "Starting Captioning job..."})
 82 |             response = grad_cam_captioning(str(abs_image_path), str(caption), str(out_dir+"/"), socketid)
 83 |         except Exception, err:
 84 |             log_to_terminal(socketid, {"terminal": traceback.print_exc()})
 85 | 
 86 |     demo_images = get_demo_images(constants.COCO_IMAGES_PATH)
 87 |     return render(request, template_name, {"demo_images": demo_images, 'socketid': socketid})
 88 | 
 89 | 
 90 | def file_upload(request):
 91 |     if request.method == "POST":
 92 |         image = request.FILES['file']
 93 |         demo_type = request.POST.get("type")
 94 | 
 95 |         if demo_type == "vqa":
 96 |             dir_type = constants.VQA_CONFIG['image_dir']
 97 |         elif demo_type == "classification":
 98 |             dir_type = constants.CLASSIFICATION_CONFIG['image_dir']
 99 |         elif demo_type == "captioning":
100 |             dir_type = constants.CAPTIONING_CONFIG['image_dir']
101 | 
102 |         random_uuid = uuid.uuid1()
103 |         # handle image upload
104 |         output_dir = os.path.join(dir_type, str(random_uuid))
105 | 
106 |         if not os.path.exists(output_dir):
107 |             os.makedirs(output_dir)
108 | 
109 |         img_path = os.path.join(output_dir, str(image))
110 |         handle_uploaded_file(image, img_path)
111 |         return JsonResponse({"file_path": img_path})
112 |     else:
113 |         pass
114 | 
115 | 
116 | 
117 | def handle_uploaded_file(f, path):
118 |     with open(path, 'wb+') as destination:
119 |         for chunk in f.chunks():
120 |             destination.write(chunk)
121 | 
122 | 
123 | def get_demo_images(demo_images_path):
124 |     try:
125 |         images_list = next(os.walk(demo_images_path))[2]
126 |         demo_images = select_random_six_demo_images(images_list)
127 | 
128 |         demo_images = [os.path.join(settings.MEDIA_URL, 'coco', 'val2014', x) for x in demo_images]
129 |     except:
130 |         images = ['img1.jpg', 'img2.jpg', 'img3.jpg', 'img4.jpg', 'img5.jpg', 'img6.jpg', ]
131 |         demo_images = [os.path.join(settings.STATIC_URL, 'images', x) for x in images]
132 |     return demo_images
133 | 
134 | 
135 | def select_random_six_demo_images(images_list):
136 |     prefixes = ('classify', 'vqa', 'caption')
137 |     demo_images = [random.choice(images_list) for i in range(6)]
138 |     for i in demo_images[:]:
139 |         if i.startswith(prefixes):
140 |             demo_images = select_random_six_demo_images(images_list)
141 |     return demo_images
142 | 
143 | 
144 | def upload_image_using_url(request):
145 |     if request.method == "POST":
146 |         try:
147 |             socketid = request.POST.get('socketid', None)
148 |             image_url = request.POST.get('src', None)
149 |             demo_type = request.POST.get('type')
150 | 
151 |             if demo_type == "vqa":
152 |                 dir_type = constants.VQA_CONFIG['image_dir']
153 |             elif demo_type == "classification":
154 |                 dir_type = constants.CLASSIFICATION_CONFIG['image_dir']
155 |             elif demo_type == "captioning":
156 |                 dir_type = constants.CAPTIONING_CONFIG['image_dir']
157 | 
158 |             img_name =  os.path.basename(urlparse(image_url).path)
159 |             response = requests.get(image_url, stream=True)
160 | 
161 |             if response.status_code == 200:
162 |                 random_uuid = uuid.uuid1()
163 |                 output_dir = os.path.join(dir_type, str(random_uuid))
164 | 
165 |                 if not os.path.exists(output_dir):
166 |                     os.makedirs(output_dir)
167 | 
168 |                 img_path = os.path.join(output_dir, str(img_name))
169 |                 with open(os.path.join(output_dir, img_name), 'wb+') as f:
170 |                     f.write(response.content)
171 | 
172 |                 img_path =  "/" + "/".join(img_path.split('/')[-5:])
173 |                 
174 |                 return JsonResponse({"file_path": img_path})
175 |             else:
176 |                 return HttpResponse("Please Enter the Correct URL.")
177 |         except:
178 |             return HttpResponse("No images matching this url.")
179 |     else:
180 |         return HttpResponse("Invalid request method.")
181 | 
182 | 
183 | def captioning_api(request):
184 |     if request.method == "POST":
185 |         try:
186 |             image = request.FILES['image']
187 |             caption = request.POST.get('caption', '')
188 | 
189 |             abs_image_path = os.path.join(settings.BASE_DIR, str(img_path[1:]))
190 |             out_dir = os.path.dirname(abs_image_path)
191 | 
192 |             # Run the captioning wrapper
193 |             log_to_terminal(socketid, {"terminal": "Starting Captioning job..."})
194 |             response = grad_cam_captioning(str(abs_image_path), str(caption), str(out_dir+"/"), socketid)
195 |         except Exception, err:
196 |             log_to_terminal(socketid, {"terminal": traceback.print_exc()})
197 | 
198 |     demo_images = get_demo_images(constants.COCO_IMAGES_PATH)
199 |     return render(request, template_name, {"demo_images": demo_images, 'socketid': socketid})
200 | 


--------------------------------------------------------------------------------
/grad_cam/templates/home.html:
--------------------------------------------------------------------------------
  1 | {% load static %}
  2 | <html lang="en">
  3 | <head>
  4 |     <meta charset="utf-8">
  5 |     <title>Grad-CAM: Gradient-weighted Class Activation Mapping</title>
  6 |     <meta name="description" content="Grad-CAM: Gradient-weighted Class Activation Mapping">
  7 |     <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 |     <link href='http://fonts.googleapis.com/css?family=Roboto:400,100,‌​100italic,300,300ita‌​lic,400italic,500,50‌​0italic,700,700itali‌​c,900italic,900' rel='stylesheet' type='text/css'>
  9 |     <link rel="stylesheet" href="//netdna.bootstrapcdn.com/bootstrap/3.0.0/css/bootstrap.min.css">
 10 |     <link rel="stylesheet" href="http://cloudcv.org/static/css/style.css">
 11 |     <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.5.0/css/font-awesome.min.css">
 12 |     <link rel="stylesheet" href="//code.jquery.com/ui/1.12.0/themes/base/jquery-ui.css">
 13 | 
 14 |     <script src="/static/js/dropzone.js"></script>
 15 |     <script src="//ajax.googleapis.com/ajax/libs/jquery/1.10.2/jquery.min.js"></script>
 16 |     <script src="http://cloudcv.org/static/js/vendor/jquery.ui.widget.js"></script>
 17 |     <script src="http://cloudcv.org/node/socket.io/socket.io.js"></script>
 18 |     <script src="https://code.jquery.com/ui/1.12.0/jquery-ui.js"></script>
 19 |     <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/dropzone/4.3.0/min/dropzone.min.css">
 20 | </head>
 21 | <body>
 22 | 
 23 | <div class="navbar navbar-inverse navbar-fixed-top">
 24 |     <div class="container">
 25 |         <div class="navbar-header">
 26 |             <button type="button" class="navbar-toggle" data-toggle="collapse" data-target=".navbar-fixed-top .navbar-collapse">
 27 |                 <span class="icon-bar"></span>
 28 |                 <span class="icon-bar"></span>
 29 |                 <span class="icon-bar"></span>
 30 |             </button>
 31 |             <a class="navbar-brand" href="/">CloudCV</a>
 32 |         </div>
 33 |         <div class="navbar-collapse collapse">
 34 |             <ul class="nav navbar-nav">
 35 |                 <li id="image-stitching"><a  href="http://cloudcv.org/image-stitch">Image Stitching</a></li>
 36 |                  <li id = "object-detection" ><a href="http://objdetect.cloudcv.org">Object Detection</a></li>
 37 |                 <li id = "decaf-server"><a  href="http://cloudcv.org/decaf-server">Decaf-Server</a></li>
 38 |                 <li id = "classification" ><a href="http://cloudcv.org/classify">Classification</a></li>
 39 |                 <li id = "poi" ><a href="http://cloudcv.org/vip">VIP</a></li>
 40 |                 <li id="trainaclass"><a href="http://cloudcv.org/trainaclass">Train a new category</a></li>
 41 |                 <li id="vqa"><a href="http://cloudcv.org/vqa">VQA</a></li>
 42 |                 <li id="vqa"><a href="{% url 'home' %}">Grad-CAM</a></li>
 43 |             </ul>
 44 |         </div>
 45 |     </div>
 46 | </div>
 47 | 
 48 | 
 49 | <style>
 50 | p, h1, h2{
 51 |   font-weight: 300 !important;
 52 |   font-family: 'Roboto', sans-serif;
 53 | }
 54 | 
 55 | body{
 56 |   font-family: 'Roboto', sans-serif;
 57 | }
 58 | 
 59 | p{
 60 |   font-size: 16px;
 61 | }
 62 | .team{
 63 |   width: 75%;
 64 |   margin-bottom: 15px;
 65 |  }
 66 |  .member-name{
 67 |   cursor: auto;
 68 |  }
 69 | 
 70 |  .img-responsive{
 71 |   max-height: 100%;
 72 |   display: block;
 73 |   height: 150px; 
 74 |  }
 75 | </style>
 76 | 
 77 | {% block header_content %}
 78 | 
 79 |   <div class="container">
 80 |     <h1 align="center">Grad-CAM: Gradient-weighted Class Activation Mapping</h1>
 81 |   </div>
 82 | 
 83 | {% endblock %}
 84 | 
 85 | {% block slider %}
 86 | 
 87 | {% endblock %}
 88 | 
 89 | {% block abstract%}
 90 | <div class="container">
 91 |     <h2>Abstract</h2>
 92 |     <p>In recent research conducted by our lab (Machine Learning & Perception group), we have developed novel techniques for making CNN more 'transparent' by producing <b>visual explanations</b> i.e visualizations showing what evidence in the image supports a prediction. Research conducted in our lab has shown that models that explain their behavior are considered more trustworthy than typical "black-box" models.</p>
 93 | 
 94 |     <img src="{% static 'images/network.jpg' %}" width="80%" align="center">
 95 | </div>
 96 | {% endblock %}
 97 | 
 98 | {% block demo_links %}
 99 | 
100 | <div class="container">
101 |   <h2>Demonstration Links</h2>
102 |     <div class="row">
103 |       <div class="col-md-4">
104 |       <div class="card card-block">
105 |         <h3 class="card-title">Visual Question Answering</h3>
106 |         <p class="card-text">Some randome text description about the demo goes here.</p>
107 |         <a target="_blank" href="{% url 'vqa' %}" class="btn btn-primary">Try Visual Question Answering Demo</a>
108 |       </div>
109 |     </div>
110 | 
111 |     <div class="col-md-4">
112 |       <div class="card card-block">
113 |         <h3 class="card-title">Classification</h3>
114 |         <p class="card-text">Some randome text description about the demo goes here.</p>
115 |         <a target="_blank" href="{% url 'classification' %}" class="btn btn-primary">Try Classification Demo</a>
116 |       </div>
117 |     </div>
118 | 
119 |     <div class="col-md-4">
120 |       <div class="card card-block">
121 |         <h3 class="card-title">Captioning</h3>
122 |         <p class="card-text">Some randome text description about the demo goes here.</p>
123 |         <a target="_blank" href="{% url 'captioning' %}" class="btn btn-primary">Try Captioning Demo</a>
124 |       </div>
125 |     </div>
126 | 
127 |   </div>
128 | </div>
129 | 
130 | {% endblock %}
131 | 
132 | {% block team %}
133 |   <div class="container">
134 |     <h2>Grad-CAM Team</h2>
135 |     <div class="row team">
136 |       <div class="col-sm-3" align="center">
137 |         <img src="{% static 'images/team/ram.jpeg'%}" class="img-responsive img-circle" alt="Cinque Terre">
138 |         <div class="member-name" align="center"><a  target="_blank" href="https://ramprs.github.io/">Ramprasaath R. Selvaraju</a></div>
139 |       </div>
140 |       <div class="col-sm-3" align="center">
141 |         <img src="{% static 'images/team/abhishek.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
142 |         <div class="member-name" align="center"><a  target="_blank" href="http://abhishekdas.com/">Abhishek Das</a></div>
143 |       </div>
144 |       <div class="col-sm-3" align="center">
145 |         <img src="{% static 'images/team/Ramakrishna-Vedantam-updated.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
146 |         <div class="member-name" align="center"><a  target="_blank" href="https://scholar.google.com/citations?user=v1CRzeAAAAAJ&hl=en">Ramakrishna Vedantam</a></div>
147 |       </div>
148 |       <div class="col-sm-3" align="center">
149 |         <img src="{% static 'images/team/michael.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
150 |         <div class="member-name" align="center"><a  target="_blank" href="">Michael Cogswell</a></div>
151 |       </div>
152 |     </div>
153 | 
154 |     <div class="row team">
155 |       <div class="col-sm-3" align="center">
156 |         <img src="{% static 'images/team/stefan.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
157 |         <div class="member-name" align="center"><a  target="_blank" href="https://computing.ece.vt.edu/~steflee/">Stefan Lee</a></div>
158 |       </div>
159 |       <div class="col-sm-3" align="center"> 
160 |         <img src="{% static 'images/team/deshraj.png'%}" class="img-responsive img-circle center" alt="Cinque Terre">
161 |         <div class="member-name" align="center"><a  target="_blank" href="https://www.linkedin.com/in/deshraj-yadav-34325975">Deshraj Yadav</a></div>
162 |       </div>
163 |       <div class="col-sm-3" align="center">
164 |         <img src="{% static 'images/team/DeviParikh.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
165 |         <div class="member-name" align="center"><a  target="_blank" href="https://filebox.ece.vt.edu/~parikh/">Devi Parikh</a></div>
166 |       </div>
167 |       <div class="col-sm-3" align="center">
168 |         <img src="{% static 'images/team/dhruv_batra.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
169 |         <div class="member-name" align="center"><a  target="_blank" href="https://filebox.ece.vt.edu/~dbatra/">Dhruv Batra</a></div>
170 |       </div>
171 |     </div>
172 | 
173 |   </div>
174 | {% endblock%}
175 | 
176 | {% block footer %}
177 | <!-- <div class="container">
178 |   <div id="footer">
179 |     <div id="footermsg" align="center"><p>Do you have questions ?</p></div>
180 |     <a href="">
181 |       <button type="button" class="btn btn-primary btn-lg">Sign up for email alerts</button>
182 |     </a>
183 | 
184 |     <div id="classicons">
185 |       <a href="https://twitter.com/cs231n">
186 |         <img src="twitter.svg">
187 |       </a>
188 |     </div>
189 | 
190 |   </div>
191 | </div> -->
192 | 
193 | {% endblock %}
194 | <script>
195 |   (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
196 |   (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
197 |   m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
198 |   })(window,document,'script','https://www.google-analytics.com/analytics.js','ga');
199 | 
200 |   ga('create', 'UA-53104159-4', 'auto');
201 |   ga('send', 'pageview');
202 | 
203 | </script>
204 | </body>
205 | </html>
206 | 


--------------------------------------------------------------------------------
/grad_cam/templates/home_new.html:
--------------------------------------------------------------------------------
  1 | {% load static %}
  2 | <html lang="en">
  3 | <head>
  4 |     <meta charset="utf-8">
  5 |     <title>Grad-CAM: Gradient-weighted Class Activation Mapping</title>
  6 |     <meta name="description" content="Grad-CAM: Gradient-weighted Class Activation Mapping">
  7 |     <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 |     <link href='http://fonts.googleapis.com/css?family=Roboto:400,100,‌​100italic,300,300ita‌​lic,400italic,500,50‌​0italic,700,700itali‌​c,900italic,900' rel='stylesheet' type='text/css'>
  9 |     <link rel="stylesheet" href="//netdna.bootstrapcdn.com/bootstrap/3.0.0/css/bootstrap.min.css">
 10 |     <link rel="stylesheet" href="http://cloudcv.org/static/css/style.css">
 11 |     <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.5.0/css/font-awesome.min.css">
 12 |     <link rel="stylesheet" href="//code.jquery.com/ui/1.12.0/themes/base/jquery-ui.css">
 13 | 
 14 |     <script src="/static/js/dropzone.js"></script>
 15 |     <script src="//ajax.googleapis.com/ajax/libs/jquery/1.10.2/jquery.min.js"></script>
 16 |     <script src="http://cloudcv.org/static/js/vendor/jquery.ui.widget.js"></script>
 17 |     <script src="http://cloudcv.org/node/socket.io/socket.io.js"></script>
 18 |     <script src="https://code.jquery.com/ui/1.12.0/jquery-ui.js"></script>
 19 |     <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/dropzone/4.3.0/min/dropzone.min.css">
 20 | </head>
 21 | <body>
 22 | 
 23 | <div class="navbar navbar-inverse navbar-fixed-top">
 24 |     <div class="container">
 25 |         <div class="navbar-header">
 26 |             <button type="button" class="navbar-toggle" data-toggle="collapse" data-target=".navbar-fixed-top .navbar-collapse">
 27 |                 <span class="icon-bar"></span>
 28 |                 <span class="icon-bar"></span>
 29 |                 <span class="icon-bar"></span>
 30 |             </button>
 31 |             <a class="navbar-brand" href="/">CloudCV</a>
 32 |         </div>
 33 |         <div class="navbar-collapse collapse">
 34 |             <ul class="nav navbar-nav">
 35 |                 <li id="image-stitching"><a  href="http://cloudcv.org/image-stitch">Image Stitching</a></li>
 36 |                  <li id = "object-detection" ><a href="http://objdetect.cloudcv.org">Object Detection</a></li>
 37 |                 <li id = "decaf-server"><a  href="http://cloudcv.org/decaf-server">Decaf-Server</a></li>
 38 |                 <li id = "classification" ><a href="http://cloudcv.org/classify">Classification</a></li>
 39 |                 <li id = "poi" ><a href="http://cloudcv.org/vip">VIP</a></li>
 40 |                 <li id="trainaclass"><a href="http://cloudcv.org/trainaclass">Train a new category</a></li>
 41 |                 <li id="vqa"><a href="http://cloudcv.org/vqa">VQA</a></li>
 42 |                 <li id="vqa"><a href="{% url 'home' %}">Grad-CAM</a></li>
 43 |             </ul>
 44 |         </div>
 45 |     </div>
 46 | </div>
 47 | 
 48 | 
 49 | <style>
 50 | p, h1, h2{
 51 |   font-weight: 300 !important;
 52 |   font-family: 'Roboto', sans-serif;
 53 | }
 54 | 
 55 | body{
 56 |   font-family: 'Roboto', sans-serif;
 57 | }
 58 | 
 59 | p{
 60 |   font-size: 16px;
 61 | }
 62 | .team{
 63 |   width: 75%;
 64 |   margin-bottom: 15px;
 65 |  }
 66 |  .member-name{
 67 |   cursor: auto;
 68 |  }
 69 | 
 70 |  .img-responsive{
 71 |   max-height: 100%;
 72 |   display: block;
 73 |   height: 150px; 
 74 |  }
 75 |  .team_div{
 76 |   margin-top: 15px;
 77 |  }
 78 | 
 79 |  #network{
 80 |   margin-top: 15px;
 81 |  }
 82 | 
 83 |  .headings{
 84 |   margin-bottom: 15px;
 85 |  }
 86 | #team_heading{
 87 |   margin-bottom: 25px;
 88 | }
 89 | </style>
 90 | 
 91 | {% block header_content %}
 92 | 
 93 |   <div class="container">
 94 |     <h1 align="center">Grad-CAM: Gradient-weighted Class Activation Mapping</h1>
 95 |   </div>
 96 | 
 97 | {% endblock %}
 98 | 
 99 | {% block slider %}
100 | 
101 | {% endblock %}
102 | 
103 | {% block abstract%}
104 | <div class="container">
105 |     <h2 align="center" class="headings">Abstract</h2>
106 |     <p>In recent research conducted by our lab (Machine Learning & Perception group), we have developed novel techniques for making CNN more 'transparent' by producing <b>visual explanations</b> i.e visualizations showing what evidence in the image supports a prediction. Research conducted in our lab has shown that models that explain their behavior are considered more trustworthy than typical "black-box" models.</p>
107 | 
108 |     <img id="network" src="{% static 'images/network.jpg' %}" width="100%" align="center">
109 | </div>
110 | {% endblock %}
111 | 
112 | {% block demo_links %}
113 | 
114 | <div class="container">
115 |   <h2 align="center" class="headings">Demonstration Links</h2>
116 |     <div class="row">
117 |       <div class="col-md-4">
118 |       <div class="card text-center">
119 |         <h3 class="card-title" align="center">Visual Question Answering</h3>
120 |         <p class="card-text" align="center">Some randome text description about the demo goes here.</p>
121 |         <a target="_blank" href="{% url 'vqa' %}" class="btn btn-primary" >Try Visual Question Answering Demo</a>
122 |       </div>
123 |     </div>
124 | 
125 |     <div class="col-md-4">
126 |       <div class="card text-center">
127 |         <h3 class="card-title" align="center">Classification</h3>
128 |         <p class="card-text" align="center">Some randome text description about the demo goes here.</p>
129 |         <a target="_blank" href="{% url 'classification' %}" class="btn btn-primary" >Try Classification Demo</a>
130 |       </div>
131 |     </div>
132 | 
133 |     <div class="col-md-4">
134 |       <div class="card text-center">
135 |         <h3 class="card-title" align="center">Captioning</h3>
136 |         <p class="card-text" align="center">Some randome text description about the demo goes here.</p>
137 |         <a target="_blank" href="{% url 'captioning' %}" class="btn btn-primary text-center">Try Captioning Demo</a>
138 |       </div>
139 |     </div>
140 | 
141 |   </div>
142 | </div>
143 | 
144 | {% endblock %}
145 | 
146 | {% block team %}
147 |   <div class="container team_div" align="center">
148 |     <h2 align="center" class="headings" id="team_heading">Grad-CAM Team</h2>
149 |     <div class="row team text-center">
150 |       <div class="col-sm-3" align="center">
151 |         <img src="{% static 'images/team/ram.jpeg'%}" class="img-responsive img-circle" alt="Cinque Terre">
152 |         <div class="member-name" align="center"><a  target="_blank" href="https://ramprs.github.io/">Ramprasaath R. Selvaraju</a></div>
153 |       </div>
154 |       <div class="col-sm-3" align="center">
155 |         <img src="{% static 'images/team/abhishek.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
156 |         <div class="member-name" align="center"><a  target="_blank" href="http://abhishekdas.com/">Abhishek Das</a></div>
157 |       </div>
158 |       <div class="col-sm-3" align="center">
159 |         <img src="{% static 'images/team/rama.jpeg'%}" class="img-responsive img-circle" alt="Cinque Terre">
160 |         <div class="member-name" align="center"><a  target="_blank" href="https://scholar.google.com/citations?user=v1CRzeAAAAAJ&hl=en">Ramakrishna Vedantam</a></div>
161 |       </div>
162 |       <div class="col-sm-3" align="center">
163 |         <img src="{% static 'images/team/michael.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
164 |         <div class="member-name" align="center"><a  target="_blank" href="">Michael Cogswell</a></div>
165 |       </div>
166 |     </div>
167 | 
168 |     <div class="row team">
169 |       <div class="col-sm-3" align="center">
170 |         <img src="{% static 'images/team/stefan.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
171 |         <div class="member-name" align="center"><a  target="_blank" href="https://computing.ece.vt.edu/~steflee/">Stefan Lee</a></div>
172 |       </div>
173 |       <div class="col-sm-3" align="center"> 
174 |         <img src="{% static 'images/team/deshraj.png'%}" class="img-responsive img-circle center" alt="Cinque Terre">
175 |         <div class="member-name" align="center"><a  target="_blank" href="https://www.linkedin.com/in/deshraj-yadav-34325975">Deshraj Yadav</a></div>
176 |       </div>
177 |       <div class="col-sm-3" align="center">
178 |         <img src="{% static 'images/team/DeviParikh.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
179 |         <div class="member-name" align="center"><a  target="_blank" href="https://filebox.ece.vt.edu/~parikh/">Devi Parikh</a></div>
180 |       </div>
181 |       <div class="col-sm-3" align="center">
182 |         <img src="{% static 'images/team/dhruv_batra.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
183 |         <div class="member-name" align="center"><a  target="_blank" href="https://filebox.ece.vt.edu/~dbatra/">Dhruv Batra</a></div>
184 |       </div>
185 |     </div>
186 | 
187 |   </div>
188 | {% endblock%}
189 | 
190 | {% block footer %}
191 | <!-- <div class="container">
192 |   <div id="footer">
193 |     <div id="footermsg" align="center"><p>Do you have questions ?</p></div>
194 |     <a href="">
195 |       <button type="button" class="btn btn-primary btn-lg">Sign up for email alerts</button>
196 |     </a>
197 | 
198 |     <div id="classicons">
199 |       <a href="https://twitter.com/cs231n">
200 |         <img src="twitter.svg">
201 |       </a>
202 |     </div>
203 | 
204 |   </div>
205 | </div> -->
206 | 
207 | {% endblock %}
208 | <script>
209 |   (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
210 |   (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
211 |   m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
212 |   })(window,document,'script','https://www.google-analytics.com/analytics.js','ga');
213 | 
214 |   ga('create', 'UA-53104159-4', 'auto');
215 |   ga('send', 'pageview');
216 | 
217 | </script>
218 | </body>
219 | </html>
220 | 


--------------------------------------------------------------------------------
/grad_cam/templates/index.html:
--------------------------------------------------------------------------------
  1 | {% load static %}
  2 | <html lang="en">
  3 | <head>
  4 |     <meta charset="utf-8">
  5 |     <title>Grad-CAM: Gradient-weighted Class Activation Mapping</title>
  6 |     <meta name="description" content="Grad-CAM: Gradient-weighted Class Activation Mapping">
  7 |     <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 |     <link href='http://fonts.googleapis.com/css?family=Roboto:400,100,‌​100italic,300,300ita‌​lic,400italic,500,50‌​0italic,700,700itali‌​c,900italic,900' rel='stylesheet' type='text/css'>
  9 |     <link rel="stylesheet" href="//netdna.bootstrapcdn.com/bootstrap/3.0.0/css/bootstrap.min.css">
 10 |     <link rel="stylesheet" href="http://cloudcv.org/static/css/style.css">
 11 |     <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.5.0/css/font-awesome.min.css">
 12 |     <link rel="stylesheet" href="//code.jquery.com/ui/1.12.0/themes/base/jquery-ui.css">
 13 | 
 14 |     <script src="/static/js/dropzone.js"></script>
 15 |     <script src="//ajax.googleapis.com/ajax/libs/jquery/1.10.2/jquery.min.js"></script>
 16 |     <script src="http://cloudcv.org/static/js/vendor/jquery.ui.widget.js"></script>
 17 |     <script src="http://cloudcv.org/node/socket.io/socket.io.js"></script>
 18 |     <script src="https://code.jquery.com/ui/1.12.0/jquery-ui.js"></script>
 19 |     <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/dropzone/4.3.0/min/dropzone.min.css">
 20 |     <script src="//netdna.bootstrapcdn.com/bootstrap/3.1.1/js/bootstrap.min.js"></script>
 21 | </head>
 22 | <body>
 23 | 
 24 |   <div class="navbar navbar-inverse navbar-fixed-top">
 25 |     <div class="container">
 26 |         <div class="navbar-header">
 27 |             <button type="button" class="navbar-toggle" data-toggle="collapse" data-target=".navbar-fixed-top .navbar-collapse">
 28 |                 <span class="icon-bar"></span>
 29 |                 <span class="icon-bar"></span>
 30 |                 <span class="icon-bar"></span>
 31 |             </button>
 32 |             <a class="navbar-brand" href="http://cloudcv.org">CloudCV</a>
 33 |         </div>
 34 |         <div class="navbar-collapse collapse">
 35 |             <ul class="nav navbar-nav">
 36 |               <li><a target="_blank" href="https://evalai.cloudcv.org">EvalAI</a></li>
 37 |               <li><a target="_blank" href="http://origami.cloudcv.org">Origami</a></li>
 38 |               <li><a target="_blank" href="http://fabrik.cloudcv.org">Fabrik</a></li>
 39 |               <li><a href="http://gsoc.cloudcv.org" target="_blank">GSoC</a></li>
 40 |               <li class="dropdown">
 41 |                 <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-haspopup="true" aria-expanded="false">Demos <span class="caret"></span></a>
 42 |                 <ul class="dropdown-menu">
 43 |                   <li><a href="http://visualchatbot.cloudcv.org" target="_blank">Visual Chatbot</a></li>
 44 |                   <li><a href="http://vqa.cloudcv.org" target="_blank">VQA</a></li>
 45 |                   <li><a href="http://gradcam.cloudcv.org" target="_blank">Grad-CAM</a></li>
 46 |                   <li><a href="http://dbs.cloudcv.org" target="_blank">DBS</a></li>
 47 |                 </ul>
 48 |               </li>
 49 |             </ul>
 50 |         </div>
 51 |     </div>
 52 | </div>
 53 | 
 54 | 
 55 | <style>
 56 | p, h1, h2, h3, a{
 57 |   font-weight: 300 !important;
 58 |   font-family: 'Roboto', sans-serif;
 59 | }
 60 | 
 61 | body{
 62 |   font-family: 'Roboto', sans-serif;
 63 | }
 64 | 
 65 | p{
 66 |   font-size: 16px;
 67 | }
 68 | .team{
 69 |   width: 75%;
 70 |   margin-bottom: 15px;
 71 |  }
 72 |  .member-name{
 73 |   cursor: auto;
 74 |   margin-top: 5px;
 75 |  }
 76 | 
 77 |  .img-responsive{
 78 |   max-height: 100%;
 79 |   display: block;
 80 |   height: 150px; 
 81 |  }
 82 |  .team_div{
 83 |   margin-top: 15px;
 84 |  }
 85 | 
 86 |  #network{
 87 |   margin-top: 15px;
 88 |  }
 89 | 
 90 |  .headings{
 91 |   margin-bottom: 15px;
 92 |  }
 93 | #team_heading{
 94 |   margin-bottom: 25px;
 95 | }
 96 | li a{
 97 |   font-size: 16px;
 98 | }
 99 | .navbar-brand{
100 |   font-size: 18px !important;
101 | }
102 | </style>
103 | 
104 | {% block header_content %}
105 | 
106 |   <div class="container">
107 |     <h1 align="center">Grad-CAM: Gradient-weighted Class Activation Mapping</h1>
108 |   </div>
109 | 
110 | {% endblock %}
111 | 
112 | {% block slider %}
113 | 
114 | {% endblock %}
115 | 
116 | {% block abstract%}
117 | <div class="container">
118 |     <h2 align="center" class="headings">Abstract</h2>
119 |     <p>We propose a technique for making Convolutional Neural Network (CNN)-based models more transparent by visualizing the regions of input that are "important" for predictions from these models - or visual explanations. Our approach, called Gradient-weighted Class Activation Mapping (Grad-CAM), uses the class-specific gradient information flowing into the final convolutional layer of a CNN to produce a coarse localization map of the important regions in the image. Grad-CAM is a strict generalization of the Class Activation Mapping. Unlike CAM, Grad-CAM requires no re-training and is broadly applicable to any CNN-based architectures. We also show how Grad-CAM may be combined with existing pixel-space visualizations to create a high-resolution class-discriminative visualization (Guided Grad-CAM). We generate Grad-CAM and Guided Grad-CAM visual explanations to better understand image classification, image captioning, and visual question answering (VQA) models. In the context of image classification models, our visualizations (a) lend insight into their failure modes showing that seemingly unreasonable predictions have reasonable explanations, and (b) outperform pixel-space gradient visualizations (Guided Backpropagation and Deconvolution) on the ILSVRC-15 weakly supervised localization task. For image captioning and VQA, our visualizations expose the somewhat surprising insight that common CNN + LSTM models can often be good at localizing discriminative input image regions despite not being trained on grounded image-text pairs.   Finally, we design and conduct human studies to measure if Guided Grad-CAM explanations help users establish trust in the predictions made by deep networks. Interestingly, we show that Guided Grad-CAM helps untrained users successfully discern a "stronger" deep network from a "weaker" one even when both networks make identical predictions.</p>
120 |     <p><b>Arxiv Paper link: </b><a href="https://arxiv.org/abs/1610.02391">https://arxiv.org/abs/1610.02391</a></p>
121 |     <img id="network" src="{% static 'images/network.png' %}" width="100%" align="center">
122 | </div>
123 | {% endblock %}
124 | 
125 | {% block demo_links %}
126 | 
127 | <div class="container">
128 |   <h2 align="center" class="headings">Demonstration Links</h2>
129 |     <div class="row">
130 |       <div class="col-md-4">
131 |       <div class="card text-center">
132 |         <h3 class="card-title" align="center">Visual Question Answering</h3>
133 |         <a target="_blank" href="{% url 'vqa' %}" class="btn btn-lg btn-primary" >Try Visual Question Answering Demo</a>
134 |       </div>
135 |     </div>
136 | 
137 |     <div class="col-md-4">
138 |       <div class="card text-center">
139 |         <h3 class="card-title" align="center">Classification</h3>
140 |         <a target="_blank" href="{% url 'classification' %}" class="btn btn-lg btn-primary" >Try Classification Demo</a>
141 |       </div>
142 |     </div>
143 | 
144 |     <div class="col-md-4">
145 |       <div class="card text-center">
146 |         <h3 class="card-title" align="center">Captioning</h3>
147 |         <a target="_blank" href="{% url 'captioning' %}" class="btn btn-lg btn-primary text-center">Try Captioning Demo</a>
148 |       </div>
149 |     </div>
150 | 
151 |   </div>
152 | </div>
153 | 
154 | {% endblock %}
155 | 
156 | {% block team %}
157 |   <div class="container team_div" align="center">
158 |     <h2 align="center" class="headings" id="team_heading">Grad-CAM Team</h2>
159 |     <div class="row team text-center">
160 |       <div class="col-sm-3" align="center">
161 |         <img src="{% static 'images/team/ram.jpeg'%}" class="img-responsive img-circle" alt="Cinque Terre">
162 |         <div class="member-name" align="center"><a  target="_blank" href="https://ramprs.github.io/">Ramprasaath R. Selvaraju</a></div>
163 |       </div>
164 |       <div class="col-sm-3" align="center">
165 |         <img src="{% static 'images/team/abhishek.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
166 |         <div class="member-name" align="center"><a  target="_blank" href="http://abhishekdas.com/">Abhishek Das</a></div>
167 |       </div>
168 |       <div class="col-sm-3" align="center">
169 |         <img src="{% static 'images/team/rama.jpeg'%}" class="img-responsive img-circle" alt="Cinque Terre">
170 |         <div class="member-name" align="center"><a  target="_blank" href="http://vrama91.github.io/">Ramakrishna Vedantam</a></div>
171 |       </div>
172 |       <div class="col-sm-3" align="center">
173 |         <img src="{% static 'images/team/michael.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
174 |         <div class="member-name" align="center"><a  target="_blank" href="http://mcogswell.io/">Michael Cogswell</a></div>
175 |       </div>
176 |     </div>
177 | 
178 |     <div class="row team">
179 |       <div class="col-sm-3" align="center"> 
180 |         <img src="{% static 'images/team/deshraj.png'%}" class="img-responsive img-circle center" alt="Cinque Terre">
181 |         <div class="member-name" align="center"><a  target="_blank" href="https://www.linkedin.com/in/deshraj-yadav-34325975">Deshraj Yadav</a></div>
182 |       </div>
183 |       <div class="col-sm-3" align="center">
184 |         <img src="{% static 'images/team/stefan.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
185 |         <div class="member-name" align="center"><a  target="_blank" href="https://computing.ece.vt.edu/~steflee/">Stefan Lee</a></div>
186 |       </div>
187 |       <div class="col-sm-3" align="center">
188 |         <img src="{% static 'images/team/devi.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
189 |         <div class="member-name" align="center"><a  target="_blank" href="https://filebox.ece.vt.edu/~parikh/">Devi Parikh</a></div>
190 |       </div>
191 |       <div class="col-sm-3" align="center">
192 |         <img src="{% static 'images/team/dhruv_batra.jpg'%}" class="img-responsive img-circle" alt="Cinque Terre">
193 |         <div class="member-name" align="center"><a  target="_blank" href="https://filebox.ece.vt.edu/~dbatra/">Dhruv Batra</a></div>
194 |       </div>
195 |     </div>
196 | 
197 |   </div>
198 | {% endblock%}
199 | 
200 | {% block footer %}
201 | 
202 | {% endblock %}
203 | <script>
204 |   (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
205 |   (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
206 |   m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
207 |   })(window,document,'script','https://www.google-analytics.com/analytics.js','ga');
208 | 
209 |   ga('create', 'UA-53104159-4', 'auto');
210 |   ga('send', 'pageview');
211 | 
212 | </script>
213 | </body>
214 | </html>
215 | 


--------------------------------------------------------------------------------
/grad_cam/templates/captioning/captioning.html:
--------------------------------------------------------------------------------
  1 | {% extends 'base.html' %}
  2 | 
  3 | {% block header_content %}
  4 | 
  5 | <a href="https://github.com/Cloud-CV/Grad-CAM" target="_blank"><img style="position: fixed; top: 0; right: 0; border: 0; z-index:2000;" src="https://camo.githubusercontent.com/365986a132ccd6a44c23a9169022c0b5c890c387/68747470733a2f2f73332e616d617a6f6e6177732e636f6d2f6769746875622f726962626f6e732f666f726b6d655f72696768745f7265645f6161303030302e706e67" alt="Fork me on GitHub" data-canonical-src="https://s3.amazonaws.com/github/ribbons/forkme_right_red_aa0000.png"></a>
  6 | 
  7 | <div class="container">
  8 |     <div class="page-header">
  9 |         <h1 align="center">Grad-CAM: Gradient-weighted Class Activation Mapping</h1>
 10 |         <br><h4>Grad-CAM highlights regions of the image the captioning model looks at while making predictions.</h4>
 11 |         <font size="4">
 12 |             <p>
 13 |                 Torch code for Grad-CAM is available <a href="//github.com/ramprs/grad-cam">here</a>. Browsers currently supported by the demo: Google Chrome, Mozilla Firefox.
 14 |             </p>
 15 |         </font>
 16 |     </div>
 17 | </div>
 18 | 
 19 | {% endblock %}
 20 | 
 21 | {% block demo_images %}
 22 | 
 23 | <div class="container">
 24 |     <div class="page-header">
 25 |         <h2>Try Grad-CAM: Sample Images</h2>
 26 |         <br>
 27 |         <div class="row">
 28 |             <div class="col-md-8 col-xs-12">
 29 |                 <font size="4">Click on one of these images to send it to our servers (Or <a class="button_link" onclick="scrollToElement($('#userImages'))">upload</a>
 30 |                     your own images below)</font>
 31 |             </div>
 32 |             <div id="show-demo-images-btn" class="col-md-4">
 33 |             <button  class="btn btn-info">Show Demo Images</button>
 34 |             </div>
 35 |         </div>
 36 |          <div class="row hiddenDiv demoImages" id="demoImages1">
 37 |             <img src="/media/grad_cam/demo_captioning/COCO_val2014_000000125524.jpg"
 38 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 39 |             <img src="/media/grad_cam/demo_captioning/COCO_val2014_000000396387.jpg"
 40 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 41 |             <img src="/media/grad_cam/demo_captioning/COCO_val2014_000000008401.jpg"
 42 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 43 |          </div>
 44 |          <div class="row hiddenDiv demoImages" id="demoImages2">
 45 |             <img src="/media/grad_cam/demo_captioning/COCO_val2014_000000381246.jpg"
 46 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 47 |             <img src="/media/grad_cam/demo_captioning/COCO_val2014_000000223766.jpg"
 48 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 49 |             <img src="/media/grad_cam/demo_captioning/COCO_val2014_000000096638.jpg"
 50 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 51 |             <br>
 52 |          </div>
 53 |         <div class="row randomImages" id="demoImages3">
 54 |             <img src="{{ demo_images.0 }}"
 55 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 56 |             <img src="{{ demo_images.1 }}"
 57 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 58 |             <img src="{{ demo_images.2 }}"
 59 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 60 |         </div>
 61 |         <div class="row randomImages" id="demoImages4">
 62 |             <img src="{{ demo_images.3 }}"
 63 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 64 |             <img src="{{ demo_images.4 }}"
 65 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 66 |             <img src="{{ demo_images.5 }}"
 67 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 68 |              <br>
 69 |         </div>
 70 |         Note: nothing is pre-computed for these images. They are treated as a fresh upload with every click.
 71 |     </div>
 72 | </div>
 73 | </div>
 74 | 
 75 | {% endblock %}
 76 | 
 77 | {% block form %}
 78 | <style type="text/css">
 79 | 
 80 |   .caption {
 81 |     /*display: block;*/
 82 |     /*text-align: center;*/
 83 |     font-size: 18px !important;
 84 |     font-weight: bold;
 85 | }
 86 | 
 87 | #inputCaption, #predictedCaption{
 88 |     font-weight: bold;
 89 | }
 90 | 
 91 | .under
 92 | {
 93 | position:absolute;
 94 | /*left:0px;
 95 | top:0px;*/
 96 | z-index:-1;
 97 | }
 98 | 
 99 | .over
100 | {
101 | position:absolute;
102 | /*left:40px;*/
103 | /*top:10px;*/
104 | z-index:0;
105 | mix-blend-mode: multiply;
106 | }
107 | 
108 | #gradCamCaption{
109 |   position: relative;
110 |   padding-top: 350px;
111 | }
112 | 
113 | .finalImages{
114 |   width: 350px !important;
115 |   height: 350px !important;
116 |   padding: 6px;
117 | }
118 | 
119 | .resultText{
120 |   margin-bottom: 15px !important;
121 | }
122 | 
123 | </style>
124 | 
125 | <div class="container">
126 |   <div class="page-header">
127 |     <h2 id="userImages">Try Grad-CAM On Your Images</h2>
128 |   </div>
129 |   {% block url_content %}
130 |     {% include 'upload_image_url.html' %}
131 |   {% endblock %}
132 |   <div class="col-sm-12">
133 |     <h3 align="center">OR</h3>
134 |   </div>
135 |   <div class="container">    
136 |     <form id="my-dropzone" method="post" class="dropzone
137 |     " action="{% url "upload" %}" enctype="multipart/form-data">
138 |     <input type="hidden" id="demoType" name="demo_type" value=""> 
139 |     <input type="hidden" id="appType" name="type" value="captioning">
140 | 
141 |     {% csrf_token %}
142 | 
143 |     {% include 'form.html' %}
144 |     </form>
145 |   </div>
146 | 
147 | {% endblock %}
148 | 
149 | {% block result %}
150 | <script type="text/javascript">
151 |   // Overriden 
152 |   Dropzone.options.myDropzone = {
153 |     autoProcessQueue: true,
154 |     uploadMultiple: false,
155 |     maxFiles: 10,
156 | 
157 |     init: function() {
158 |       var myDropzone = this;
159 |       this.hiddenFileInput.removeAttribute('multiple');
160 |       myDropzone.on('success', function(file, data){
161 |         console.log(data);
162 |         $("#inputImageAfterUpload").attr('src', data['file_path']);
163 |         $("#ResultDiv").show();
164 |         $("#show-grad-cam-result").hide();
165 |         $("#demoType").val("uploadedImageType");
166 |         $("#question").val("");
167 |         $("#Caption").val("");
168 |         $('#comments').prepend('<br>');
169 |         $('#comments').prepend('<li>' + "Image uploaded successfully..." + '</li>');
170 |         scrollToElement($("#termstart"));
171 |         scrollToElement($("#ResultDiv"));
172 |       });
173 |     }
174 |   }
175 | </script>
176 | 
177 | <script type="text/javascript">
178 | 
179 | 
180 | $(document).ready(function(){
181 |   var ws_scheme = window.location.protocol == "https:" ? "wss" : "ws";
182 |   var socket = new ReconnectingWebSocket(ws_scheme + '://' + window.location.host + "/chat" + window.location.pathname);
183 | 
184 |   socket.onopen = function() {
185 |       console.log("User connected to the socket with socketid "+ "{{socketid }}");
186 |       socket.send("{{ socketid }}");
187 |   }
188 | 
189 |   socket.onmessage = function(response) {
190 |     console.log("Getting response from the worker.....");
191 |     console.log(JSON.parse(response.data));
192 | 
193 |     response = JSON.parse(response.data);
194 | 
195 |     if ("info" in response){
196 |       console.log("Info is there as the key");
197 |     }
198 | 
199 |     if ("terminal" in response){
200 | 
201 |       $('#comments').prepend('<li>' + response['terminal'] + '</li>');
202 |     }
203 | 
204 |     if("result" in response){
205 | 
206 |       result = JSON.parse(response['result']);
207 |       var d = new Date();
208 |       $("#inputCaption").text(result['input_caption']);
209 |       $("#predictedCaption").text(result['pred_caption']);
210 |       $("#overImg1").attr("src", result['input_image']);
211 |       $("#img1").attr("src",result['captioning_gcam_raw']+"?"+d.getTime());
212 |       $("#img2").attr("src",result['captioning_gb']+"?"+d.getTime());
213 |       $("#img3").attr("src",result['captioning_gb_gcam']+"?"+d.getTime());
214 |       $("#show-grad-cam-result").show();
215 |       scrollToElement($("#show-grad-cam-result"));
216 |       $('#comments').prepend('<br>');
217 |     }
218 |   }
219 | });
220 | 
221 |   var getLocation = function(href) {
222 |       var l = document.createElement("a");
223 |       l.href = href;
224 |       return l;
225 |   };
226 | 
227 | function submitDemoImage(src){
228 |   var img_path = getLocation(src).pathname;
229 |   $("#inputImageAfterUpload").attr('src', img_path);
230 |   $("#show-grad-cam-result").hide();
231 |   $("#Caption").val("");
232 |   $("#ResultDiv").show();
233 |   scrollToElement($("#termstart"));
234 |   $('#comments').prepend('<br>');
235 |   $('#comments').prepend('<li>' + "Submitted demo image" + '</li>');
236 |   scrollToElement($("#ResultDiv"));
237 | }
238 | 
239 | function submitImageForCaptioning () {
240 |   var caption = $("#Caption").val();
241 |   var l = $("#inputImageAfterUpload")[0].src;
242 |   var img_path = getLocation(l).pathname;
243 | 
244 |   $.ajax({
245 |     type    : 'POST', // define the type of HTTP verb we want to use (POST for our form)
246 |     url     : '{% url 'captioning' %}', // the url where we want to POST
247 |     data    : { 'img_path': img_path, 'csrfmiddlewaretoken': "{{ csrf_token }}", 'caption': caption, 'socketid': "{{ socketid }}"} // our data object
248 |   })// using the done promise callback
249 |   .done(function(response) {
250 |     console.log("Ajax call completed successfully");
251 |   });
252 | }
253 | 
254 | function submitImageUsingUrl(){
255 |   var src = document.getElementById("image_url").value;
256 |   $('#comments').prepend('<br>');
257 |   $('#comments').prepend('<li>' + "Starting the Image Download process." + '</li>');
258 | 
259 |   scrollToElement($("#termstart"));
260 |   scrollToElement($("#resultHeading"));
261 | 
262 |   $.ajax({
263 |     type : "POST",
264 |     url  : '{% url 'upload-url' %}',
265 |     data : {'src': src  , 'socketid': "{{socketid}}", 'csrfmiddlewaretoken': '{{ csrf_token }}', type:"captioning"}
266 |   }).done(function(data){
267 |     console.log(data);
268 |     $("#inputImageAfterUpload").attr('src', data["file_path"]);
269 |     $("#label").val("");
270 |     $("#show-grad-cam-result").hide();
271 |     $("#ResultDiv").show();
272 |   });
273 | };
274 | 
275 | $("#image_url").keydown(function(e){
276 |   if (e.which === 13){
277 |     $("#image_url_submit_btn").click();
278 |   }
279 | });
280 | 
281 | $('#image_url').on('paste', function(){
282 |   setTimeout(function(){
283 |     $("#image_url_submit_btn").click();
284 |   }, 0);
285 | });
286 | 
287 | </script>
288 | <br>
289 |   <div class="page-header">
290 |     <h2 id="resultHeading" class="center">Result of Grad-CAM for Captioning</h2>
291 |   </div>
292 | <div id="ResultDiv" class="row" style="padding-bottom:50px; display:None;">
293 |   <div class="col-md-5" style="padding-bottom: 30px; clear: both;">
294 |     <img class="img-responsive" src="" style="height: 300px;" id="inputImageAfterUpload">
295 |   </div>
296 |   <div class="col-md-7" style="padding-bottom: 30px;">
297 |     <input id="Caption" class="form-control" name="caption" placeholder="Enter the caption...(Optional)"><br>
298 |     <input type="button" value="Submit" onclick="submitImageForCaptioning()" class="btn btn-primary">
299 | </div>
300 | </div>
301 | 
302 | <div class="row demoImages" style="display:None;" id="show-grad-cam-result" >
303 | 
304 |   <div class="col-md-12 resultText">
305 |     <h3 style="display: inline;" align="center">Predicted Caption : &nbsp;</h3>
306 |     <h3 id="predictedCaption" style="display: inline;" class="center"></h3>
307 |   </div>
308 | 
309 |   <div class="col-md-12 resultText">
310 |     <h3 style="display: inline;" class="center">Generating Grad-CAM visualizations for: &nbsp;</h3>
311 |     <h3 id="inputCaption" style="display: inline;" align="center"></h3>
312 |   </div>
313 | 
314 |   <div class="col-md-4">
315 |     <img src="" class="col-md-12 finalImages" id="img2">
316 |       <p class="caption" style="font-size: 14 px;" align="left">Guided Backprop</p>
317 |   </div>
318 | 
319 |   <div class="col-md-4">
320 |     <img src="" class="over col-md-12 finalImages" id="overImg1" />
321 |     <img src="" class="under col-md-12 finalImages" id="img1">
322 |     <p class="caption" style="font-size: 14 px;" align="left" id="gradCamCaption">Grad-CAM</p>
323 |   </div>
324 | 
325 |   <div class="col-md-4">
326 |     <img src="" class="col-md-12 finalImages" id="img3">
327 |       <p class="caption" style="font-size: 14 px; padding-left: 5px;" align="left">Guided Grad-CAM</p>
328 |   </div>
329 | 
330 | </div>
331 | {% endblock %}
332 | 
333 | {% block credits %}
334 | <h2 class="page-header"> Credits </h2>
335 |   <font size="4">
336 |     <a href="https://github.com/karpathy/neuraltalk2">Code for Neuraltalk2</a><br>
337 |     Built by <a href="http://github.com/DESHRAJ" target="_blank">@deshraj</a>
338 |     <br><br>
339 |   </font>
340 |   <br>
341 | </div>
342 | </body>
343 | <script type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/reconnecting-websocket/1.0.0/reconnecting-websocket.min.js"></script>
344 | </html>
345 | {% endblock %}
346 | 


--------------------------------------------------------------------------------
/grad_cam/templates/base.html:
--------------------------------------------------------------------------------
  1 | <html lang="en">
  2 | <head>
  3 |     <meta charset="utf-8">
  4 |     <title>Grad-CAM: Gradient-weighted Class Activation Mapping</title>
  5 |     <meta name="description" content="CloudCV: Large Scale Distributed Computer Vision as a Cloud Service">
  6 |     <meta name="viewport" content="width=device-width, initial-scale=1.0">
  7 |     <link href='http://fonts.googleapis.com/css?family=Roboto:400,100,‌​100italic,300,300ita‌​lic,400italic,500,50‌​0italic,700,700itali‌​c,900italic,900' rel='stylesheet' type='text/css'>
  8 |     <link rel="stylesheet" href="//netdna.bootstrapcdn.com/bootstrap/3.0.0/css/bootstrap.min.css">
  9 |     <link rel="stylesheet" href="http://cloudcv.org/static/css/style.css">
 10 |     <link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/font-awesome/4.5.0/css/font-awesome.min.css">
 11 |     <link rel="stylesheet" href="//code.jquery.com/ui/1.12.0/themes/base/jquery-ui.css">
 12 | 
 13 |     <script src="/static/js/dropzone.js"></script>
 14 |     <script src="//ajax.googleapis.com/ajax/libs/jquery/1.10.2/jquery.min.js"></script>
 15 |     <script src="http://cloudcv.org/static/js/vendor/jquery.ui.widget.js"></script>
 16 |     <script src="http://cloudcv.org/node/socket.io/socket.io.js"></script>
 17 |     <script src="https://code.jquery.com/ui/1.12.0/jquery-ui.js"></script>
 18 |     <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/dropzone/4.3.0/min/dropzone.min.css">
 19 | </head>
 20 | <body>
 21 | 
 22 | <div class="navbar navbar-inverse navbar-fixed-top">
 23 |     <div class="container">
 24 |         <div class="navbar-header">
 25 |             <button type="button" class="navbar-toggle" data-toggle="collapse" data-target=".navbar-fixed-top .navbar-collapse">
 26 |                 <span class="icon-bar"></span>
 27 |                 <span class="icon-bar"></span>
 28 |                 <span class="icon-bar"></span>
 29 |             </button>
 30 |             <a class="navbar-brand" href="http://cloudcv.org">CloudCV</a>
 31 |         </div>
 32 |         <div class="navbar-collapse collapse">
 33 |             <ul class="nav navbar-nav">
 34 |               <li><a target="_blank" href="https://evalai.cloudcv.org">EvalAI</a></li>
 35 |               <li><a target="_blank" href="http://origami.cloudcv.org">Origami</a></li>
 36 |               <li><a target="_blank" href="http://fabrik.cloudcv.org">Fabrik</a></li>
 37 |               <li><a href="http://gsoc.cloudcv.org" target="_blank">GSoC</a></li>
 38 |               <li class="dropdown">
 39 |                 <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-haspopup="true" aria-expanded="false">Demos<span class="caret"></span></a>
 40 |                 <ul class="dropdown-menu">
 41 |                   <li><a href="http://visualchatbot.cloudcv.org" target="_blank">Visual Chatbot</a></li>
 42 |                   <li><a href="http://vqa.cloudcv.org" target="_blank">VQA</a></li>
 43 |                   <li><a href="http://gradcam.cloudcv.org" target="_blank">Grad-CAM</a></li>
 44 |                   <li><a href="http://dbs.cloudcv.org" target="_blank">DBS</a></li>
 45 |                 </ul>
 46 |               </li>
 47 |             </ul>
 48 |         </div>
 49 |     </div>
 50 | </div>
 51 | 
 52 | 
 53 | <style>
 54 |   .hiddenDiv{
 55 |       display: none;
 56 |   }
 57 |   .button_link {
 58 |   cursor: pointer;
 59 |   }
 60 |   .demo_img{
 61 |   height: 300px !important;
 62 |       padding: 6px;
 63 | 
 64 |   }
 65 |   .demo_img:hover {
 66 |   border: 6px solid black;
 67 |       padding: 0px;
 68 |   cursor: pointer;
 69 |   }
 70 |   #show-demo-images-btn{
 71 |       text-align: right;
 72 |   }
 73 |   @media(max-width: 540px){
 74 |       #show-demo-images-btn{
 75 |         text-align: center;
 76 | 
 77 |       }
 78 |   }
 79 | 
 80 | .dz-upload { 
 81 |     display: block; 
 82 |     background-color: red; 
 83 |     height: 10px;
 84 |     width: 0%;
 85 | }
 86 | 
 87 | p, h1,h2,h3,h4, font, body{
 88 |   font-weight: 300 !important;
 89 |   font-family: 'Roboto', sans-serif !important;
 90 | }
 91 | 
 92 | 
 93 | </style>
 94 | 
 95 | <div id="socket-error" class="modal hide fade" tabindex="-1" data-width="760">
 96 |   <div class="modal-header">
 97 |     <button type="button" class="close" data-dismiss="modal" aria-hidden="true">×</button>
 98 |     <h3>Socket Error</h3>
 99 |   </div>
100 |   <div class="modal-body">
101 |     <div class="row-fluid">
102 |       Socket connection cannot be established on port 8000 which is required to communicate with the CloudCV Servers. Please make sure that port 8000 is open and not blocked by firewall on your system.<br>
103 |     </div>
104 |   </div>
105 |   <div class="modal-footer">
106 |     <button type="button" data-dismiss="modal" class="btn">Close</button>
107 |   </div>
108 | </div>
109 | 
110 | {% block header_content %}
111 | 
112 |   <div class="container">
113 |       <div class="page-header">
114 |         <h1 align="center">CloudCV Sample Demo Heading </h1>
115 |         <h3 align="center">More details about the VQA dataset can be found <a href="http://visualqa.org/">here.</a></h3>
116 |         <h3 align="center">State-of-the-art VQA model and code available <a href="https://github.com/VT-vision-lab/VQA_LSTM_CNN">here</a></h3>
117 |         <br>
118 |         <font size="4">
119 |           <p style="text-align:center;"><font size="4">CloudCV can answer questions you ask about an image</font><br><br>
120 |               <span style="font-size: 14px;">Browsers currently supported: Google Chrome, Mozilla Firefox</span>
121 |           </p>
122 |         </font>
123 |       <br><br>
124 |     </div>
125 |   </div>
126 | 
127 | {% endblock %}
128 | 
129 | {% block demo_images %}
130 | 
131 | <div class="container">
132 |     <div class="page-header">
133 |         <h2>Try Grad-CAM: Sample Images</h2>
134 |         <br>
135 |         <div class="row">
136 |             <div class="col-md-8 col-xs-12">
137 |                 <font size="4">Click on one of these images to send it to our servers (Or <a class="button_link" onclick="scrollToElement($('#userImages'))">upload</a>
138 |                     your own images below)</font>
139 |             </div>
140 |             <div id="show-demo-images-btn" class="col-md-4">
141 |             <button  class="btn btn-info">Show Demo Images</button>
142 |             </div>
143 |         </div>
144 |          <div class="row hiddenDiv demoImages" id="demoImages1">
145 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000003501.jpg "
146 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
147 |             <img src="/media/grad_cam/demo_vqa/firehydrant.jpg"
148 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
149 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000237618.jpg"
150 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
151 |          </div>
152 |          <div class="row hiddenDiv demoImages" id="demoImages2">
153 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000184402.jpg"
154 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
155 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000393056.jpg"
156 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
157 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000240731.jpg"
158 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
159 |             <br>
160 |          </div>
161 |         <div class="row randomImages" id="demoImages3">
162 |             <img src="{{ demo_images.0 }}"
163 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
164 |             <img src="{{ demo_images.1 }}"
165 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
166 |             <img src="{{ demo_images.2 }}"
167 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
168 |         </div>
169 |         <div class="row randomImages" id="demoImages4">
170 |             <img src="{{ demo_images.3 }}"
171 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
172 |             <img src="{{ demo_images.4 }}"
173 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
174 |             <img src="{{ demo_images.5 }}"
175 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
176 |              <br>
177 |         </div>
178 |         Note: nothing is pre-computed for these images. They are treated as a fresh upload with every click.
179 |     </div>
180 | </div>
181 | </div>
182 | 
183 | {% endblock %}
184 | 
185 | {% block form %}
186 | {% endblock %}
187 | 
188 | {% block terminal %}
189 | 
190 | <div class="container">
191 |         <h3 id="termstart">Terminal: </h3>
192 | 
193 |         <div id="Console"
194 |              style="height:300px; color: #FFFFFF; background-color: #2B2A2B; overflow:scroll; padding: 10px;">
195 |             <ul id="comments" style='list-style-type:none;'>
196 |             </ul>
197 |         </div>
198 |         <br>
199 | 
200 |         <div id="underTheHood">
201 |             <p><h3>How it works</h3></p>
202 |           <font size="4">
203 |                 <ol>
204 |                     <li>You upload an image.</li>
205 |                     <li>Your request is sent to our servers with GPUs courtesy NVIDIA.</li>
206 |                     <li>Our servers run our deep-learning based algorithm.</li>
207 |                     <li>Results and updates are shown in real-time.</li>    
208 |                 </ol>
209 |             </font><br><br>
210 |         </div>
211 | 
212 | {% endblock %}
213 | 
214 | {% block result %}
215 | 
216 | {% endblock %}
217 | 
218 | {% block credits %}
219 | 
220 |   <div id="creditSection">
221 |     <h3> Credits </h3>
222 |     <font size="4">
223 |       <a href="#">Sample Credit Link Section</a><br>
224 |         Deshraj Yadav, Harsh Agarwal, Dhruv Batra
225 |       <br><br>
226 |     </font>
227 |     <br>
228 |   </div>
229 | {% endblock %}
230 | 
231 |   </div>
232 | 
233 | <script>
234 |     var socketid;
235 |     var demo_running=0;
236 | 
237 | </script>
238 | <script>
239 |     var isOpera = (!!window.opr && !!opr.addons) || !!window.opera || navigator.userAgent.indexOf(' OPR/') >= 0;
240 |     var isFirefox = typeof InstallTrigger !== 'undefined';
241 |     var isSafari = Object.prototype.toString.call(window.HTMLElement).indexOf('Constructor') > 0;
242 |     var isIE = /*@cc_on!@*/false || !!document.documentMode;
243 |     var isEdge = !isIE && !!window.StyleMedia;
244 |     var isChrome = !!window.chrome && !!window.chrome.webstore;
245 |     var isBlink = (isChrome || isOpera) && !!window.CSS;
246 |     var getUrlParameter = function getUrlParameter(sParam) {
247 |         var sPageURL = decodeURIComponent(window.location.search.substring(1)),
248 |             sURLVariables = sPageURL.split('&'),
249 |             sParameterName,
250 |             i;
251 | 
252 |         for (i = 0; i < sURLVariables.length; i++) {
253 |             sParameterName = sURLVariables[i].split('=');
254 | 
255 |             if (sParameterName[0] === sParam) {
256 |                 return sParameterName[1] === undefined ? true : sParameterName[1];
257 |             }
258 |         }
259 |     };
260 | 
261 | </script>
262 | 
263 | <script>
264 |   function scrollToElement(dstElement) {
265 |     try
266 |     {
267 |       var scrollPixels = dstElement.offset().top - $(".navbar-fixed-top").height()-30;
268 |       $('html, body').animate({
269 |       scrollTop: scrollPixels
270 |       }, 2000);
271 |     }
272 |     catch(err)
273 |     {
274 |         console.log(err);
275 |     }
276 |   }
277 | 
278 |   function submitForm(src, id){
279 |       //Change the image to loading jpeg
280 |       console.log("Submitted question.");
281 |       $('#comments').prepend('<li>' + "Asking the question..." + '</li>');
282 |       console.log(src);
283 | 
284 |       var txtArea = document.getElementById("txt"+id);
285 | 
286 |       $.ajax({
287 |         type    : 'POST', // define the type of HTTP verb we want to use (POST for our form)
288 |         url     : '{% url 'upload' %}', // the url where we want to POST
289 |         data    : {'src':src, } // our data object
290 |       })
291 |     .done(function(data) {
292 |       data = JSON.parse(data);
293 |       console.log(data);
294 |     });
295 |   }
296 | 
297 | </script>
298 | 
299 | <script>
300 | 
301 |   $(document).ready(function() {
302 |     $("#show-demo-images-btn button").click(function() {
303 |         if($(this).text() == "Show Demo Images") {
304 |             $(this).text("Show Random Images");
305 |             $('#demoImages3').hide();
306 |             $('#demoImages4').hide();
307 |             $('#demoImages1').show();
308 |             $('#demoImages2').show();
309 |         } else if($(this).text() == "Show Random Images") {
310 |             $(this).text("Show Demo Images");
311 |             $('#demoImages1').hide();
312 |             $('#demoImages2').hide();
313 |             $('#demoImages3').show();
314 |             $('#demoImages4').show();
315 |         } else {
316 |             alert("An error occured. We will fix it soon.");
317 |         }
318 |     });
319 |   });
320 | 
321 | </script>
322 | 
323 | <script type="text/javascript">
324 |     $("#question").keypress(function(event) {
325 |         if (event.which == 13) {
326 |           if ($("#question").val().length){
327 |             console.log("shift focus to answer");
328 |             $("#answer").focus();
329 |           }
330 |         }
331 |     });
332 | 
333 |         $("#answer").keypress(function(event) {
334 |         if (event.which == 13) {
335 |             submitImageForVqa();
336 |             console.log("submited the form");
337 |         }
338 |     });
339 | 
340 |         $("#Caption").keypress(function(event) {
341 |         if (event.which == 13) {
342 |             submitImageForCaptioning();
343 |             console.log("submited the form");
344 |         }
345 |     });
346 | 
347 |         $("#label").keypress(function(event) {
348 |         if (event.which == 13) {
349 |             submitImageForClassification();
350 |             console.log("submited the form");
351 |         }
352 |     });
353 | </script>
354 | <script>
355 |   (function(i,s,o,g,r,a,m){i['GoogleAnalyticsObject']=r;i[r]=i[r]||function(){
356 |   (i[r].q=i[r].q||[]).push(arguments)},i[r].l=1*new Date();a=s.createElement(o),
357 |   m=s.getElementsByTagName(o)[0];a.async=1;a.src=g;m.parentNode.insertBefore(a,m)
358 |   })(window,document,'script','https://www.google-analytics.com/analytics.js','ga');
359 | 
360 |   ga('create', 'UA-53104159-4', 'auto');
361 |   ga('send', 'pageview');
362 | 
363 | </script>
364 | </body>
365 | </html>
366 | 


--------------------------------------------------------------------------------
/grad_cam/templates/classification/classification.html:
--------------------------------------------------------------------------------
  1 | {% extends 'base.html' %}
  2 | 
  3 | {% block header_content %}
  4 | 
  5 | <a href="https://github.com/Cloud-CV/Grad-CAM" target="_blank"><img style="position: fixed; top: 0; right: 0; border: 0; z-index:2000;" src="https://camo.githubusercontent.com/365986a132ccd6a44c23a9169022c0b5c890c387/68747470733a2f2f73332e616d617a6f6e6177732e636f6d2f6769746875622f726962626f6e732f666f726b6d655f72696768745f7265645f6161303030302e706e67" alt="Fork me on GitHub" data-canonical-src="https://s3.amazonaws.com/github/ribbons/forkme_right_red_aa0000.png"></a>
  6 | 
  7 | <div class="container">
  8 |     <div class="page-header">
  9 |         <h1 align="center">Grad-CAM: Gradient-weighted Class Activation Mapping</h1>
 10 |         <br><h4>Grad-CAM highlights regions of the image the classification model looks at while making predictions.</h4>
 11 |         <font size="4">
 12 |             <p>
 13 |                 Torch code for Grad-CAM is available <a href="//github.com/ramprs/grad-cam">here</a>. Browsers currently supported by the demo: Google Chrome, Mozilla Firefox.
 14 |             </p>
 15 |         </font>
 16 |     </div>
 17 | </div>
 18 | 
 19 | {% endblock %}
 20 | 
 21 | 
 22 | {% block demo_images %}
 23 | 
 24 | <div class="container">
 25 |     <div class="page-header">
 26 |         <h2>Try Grad-CAM: Sample Images</h2>
 27 |         <br>
 28 |         <div class="row">
 29 |             <div class="col-md-8 col-xs-12">
 30 |                 <font size="4">Click on one of these images to send it to our servers (Or <a class="button_link" onclick="scrollToElement($('#userImages'))">upload</a>
 31 |                     your own images below)</font>
 32 |             </div>
 33 |             <div id="show-demo-images-btn" class="col-md-4">
 34 |             <button  class="btn btn-info">Show Demo Images</button>
 35 |             </div>
 36 |         </div>
 37 |          <div class="row hiddenDiv demoImages" id="demoImages1">
 38 |             <img src="/media/grad_cam/demo_classification/COCO_train2014_000000114269.jpg"
 39 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 40 |             <img src="/media/grad_cam/demo_classification/COCO_train2014_000000125586.jpg"
 41 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 42 |             <img src="/media/grad_cam/demo_classification/COCO_train2014_000000527338.jpg"
 43 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 44 |          </div>
 45 |          <div class="row hiddenDiv demoImages" id="demoImages2">
 46 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000184402.jpg"
 47 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 48 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000393056.jpg"
 49 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 50 |             <img src="/media/grad_cam/demo_vqa/COCO_val2014_000000240731.jpg"
 51 |                  onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 52 |             <br>
 53 |          </div>
 54 |         <div class="row randomImages" id="demoImages3">
 55 |             <img src="{{ demo_images.0 }}"
 56 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 57 |             <img src="{{ demo_images.1 }}"
 58 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 59 |             <img src="{{ demo_images.2 }}"
 60 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 61 |         </div>
 62 |         <div class="row randomImages" id="demoImages4">
 63 |             <img src="{{ demo_images.3 }}"
 64 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 65 |             <img src="{{ demo_images.4 }}"
 66 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 67 |             <img src="{{ demo_images.5 }}"
 68 |                   onclick="submitDemoImage(this.src)" class="demo_img col-md-4"></img>
 69 |              <br>
 70 |         </div>
 71 |         Note: nothing is pre-computed for these images. They are treated as a fresh upload with every click.
 72 |     </div>
 73 | </div>
 74 | </div>
 75 | 
 76 | {% endblock %}
 77 | 
 78 | 
 79 | {% block form %}
 80 | 
 81 | <div class="container">
 82 |   <div class="page-header">
 83 |     <h2 id="userImages">Try Grad-CAM On Your Images</h2>
 84 |   </div>
 85 |   {% block url_content %}
 86 |     {% include 'upload_image_url.html' %}
 87 |   {% endblock %}
 88 |   <div class="col-sm-12">
 89 |     <h3 align="center">OR</h3>
 90 |   </div>
 91 |   <div class="container">
 92 |     <form id="my-dropzone" method="post" class="dropzone
 93 |     " action="{% url "upload" %}" enctype="multipart/form-data">
 94 |     {% csrf_token %}
 95 |       <input type="hidden" id="demoType" name="demo_type" value=""> 
 96 |       <input type="hidden" id="appType" name="type" value="classification">
 97 | 
 98 |     {% include 'form.html' %}
 99 |     </form>
100 |   </div>
101 | 
102 | {% endblock %}
103 | 
104 | {% block result %}
105 | <style type="text/css">
106 | 
107 |   .caption {
108 |     /*display: block;*/
109 |     /*text-align: center;*/
110 |     font-size: 18px !important;
111 |     font-weight: bold;
112 | }
113 | 
114 | #inputLabel, #predictedLabel{
115 |     font-weight: bold;
116 | }
117 | 
118 | .under{
119 | position:absolute;
120 | /*left:0px;
121 | top:0px;*/
122 | z-index:-1;
123 | }
124 | 
125 | .over
126 | {
127 | position:absolute;
128 | /*left:40px;*/
129 | /*top:10px;*/
130 | z-index:0;
131 | mix-blend-mode: multiply;
132 | }
133 | 
134 | #gradCamCaption{
135 |   position: relative;
136 |   padding-top: 350px;
137 | }
138 | 
139 | .finalImages{
140 |   width: 350px !important;
141 |   height: 350px !important;
142 |   padding: 6px;
143 | }
144 | 
145 | .resultText{
146 |   margin-bottom: 15px !important;
147 | }
148 | </style>
149 | 
150 | <script type="text/javascript">
151 | 
152 | var labels={"1":"tench","2":"goldfish","3":"great white shark","4":"tiger shark","5":"hammerhead","6":"electric ray","7":"stingray","8":"cock","9":"hen","10":"ostrich","11":"brambling","12":"goldfinch","13":"house finch","14":"junco","15":"indigo bunting","16":"robin","17":"bulbul","18":"jay","19":"magpie","20":"chickadee","21":"water ouzel","22":"kite","23":"bald eagle","24":"vulture","25":"great grey owl","26":"European fire salamander","27":"common newt","28":"eft","29":"spotted salamander","30":"axolotl","31":"bullfrog","32":"tree frog","33":"tailed frog","34":"loggerhead","35":"leatherback turtle","36":"mud turtle","37":"terrapin","38":"box turtle","39":"banded gecko","40":"common iguana","41":"American chameleon","42":"whiptail","43":"agama","44":"frilled lizard","45":"alligator lizard","46":"Gila monster","47":"green lizard","48":"African chameleon","49":"Komodo dragon","50":"African crocodile","51":"American alligator","52":"triceratops","53":"thunder snake","54":"ringneck snake","55":"hognose snake","56":"green snake","57":"king snake","58":"garter snake","59":"water snake","60":"vine snake","61":"night snake","62":"boa constrictor","63":"rock python","64":"Indian cobra","65":"green mamba","66":"sea snake","67":"horned viper","68":"diamondback","69":"sidewinder","70":"trilobite","71":"harvestman","72":"scorpion","73":"black and gold garden spider","74":"barn spider","75":"garden spider","76":"black widow","77":"tarantula","78":"wolf spider","79":"tick","80":"centipede","81":"black grouse","82":"ptarmigan","83":"ruffed grouse","84":"prairie chicken","85":"peacock","86":"quail","87":"partridge","88":"African grey","89":"macaw","90":"sulphur-crested cockatoo","91":"lorikeet","92":"coucal","93":"bee eater","94":"hornbill","95":"hummingbird","96":"jacamar","97":"toucan","98":"drake","99":"red-breasted merganser","100":"goose","101":"black swan","102":"tusker","103":"echidna","104":"platypus","105":"wallaby","106":"koala","107":"wombat","108":"jellyfish","109":"sea anemone","110":"brain coral","111":"flatworm","112":"nematode","113":"conch","114":"snail","115":"slug","116":"sea slug","117":"chiton","118":"chambered nautilus","119":"Dungeness crab","120":"rock crab","121":"fiddler crab","122":"king crab","123":"American lobster","124":"spiny lobster","125":"crayfish","126":"hermit crab","127":"isopod","128":"white stork","129":"black stork","130":"spoonbill","131":"flamingo","132":"little blue heron","133":"American egret","134":"bittern","135":"crane","136":"limpkin","137":"European gallinule","138":"American coot","139":"bustard","140":"ruddy turnstone","141":"red-backed sandpiper","142":"redshank","143":"dowitcher","144":"oystercatcher","145":"pelican","146":"king penguin","147":"albatross","148":"grey whale","149":"killer whale","150":"dugong","151":"sea lion","152":"Chihuahua","153":"Japanese spaniel","154":"Maltese dog","155":"Pekinese","156":"Shih-Tzu","157":"Blenheim spaniel","158":"papillon","159":"toy terrier","160":"Rhodesian ridgeback","161":"Afghan hound","162":"basset","163":"beagle","164":"bloodhound","165":"bluetick","166":"black-and-tan coonhound","167":"Walker hound","168":"English foxhound","169":"redbone","170":"borzoi","171":"Irish wolfhound","172":"Italian greyhound","173":"whippet","174":"Ibizan hound","175":"Norwegian elkhound","176":"otterhound","177":"Saluki","178":"Scottish deerhound","179":"Weimaraner","180":"Staffordshire bullterrier","181":"American Staffordshire terrier","182":"Bedlington terrier","183":"Border terrier","184":"Kerry blue terrier","185":"Irish terrier","186":"Norfolk terrier","187":"Norwich terrier","188":"Yorkshire terrier","189":"wire-haired fox terrier","190":"Lakeland terrier","191":"Sealyham terrier","192":"Airedale","193":"cairn","194":"Australian terrier","195":"Dandie Dinmont","196":"Boston bull","197":"miniature schnauzer","198":"giant schnauzer","199":"standard schnauzer","200":"Scotch terrier","201":"Tibetan terrier","202":"silky terrier","203":"soft-coated wheaten terrier","204":"West Highland white terrier","205":"Lhasa","206":"flat-coated retriever","207":"curly-coated retriever","208":"golden retriever","209":"Labrador retriever","210":"Chesapeake Bay retriever","211":"German short-haired pointer","212":"vizsla","213":"English setter","214":"Irish setter","215":"Gordon setter","216":"Brittany spaniel","217":"clumber","218":"English springer","219":"Welsh springer spaniel","220":"cocker spaniel","221":"Sussex spaniel","222":"Irish water spaniel","223":"kuvasz","224":"schipperke","225":"groenendael","226":"malinois","227":"briard","228":"kelpie","229":"komondor","230":"Old English sheepdog","231":"Shetland sheepdog","232":"collie","233":"Border collie","234":"Bouvier des Flandres","235":"Rottweiler","236":"German shepherd","237":"Doberman","238":"miniature pinscher","239":"Greater Swiss Mountain dog","240":"Bernese mountain dog","241":"Appenzeller","242":"EntleBucher","243":"boxer","244":"bull mastiff","245":"Tibetan mastiff","246":"French bulldog","247":"Great Dane","248":"Saint Bernard","249":"Eskimo dog","250":"malamute","251":"Siberian husky","252":"dalmatian","253":"affenpinscher","254":"basenji","255":"pug","256":"Leonberg","257":"Newfoundland","258":"Great Pyrenees","259":"Samoyed","260":"Pomeranian","261":"chow","262":"keeshond","263":"Brabancon griffon","264":"Pembroke","265":"Cardigan","266":"toy poodle","267":"miniature poodle","268":"standard poodle","269":"Mexican hairless","270":"timber wolf","271":"white wolf","272":"red wolf","273":"coyote","274":"dingo","275":"dhole","276":"African hunting dog","277":"hyena","278":"red fox","279":"kit fox","280":"Arctic fox","281":"grey fox","282":"tabby","283":"tiger cat","284":"Persian cat","285":"Siamese cat","286":"Egyptian cat","287":"cougar","288":"lynx","289":"leopard","290":"snow leopard","291":"jaguar","292":"lion","293":"tiger","294":"cheetah","295":"brown bear","296":"American black bear","297":"ice bear","298":"sloth bear","299":"mongoose","300":"meerkat","301":"tiger beetle","302":"ladybug","303":"ground beetle","304":"long-horned beetle","305":"leaf beetle","306":"dung beetle","307":"rhinoceros beetle","308":"weevil","309":"fly","310":"bee","311":"ant","312":"grasshopper","313":"cricket","314":"walking stick","315":"cockroach","316":"mantis","317":"cicada","318":"leafhopper","319":"lacewing","320":"dragonfly","321":"damselfly","322":"admiral","323":"ringlet","324":"monarch","325":"cabbage butterfly","326":"sulphur butterfly","327":"lycaenid","328":"starfish","329":"sea urchin","330":"sea cucumber","331":"wood rabbit","332":"hare","333":"Angora","334":"hamster","335":"porcupine","336":"fox squirrel","337":"marmot","338":"beaver","339":"guinea pig","340":"sorrel","341":"zebra","342":"hog","343":"wild boar","344":"warthog","345":"hippopotamus","346":"ox","347":"water buffalo","348":"bison","349":"ram","350":"bighorn","351":"ibex","352":"hartebeest","353":"impala","354":"gazelle","355":"Arabian camel","356":"llama","357":"weasel","358":"mink","359":"polecat","360":"black-footed ferret","361":"otter","362":"skunk","363":"badger","364":"armadillo","365":"three-toed sloth","366":"orangutan","367":"gorilla","368":"chimpanzee","369":"gibbon","370":"siamang","371":"guenon","372":"patas","373":"baboon","374":"macaque","375":"langur","376":"colobus","377":"proboscis monkey","378":"marmoset","379":"capuchin","380":"howler monkey","381":"titi","382":"spider monkey","383":"squirrel monkey","384":"Madagascar cat","385":"indri","386":"Indian elephant","387":"African elephant","388":"lesser panda","389":"giant panda","390":"barracouta","391":"eel","392":"coho","393":"rock beauty","394":"anemone fish","395":"sturgeon","396":"gar","397":"lionfish","398":"puffer","399":"abacus","400":"abaya","401":"academic gown","402":"accordion","403":"acoustic guitar","404":"aircraft carrier","405":"airliner","406":"airship","407":"altar","408":"ambulance","409":"amphibian","410":"analog clock","411":"apiary","412":"apron","413":"ashcan","414":"assault rifle","415":"backpack","416":"bakery","417":"balance beam","418":"balloon","419":"ballpoint","420":"Band Aid","421":"banjo","422":"bannister","423":"barbell","424":"barber chair","425":"barbershop","426":"barn","427":"barometer","428":"barrel","429":"barrow","430":"baseball","431":"basketball","432":"bassinet","433":"bassoon","434":"bathing cap","435":"bath towel","436":"bathtub","437":"beach wagon","438":"beacon","439":"beaker","440":"bearskin","441":"beer bottle","442":"beer glass","443":"bell cote","444":"bib","445":"bicycle-built-for-two","446":"bikini","447":"binder","448":"binoculars","449":"birdhouse","450":"boathouse","451":"bobsled","452":"bolo tie","453":"bonnet","454":"bookcase","455":"bookshop","456":"bottlecap","457":"bow","458":"bow tie","459":"brass","460":"brassiere","461":"breakwater","462":"breastplate","463":"broom","464":"bucket","465":"buckle","466":"bulletproof vest","467":"bullet train","468":"butcher shop","469":"cab","470":"caldron","471":"candle","472":"cannon","473":"canoe","474":"can opener","475":"cardigan","476":"car mirror","477":"carousel","478":"carpenter's kit","479":"carton","480":"car wheel","481":"cash machine","482":"cassette","483":"cassette player","484":"castle","485":"catamaran","486":"CD player","487":"cello","488":"cellular telephone","489":"chain","490":"chainlink fence","491":"chain mail","492":"chain saw","493":"chest","494":"chiffonier","495":"chime","496":"china cabinet","497":"Christmas stocking","498":"church","499":"cinema","500":"cleaver","501":"cliff dwelling","502":"cloak","503":"clog","504":"cocktail shaker","505":"coffee mug","506":"coffeepot","507":"coil","508":"combination lock","509":"computer keyboard","510":"confectionery","511":"container ship","512":"convertible","513":"corkscrew","514":"cornet","515":"cowboy boot","516":"cowboy hat","517":"cradle","518":"crane","519":"crash helmet","520":"crate","521":"crib","522":"Crock Pot","523":"croquet ball","524":"crutch","525":"cuirass","526":"dam","527":"desk","528":"desktop computer","529":"dial telephone","530":"diaper","531":"digital clock","532":"digital watch","533":"dining table","534":"dishrag","535":"dishwasher","536":"disk brake","537":"dock","538":"dogsled","539":"dome","540":"doormat","541":"drilling platform","542":"drum","543":"drumstick","544":"dumbbell","545":"Dutch oven","546":"electric fan","547":"electric guitar","548":"electric locomotive","549":"entertainment center","550":"envelope","551":"espresso maker","552":"face powder","553":"feather boa","554":"file","555":"fireboat","556":"fire engine","557":"fire screen","558":"flagpole","559":"flute","560":"folding chair","561":"football helmet","562":"forklift","563":"fountain","564":"fountain pen","565":"four-poster","566":"freight car","567":"French horn","568":"frying pan","569":"fur coat","570":"garbage truck","571":"gasmask","572":"gas pump","573":"goblet","574":"go-kart","575":"golf ball","576":"golfcart","577":"gondola","578":"gong","579":"gown","580":"grand piano","581":"greenhouse","582":"grille","583":"grocery store","584":"guillotine","585":"hair slide","586":"hair spray","587":"half track","588":"hammer","589":"hamper","590":"hand blower","591":"hand-held computer","592":"handkerchief","593":"hard disc","594":"harmonica","595":"harp","596":"harvester","597":"hatchet","598":"holster","599":"home theater","600":"honeycomb","601":"hook","602":"hoopskirt","603":"horizontal bar","604":"horse cart","605":"hourglass","606":"iPod","607":"iron","608":"jack-o'-lantern","609":"jean","610":"jeep","611":"jersey","612":"jigsaw puzzle","613":"jinrikisha","614":"joystick","615":"kimono","616":"knee pad","617":"knot","618":"lab coat","619":"ladle","620":"lampshade","621":"laptop","622":"lawn mower","623":"lens cap","624":"letter opener","625":"library","626":"lifeboat","627":"lighter","628":"limousine","629":"liner","630":"lipstick","631":"Loafer","632":"lotion","633":"loudspeaker","634":"loupe","635":"lumbermill","636":"magnetic compass","637":"mailbag","638":"mailbox","639":"maillot","640":"maillot","641":"manhole cover","642":"maraca","643":"marimba","644":"mask","645":"matchstick","646":"maypole","647":"maze","648":"measuring cup","649":"medicine chest","650":"megalith","651":"microphone","652":"microwave","653":"military uniform","654":"milk can","655":"minibus","656":"miniskirt","657":"minivan","658":"missile","659":"mitten","660":"mixing bowl","661":"mobile home","662":"Model T","663":"modem","664":"monastery","665":"monitor","666":"moped","667":"mortar","668":"mortarboard","669":"mosque","670":"mosquito net","671":"motor scooter","672":"mountain bike","673":"mountain tent","674":"mouse","675":"mousetrap","676":"moving van","677":"muzzle","678":"nail","679":"neck brace","680":"necklace","681":"nipple","682":"notebook","683":"obelisk","684":"oboe","685":"ocarina","686":"odometer","687":"oil filter","688":"organ","689":"oscilloscope","690":"overskirt","691":"oxcart","692":"oxygen mask","693":"packet","694":"paddle","695":"paddlewheel","696":"padlock","697":"paintbrush","698":"pajama","699":"palace","700":"panpipe","701":"paper towel","702":"parachute","703":"parallel bars","704":"park bench","705":"parking meter","706":"passenger car","707":"patio","708":"pay-phone","709":"pedestal","710":"pencil box","711":"pencil sharpener","712":"perfume","713":"Petri dish","714":"photocopier","715":"pick","716":"pickelhaube","717":"picket fence","718":"pickup","719":"pier","720":"piggy bank","721":"pill bottle","722":"pillow","723":"ping-pong ball","724":"pinwheel","725":"pirate","726":"pitcher","727":"plane","728":"planetarium","729":"plastic bag","730":"plate rack","731":"plow","732":"plunger","733":"Polaroid camera","734":"pole","735":"police van","736":"poncho","737":"pool table","738":"pop bottle","739":"pot","740":"potter's wheel","741":"power drill","742":"prayer rug","743":"printer","744":"prison","745":"projectile","746":"projector","747":"puck","748":"punching bag","749":"purse","750":"quill","751":"quilt","752":"racer","753":"racket","754":"radiator","755":"radio","756":"radio telescope","757":"rain barrel","758":"recreational vehicle","759":"reel","760":"reflex camera","761":"refrigerator","762":"remote control","763":"restaurant","764":"revolver","765":"rifle","766":"rocking chair","767":"rotisserie","768":"rubber eraser","769":"rugby ball","770":"rule","771":"running shoe","772":"safe","773":"safety pin","774":"saltshaker","775":"sandal","776":"sarong","777":"sax","778":"scabbard","779":"scale","780":"school bus","781":"schooner","782":"scoreboard","783":"screen","784":"screw","785":"screwdriver","786":"seat belt","787":"sewing machine","788":"shield","789":"shoe shop","790":"shoji","791":"shopping basket","792":"shopping cart","793":"shovel","794":"shower cap","795":"shower curtain","796":"ski","797":"ski mask","798":"sleeping bag","799":"slide rule","800":"sliding door","801":"slot","802":"snorkel","803":"snowmobile","804":"snowplow","805":"soap dispenser","806":"soccer ball","807":"sock","808":"solar dish","809":"sombrero","810":"soup bowl","811":"space bar","812":"space heater","813":"space shuttle","814":"spatula","815":"speedboat","816":"spider web","817":"spindle","818":"sports car","819":"spotlight","820":"stage","821":"steam locomotive","822":"steel arch bridge","823":"steel drum","824":"stethoscope","825":"stole","826":"stone wall","827":"stopwatch","828":"stove","829":"strainer","830":"streetcar","831":"stretcher","832":"studio couch","833":"stupa","834":"submarine","835":"suit","836":"sundial","837":"sunglass","838":"sunglasses","839":"sunscreen","840":"suspension bridge","841":"swab","842":"sweatshirt","843":"swimming trunks","844":"swing","845":"switch","846":"syringe","847":"table lamp","848":"tank","849":"tape player","850":"teapot","851":"teddy","852":"television","853":"tennis ball","854":"thatch","855":"theater curtain","856":"thimble","857":"thresher","858":"throne","859":"tile roof","860":"toaster","861":"tobacco shop","862":"toilet seat","863":"torch","864":"totem pole","865":"tow truck","866":"toyshop","867":"tractor","868":"trailer truck","869":"tray","870":"trench coat","871":"tricycle","872":"trimaran","873":"tripod","874":"triumphal arch","875":"trolleybus","876":"trombone","877":"tub","878":"turnstile","879":"typewriter keyboard","880":"umbrella","881":"unicycle","882":"upright","883":"vacuum","884":"vase","885":"vault","886":"velvet","887":"vending machine","888":"vestment","889":"viaduct","890":"violin","891":"volleyball","892":"waffle iron","893":"wall clock","894":"wallet","895":"wardrobe","896":"warplane","897":"washbasin","898":"washer","899":"water bottle","900":"water jug","901":"water tower","902":"whiskey jug","903":"whistle","904":"wig","905":"window screen","906":"window shade","907":"Windsor tie","908":"wine bottle","909":"wing","910":"wok","911":"wooden spoon","912":"wool","913":"worm fence","914":"wreck","915":"yawl","916":"yurt","917":"web site","918":"comic book","919":"crossword puzzle","920":"street sign","921":"traffic light","922":"book jacket","923":"menu","924":"plate","925":"guacamole","926":"consomme","927":"hot pot","928":"trifle","929":"ice cream","930":"ice lolly","931":"French loaf","932":"bagel","933":"pretzel","934":"cheeseburger","935":"hotdog","936":"mashed potato","937":"head cabbage","938":"broccoli","939":"cauliflower","940":"zucchini","941":"spaghetti squash","942":"acorn squash","943":"butternut squash","944":"cucumber","945":"artichoke","946":"bell pepper","947":"cardoon","948":"mushroom","949":"Granny Smith","950":"strawberry","951":"orange","952":"lemon","953":"fig","954":"pineapple","955":"banana","956":"jackfruit","957":"custard apple","958":"pomegranate","959":"hay","960":"carbonara","961":"chocolate sauce","962":"dough","963":"meat loaf","964":"pizza","965":"potpie","966":"burrito","967":"red wine","968":"espresso","969":"cup","970":"eggnog","971":"alp","972":"bubble","973":"cliff","974":"coral reef","975":"geyser","976":"lakeside","977":"promontory","978":"sandbar","979":"seashore","980":"valley","981":"volcano","982":"ballplayer","983":"groom","984":"scuba diver","985":"rapeseed","986":"daisy","987":"yellow lady's slipper","988":"corn","989":"acorn","990":"hip","991":"buckeye","992":"coral fungus","993":"agaric","994":"gyromitra","995":"stinkhorn","996":"earthstar","997":"hen-of-the-woods","998":"bolete","999":"ear","1000":"toilet tissue"};
153 | 
154 | $(document).ready(function(){
155 |   var arr = $.map(labels, function(el) { return el });
156 |   $( "#label" ).autocomplete({
157 |     source: arr
158 |   });
159 | });
160 | 
161 | var getLocation = function(href) {
162 |     var l = document.createElement("a");
163 |     l.href = href;
164 |     return l;
165 | };
166 | 
167 | function submitDemoImage(src){
168 |   var img_path = getLocation(src).pathname;
169 |   $("#inputImageAfterUpload").attr('src', img_path);
170 |   $("#label").val("");
171 |   $("#show-grad-cam-result").hide();
172 |   $("#ResultDiv").show();
173 |   scrollToElement($("#termstart"));
174 |   $('#comments').prepend('<br>');
175 |   $('#comments').prepend('<li>' + "Submitted demo image" + '</li>');
176 |   scrollToElement($("#ResultDiv"));
177 | }
178 | 
179 | function submitImageForClassification () {
180 |   var label = $("#label").val();
181 |   var label_id = null;
182 |   $.each(labels, function(index, value) {
183 |         if(value == label){
184 |           label_id = index;
185 |           return false;
186 |         }
187 | 
188 |         label_id = -1;
189 |   });
190 | 
191 |   console.log("The label id is " + label_id);
192 | 
193 |   var l = $("#inputImageAfterUpload")[0].src;
194 |   var img_path = getLocation(l).pathname;
195 | 
196 |   var data = { 'img_path': img_path, 'label': label_id};
197 | 
198 |   $.ajax({
199 |     type    : 'POST', // define the type of HTTP verb we want to use (POST for our form)
200 |     url     : '{% url 'classification' %}', // the url where we want to POST
201 |     data    : { 'img_path': img_path, 'csrfmiddlewaretoken': "{{ csrf_token }}", 'label': label_id, 'socketid': "{{socketid}}"} // our data object
202 |   }) // using the done promise callback
203 |   .done(function(response) {
204 |     console.log("Ajax call completes");
205 |   });
206 | }
207 | 
208 | $(document).ready(function(){
209 |   var ws_scheme = window.location.protocol == "https:" ? "wss" : "ws";
210 |   var socket = new WebSocket(ws_scheme + '://' + window.location.host + "/chat" + window.location.pathname);
211 |   console.log(socket);
212 |   socket.onopen = function() {
213 |       this.send("{{ socketid}}");
214 |       console.log("User connected to the socket with socketid "+ "{{socketid}}");
215 |   }
216 | 
217 |   socket.onmessage = function(response) {
218 |     console.log("Getting response from the worker.....");
219 |     console.log(JSON.parse(response.data));
220 | 
221 |     response = JSON.parse(response.data);
222 | 
223 |     if ("info" in response) {
224 |       console.log("Info is there as the key");
225 |     }
226 | 
227 |     if ("terminal" in response) {
228 |       $('#comments').prepend('<li>' + response['terminal'] + '</li>');
229 |     }
230 | 
231 |     if("result" in response){
232 | 
233 |       result = JSON.parse(response['result']);
234 |       console.log(result);
235 | 
236 |       console.log(result['classify_gcam_raw']);
237 |       console.log(result['classify_gb']);
238 |       console.log(result['classify_gb_gcam']);
239 |       console.log("Result key exists");
240 | 
241 |       $("#inputLabel").text(labels[result['label']]);
242 |       $("#predictedLabel").text(labels[result['pred_label']]);
243 |       $("#overImg1").attr("src", result['input_image']);
244 | 
245 |       var d = new Date();
246 |       $("#img1").attr("src",result['classify_gcam_raw']+"?"+d.getTime());
247 |       $("#img2").attr("src",result['classify_gb']+"?"+d.getTime());
248 |       $("#img3").attr("src",result['classify_gb_gcam']+"?"+d.getTime());
249 |       $("#show-grad-cam-result").show();
250 |       scrollToElement($("#show-grad-cam-result"));
251 |       $('#comments').prepend('<br>');
252 |     }
253 |   }
254 | });
255 | 
256 | function submitImageUsingUrl(){
257 |   var src = document.getElementById("image_url").value;
258 |   $('#comments').prepend('<br>');
259 |   $('#comments').prepend('<li>' + "Starting the Image Download process." + '</li>');
260 | 
261 |   scrollToElement($("#termstart"));
262 |   scrollToElement($("#resultHeading"));
263 | 
264 |   $.ajax({
265 |     type : "POST",
266 |     url  : '{% url 'upload-url' %}',
267 |     data : {'src': src  , 'socketid': "{{socketid}}", 'csrfmiddlewaretoken': '{{ csrf_token }}', type:"classification"}
268 |   }).done(function(data){
269 |     console.log(data);
270 |     $("#inputImageAfterUpload").attr('src', data["file_path"]);
271 |     $("#label").val("");
272 |     $("#show-grad-cam-result").hide();
273 |     $("#ResultDiv").show();
274 |   });
275 | };
276 | 
277 | $("#image_url").keydown(function(e){
278 |   if (e.which === 13){
279 |     $("#image_url_submit_btn").click();
280 |   }
281 | });
282 | 
283 | $('#image_url').on('paste', function(){
284 |   setTimeout(function(){
285 |     $("#image_url_submit_btn").click();
286 |   }, 0);
287 | });
288 | 
289 | </script>
290 | 
291 | <script type="text/javascript">
292 |   // Overriden 
293 |   Dropzone.options.myDropzone = {
294 |     autoProcessQueue: true,
295 |     uploadMultiple: false,
296 |     maxFiles: 10,
297 | 
298 |     init: function() {
299 |       var myDropzone = this;
300 |       this.hiddenFileInput.removeAttribute('multiple');
301 | 
302 |       myDropzone.on('success', function(file, data){
303 |         console.log(data);
304 |         $("#inputImageAfterUpload").attr('src', data['file_path']);
305 |         $("#show-grad-cam-result").hide();
306 |         $("#ResultDiv").show();
307 |         $("#demoType").val("uploadedImageType");
308 |         $("#label").val("");
309 |         scrollToElement($("#ResultDiv"));
310 |       });
311 |     }
312 |   }
313 | </script>
314 | 
315 | <script type="text/javascript">
316 | 
317 | </script>
318 | <br>
319 |   <div class="page-header">
320 |     <h2 id="resultHeading" class="center">Result of Grad-CAM for Classification</h2>
321 |   </div>
322 | <div id="ResultDiv" class="row" style="padding-bottom:50px; display:None;">
323 |   <div class="col-md-5" style="padding-bottom: 30px; clear: both;">
324 |     <img class="img-responsive" src="" style="height: 300px;" id="inputImageAfterUpload">
325 |   </div>
326 |   <div class="col-md-7" style="padding-bottom: 30px;">
327 |   <input id="label" class="form-control" name="label" placeholder="Start typing label...(Optional)" >
328 |     <br>
329 |     <input type="button" value="Submit" onclick="submitImageForClassification()" class="btn btn-primary">
330 |   </div>
331 | </div>
332 |   <div class="row demoImages" style="display:None;" id="show-grad-cam-result" >
333 | 
334 |   <div class="col-md-12 resultText">
335 |     <h3 style="display: inline;" align="center">Predicted Label : &nbsp;</h3>
336 |     <h3 id="predictedLabel" style="display: inline;" class="center"></h3>
337 |   </div>
338 | 
339 |     <div class="col-md-12 resultText">
340 |       <h3 style="display: inline;" class="center">Generating Grad-CAM visualizations for: &nbsp;</h3>
341 |       <h3 style="display: inline;" class="center" id="inputLabel"></h3> 
342 |     </div>
343 | 
344 |     <div class="col-md-4">
345 |       <img src="" class="col-md-12 finalImages" id="img2">
346 |         <p class="caption" style="font-size: 14 px;" align="left">Guided Backprop</p>
347 |     </div>
348 |     <div class="col-md-4">
349 |       <img src="" class="over col-md-12 finalImages" id="overImg1" />
350 |       <img src="" class="under col-md-12 finalImages" id="img1">
351 |       <p class="caption" style="font-size: 14 px;" align="left" id="gradCamCaption">Grad-CAM</p>
352 |     </div>
353 |     <div class="col-md-4">
354 |       <img src="" class="col-md-12 finalImages" id="img3">
355 |         <p class="caption" style="font-size: 14 px; padding-left: 5px;" align="left">Guided Grad-CAM</p>
356 |     </div>
357 | </div>
358 | {% endblock %}
359 | 
360 | {% block credits %}
361 | <h2 class="page-header"> Credits </h2>
362 | <font size="4">
363 |   Built by <a href="http://github.com/DESHRAJ" target="_blank">@deshraj</a>
364 |   <br><br>
365 | </font>
366 | 
367 |  <br>
368 | </div>
369 | 
370 | </body>
371 | <script type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/reconnecting-websocket/1.0.0/reconnecting-websocket.min.js"></script>
372 | 
373 | </html>
374 | {% endblock %}
375 | 


--------------------------------------------------------------------------------
/grad_cam/templates/vqa/vqa.html:
--------------------------------------------------------------------------------
   1 | {% extends 'base.html' %}
   2 | 
   3 | 
   4 | {% block header_content %}
   5 | 
   6 | <a href="https://github.com/Cloud-CV/Grad-CAM" target="_blank"><img style="position: fixed; top: 0; right: 0; border: 0; z-index:2000;" src="https://camo.githubusercontent.com/365986a132ccd6a44c23a9169022c0b5c890c387/68747470733a2f2f73332e616d617a6f6e6177732e636f6d2f6769746875622f726962626f6e732f666f726b6d655f72696768745f7265645f6161303030302e706e67" alt="Fork me on GitHub" data-canonical-src="https://s3.amazonaws.com/github/ribbons/forkme_right_red_aa0000.png"></a>
   7 | 
   8 | <div class="container">
   9 |     <div class="page-header">
  10 |         <h1 align="center">Grad-CAM: Gradient-weighted Class Activation Mapping</h1>
  11 |         <br><h4>Grad-CAM highlights regions of the image the VQA model looks at while making predictions.</h4>
  12 |         <font size="4">
  13 |             <p>
  14 |                 Torch code for Grad-CAM is available <a href="//github.com/ramprs/grad-cam">here</a>. Browsers currently supported by the demo: Google Chrome, Mozilla Firefox.
  15 |             </p>
  16 |         </font>
  17 |     </div>
  18 | </div>
  19 | 
  20 | {% endblock %}
  21 | 
  22 | {% block form %}
  23 | <style type="text/css">
  24 | 
  25 |   .caption {
  26 |     font-size: 18px !important;
  27 |     font-weight: bold;
  28 | }
  29 | 
  30 | #inputAnswer, #predictedAnswer{
  31 |     font-weight: bold;
  32 | }
  33 | 
  34 | .under
  35 | {
  36 | position:absolute;
  37 | z-index:-1;
  38 | }
  39 | 
  40 | .over
  41 | {
  42 | position:absolute;
  43 | z-index:0;
  44 | mix-blend-mode: multiply;
  45 | }
  46 | 
  47 | #gradCamCaption{
  48 |   position: relative;
  49 |   padding-top: 350px;
  50 | }
  51 | 
  52 | .finalImages{
  53 |   width: 350px !important;
  54 |   height: 350px !important;
  55 |   padding: 6px;
  56 | }
  57 | 
  58 | .resultText{
  59 |   margin-bottom: 15px !important;
  60 | }
  61 | 
  62 | </style>
  63 | 
  64 | <div class="container">
  65 |   <div class="page-header">
  66 |     <h2 id="userImages">Try Grad-CAM on your images</h2>
  67 |   </div>
  68 |   {% block url_content %}
  69 |   {% include 'upload_image_url.html' %}
  70 |   {% endblock %}
  71 |   <div class="col-sm-12">
  72 |     <h3 align="center">OR</h3>
  73 |   </div>
  74 |     
  75 |   <div class="container">
  76 |     <form id="my-dropzone" method="post" class="dropzone" action="{% url "upload" %}" enctype="multipart/form-data">
  77 |     <input type="hidden" id="demoType" name="demo_type" value=""> 
  78 |     <input type="hidden" id="appType" name="type" value="vqa"> 
  79 |     {% csrf_token %}
  80 | 
  81 |     {% include 'form.html' %}
  82 |     </form>
  83 |   </div>
  84 | 
  85 | {% endblock %}
  86 | 
  87 | 
  88 | {% block result %}
  89 | 
  90 | 
  91 | <script type="text/javascript">
  92 | 
  93 | var answers = {
  94 |   "1":"yes",
  95 |   "2":"no",
  96 |   "3":"2",
  97 |   "4":"1",
  98 |   "5":"white",
  99 |   "6":"3",
 100 |   "7":"red",
 101 |   "8":"blue",
 102 |   "9":"4",
 103 |   "10":"green",
 104 |   "11":"black",
 105 |   "12":"yellow",
 106 |   "13":"brown",
 107 |   "14":"5",
 108 |   "15":"tennis",
 109 |   "16":"baseball",
 110 |   "17":"right",
 111 |   "18":"orange",
 112 |   "19":"bathroom",
 113 |   "20":"left",
 114 |   "21":"6",
 115 |   "22":"wood",
 116 |   "23":"frisbee",
 117 |   "24":"0",
 118 |   "25":"pink",
 119 |   "26":"pizza",
 120 |   "27":"gray",
 121 |   "28":"kitchen",
 122 |   "29":"skateboarding",
 123 |   "30":"cat",
 124 |   "31":"7",
 125 |   "32":"black and white",
 126 |   "33":"skiing",
 127 |   "34":"8",
 128 |   "35":"dog",
 129 |   "36":"surfing",
 130 |   "37":"water",
 131 |   "38":"snow",
 132 |   "39":"skateboard",
 133 |   "40":"10",
 134 |   "41":"wii",
 135 |   "42":"surfboard",
 136 |   "43":"man",
 137 |   "44":"kite",
 138 |   "45":"grass",
 139 |   "46":"purple",
 140 |   "47":"giraffe",
 141 |   "48":"eating",
 142 |   "49":"broccoli",
 143 |   "50":"stop",
 144 |   "51":"elephant",
 145 |   "52":"phone",
 146 |   "53":"apple",
 147 |   "54":"train",
 148 |   "55":"winter",
 149 |   "56":"umbrella",
 150 |   "57":"sheep",
 151 |   "58":"silver",
 152 |   "59":"horse",
 153 |   "60":"banana",
 154 |   "61":"motorcycle",
 155 |   "62":"9",
 156 |   "63":"laptop",
 157 |   "64":"beach",
 158 |   "65":"sunny",
 159 |   "66":"cake",
 160 |   "67":"brick",
 161 |   "68":"wine",
 162 |   "69":"woman",
 163 |   "70":"hat",
 164 |   "71":"12",
 165 |   "72":"bear",
 166 |   "73":"flowers",
 167 |   "74":"food",
 168 |   "75":"bananas",
 169 |   "76":"table",
 170 |   "77":"soccer",
 171 |   "78":"living room",
 172 |   "79":"female",
 173 |   "80":"bench",
 174 |   "81":"cow",
 175 |   "82":"bus",
 176 |   "83":"zebra",
 177 |   "84":"snowboarding",
 178 |   "85":"male",
 179 |   "86":"kites",
 180 |   "87":"11",
 181 |   "88":"hot dog",
 182 |   "89":"tennis racket",
 183 |   "90":"trees",
 184 |   "91":"helmet",
 185 |   "92":"night",
 186 |   "93":"fence",
 187 |   "94":"teddy bear",
 188 |   "95":"down",
 189 |   "96":"tile",
 190 |   "97":"tan",
 191 |   "98":"standing",
 192 |   "99":"camera",
 193 |   "100":"airport",
 194 |   "101":"outside",
 195 |   "102":"bat",
 196 |   "103":"bird",
 197 |   "104":"donut",
 198 |   "105":"cloudy",
 199 |   "106":"bed",
 200 |   "107":"christmas",
 201 |   "108":"zoo",
 202 |   "109":"tree",
 203 |   "110":"metal",
 204 |   "111":"cheese",
 205 |   "112":"20",
 206 |   "113":"bedroom",
 207 |   "114":"car",
 208 |   "115":"red and white",
 209 |   "116":"fork",
 210 |   "117":"palm",
 211 |   "118":"plane",
 212 |   "119":"cows",
 213 |   "120":"glass",
 214 |   "121":"bike",
 215 |   "122":"beer",
 216 |   "123":"chinese",
 217 |   "124":"suitcase",
 218 |   "125":"sitting",
 219 |   "126":"old",
 220 |   "127":"sandwich",
 221 |   "128":"carrots",
 222 |   "129":"boat",
 223 |   "130":"stripes",
 224 |   "131":"skis",
 225 |   "132":"blonde",
 226 |   "133":"glasses",
 227 |   "134":"15",
 228 |   "135":"up",
 229 |   "136":"chocolate",
 230 |   "137":"cell phone",
 231 |   "138":"13",
 232 |   "139":"nike",
 233 |   "140":"tv",
 234 |   "141":"walking",
 235 |   "142":"airplane",
 236 |   "143":"sand",
 237 |   "144":"chair",
 238 |   "145":"open",
 239 |   "146":"horses",
 240 |   "147":"birthday",
 241 |   "148":"mountains",
 242 |   "149":"fruit",
 243 |   "150":"fire hydrant",
 244 |   "151":"sunglasses",
 245 |   "152":"scissors",
 246 |   "153":"ocean",
 247 |   "154":"donuts",
 248 |   "155":"cold",
 249 |   "156":"wall",
 250 |   "157":"truck",
 251 |   "158":"tie",
 252 |   "159":"coffee",
 253 |   "160":"fall",
 254 |   "161":"many",
 255 |   "162":"girl",
 256 |   "163":"clear",
 257 |   "164":"usa",
 258 |   "165":"street",
 259 |   "166":"round",
 260 |   "167":"day",
 261 |   "168":"blue and white",
 262 |   "169":"toilet",
 263 |   "170":"plaid",
 264 |   "171":"snowboard",
 265 |   "172":"25",
 266 |   "173":"cooking",
 267 |   "174":"nothing",
 268 |   "175":"ski poles",
 269 |   "176":"wedding",
 270 |   "177":"wetsuit",
 271 |   "178":"knife",
 272 |   "179":"boy",
 273 |   "180":"ball",
 274 |   "181":"breakfast",
 275 |   "182":"sleeping",
 276 |   "183":"mirror",
 277 |   "184":"asian",
 278 |   "185":"africa",
 279 |   "186":"people",
 280 |   "187":"afternoon",
 281 |   "188":"toothbrush",
 282 |   "189":"plate",
 283 |   "190":"paper",
 284 |   "191":"on table",
 285 |   "192":"elephants",
 286 |   "193":"square",
 287 |   "194":"stone",
 288 |   "195":"mountain",
 289 |   "196":"window",
 290 |   "197":"dirt",
 291 |   "198":"couch",
 292 |   "199":"clock",
 293 |   "200":"city",
 294 |   "201":"no one",
 295 |   "202":"evening",
 296 |   "203":"14",
 297 |   "204":"zebras",
 298 |   "205":"happy",
 299 |   "206":"chicken",
 300 |   "207":"building",
 301 |   "208":"sun",
 302 |   "209":"backpack",
 303 |   "210":"police",
 304 |   "211":"playing wii",
 305 |   "212":"daytime",
 306 |   "213":"fish",
 307 |   "214":"luggage",
 308 |   "215":"flying kite",
 309 |   "216":"plastic",
 310 |   "217":"lot",
 311 |   "218":"spoon",
 312 |   "219":"on wall",
 313 |   "220":"park",
 314 |   "221":"england",
 315 |   "222":"remote",
 316 |   "223":"picture",
 317 |   "224":"oranges",
 318 |   "225":"brushing teeth",
 319 |   "226":"birds",
 320 |   "227":"restaurant",
 321 |   "228":"refrigerator",
 322 |   "229":"pine",
 323 |   "230":"50",
 324 |   "231":"watch",
 325 |   "232":"very",
 326 |   "233":"jeans",
 327 |   "234":"graffiti",
 328 |   "235":"brown and white",
 329 |   "236":"summer",
 330 |   "237":"rainy",
 331 |   "238":"background",
 332 |   "239":"talking on phone",
 333 |   "240":"sidewalk",
 334 |   "241":"safety",
 335 |   "242":"leaves",
 336 |   "243":"hay",
 337 |   "244":"concrete",
 338 |   "245":"carrot",
 339 |   "246":"16",
 340 |   "247":"motorcycles",
 341 |   "248":"bicycle",
 342 |   "249":"american",
 343 |   "250":"none",
 344 |   "251":"in water",
 345 |   "252":"child",
 346 |   "253":"umbrellas",
 347 |   "254":"overcast",
 348 |   "255":"gold",
 349 |   "256":"giraffes",
 350 |   "257":"field",
 351 |   "258":"wii remote",
 352 |   "259":"playing tennis",
 353 |   "260":"microwave",
 354 |   "261":"catcher",
 355 |   "262":"resting",
 356 |   "263":"floor",
 357 |   "264":"towel",
 358 |   "265":"rocks",
 359 |   "266":"ground",
 360 |   "267":"24",
 361 |   "268":"pepperoni",
 362 |   "269":"milk",
 363 |   "270":"london",
 364 |   "271":"coca cola",
 365 |   "272":"circle",
 366 |   "273":"books",
 367 |   "274":"30",
 368 |   "275":"heart",
 369 |   "276":"floral",
 370 |   "277":"checkered",
 371 |   "278":"vegetables",
 372 |   "279":"racket",
 373 |   "280":"church",
 374 |   "281":"apples",
 375 |   "282":"tomato",
 376 |   "283":"surfboards",
 377 |   "284":"middle",
 378 |   "285":"in air",
 379 |   "286":"double decker",
 380 |   "287":"vase",
 381 |   "288":"small",
 382 |   "289":"rainbow",
 383 |   "290":"person",
 384 |   "291":"on",
 385 |   "292":"light",
 386 |   "293":"flower",
 387 |   "294":"box",
 388 |   "295":"bag",
 389 |   "296":"pitcher",
 390 |   "297":"closed",
 391 |   "298":"bridge",
 392 |   "299":"shadow",
 393 |   "300":"rain",
 394 |   "301":"new york",
 395 |   "302":"sink",
 396 |   "303":"morning",
 397 |   "304":"clouds",
 398 |   "305":"bowl",
 399 |   "306":"gas",
 400 |   "307":"umpire",
 401 |   "308":"rock",
 402 |   "309":"parking meter",
 403 |   "310":"keyboard",
 404 |   "311":"taking picture",
 405 |   "312":"grazing",
 406 |   "313":"sandals",
 407 |   "314":"inside",
 408 |   "315":"100",
 409 |   "316":"striped",
 410 |   "317":"leather",
 411 |   "318":"bread",
 412 |   "319":"triangle",
 413 |   "320":"lights",
 414 |   "321":"drinking",
 415 |   "322":"baby",
 416 |   "323":"wire",
 417 |   "324":"reading",
 418 |   "325":"ketchup",
 419 |   "326":"blanket",
 420 |   "327":"salad",
 421 |   "328":"rope",
 422 |   "329":"china",
 423 |   "330":"sunset",
 424 |   "331":"purse",
 425 |   "332":"on left",
 426 |   "333":"computer",
 427 |   "334":"adidas",
 428 |   "335":"wilson",
 429 |   "336":"roses",
 430 |   "337":"road",
 431 |   "338":"18",
 432 |   "339":"jumping",
 433 |   "340":"dessert",
 434 |   "341":"canada",
 435 |   "342":"bears",
 436 |   "343":"river",
 437 |   "344":"hot dogs",
 438 |   "345":"goggles",
 439 |   "346":"young",
 440 |   "347":"texting",
 441 |   "348":"hotel",
 442 |   "349":"glove",
 443 |   "350":"dell",
 444 |   "351":"skate park",
 445 |   "352":"shorts",
 446 |   "353":"passenger",
 447 |   "354":"on plate",
 448 |   "355":"house",
 449 |   "356":"electric",
 450 |   "357":"desk",
 451 |   "358":"book",
 452 |   "359":"17",
 453 |   "360":"train station",
 454 |   "361":"soup",
 455 |   "362":"playing",
 456 |   "363":"photographer",
 457 |   "364":"oven",
 458 |   "365":"mouse",
 459 |   "366":"counter",
 460 |   "367":"cars",
 461 |   "368":"tracks",
 462 |   "369":"shirt",
 463 |   "370":"rose",
 464 |   "371":"red and yellow",
 465 |   "372":"rectangle",
 466 |   "373":"plant",
 467 |   "374":"olives",
 468 |   "375":"office",
 469 |   "376":"home",
 470 |   "377":"electricity",
 471 |   "378":"beige",
 472 |   "379":"windows",
 473 |   "380":"seagull",
 474 |   "381":"red and blue",
 475 |   "382":"guitar",
 476 |   "383":"gloves",
 477 |   "384":"star",
 478 |   "385":"spinach",
 479 |   "386":"shade",
 480 |   "387":"noon",
 481 |   "388":"large",
 482 |   "389":"delta",
 483 |   "390":"top",
 484 |   "391":"tennis ball",
 485 |   "392":"stop sign",
 486 |   "393":"smoke",
 487 |   "394":"wind",
 488 |   "395":"sky",
 489 |   "396":"sign",
 490 |   "397":"on ground",
 491 |   "398":"jacket",
 492 |   "399":"helmets",
 493 |   "400":"flying",
 494 |   "401":"branch",
 495 |   "402":"tabby",
 496 |   "403":"decoration",
 497 |   "404":"cutting board",
 498 |   "405":"bottom",
 499 |   "406":"tomatoes",
 500 |   "407":"tennis court",
 501 |   "408":"taking off",
 502 |   "409":"steam",
 503 |   "410":"stainless steel",
 504 |   "411":"sneakers",
 505 |   "412":"rug",
 506 |   "413":"lettuce",
 507 |   "414":"cup",
 508 |   "415":"basket",
 509 |   "416":"short",
 510 |   "417":"lemon",
 511 |   "418":"jet",
 512 |   "419":"indoors",
 513 |   "420":"head",
 514 |   "421":"both",
 515 |   "422":"wii controller",
 516 |   "423":"toy",
 517 |   "424":"stove",
 518 |   "425":"real",
 519 |   "426":"orange juice",
 520 |   "427":"oak",
 521 |   "428":"mustard",
 522 |   "429":"lab",
 523 |   "430":"clay",
 524 |   "431":"calm",
 525 |   "432":"blinds",
 526 |   "433":"white and blue",
 527 |   "434":"trash can",
 528 |   "435":"toilet paper",
 529 |   "436":"red and black",
 530 |   "437":"peppers",
 531 |   "438":"long",
 532 |   "439":"hot",
 533 |   "440":"hand",
 534 |   "441":"flag",
 535 |   "442":"fan",
 536 |   "443":"spring",
 537 |   "444":"ski",
 538 |   "445":"shoes",
 539 |   "446":"ponytail",
 540 |   "447":"fire",
 541 |   "448":"blue and yellow",
 542 |   "449":"40",
 543 |   "450":"water skiing",
 544 |   "451":"urban",
 545 |   "452":"swimming",
 546 |   "453":"school",
 547 |   "454":"samsung",
 548 |   "455":"protection",
 549 |   "456":"pictures",
 550 |   "457":"pepsi",
 551 |   "458":"parking",
 552 |   "459":"on desk",
 553 |   "460":"market",
 554 |   "461":"flip flops",
 555 |   "462":"tea",
 556 |   "463":"talking",
 557 |   "464":"suit",
 558 |   "465":"scarf",
 559 |   "466":"posing",
 560 |   "467":"polar",
 561 |   "468":"on bed",
 562 |   "469":"landing",
 563 |   "470":"english",
 564 |   "471":"diamond",
 565 |   "472":"collar",
 566 |   "473":"at camera",
 567 |   "474":"trash",
 568 |   "475":"raining",
 569 |   "476":"parrot",
 570 |   "477":"oval",
 571 |   "478":"laying down",
 572 |   "479":"good",
 573 |   "480":"bricks",
 574 |   "481":"boats",
 575 |   "482":"away",
 576 |   "483":"shelf",
 577 |   "484":"running",
 578 |   "485":"rice",
 579 |   "486":"pole",
 580 |   "487":"meat",
 581 |   "488":"lake",
 582 |   "489":"india",
 583 |   "490":"fridge",
 584 |   "491":"fork and knife",
 585 |   "492":"clothes",
 586 |   "493":"carpet",
 587 |   "494":"unknown",
 588 |   "495":"turkey",
 589 |   "496":"straw",
 590 |   "497":"playing frisbee",
 591 |   "498":"parasailing",
 592 |   "499":"lamp",
 593 |   "500":"cross",
 594 |   "501":"color",
 595 |   "502":"chef",
 596 |   "503":"bottle",
 597 |   "504":"boots",
 598 |   "505":"yellow and blue",
 599 |   "506":"strawberries",
 600 |   "507":"skateboards",
 601 |   "508":"polo",
 602 |   "509":"orange and white",
 603 |   "510":"one way",
 604 |   "511":"headphones",
 605 |   "512":"balance",
 606 |   "513":"strawberry",
 607 |   "514":"steel",
 608 |   "515":"p",
 609 |   "516":"octagon",
 610 |   "517":"military",
 611 |   "518":"headband",
 612 |   "519":"front",
 613 |   "520":"fries",
 614 |   "521":"dogs",
 615 |   "522":"dinner",
 616 |   "523":"bicycles",
 617 |   "524":"19",
 618 |   "525":"skateboarder",
 619 |   "526":"pillow",
 620 |   "527":"parking lot",
 621 |   "528":"parade",
 622 |   "529":"napkin",
 623 |   "530":"flying kites",
 624 |   "531":"cutting cake",
 625 |   "532":"cowboy",
 626 |   "533":"blender",
 627 |   "534":"bikes",
 628 |   "535":"23",
 629 |   "536":"shower",
 630 |   "537":"ring",
 631 |   "538":"pug",
 632 |   "539":"polar bear",
 633 |   "540":"on sidewalk",
 634 |   "541":"mercedes",
 635 |   "542":"japan",
 636 |   "543":"hydrant",
 637 |   "544":"granite",
 638 |   "545":"german",
 639 |   "546":"dirty",
 640 |   "547":"cutting",
 641 |   "548":"collie",
 642 |   "549":"carriage",
 643 |   "550":"asia",
 644 |   "551":"2 feet",
 645 |   "552":"tower",
 646 |   "553":"soda",
 647 |   "554":"reflection",
 648 |   "555":"outdoors",
 649 |   "556":"off",
 650 |   "557":"ford",
 651 |   "558":"dunkin donuts",
 652 |   "559":"duck",
 653 |   "560":"coke",
 654 |   "561":"clean",
 655 |   "562":"chain link",
 656 |   "563":"beef",
 657 |   "564":"above",
 658 |   "565":"wine glass",
 659 |   "566":"surf",
 660 |   "567":"spanish",
 661 |   "568":"pen",
 662 |   "569":"mcdonald's",
 663 |   "570":"indian",
 664 |   "571":"hit ball",
 665 |   "572":"fake",
 666 |   "573":"dusk",
 667 |   "574":"dress",
 668 |   "575":"chopsticks",
 669 |   "576":"bracelet",
 670 |   "577":"baseball bat",
 671 |   "578":"air",
 672 |   "579":"22",
 673 |   "580":"21",
 674 |   "581":"wool",
 675 |   "582":"w",
 676 |   "583":"ski lift",
 677 |   "584":"siamese",
 678 |   "585":"painting",
 679 |   "586":"onions",
 680 |   "587":"men",
 681 |   "588":"lighthouse",
 682 |   "589":"italy",
 683 |   "590":"ice cream",
 684 |   "591":"honda",
 685 |   "592":"gray and white",
 686 |   "593":"grapes",
 687 |   "594":"football",
 688 |   "595":"downhill",
 689 |   "596":"candles",
 690 |   "597":"bmw",
 691 |   "598":"200",
 692 |   "599":"white and red",
 693 |   "600":"watching",
 694 |   "601":"seagulls",
 695 |   "602":"red white and blue",
 696 |   "603":"ramp",
 697 |   "604":"poles",
 698 |   "605":"plants",
 699 |   "606":"owl",
 700 |   "607":"nowhere",
 701 |   "608":"no parking",
 702 |   "609":"net",
 703 |   "610":"necklace",
 704 |   "611":"lunch",
 705 |   "612":"kia",
 706 |   "613":"jump",
 707 |   "614":"ham",
 708 |   "615":"green and white",
 709 |   "616":"fishing",
 710 |   "617":"fire truck",
 711 |   "618":"ducks",
 712 |   "619":"bow",
 713 |   "620":"bacon",
 714 |   "621":"27",
 715 |   "622":"warm",
 716 |   "623":"tulips",
 717 |   "624":"slow",
 718 |   "625":"on floor",
 719 |   "626":"on counter",
 720 |   "627":"north",
 721 |   "628":"marble",
 722 |   "629":"in bowl",
 723 |   "630":"fedora",
 724 |   "631":"door",
 725 |   "632":"dock",
 726 |   "633":"big ben",
 727 |   "634":"batting",
 728 |   "635":"b",
 729 |   "636":"3 feet",
 730 |   "637":"van",
 731 |   "638":"toyota",
 732 |   "639":"terrier",
 733 |   "640":"tennis rackets",
 734 |   "641":"stuffed animal",
 735 |   "642":"riding",
 736 |   "643":"pot",
 737 |   "644":"pepper",
 738 |   "645":"on tracks",
 739 |   "646":"krispy kreme",
 740 |   "647":"fedex",
 741 |   "648":"dodgers",
 742 |   "649":"dining room",
 743 |   "650":"crosswalk",
 744 |   "651":"cigarette",
 745 |   "652":"big",
 746 |   "653":"basketball",
 747 |   "654":"bandana",
 748 |   "655":"bakery",
 749 |   "656":"back",
 750 |   "657":"art",
 751 |   "658":"visor",
 752 |   "659":"teddy bears",
 753 |   "660":"suitcases",
 754 |   "661":"sugar",
 755 |   "662":"stairs",
 756 |   "663":"sparrow",
 757 |   "664":"shoe",
 758 |   "665":"serve",
 759 |   "666":"public",
 760 |   "667":"paint",
 761 |   "668":"newspaper",
 762 |   "669":"monkey",
 763 |   "670":"low",
 764 |   "671":"face",
 765 |   "672":"candle",
 766 |   "673":"black and red",
 767 |   "674":"apartment",
 768 |   "675":"african",
 769 |   "676":"a",
 770 |   "677":"35",
 771 |   "678":"28",
 772 |   "679":"wet",
 773 |   "680":"united",
 774 |   "681":"tattoo",
 775 |   "682":"statue",
 776 |   "683":"starbucks",
 777 |   "684":"sprinkles",
 778 |   "685":"sailboat",
 779 |   "686":"parsley",
 780 |   "687":"on right",
 781 |   "688":"on grass",
 782 |   "689":"log",
 783 |   "690":"i don't know",
 784 |   "691":"hello kitty",
 785 |   "692":"go",
 786 |   "693":"giants",
 787 |   "694":"game",
 788 |   "695":"french",
 789 |   "696":"fast",
 790 |   "697":"eagle",
 791 |   "698":"children",
 792 |   "699":"cell phones",
 793 |   "700":"broken",
 794 |   "701":"bell",
 795 |   "702":"behind",
 796 |   "703":"batter",
 797 |   "704":"38",
 798 |   "705":"work",
 799 |   "706":"wooden",
 800 |   "707":"wicker",
 801 |   "708":"watermelon",
 802 |   "709":"washington",
 803 |   "710":"very tall",
 804 |   "711":"typing",
 805 |   "712":"tank top",
 806 |   "713":"t",
 807 |   "714":"surfer",
 808 |   "715":"snowy",
 809 |   "716":"sausage",
 810 |   "717":"red and green",
 811 |   "718":"phones",
 812 |   "719":"obama",
 813 |   "720":"nighttime",
 814 |   "721":"moving",
 815 |   "722":"ladder",
 816 |   "723":"hats",
 817 |   "724":"german shepherd",
 818 |   "725":"full",
 819 |   "726":"foil",
 820 |   "727":"fireplace",
 821 |   "728":"cross country",
 822 |   "729":"chihuahua",
 823 |   "730":"chicago",
 824 |   "731":"catching",
 825 |   "732":"c",
 826 |   "733":"55",
 827 |   "734":"yellow and red",
 828 |   "735":"working",
 829 |   "736":"white and black",
 830 |   "737":"vertical",
 831 |   "738":"vanilla",
 832 |   "739":"traveling",
 833 |   "740":"towels",
 834 |   "741":"tiger",
 835 |   "742":"stuffed animals",
 836 |   "743":"stick",
 837 |   "744":"south",
 838 |   "745":"sad",
 839 |   "746":"red sox",
 840 |   "747":"potatoes",
 841 |   "748":"playing baseball",
 842 |   "749":"pigeon",
 843 |   "750":"orioles",
 844 |   "751":"one on right",
 845 |   "752":"museum",
 846 |   "753":"medium",
 847 |   "754":"mask",
 848 |   "755":"magnets",
 849 |   "756":"little",
 850 |   "757":"horns",
 851 |   "758":"hair dryer",
 852 |   "759":"foreground",
 853 |   "760":"eggs",
 854 |   "761":"east",
 855 |   "762":"daisy",
 856 |   "763":"cumulus",
 857 |   "764":"cone",
 858 |   "765":"commercial",
 859 |   "766":"ceiling",
 860 |   "767":"cargo",
 861 |   "768":"bun",
 862 |   "769":"bucket",
 863 |   "770":"bar",
 864 |   "771":"women",
 865 |   "772":"white and brown",
 866 |   "773":"waves",
 867 |   "774":"united states",
 868 |   "775":"twin",
 869 |   "776":"tray",
 870 |   "777":"transportation",
 871 |   "778":"scooter",
 872 |   "779":"sandwiches",
 873 |   "780":"roman numerals",
 874 |   "781":"roman",
 875 |   "782":"pasta",
 876 |   "783":"navy",
 877 |   "784":"lion",
 878 |   "785":"library",
 879 |   "786":"laptops",
 880 |   "787":"high",
 881 |   "788":"harley",
 882 |   "789":"garbage",
 883 |   "790":"flags",
 884 |   "791":"cleaning",
 885 |   "792":"cats",
 886 |   "793":"butterfly",
 887 |   "794":"butter",
 888 |   "795":"bus stop",
 889 |   "796":"bulldog",
 890 |   "797":"basil",
 891 |   "798":"apron",
 892 |   "799":"60",
 893 |   "800":"vest",
 894 |   "801":"tail",
 895 |   "802":"swinging",
 896 |   "803":"sweater",
 897 |   "804":"subway",
 898 |   "805":"station",
 899 |   "806":"stars",
 900 |   "807":"smile",
 901 |   "808":"shrimp",
 902 |   "809":"shallow",
 903 |   "810":"runway",
 904 |   "811":"playing game",
 905 |   "812":"pineapple",
 906 |   "813":"pickles",
 907 |   "814":"pelican",
 908 |   "815":"peace",
 909 |   "816":"party",
 910 |   "817":"outdoor",
 911 |   "818":"on street",
 912 |   "819":"microphone",
 913 |   "820":"harley davidson",
 914 |   "821":"green and yellow",
 915 |   "822":"glazed",
 916 |   "823":"europe",
 917 |   "824":"driving",
 918 |   "825":"cookies",
 919 |   "826":"ceramic",
 920 |   "827":"cart",
 921 |   "828":"calico",
 922 |   "829":"bikini",
 923 |   "830":"32",
 924 |   "831":"10 feet",
 925 |   "832":"yellow and black",
 926 |   "833":"wild",
 927 |   "834":"uphill",
 928 |   "835":"tusks",
 929 |   "836":"tall",
 930 |   "837":"steak",
 931 |   "838":"sony",
 932 |   "839":"smiling",
 933 |   "840":"serving",
 934 |   "841":"sauce",
 935 |   "842":"railing",
 936 |   "843":"pork",
 937 |   "844":"polka dot",
 938 |   "845":"pigeons",
 939 |   "846":"pickle",
 940 |   "847":"parked",
 941 |   "848":"on tower",
 942 |   "849":"mushrooms",
 943 |   "850":"lots",
 944 |   "851":"leash",
 945 |   "852":"handle",
 946 |   "853":"halloween",
 947 |   "854":"hair",
 948 |   "855":"grill",
 949 |   "856":"golden retriever",
 950 |   "857":"goat",
 951 |   "858":"french fries",
 952 |   "859":"forward",
 953 |   "860":"egg",
 954 |   "861":"crane",
 955 |   "862":"cleats",
 956 |   "863":"cherry",
 957 |   "864":"chandelier",
 958 |   "865":"chain",
 959 |   "866":"camouflage",
 960 |   "867":"british airways",
 961 |   "868":"barn",
 962 |   "869":"bags",
 963 |   "870":"45",
 964 |   "871":"x",
 965 |   "872":"west",
 966 |   "873":"wave",
 967 |   "874":"watching tv",
 968 |   "875":"wagon",
 969 |   "876":"vases",
 970 |   "877":"straight",
 971 |   "878":"store",
 972 |   "879":"soccer ball",
 973 |   "880":"smoothie",
 974 |   "881":"selfie",
 975 |   "882":"racing",
 976 |   "883":"pizza cutter",
 977 |   "884":"pig",
 978 |   "885":"pier",
 979 |   "886":"piano",
 980 |   "887":"oil",
 981 |   "888":"nokia",
 982 |   "889":"modern",
 983 |   "890":"laying",
 984 |   "891":"kids",
 985 |   "892":"gothic",
 986 |   "893":"germany",
 987 |   "894":"garage",
 988 |   "895":"finch",
 989 |   "896":"empty",
 990 |   "897":"desert",
 991 |   "898":"deer",
 992 |   "899":"corn",
 993 |   "900":"cook",
 994 |   "901":"cones",
 995 |   "902":"circles",
 996 |   "903":"catching frisbee",
 997 |   "904":"candy",
 998 |   "905":"california",
 999 |   "906":"black and yellow",
1000 |   "907":"beard",
1001 |   "908":"barbed wire",
1002 |   "909":"army",
1003 |   "910":"all",
1004 |   "911":"adult",
1005 |   "912":"33",
1006 |   "913":"26",
1007 |   "914":"wires",
1008 |   "915":"water bottle",
1009 |   "916":"washington dc",
1010 |   "917":"waiting",
1011 |   "918":"toothbrushes",
1012 |   "919":"toaster oven",
1013 |   "920":"taxi",
1014 |   "921":"tag",
1015 |   "922":"suv",
1016 |   "923":"string",
1017 |   "924":"stool",
1018 |   "925":"setting",
1019 |   "926":"santa",
1020 |   "927":"power lines",
1021 |   "928":"poodle",
1022 |   "929":"pilot",
1023 |   "930":"owner",
1024 |   "931":"one on left",
1025 |   "932":"on building",
1026 |   "933":"italian",
1027 |   "934":"hungry",
1028 |   "935":"harness",
1029 |   "936":"half",
1030 |   "937":"france",
1031 |   "938":"fell",
1032 |   "939":"emirates",
1033 |   "940":"dry",
1034 |   "941":"dirt bike",
1035 |   "942":"controller",
1036 |   "943":"can",
1037 |   "944":"bull",
1038 |   "945":"british",
1039 |   "946":"bowling",
1040 |   "947":"bib",
1041 |   "948":"behind fence",
1042 |   "949":"baseball field",
1043 |   "950":"australia",
1044 |   "951":"asphalt",
1045 |   "952":"animals",
1046 |   "953":"44",
1047 |   "954":"29",
1048 |   "955":"2013",
1049 |   "956":"150",
1050 |   "957":"yellow and white",
1051 |   "958":"woods",
1052 |   "959":"volleyball",
1053 |   "960":"vegetable",
1054 |   "961":"traffic light",
1055 |   "962":"traffic",
1056 |   "963":"throwing",
1057 |   "964":"thin",
1058 |   "965":"swan",
1059 |   "966":"skull",
1060 |   "967":"skier",
1061 |   "968":"ship",
1062 |   "969":"san francisco",
1063 |   "970":"rural",
1064 |   "971":"polka dots",
1065 |   "972":"pitching",
1066 |   "973":"panda",
1067 |   "974":"out",
1068 |   "975":"nintendo",
1069 |   "976":"mozzarella",
1070 |   "977":"maple",
1071 |   "978":"man on right",
1072 |   "979":"man on left",
1073 |   "980":"m",
1074 |   "981":"lilies",
1075 |   "982":"kite flying",
1076 |   "983":"in field",
1077 |   "984":"ice",
1078 |   "985":"hospital",
1079 |   "986":"farm",
1080 |   "987":"do not enter",
1081 |   "988":"dark",
1082 |   "989":"daisies",
1083 |   "990":"curly",
1084 |   "991":"cupcake",
1085 |   "992":"cucumber",
1086 |   "993":"corner",
1087 |   "994":"clock tower",
1088 |   "995":"chips",
1089 |   "996":"cheesecake",
1090 |   "997":"chairs",
1091 |   "998":"center",
1092 |   "999":"cardboard",
1093 |   "1000":"business"
1094 | }
1095 | 
1096 |   $(document).ready(function(){
1097 |     var arr = $.map(answers, function(el) { return el });
1098 |     $( "#answer" ).autocomplete({
1099 |       source: arr
1100 |     });
1101 |   });
1102 | 
1103 |   // Overriden 
1104 |   Dropzone.options.myDropzone = {
1105 |     uploadMultiple: false,
1106 |     autoProcessQueue: true,
1107 |     maxFiles: 10,
1108 | 
1109 |     init: function() {
1110 |       var myDropzone = this;
1111 |       this.hiddenFileInput.removeAttribute('multiple');
1112 |       myDropzone.on('success', function(file, data){
1113 |         console.log(data);
1114 |         $("#inputImageAfterUpload").attr('src', data['file_path']);
1115 |         $("#ResultDiv").show();
1116 |         $("#show-grad-cam-result").hide();
1117 |         $("#demoType").val("uploadedImageType");
1118 |         $("#question").val("");
1119 |         $("#answer").val("");
1120 |         scrollToElement($("#termstart"));
1121 |         $('#comments').prepend('<br>');
1122 |         $('#comments').prepend('<li>' + "Image uploaded successfully..." + '</li>');
1123 |         scrollToElement($("#resultHeading"));
1124 |       });
1125 |     }
1126 |   }
1127 | </script>
1128 | 
1129 | <script type="text/javascript">
1130 | 
1131 | 
1132 | $(document).ready(function(){
1133 |   var ws_scheme = window.location.protocol == "https:" ? "wss" : "ws";
1134 |   var socket = new ReconnectingWebSocket(ws_scheme + '://' + window.location.host + "/chat" + window.location.pathname);
1135 | 
1136 |   socket.onopen = function() {
1137 |       console.log("User connected to the socket with socketid "+ "{{socketid}}");
1138 |       socket.send("{{ socketid }}");
1139 |   }
1140 | 
1141 |   socket.onmessage = function(response) {
1142 |     console.log("Getting response from the worker.....");
1143 |     console.log(JSON.parse(response.data));
1144 | 
1145 |     response = JSON.parse(response.data);
1146 | 
1147 |     if ("info" in response){
1148 |       console.log("Info is there as the key");
1149 |     }
1150 | 
1151 |     if ("terminal" in response) {
1152 |       $('#comments').prepend('<li>' + response['terminal'] + '</li>');
1153 |     }
1154 | 
1155 |     if("result" in response){
1156 | 
1157 |       result = JSON.parse(response['result']);
1158 |       console.log(result);
1159 |       var d = new Date();
1160 |       $("#overImg1").attr("src", result['input_image']);
1161 |       $("#img1").attr("src",result['vqa_gcam_raw']+"?"+d.getTime());
1162 |       $("#img2").attr("src",result['vqa_gb']+"?"+d.getTime());
1163 |       $("#img3").attr("src",result['vqa_gb_gcam']+"?"+d.getTime());
1164 |       $("#predictedAnswer").text(result['answer']);
1165 |       $("#inputAnswer").text(result['input_answer']);
1166 |       $("#show-grad-cam-result").show();
1167 |       scrollToElement($("#show-grad-cam-result"));
1168 |     }
1169 | 
1170 |   }
1171 | });
1172 | 
1173 |   var getLocation = function(href) {
1174 |       var l = document.createElement("a");
1175 |       l.href = href;
1176 |       return l;
1177 |   };
1178 | 
1179 | function submitDemoImage(src){
1180 |   $("#demoType").val("demoImageType");
1181 |   $("#show-grad-cam-result").hide();
1182 |   $("#question").val("");
1183 |   $("#answer").val("");
1184 |   var img_path = getLocation(src).pathname;
1185 |   $("#inputImageAfterUpload").attr('src', img_path);
1186 |   $("#ResultDiv").show();
1187 |   $('#comments').prepend('<br>');
1188 |   $('#comments').prepend('<li>' + "Submitted demo image" + '</li>');
1189 |   scrollToElement($("#termstart"));
1190 |   scrollToElement($("#resultHeading"));
1191 | }
1192 | 
1193 | function submitImageForVqa () {
1194 |   $("#show-grad-cam-result").hide();
1195 |   var question = $("#question").val();
1196 |   if (question){
1197 | 
1198 |   var answer = $("#answer").val();
1199 |   var demo_type = $("#demoType").val();
1200 |   var l = $("#inputImageAfterUpload")[0].src;
1201 |   var img_path = getLocation(l).pathname;
1202 | 
1203 |   $.ajax({
1204 |     type    : 'POST', // define the type of HTTP verb we want to use (POST for our form)
1205 |     url     : '{% url 'vqa' %}', // the url where we want to POST
1206 |     data    : { 'img_path': img_path, 'csrfmiddlewaretoken': '{{ csrf_token }}', 'question': question, 'answer': answer, 'socketid': "{{socketid}}"} // our data object
1207 |   })// using the done promise callback
1208 |   .done(function(response) {
1209 |     console.log("Ajax call completed successfully.")
1210 |   });
1211 |   }
1212 |   else{
1213 |     $('#comments').prepend('<li>' + "Enter the question to submit the job" + '</li>');
1214 |   }
1215 | }
1216 | 
1217 | function submitImageUsingUrl(){
1218 |   var src = document.getElementById("image_url").value;
1219 |   $('#comments').prepend('<br>');
1220 |   $('#comments').prepend('<li>' + "Starting the Image Download process." + '</li>');
1221 | 
1222 |   scrollToElement($("#termstart"));
1223 |   scrollToElement($("#resultHeading"));
1224 | 
1225 |   $.ajax({
1226 |     type : "POST",
1227 |     url  : '{% url 'upload-url' %}',
1228 |     data : {'src': src  , 'socketid': "{{socketid}}", 'csrfmiddlewaretoken': '{{ csrf_token }}', type:"vqa"}
1229 |   }).done(function(data){
1230 |     console.log(data);
1231 |     $("#inputImageAfterUpload").attr('src', data["file_path"]);
1232 |     $("#label").val("");
1233 |     $("#show-grad-cam-result").hide();
1234 |     $("#ResultDiv").show();
1235 |   });
1236 | };
1237 | 
1238 | $("#image_url").keydown(function(e){
1239 |   if (e.which === 13){
1240 |     $("#image_url_submit_btn").click();
1241 |   }
1242 | });
1243 | 
1244 | $('#image_url').on('paste', function(){
1245 |   setTimeout(function(){
1246 |     $("#image_url_submit_btn").click();
1247 |   }, 0);
1248 | });
1249 | 
1250 | </script>
1251 | <br>
1252 |   <div class="page-header">
1253 |     <h2 id="resultHeading" class="center">Result of Grad-CAM for Visual Question Answering</h2>
1254 |   </div>
1255 |   <br>
1256 | <div id="ResultDiv" class="row" style="display:None;">
1257 |   <div class="col-md-5" style="padding-bottom: 30px; clear: both;">
1258 |     <img class="img-responsive" src="" style="height: 300px;" id="inputImageAfterUpload">
1259 |   </div>
1260 |   <div class="col-md-7" style="padding-bottom: 30px;">
1261 |   <input id="question" class="form-control" name="question" placeholder="Enter the question" required><br>
1262 |   <input id="answer" class="form-control" name="answer" placeholder="Answer(Optional)"><br>
1263 |     <input type="button" value="Submit" onclick="submitImageForVqa()" class="btn btn-primary">
1264 |   </div>
1265 | </div>
1266 |   <div class="row demoImages" style="display:None;" id="show-grad-cam-result" >
1267 |     <div class="col-md-12 resultText">
1268 |       <h3 style="display: inline;" align="center">Predicted Answer : &nbsp;</h3>
1269 |       <h3 id="predictedAnswer" style="display: inline;" class="center"></h3>
1270 |     </div>
1271 | 
1272 |     <div class="col-md-12 resultText">
1273 |       <h3 style="display: inline;" class="center">Generating Grad-CAM visualizations for: &nbsp;</h3>
1274 |       <h3 id="inputAnswer" style="display: inline;" align="center"></h3>
1275 |     </div>
1276 | 
1277 |   <div class="row">
1278 |     
1279 |     <div class="col-md-4">
1280 |       <img src="" class="col-md-12 finalImages" id="img2">
1281 |         <p class="caption" style="font-size: 14 px;" align="left">Guided Backprop</p>
1282 |     </div>
1283 |     <div class="col-md-4">
1284 |       <img src="" class="over col-md-12 finalImages" id="overImg1" />
1285 |       <img src="" class="under col-md-12 finalImages" id="img1">
1286 |       <p class="caption" style="font-size: 14 px;" align="left" id="gradCamCaption">Grad-CAM</p>
1287 |     </div>
1288 |     <div class="col-md-4">
1289 |       <img src="" class="col-md-12 finalImages" id="img3">
1290 |         <p class="caption" style="font-size: 14 px; padding-left: 5px;" align="left">Guided Grad-CAM</p>
1291 |     </div>
1292 |   </div>
1293 |   </div>
1294 | {% endblock %}
1295 | 
1296 | {% block credits %}
1297 | <h2 class="page-header"> Credits </h2>
1298 | <font size="4">
1299 |   <a href="https://github.com/VT-vision-lab/VQA_LSTM_CNN">Code for VQA Model</a><br>
1300 |     Built by <a href="http://github.com/DESHRAJ" target="_blank">@deshraj</a><br>
1301 |   <br><br>
1302 | </font>
1303 | <br>
1304 |   </div>
1305 | 
1306 | </body>
1307 | <script type="text/javascript" src="https://cdnjs.cloudflare.com/ajax/libs/reconnecting-websocket/1.0.0/reconnecting-websocket.min.js"></script>
1308 | </html>
1309 | {% endblock %}
1310 | 


--------------------------------------------------------------------------------