├── .coveragerc
├── .gitignore
├── .travis.yml
├── LICENSE
├── README.md
├── experiments
    └── BigARTM_run_example.ipynb
├── library.md
├── presentation
    ├── article meeting.pdf
    ├── article meeting.tex
    ├── bibl.bib
    └── imgs
    │   ├── nade black.png
    │   ├── nade.png
    │   ├── rnn-encoder-decoder white.png
    │   └── rnn-encoder-decoder.png
├── requirements.txt
├── setup.py
└── snippet_ranger
    ├── __init__.py
    ├── __main__.py
    ├── data
        ├── matplotlib_dependent_reps.txt
        ├── numpy_dependent_reps.txt
        ├── pandas_dependent_reps.txt
        ├── tensorflow_dependent_reps.txt
        └── tqdm_dependent_reps.txt
    ├── librariesio_fetcher.py
    ├── model2
        ├── __init__.py
        ├── base_split.py
        ├── snippet2bow.py
        ├── snippet2df.py
        └── source2func.py
    ├── models
        ├── __init__.py
        └── snippet.py
    ├── pylib2uast.py
    ├── tests
        ├── __init__.py
        ├── data
        │   ├── snippet_test_repo.asdf
        │   ├── source_test_repo.asdf
        │   ├── test_lib.asdf
        │   ├── test_lib
        │   │   ├── __init__.py
        │   │   └── example.py
        │   ├── test_librariesio_data
        │   │   ├── projects-1.0.0-2017-06-15.csv
        │   │   └── repository_dependencies-1.0.0-2017-06-15.csv
        │   └── test_repo
        │   │   └── example.py
        ├── models.py
        ├── test_librariesio_fetcher.py
        ├── test_main.py
        ├── test_snippet.py
        ├── test_source2func.py
        └── test_utils.py
    └── utils.py


/.coveragerc:
--------------------------------------------------------------------------------
 1 | 
 2 | [run]
 3 | branch = True
 4 | source = snippet_ranger
 5 | 
 6 | [report]
 7 | exclude_lines =
 8 |     no cover
 9 |     raise NotImplementedError
10 |     if __name__ == "__main__":
11 | ignore_errors = True
12 | omit =
13 |     snippet_ranger/tests/*
14 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | # Mac specific
 2 | *.DS_Store
 3 | 
 4 | # Python
 5 | */__pycache__/*
 6 | *.pyc
 7 | 
 8 | # tex files
 9 | *.aux
10 | *.bbl
11 | *.blg
12 | *.fdb_latexmk
13 | *.fls
14 | *.log
15 | *.nav
16 | *.out
17 | *.snm
18 | *.synctex.gz
19 | *.toc
20 | *.vrb
21 | 
22 | # jupyter notebooks
23 | *.ipynb_checkpoints/
24 | 
25 | # pycharm
26 | .idea
27 | 
28 | #LibraryIO data
29 | data/Libraries/*


--------------------------------------------------------------------------------
/.travis.yml:
--------------------------------------------------------------------------------
 1 | language: python
 2 | sudo: false
 3 | dist: trusty
 4 | services:
 5 | - docker
 6 | cache:
 7 |   directories:
 8 |   - "$HOME/.cache/pip"
 9 | _install: &_install
10 |   - gimme 1.8
11 |   - source ~/.gimme/envs/latest.env
12 |   - pip install --upgrade pip
13 |   - pip install -r requirements.txt codecov
14 |   - pip install -e .
15 | _coverage: &_coverage
16 |   - SCRIPT="coverage run --concurrency=multiprocessing -m unittest discover && coverage combine"
17 | matrix:
18 |   include:
19 |     - python: 3.4
20 |       env: *_coverage
21 |       install: *_install
22 |     - python: 3.5
23 |       env: *_coverage
24 |       install: *_install
25 |     - python: 3.6
26 |       env: SCRIPT="pep8 --max-line-length=99 ."
27 |       install: pip install pep8
28 |     - python: 3.6
29 |       env: *_coverage
30 |       install: *_install
31 |       after_success:
32 |         - codecov
33 |   fast_finish: true
34 | script:
35 | - (eval "$SCRIPT")
36 | notifications:
37 |   email: false
38 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 |                                  Apache License
  2 |                            Version 2.0, January 2004
  3 |                         http://www.apache.org/licenses/
  4 | 
  5 |    TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
  6 | 
  7 |    1. Definitions.
  8 | 
  9 |       "License" shall mean the terms and conditions for use, reproduction,
 10 |       and distribution as defined by Sections 1 through 9 of this document.
 11 | 
 12 |       "Licensor" shall mean the copyright owner or entity authorized by
 13 |       the copyright owner that is granting the License.
 14 | 
 15 |       "Legal Entity" shall mean the union of the acting entity and all
 16 |       other entities that control, are controlled by, or are under common
 17 |       control with that entity. For the purposes of this definition,
 18 |       "control" means (i) the power, direct or indirect, to cause the
 19 |       direction or management of such entity, whether by contract or
 20 |       otherwise, or (ii) ownership of fifty percent (50%) or more of the
 21 |       outstanding shares, or (iii) beneficial ownership of such entity.
 22 | 
 23 |       "You" (or "Your") shall mean an individual or Legal Entity
 24 |       exercising permissions granted by this License.
 25 | 
 26 |       "Source" form shall mean the preferred form for making modifications,
 27 |       including but not limited to software source code, documentation
 28 |       source, and configuration files.
 29 | 
 30 |       "Object" form shall mean any form resulting from mechanical
 31 |       transformation or translation of a Source form, including but
 32 |       not limited to compiled object code, generated documentation,
 33 |       and conversions to other media types.
 34 | 
 35 |       "Work" shall mean the work of authorship, whether in Source or
 36 |       Object form, made available under the License, as indicated by a
 37 |       copyright notice that is included in or attached to the work
 38 |       (an example is provided in the Appendix below).
 39 | 
 40 |       "Derivative Works" shall mean any work, whether in Source or Object
 41 |       form, that is based on (or derived from) the Work and for which the
 42 |       editorial revisions, annotations, elaborations, or other modifications
 43 |       represent, as a whole, an original work of authorship. For the purposes
 44 |       of this License, Derivative Works shall not include works that remain
 45 |       separable from, or merely link (or bind by name) to the interfaces of,
 46 |       the Work and Derivative Works thereof.
 47 | 
 48 |       "Contribution" shall mean any work of authorship, including
 49 |       the original version of the Work and any modifications or additions
 50 |       to that Work or Derivative Works thereof, that is intentionally
 51 |       submitted to Licensor for inclusion in the Work by the copyright owner
 52 |       or by an individual or Legal Entity authorized to submit on behalf of
 53 |       the copyright owner. For the purposes of this definition, "submitted"
 54 |       means any form of electronic, verbal, or written communication sent
 55 |       to the Licensor or its representatives, including but not limited to
 56 |       communication on electronic mailing lists, source code control systems,
 57 |       and issue tracking systems that are managed by, or on behalf of, the
 58 |       Licensor for the purpose of discussing and improving the Work, but
 59 |       excluding communication that is conspicuously marked or otherwise
 60 |       designated in writing by the copyright owner as "Not a Contribution."
 61 | 
 62 |       "Contributor" shall mean Licensor and any individual or Legal Entity
 63 |       on behalf of whom a Contribution has been received by Licensor and
 64 |       subsequently incorporated within the Work.
 65 | 
 66 |    2. Grant of Copyright License. Subject to the terms and conditions of
 67 |       this License, each Contributor hereby grants to You a perpetual,
 68 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 69 |       copyright license to reproduce, prepare Derivative Works of,
 70 |       publicly display, publicly perform, sublicense, and distribute the
 71 |       Work and such Derivative Works in Source or Object form.
 72 | 
 73 |    3. Grant of Patent License. Subject to the terms and conditions of
 74 |       this License, each Contributor hereby grants to You a perpetual,
 75 |       worldwide, non-exclusive, no-charge, royalty-free, irrevocable
 76 |       (except as stated in this section) patent license to make, have made,
 77 |       use, offer to sell, sell, import, and otherwise transfer the Work,
 78 |       where such license applies only to those patent claims licensable
 79 |       by such Contributor that are necessarily infringed by their
 80 |       Contribution(s) alone or by combination of their Contribution(s)
 81 |       with the Work to which such Contribution(s) was submitted. If You
 82 |       institute patent litigation against any entity (including a
 83 |       cross-claim or counterclaim in a lawsuit) alleging that the Work
 84 |       or a Contribution incorporated within the Work constitutes direct
 85 |       or contributory patent infringement, then any patent licenses
 86 |       granted to You under this License for that Work shall terminate
 87 |       as of the date such litigation is filed.
 88 | 
 89 |    4. Redistribution. You may reproduce and distribute copies of the
 90 |       Work or Derivative Works thereof in any medium, with or without
 91 |       modifications, and in Source or Object form, provided that You
 92 |       meet the following conditions:
 93 | 
 94 |       (a) You must give any other recipients of the Work or
 95 |           Derivative Works a copy of this License; and
 96 | 
 97 |       (b) You must cause any modified files to carry prominent notices
 98 |           stating that You changed the files; and
 99 | 
100 |       (c) You must retain, in the Source form of any Derivative Works
101 |           that You distribute, all copyright, patent, trademark, and
102 |           attribution notices from the Source form of the Work,
103 |           excluding those notices that do not pertain to any part of
104 |           the Derivative Works; and
105 | 
106 |       (d) If the Work includes a "NOTICE" text file as part of its
107 |           distribution, then any Derivative Works that You distribute must
108 |           include a readable copy of the attribution notices contained
109 |           within such NOTICE file, excluding those notices that do not
110 |           pertain to any part of the Derivative Works, in at least one
111 |           of the following places: within a NOTICE text file distributed
112 |           as part of the Derivative Works; within the Source form or
113 |           documentation, if provided along with the Derivative Works; or,
114 |           within a display generated by the Derivative Works, if and
115 |           wherever such third-party notices normally appear. The contents
116 |           of the NOTICE file are for informational purposes only and
117 |           do not modify the License. You may add Your own attribution
118 |           notices within Derivative Works that You distribute, alongside
119 |           or as an addendum to the NOTICE text from the Work, provided
120 |           that such additional attribution notices cannot be construed
121 |           as modifying the License.
122 | 
123 |       You may add Your own copyright statement to Your modifications and
124 |       may provide additional or different license terms and conditions
125 |       for use, reproduction, or distribution of Your modifications, or
126 |       for any such Derivative Works as a whole, provided Your use,
127 |       reproduction, and distribution of the Work otherwise complies with
128 |       the conditions stated in this License.
129 | 
130 |    5. Submission of Contributions. Unless You explicitly state otherwise,
131 |       any Contribution intentionally submitted for inclusion in the Work
132 |       by You to the Licensor shall be under the terms and conditions of
133 |       this License, without any additional terms or conditions.
134 |       Notwithstanding the above, nothing herein shall supersede or modify
135 |       the terms of any separate license agreement you may have executed
136 |       with Licensor regarding such Contributions.
137 | 
138 |    6. Trademarks. This License does not grant permission to use the trade
139 |       names, trademarks, service marks, or product names of the Licensor,
140 |       except as required for reasonable and customary use in describing the
141 |       origin of the Work and reproducing the content of the NOTICE file.
142 | 
143 |    7. Disclaimer of Warranty. Unless required by applicable law or
144 |       agreed to in writing, Licensor provides the Work (and each
145 |       Contributor provides its Contributions) on an "AS IS" BASIS,
146 |       WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
147 |       implied, including, without limitation, any warranties or conditions
148 |       of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
149 |       PARTICULAR PURPOSE. You are solely responsible for determining the
150 |       appropriateness of using or redistributing the Work and assume any
151 |       risks associated with Your exercise of permissions under this License.
152 | 
153 |    8. Limitation of Liability. In no event and under no legal theory,
154 |       whether in tort (including negligence), contract, or otherwise,
155 |       unless required by applicable law (such as deliberate and grossly
156 |       negligent acts) or agreed to in writing, shall any Contributor be
157 |       liable to You for damages, including any direct, indirect, special,
158 |       incidental, or consequential damages of any character arising as a
159 |       result of this License or out of the use or inability to use the
160 |       Work (including but not limited to damages for loss of goodwill,
161 |       work stoppage, computer failure or malfunction, or any and all
162 |       other commercial damages or losses), even if such Contributor
163 |       has been advised of the possibility of such damages.
164 | 
165 |    9. Accepting Warranty or Additional Liability. While redistributing
166 |       the Work or Derivative Works thereof, You may choose to offer,
167 |       and charge a fee for, acceptance of support, warranty, indemnity,
168 |       or other liability obligations and/or rights consistent with this
169 |       License. However, in accepting such obligations, You may act only
170 |       on Your own behalf and on Your sole responsibility, not on behalf
171 |       of any other Contributor, and only if You agree to indemnify,
172 |       defend, and hold each Contributor harmless for any liability
173 |       incurred by, or claims asserted against, such Contributor by reason
174 |       of your accepting any such warranty or additional liability.
175 | 
176 |    END OF TERMS AND CONDITIONS
177 | 
178 |    APPENDIX: How to apply the Apache License to your work.
179 | 
180 |       To apply the Apache License to your work, attach the following
181 |       boilerplate notice, with the fields enclosed by brackets "{}"
182 |       replaced with your own identifying information. (Don't include
183 |       the brackets!)  The text should be enclosed in the appropriate
184 |       comment syntax for the file format. We also recommend that a
185 |       file or class name and description of purpose be included on the
186 |       same "printed page" as the copyright notice for easier
187 |       identification within third-party archives.
188 | 
189 |    Copyright {yyyy} {name of copyright owner}
190 | 
191 |    Licensed under the Apache License, Version 2.0 (the "License");
192 |    you may not use this file except in compliance with the License.
193 |    You may obtain a copy of the License at
194 | 
195 |        http://www.apache.org/licenses/LICENSE-2.0
196 | 
197 |    Unless required by applicable law or agreed to in writing, software
198 |    distributed under the License is distributed on an "AS IS" BASIS,
199 |    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
200 |    See the License for the specific language governing permissions and
201 |    limitations under the License.
202 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | ## Snippet ranger
  2 | 
  3 | [![Build Status](https://travis-ci.org/src-d/snippet-ranger.svg)](https://travis-ci.org/src-d/snippet-ranger) 
  4 | [![codecov](https://codecov.io/github/src-d/snippet-ranger/coverage.svg)](https://codecov.io/gh/src-d/snippet-ranger)
  5 | 
  6 | This tool is built on top of [ast2vec](https://github.com/src-d/ast2vec) Machine Learning models.
  7 | 
  8 | Provides API and tools to train and use models for ecosystem exploratory snippet mining.
  9 | It can help you to learn new libraries faster and speed up coding speed.
 10 | The module allows you to train and use hierarchical topic model on top of
 11 | [babelfish](https://github.com/bblfsh) UAST for any library you want.
 12 | 
 13 | Now Snippet ranger is under **active development**.
 14 | 
 15 | ## Install
 16 | 
 17 | ```
 18 | pip3 install git+https://github.com/src-d/snippet-ranger
 19 | ```
 20 | 
 21 | ## Usage
 22 | 
 23 | The project exposes two interfaces: API and command line. The command line is
 24 | 
 25 | ```
 26 | snippet_ranger --help
 27 | ```
 28 | 
 29 | ## Pipeline for dataset collection
 30 | 
 31 | **1. Get list of dependent repositories.**
 32 | 
 33 | You should have libraries.io (v1.0.0) dataset on your disk. 
 34 | You can download it here: https://libraries.io/data
 35 | 
 36 | Example for `numpy` library:
 37 | ```
 38 | snippet_ranger dependent_reps --librariesio_data ../libio/ -o . --libraries numpy:https://github.com/numpy/numpy
 39 | ```
 40 | 
 41 | There are examples of output files in [data folder](https://github.com/src-d/snippet-ranger/tree/master/data). 
 42 | You can use it to try snippet_ranger without a need to download libraries.io dataset.
 43 | 
 44 | **2. Clone repositories**
 45 | 
 46 | Use `ast2vec clone` for it. It requires enry. Install it via `ast2vec enry` if you do not have.
 47 | Example:
 48 | ```
 49 | ast2vec clone --ignore -o data/repos/numpy -t 16 --languages Python --linguist ./enry numpy.txt
 50 | ```
 51 | 
 52 | You can skip the second step if you do not want to store repositories.
 53 | But enry installation is necessary.
 54 | 
 55 | **3. Convert to Source [modelforge](https://github.com/src-d/modelforge) models**
 56 | 
 57 | Use `ast2vec repos2source` for it.
 58 | You should have bblfsh server running. 
 59 | Please use v0.7.0 and v0.8.2. of python driver:
 60 | ```
 61 | BBLFSH_DRIVER_IMAGES="python=docker://bblfsh/python-driver:v0.8.2" docker run -e BBLFSH_DRIVER_IMAGES --rm --privileged -d -p 9432:9432 --name bblfsh bblfsh/server:v0.7.0 --log-level DEBUG
 62 | ```
 63 | 
 64 | Example:
 65 | ```
 66 | ast2vec repos2source -p 2 -t 8 --organize-files 2 -o data/sources $( find data/repos/numpy -maxdepth 1 -mindepth 1 -type d | xargs)
 67 | ```
 68 | If you skip second step replace `data/repos/numpy` with `data/numpy_dependent_reps.txt`:
 69 | ```
 70 | ast2vec repos2source -p 2 -t 8 --organize-files 2 -o data/sources data/numpy_dependent_reps.txt
 71 | ```
 72 | 
 73 | Check [ast2vec topic modeling instructions](https://github.com/src-d/ast2vec/blob/master/topic_modeling.md#fetch-repositories-and-save-them-as-source-models)
 74 | to learn more about parameters.
 75 | 
 76 | **4. Get UAST for the library**
 77 | 
 78 | If you use the library for Python, first you should install it to avoid autogenerated files losing. 
 79 | UAST is builded from installation directory:
 80 | ```
 81 | snippet_ranger pylib2uast -p 1 -o ./data/libraries_uasts numpy
 82 | ```
 83 | 
 84 | You can use other languages which are supported by [bblfsh](doc.bblf.sh).
 85 | Just download the library sources and run `ast2vec repo2uast` for it.
 86 | 
 87 | **5. Extract snippets from Source model**
 88 | 
 89 | Use `snippet_ranger source2func` for it.
 90 | 
 91 | This command does the following:
 92 |   * Filter files without library usage. 
 93 |   * Split files to functions or take full file if there are no functions (just script).
 94 |   * Filter split result without library function calls.
 95 | 
 96 | More ways of snippet extraction can be added later. 
 97 | 
 98 | Example:
 99 | ```
100 | snippet_ranger source2func -p 8 --library_name numpy --library_uast ./data/libraries_uasts/numpy.asdf -o ./data/funcs/numpy/ ./data/sources/numpy
101 | ```
102 | 
103 | If you have several `All functions are filtered and you get empty model.` errors it is ok.
104 | 
105 | **6. Create vowpal wabbit dataset**
106 | 
107 | Here you have two way. Default one is use all simple identifiers as tokens for document modeling, 
108 | as described in 3-4 points in 
109 | [ast2vec topic modeling instructions](https://github.com/src-d/ast2vec/blob/master/topic_modeling.md).
110 | 
111 | Another one, use only specific identifiers, which can be found in the library UAST.
112 | For now, it is only about function calls (fc).
113 | Use `snippet2fc_df` and `snippet2fc_bow` for the second approach.
114 | 
115 | Example:
116 | ```
117 | mkdir ./data/dfs_fc
118 | snippet_ranger snippet2fc_df  -p 8 --library_name numpy --library_uast ./data/libraries_uasts/numpy.asdf ./data/funcs/numpy/ ./data/dfs_fc/numpy.asdf
119 | snippet_ranger snippet2fc_bow -p 8 --df ./data/dfs_fc/numpy.asdf -v 1000000 ./data/funcs/numpy/ ./data/bows_fc/numpy
120 | ```
121 | 
122 | Then you need to do the same as in 5-7 points in 
123 | [ast2vec topic modeling](https://github.com/src-d/ast2vec/blob/master/topic_modeling.md):
124 | 
125 | ```
126 | python3 -m ast2vec join-bow -p 16 --bow ./data/bows_fc/numpy ./data/bows_fc/numpy.asdf
127 | python3 -m ast2vec bow2vw --bow ./data/bows_fc/numpy.asdf -o ./data/vowpal_wabbit/numpy_fc.txt
128 | ```
129 | 
130 | ## Fit shallow and hierarchical topic model
131 | 
132 | **On going**
133 | 
134 | You should install BigARTM library. 
135 | Easy way is to use `ast2vec bigartm` command (not implemented yet).
136 | 
137 | You can checkout 
138 | [simple draft experiment using BigARTM Python API notebook](https://github.com/src-d/snippet-ranger/blob/master/experiments/BigARTM_run_example.ipynb).
139 | 
140 | ## Contributions
141 | [![PEP8](https://img.shields.io/badge/code%20style-pep8-orange.svg)](https://www.python.org/dev/peps/pep-0008/)
142 | 
143 | We use [PEP8](https://www.python.org/dev/peps/pep-0008/) with line length 99 and ". All the tests
144 | must pass:
145 | 
146 | ```
147 | unittest discover /path/to/ast2vec
148 | ```
149 | 
150 | ## License
151 | 
152 | Apache 2.0.
153 | 


--------------------------------------------------------------------------------
/library.md:
--------------------------------------------------------------------------------
 1 | 
 2 | # Topic modeling
 3 | 
 4 | ## BigARTM
 5 | * [BigARTM](http://bigartm.org) main site
 6 | * BigARTM [Tutorial on Probabilistic Topic Modeling: Additive Regularization for Stochastic Matrix Factorization](http://www.machinelearning.ru/wiki/images/1/1f/Voron14aist.pdf)
 7 | * BigARTM [Additive Regularization for Topic Models of Text Collections](http://www.machinelearning.ru/wiki/images/2/21/Voron14dan-eng.pdf)
 8 | * Main idea: Additive Regularization of Topic Models
 9 | * hARTM for hierarchical topic modeling. [presentation](http://www.machinelearning.ru/wiki/images/d/dc/2.Chirkova.pdf)
10 | 
11 | ## Other
12 | * [Collaborative deep learning for recommender systems](https://arxiv.org/pdf/1409.2944.pdf). [code](https://github.com/js05212/MXNet-for-CDL/blob/master/collaborative-dl.ipynb).
13 | > We generalize recent advances in deep learning from i.i.d. input to non-i.i.d. (CF-based) input and propose in this paper a hierarchical Bayesian model called collaborative deep learning (CDL), which jointly performs deep representation learning for the content information and collaborative filtering for the ratings (feedback) matrix. Extensive experiments on three real-world datasets from different domains show that CDL can significantly advance the state of the art.
14 | * [Scalable Deep Poisson Factor Analysis for Topic Modeling](http://proceedings.mlr.press/v37/gan15.pdf), [matlab code](https://github.com/zhegan27/dpfa_icml2015)
15 | 
16 | # DocNADE for document representation
17 | 
18 | * [DocNADE](http://proceedings.mlr.press/v15/larochelle11a/larochelle11a.pdf) and [post how to use it](http://blog.aylien.com/tensorflow-implementation-neural-autoregressive-topic-model-docnade/) to get document representation.
19 | 
20 | # Deep learning way
21 | 
22 | Another way to solve similar task
23 | 
24 | * [Deep API learning, Xiaodong Gu, Hongyu Zhang, Dongmei Zhang, and Sunghun Kim](https://arxiv.org/pdf/1605.08535v1.pdf)
25 |     > We propose DeepAPI, a deep learning based approach to generate API usage sequences for a given natural language query. DeepAPI adapts a neural language model named RNN Encoder-Decoder. It encodes a word sequence (user query) into a fixed-length context vector, and generates an API sequence based on the context vector. We also augment the RNN Encoder-Decoder by considering the importance of individual APIs. We empirically evaluate our approach with more than 7 million annotated code snippets collected from GitHub. The results show that our approach generates largely accurate API sequences and outperforms the related approaches.
26 | 
27 |     * RNN Encoder-Decoder
28 |         > the API learning problem as a machine translation problem: given a natural language query x = x1 , ..., xn where xt is a key word, we aim to translate it into an API sequence y = y1,...,ym where yt is an API
29 |     * Learns on 
30 |         > a corpus of annotated API sequences, i.e., ⟨API sequence, annotation⟩ pairs,
31 | 
32 | # Probabilistic way. Interesting Sequence Mining
33 | 
34 | * [MAST-group.](https://mast-group.github.io/) Probabilistic API Miner. [github](https://github.com/mast-group/api-mining), article [Parameter-Free Probabilistic API Mining across GitHub](https://arxiv.org/pdf/1512.05558.pdf).
35 |     > PAM is a near parameter-free probabilistic algorithm for mining the most interesting API patterns from a list of API call sequences. PAM largely avoids returning redundant and spurious sequences, unlike API mining approaches based on frequent pattern mining.
36 |     
37 |     > the hand-written examples actually have limited coverage of real API usages.
38 | 
39 | * [MAST-group.](https://mast-group.github.io/) Interesting Sequence Miner [github](https://github.com/mast-group/sequence-mining), article [A Subsequence Interleaving Model for Sequential Pattern Mining](https://arxiv.org/pdf/1602.05012.pdf)
40 |     > ISM is a novel algorithm that mines the subsequences that are most interesting under a probabilistic model of a sequence database. Our model is able to efficiently infer interesting subsequences directly from the database.
41 | 
42 | ### Related works from articles
43 | * MAPO
44 |     * Use code search engines for finding snippets.
45 |     * Clustering by method according to a distance metric, computed as an average of the similarity of method names, class names, and the called API methods themselves.
46 |     * For each cluster, MAPO mines the most frequent API calls using SPAM
47 | * UP-Miner
48 |     * extends MAPO
49 |     * use BIDE algorithm. It returns only the frequent sequences that have no subsequences with the same frequency 
50 |     * clustering distance metric based on the set of all API call sequence n-grams
51 | * SNIFF
52 |     * finds abstract code examples relevant to a natural language query expressing a desired task. 
53 |     * annotates publicly available source code with API documentation and the annotated code is then indexed for searching.
54 | 
55 | # Can be useful
56 | 
57 | * [Searching and Skimming: An Exploratory Study. Jamie Starke, Chris Luce, Jonathan Sillito University of Calgary
58 | Calgary, Canada](http://people.ucalgary.ca/~sillito/work/icsm2009.pdf)
59 |     > We conducted a formative study in which programmers were asked to perform corrective tasks to a system they were initially unfamiliar with. Our analysis focused specifically on how programmers decide what to search for, and how they decide which results are relevant to their task. Based on our analysis, we present five observations about our participant’s approach to finding information and some of the challenges they faced. We also discuss the implications these observations have for the design of source code search tools.
60 | 
61 | # Others articles
62 | 
63 | * [Code Search via Topic-Enriched Dependence Graph Matching](http://ink.library.smu.edu.sg/cgi/viewcontent.cgi?article=2396&context=sis_research)
64 |     > In this paper, we propose a semantic dependence search engine that integrates both kinds of techniques and can retrieve code snippets based on expressive user queries describing both topics and dependencies. Users can specify their search targets in a free form format describing desired topics (i.e., high-level semantic or functionality of the target code); a specialized graph query language allows users to describe low-level data and control dependencies in code and thus helps to refine the queries described in the free format. Our empirical evaluation on a number of software maintenance tasks shows that our search engine can efficiently locate desired code fragments accurately.
65 |     
66 |     * Use LDA and structural and semantic representations (system dependence graphs (SDGs)) of code.
67 |     * Have special and overcomplicated query language
68 | 
69 | * [Improving Topic Model Source Code Summarization Paul W. McBurney, Cheng Liu, Collin McMillan, and Tim Weninger](https://www3.nd.edu/~cmc/papers/mcburney_icpcera_2014.pdf)
70 |     > In this paper, we present an emerging source code summarization technique that uses topic modeling to select keywords and topics as summaries for source code. Our approach organizes the topics in source code into a hierarchy, with more general topics near the top of the hierarchy. In this way, we present the software’s highest-level functionality first, before lower-level details. This is an advantage over previous approaches based on topic models, that only present groups of related keywords without a hierarchy. We conducted a preliminary user study that found our approach selects keywords and topics that the participants found to be accurate in a majority of cases.
71 | 
72 |     * Topic modeling for code summarization task. Task of creating a brief description of a section of source code.
73 |     
74 |     * It uses HDTM algorithm, which analyses graph of documents. 
75 |      > Our technique employs the HDTM algorithm described by Weninger et. al [29] to extract a topic hierarchy for a software system, then we display the hierarchy to programmers in a navigable web interface.
76 | 
77 |     * We can use this approach to extract names and keywords in themes
78 |     > Code summarization techniques based on topic models are described extensively in software engineering literature [19]. But as a recent study by Panichella et. al points out, these techniques often “have rather low performance when applied on software data” [19].
79 |     
80 | * [API usage pattern recommendation for software development](http://www.sciencedirect.com/science/article/pii/S0164121216301200)
81 |     > Our approach represents the source code as a network of object usages where an object usage is a set of method calls invoked on a single API class. We automatically extract usage patterns by clustering the data based on the co-existence relations between object usages. We conduct an empirical study using a corpus of 11,510 Android applications. The results demonstrate that our approach can effectively mine API usage patterns with high completeness and low redundancy. We observe 18% and 38% improvement on F-measure and response time respectively comparing to usage pattern extraction using frequent-sequence mining.
82 |     
83 |     > Specifically, we show that our approach outperforms the baseline in mining less frequently used API usage patterns. In addition, the ranking quality of our approach is better than Codota which is an online commercial usage pattern recommendation service for Android development.
84 |     
85 | * [Multimodal Code Search by Shaowei Wang](http://ink.library.smu.edu.sg/cgi/viewcontent.cgi?article=1118&context=etd_coll)
86 |     > In this dissertation, we propose a multimodal code search engine, which employs novel techniques that allow developers to effectively find code elements of interest by processing developers’ inputs in various input forms including free-form texts, an SQL-like domain-specific language, code examples, execution traces, and user feedback.  Our evaluations show that our approaches improve over state-of-the-art approaches significantly.
87 |     
88 |     It is a big work. Interesting Literature Review. I think it can be helpful. 
89 | 
90 | # Libs & Tools
91 | 
92 | * https://libraries.io/data
93 | 
94 |     Can be useful to get libraries list and projects, that use specific library.
95 | 


--------------------------------------------------------------------------------
/presentation/article meeting.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/presentation/article meeting.pdf


--------------------------------------------------------------------------------
/presentation/article meeting.tex:
--------------------------------------------------------------------------------
  1 | \documentclass[10pt,aspectratio=1610]{beamer}
  2 | 
  3 | \usetheme[progressbar=frametitle,sectionpage=none,background=light]{metropolis}
  4 | 
  5 | %%––––––––––––––––––––––––––––––––––––––––––––––––
  6 | % Define styles
  7 | %%––––––––––––––––––––––––––––––––––––––––––––––––
  8 | 
  9 | %%––––––––––––––––––––––––––––––––––––––––––––––––
 10 | % Setting up colors
 11 | \definecolor{logoblue1}{RGB}{35, 121, 181}
 12 | \definecolor{logoblue2}{RGB}{88, 145, 202}
 13 | \definecolor{darkblue}{RGB}{25, 41, 54}
 14 | \definecolor{lightgrey}{RGB}{134, 143, 161}
 15 | \definecolor{greytext}{RGB}{102, 118, 128}
 16 | \definecolor{darktext}{RGB}{29, 43, 52}
 17 | \definecolor{green}{RGB}{0, 184, 44}
 18 | \definecolor{vividblue}{RGB}{15, 117, 183}
 19 | \definecolor{orange}{RGB}{246, 177, 70}
 20 | \definecolor{lightblue}{RGB}{244, 247, 251}
 21 | \definecolor{white}{RGB}{255, 255, 255}
 22 | \definecolor{red}{RGB}{183, 25, 29}
 23 | 
 24 | \setbeamercolor{frametitle}{bg=darkblue, fg=lightblue}
 25 | \setbeamercolor{background canvas}{bg=black}
 26 | \setbeamercolor{normal text}{fg=lightblue}
 27 | %%––––––––––––––––––––––––––––––––––––––––––––––––
 28 | 
 29 | %%––––––––––––––––––––––––––––––––––––––––––––––––
 30 | % Setting up fonts
 31 | \usepackage{lato}
 32 | \usepackage{roboto}
 33 | \usepackage{montserrat}
 34 | 
 35 | \setbeamerfont{frametitle}{family=\flafamily, size*={18}{18}}
 36 | % \setbeamerfont{footline}{family=\fontfamily{montserrat}}
 37 | % \setbeamerfont{normal text}{family=\roboto, size*={16}{18}}
 38 | 
 39 | % Setting up fonts for bibliography style
 40 | \setbeamerfont{bibliography entry author}{size=\small}
 41 | \setbeamerfont{bibliography entry title}{size=\small}
 42 | \setbeamerfont{bibliography entry location}{size=\small}
 43 | \setbeamerfont{bibliography entry note}{size=\small}
 44 | \setbeamerfont{bibliography item}{size=\small}
 45 | %%––––––––––––––––––––––––––––––––––––––––––––––––
 46 | 
 47 | \usepackage{appendixnumberbeamer}
 48 | 
 49 | \usepackage{booktabs}
 50 | \usepackage[scale=2]{ccicons}
 51 | 
 52 | \usepackage{pgfplots}
 53 | \usepgfplotslibrary{dateplot}
 54 | 
 55 | \usepackage{xspace}
 56 | \newcommand{\themename}{\textbf{\textsc{metropolis}}\xspace}
 57 | 
 58 | \usepackage{hyperref}
 59 | \hypersetup{
 60 |   colorlinks, 
 61 |   urlcolor=vividblue, 
 62 |   citecolor=lightblue, 
 63 |   linkcolor=lightblue
 64 | }
 65 | 
 66 | \setbeamertemplate{frame footer}{{\large\textcolor{logoblue1}{source}\textcolor{logoblue2}{\{d\}}}}
 67 | 
 68 | 
 69 | \title{Exploratory code search and snippet suggestion}
 70 | \subtitle{Article review}
 71 | \date{\today}
 72 | \author{Slavnov Konstantin\\konstantin@sourced.tech}
 73 | %\titlegraphic{\hfill\includegraphics[height=1.5cm]{logo.png}}
 74 | 
 75 | \begin{document}
 76 | 
 77 | \maketitle
 78 | 
 79 | \section{Introduction}
 80 | 
 81 |   
 82 | 
 83 | \begin{frame}[fragile]{Introduction}
 84 | 
 85 |   What is the \textbf{fastest} way to learn a new library? 
 86 | 
 87 |   New framework investigation ways:
 88 |   \begin{itemize}
 89 |     \item Documentation reading;
 90 |     \item Ask stackoverflow;
 91 |     \item \alert<2>{Just start to use it;}
 92 |     \item \alert<2>{Search code examples;}
 93 |     \item etc
 94 |   \end{itemize}
 95 | 
 96 |   \vfill
 97 |   \pause
 98 |   \textbf{Insights} from Searching and Skimming: An Exploratory Study \cite{starke2009searching}.
 99 | 
100 | \end{frame}
101 | \begin{frame}[fragile]{Ways to solve}
102 |   Let's build a machine learning assistant! 
103 | 
104 |   Approaches:
105 |   \begin{itemize}
106 |     \item \alert<2>{Topic modeling}
107 |     \item Hierarchical clustering
108 |     \item Deep learning way
109 |     \item Probabilistic way
110 |   \end{itemize}
111 | \end{frame}
112 | 
113 | 
114 | \section{Approaches}
115 | 
116 | \begin{frame}{Topic modeling}
117 |   Scheme
118 |   \begin{itemize}
119 |     \item Get a codebase of library usage
120 |     \item Build a hierarchical topic modeling for codebase
121 |     \item Show it for user API query
122 |     \item ???
123 |     \item PROFIT!
124 |   \end{itemize}
125 | \end{frame}
126 | 
127 | \begin{frame}{Flat topic model. Reminder}
128 |   \begin{itemize}
129 |     \item Documents $d \in D$
130 |     \item Tokens (words) $w \in W$
131 |     \item Topics $t \in T$
132 |     \item Document-token counters $n_{dw}$\\[3mm]
133 |   \end{itemize}
134 |   Flat topic model:\\[-1mm]
135 |   $$
136 |     P_{wd} = \dfrac{n_{dw}}{\sum_{w' \in W} n_{dw'}} = p(w \mid d) \approx \sum_{t \in T} p(w \mid t)\, p(t \mid d) = \sum_{tin} \phi_{wt} \theta_{td} = \{\Phi \Theta\}_{wd}
137 |   $$
138 |   or just
139 |   $$
140 |       P \approx \Phi \Theta
141 |   $$
142 |   \pause
143 |   Applying MLE:
144 |   $$
145 |     L(\Psi, \Theta) = \sum_{d\in D}
146 |       \sum_{w \in d} n_{dw} \ln 
147 |         \sum_t \psi_{wt} \theta_{td} \quad
148 |     \longrightarrow \max_{\Psi, \Theta \text{ -- stochastic}}
149 |   $$
150 | 
151 |   EM-algorithm is used for training.
152 | \end{frame}
153 | 
154 | \begin{frame}{Flat topic model.}
155 | 
156 |    \href{http://bigartm.org}{BigARTM} is good tool for it.
157 | 
158 |   What we can do:
159 |   \begin{itemize}
160 |     \item Add regularisers: \quad 
161 |       $$ L(\Psi, \Theta) + R(\Psi, \Theta) 
162 |          \longrightarrow \max $$
163 |     \item Add modalities $m \in M$. 
164 |       $$W = \bigsqcup_{m \in M} W_m  \text{ and } \Phi = [\Phi_1 | \cdots | \Phi_n ]$$
165 |   \end{itemize}
166 |   \vspace{5mm}
167 |   \pause
168 |   Let's build \textbf{topic hierarchies}.
169 |   \begin{itemize}
170 |     \item Each level is a topic model.
171 |     \item Next level is learned with \textbf{specific regulariser} to find
172 | parent topics from previous level.
173 |   \end{itemize}
174 |   \vspace{5mm}
175 |   Check out \cite{vorontsov2014additive, vorontsov2014tutorial}.
176 | \end{frame}
177 | 
178 | \begin{frame}{Topic hierarchies.}
179 |   \begin{itemize}
180 |   \item \textbf{Learned} parent level: topics $a \in A$ with $\Phi' \in \mathbb{R}^{|W| \times |A|} $ and $\Theta' \in \mathbb{R}^{|A| \times |D|} $.
181 |   \item \textbf{To learn:} \\
182 |       \quad New level with topics $t \in T$ and $\Phi \in \mathbb{R}^{|W| \times |T|} $ and $\Theta \in \mathbb{R}^{|T| \times |D|} $.\\
183 |       \quad Parent-child relations $\Psi_{ta}$  -- $t$ is a child of $a$.
184 |   \pause
185 |   \item \textbf{Assumption:} parent topic is a mixture of children's: \\[2mm]
186 |   \qquad\qquad
187 |   $\displaystyle
188 |       p(w \mid a) \approx \sum_{t \in T} \; p(w \mid t) p(t \mid a)
189 |   $
190 |   \qquad or just \qquad
191 |   $
192 |     \Phi^l \approx  \Phi \Psi
193 |   $
194 |   \pause
195 |   \item We can just add $|A|$ pseudo documents with $n_{wa}$ counters
196 |   \pause
197 |   \item The same point with $\Theta$ regularisation.
198 |   $
199 |   \Theta^l \approx \tilde \Psi \Theta
200 |   $
201 |   It is like add new modality with tokens corresponding to $a \in A$.
202 |   \end{itemize}
203 | 
204 | \end{frame}
205 | 
206 | \begin{frame}{Hierarchy sparsing}
207 |   \textbf{The goal:}\quad Topics should have small number of parents. \\[5mm]
208 | 
209 |   $p(a \mid t)$ should be sparse.
210 |   
211 |   Similar to LDA regulariser:
212 |   $$
213 |       R(\Psi) 
214 |         = \dfrac{1}{|A|} \sum_a \sum_t \ln p(a \mid t)
215 |         = \dfrac{1}{|A|} \sum_a \sum_t \ln 
216 |             \dfrac{\psi_{ta} \; p(a)}{\sum_{a'} \psi_{ta'} \; p(a')}
217 |   $$
218 | 
219 |   To apply we need just to update M-step of EM-algorithm.
220 | 
221 |   The same approach for $\Theta$ regularisation.
222 | \end{frame}
223 | 
224 | \begin{frame}{Hierarchical clustering approach}
225 |   Scheme
226 |   \begin{itemize}
227 |     \item Get a codebase of library usage
228 |     \item \alert<2>{Somehow get a document representations in $\mathbb{R}^{d}$}
229 |     \item Build a hierarchical clusterization
230 |     \item Show it for user API query
231 |     \item ???
232 |     \item PROFIT!
233 |   \end{itemize}
234 | \end{frame}
235 | 
236 | \begin{frame}{DocNADE}
237 |   \begin{columns}[T,onlytextwidth]
238 |     \column{0.7\textwidth}
239 |       \textbf{NADE} -- Neural Autoregressive Distribution Estimator \cite{larochelle2011neural}.\\[2mm]
240 | 
241 |       Based on fact that \qquad
242 |       $ \displaystyle
243 |         p(v) = 
244 |           \prod_{d=1}^D p(v_d \mid v_{<d})
245 |       $ \\[3mm]
246 |       We need to \textbf{parametrise} $p(v_d \mid v_{<d})$.\\[-3.5mm]
247 |       \pause
248 |       $$
249 |         p(v_d \mid v_{<d}) = \mathrm{sigm}(b_d + V_{d,:}h_d)
250 |       $$
251 |       $$
252 |         h_d = \mathrm{sigm}(c + W_{:, <d}v_{<d}).
253 |       $$
254 | 
255 |       $W, V, b, c$ -- learnable parameters by LME.
256 |       \pause
257 |       Softmax is used for vectors modeling:
258 |       $$
259 |         p(v_d \mid v) = \dfrac{\exp(b_{w_b} + V_{w_d, :}h_d)}{\sum_w\exp(b_{w} + V_{w, :}h_d)}
260 |       $$
261 |       \pause
262 |       Trains on random permutations of the words in a document.
263 | 
264 |     \column{0.4\textwidth}
265 |       \vspace{7mm}
266 |       \quad\includegraphics[width=4.2cm]{./imgs/nade.png}
267 |   \end{columns}
268 |   Document representation is $h_T$ at the final timestep $T$.
269 | \end{frame}
270 | 
271 | \begin{frame}{Deep learning way}
272 |   \begin{itemize}
273 |     \item  \textbf{Aim:} Generate API sequences for a natural language query \cite{gu2016deepAPILearning}.
274 |     \item  \textbf{Method:} RNN encoder-decoder model for API learning.
275 |     \item  \textbf{Data:} annotated code snippets collected from GitHub.
276 |   \end{itemize}
277 |   \centering\includegraphics[width=12cm]{./imgs/rnn-encoder-decoder.png}
278 | \end{frame}
279 | 
280 | \begin{frame}{Deep learning way}
281 |   \textbf{Details:} 
282 |   \begin{itemize}
283 |     \item Run on sequences of API methods only.
284 |     \item RNN is \textbf{GRU}, Encoder is bidirectional with attention, 1000 hidden units, 120 dimension of word embeddings.
285 |     \item Beam Search for generation several API sequences to choose
286 |     \pause
287 |     \item IDF-based weights for API as a penalty term in \textbf{loss}:
288 |     $$
289 |       \mathrm{loss}_{it} = - \log p_\theta (y_{it} \mid x_i) - \lambda \log(\dfrac{N}{n_{t}})
290 |     $$
291 |     where\\
292 |     \quad $i$ is $i$-th train instance,\\
293 |     \quad $t$ is $t$-th target word in instance i,\\
294 |     \quad $N$ is the total number of API sequences,\\
295 |     \quad $n_t$ is the number of sequences where the API $t$ appears.\\
296 | 
297 |   \end{itemize}
298 | \end{frame}
299 | 
300 | \begin{frame}{Probabilistic way. Interesting Sequence Mining}
301 |   \begin{columns}[T,onlytextwidth]
302 |   \column{0.55\textwidth}
303 |       \textbf{Task:} get meaningful API patterns $\mathcal{I}$ \cite{fowkes2016ProbabilisticAPIMining, fowkes2016subsequenceMining}.\\[2mm]
304 | 
305 |       \textbf{Idea:} Use API patterns $\mathcal{I}$ to define a code probability in database $X$.\\[2mm]
306 | 
307 |       Pattern is interesting code \textbf{subsequence}.\\[2mm]
308 |       \pause
309 |       Simplified model:
310 |       $$
311 |           p(X, z \mid \mathcal{I}) \sim \prod_{i \in \mathcal{I}\cap X} p_i^{z_i} (1 - p_i)^{1-z_i}
312 |       $$
313 | 
314 |       \vspace{3mm}
315 | 
316 |       {\small
317 |       $X$ -- code database,
318 | 
319 |       $\mathcal{I}$ -- set of API patterns,
320 | 
321 |       $p_i$ -- API pattern $i \in \mathcal{I}$ probability,
322 | 
323 |       $z_i$ -- indicator of including pattern into code (hidden).
324 |       }
325 |       \pause
326 |   \column{0.03\textwidth}
327 |   \column{0.03\textwidth}
328 |   Example:\\[2mm]
329 |   \column{0.35\textwidth}
330 |   \vspace{3mm}
331 | 
332 |     \setlength{\tabcolsep}{2pt}
333 |     \begin{tabular}{llllllll}
334 |                &   &   &   &   &   &    &     \\
335 |       $X =$ \{ & d & b & c & e & d & f  & f;   \\
336 |                & e & e & d & f & f & f; &     \\
337 |                & d & f & d & e & f & f; & \}  
338 |     \end{tabular}
339 |     
340 |     \vspace{5mm}
341 | 
342 |     \begin{tabular}{lccccc}
343 |       $\mathcal{I} =$ \{ & [ b c e ] & [ d f ] & [ d f ] & [ e f ] &\}\\[2mm]
344 |                          &     1     &    1    &    1    &    0    &  \\
345 |             $z:$         &     0     &    1    &    0    &    1    &  \\
346 |                          &     0     &    1    &    1    &    1    &  \\[2mm] 
347 |             $p_i:$       &    0.33   &    1    &   0.66  &   0.66  &  \\
348 | 
349 |     \end{tabular}
350 |   \end{columns}
351 | \end{frame}
352 | 
353 | \begin{frame}{Probabilistic way. Interesting Sequence Mining}
354 |   \begin{columns}[T,onlytextwidth]
355 |   \column{0.55\textwidth}
356 |    \textbf{Solver:} EM-algorithm.
357 | 
358 |    Iterate:
359 |    \begin{enumerate}
360 |       \item Structural-EM ($\mathcal{I}$ update)
361 |       \begin{enumerate}
362 |         \item Somehow generate candidate $S'$ 
363 |         \item See if quality increases
364 |       \end{enumerate} 
365 |       \item Hard-EM ($z$ and $p$ update)
366 |         \begin{enumerate}
367 |           \item Find patterns from $\mathcal{I}$ that was used to sample $X$ with greedy search.
368 |           $$
369 |             z = \arg\max_z \log p(z \mid p, \mathcal{I}; X)
370 |           $$ 
371 |           \item Update $p_i$ by averaging $z$.
372 |         \end{enumerate}
373 |   \end{enumerate}
374 |   \column{0.03\textwidth}
375 |   \column{0.03\textwidth}
376 |   Example:\\[2mm]
377 |   \column{0.35\textwidth}
378 |   \vspace{3mm}
379 | 
380 |     \setlength{\tabcolsep}{2pt}
381 |     \begin{tabular}{llllllll}
382 |                &   &   &   &   &   &    &     \\
383 |       $X =$ \{ & d & b & c & e & d & f  & f;   \\
384 |                & e & e & d & f & f & f; &     \\
385 |                & d & f & d & e & f & f; & \}  
386 |     \end{tabular}
387 |     
388 |     \vspace{5mm}
389 | 
390 |     \begin{tabular}{lccccc}
391 |       $\mathcal{I} =$ \{ & [ b c e ] & [ d f ] & [ d f ] & [ e f ] &\}\\[2mm]
392 |                          &     1     &    1    &    1    &    0    &  \\
393 |             $z:$         &     0     &    1    &    0    &    1    &  \\
394 |                          &     0     &    1    &    1    &    1    &  \\[2mm] 
395 |             $p_i:$       &     0.33  &    1    &   0.66  &   0.66  &  \\
396 | 
397 |     \end{tabular}
398 | \end{columns}
399 | \end{frame}
400 | 
401 | \begin{frame}{References. Links}
402 |   \begin{enumerate}
403 |     \item \href{http://www.machinelearning.ru/wiki/images/d/dc/2.Chirkova.pdf}{Hierarchical Multimodal Topic Modeling presentation. N. A. Chirkova and K. V. Vorontsov}
404 |     \item \href{http://bigartm.org}{BigARTM for Topic Modeling}
405 |     \item \href{http://blog.aylien.com/tensorflow-implementation-neural-autoregressive-topic-model-docnade/}{Post about DocNADE with implementation}
406 |     \item \href{https://github.com/mast-group/api-mining}{Probabilistic API Mining code}
407 | 
408 | 
409 |   \end{enumerate}
410 | 
411 | \end{frame}
412 | 
413 | \begin{frame}[allowframebreaks]{References. Articles}
414 | 
415 |   \setbeamertemplate{bibliography item}{\insertbiblabel}
416 |   \bibliography{bibl.bib}
417 |   \bibliographystyle{abbrv}
418 | 
419 | \end{frame}
420 | 
421 | \end{document}
422 | 


--------------------------------------------------------------------------------
/presentation/bibl.bib:
--------------------------------------------------------------------------------
 1 | @inproceedings{starke2009searching,
 2 |   title={Searching and skimming: An exploratory study},
 3 |   author={Starke, Jamie and Luce, Chris and Sillito, Jonathan},
 4 |   booktitle={Software Maintenance, 2009. ICSM 2009. IEEE International Conference on},
 5 |   pages={157--166},
 6 |   year={2009},
 7 |   organization={IEEE}
 8 | }
 9 | 
10 | @inproceedings{vorontsov2014tutorial,
11 |   title={Tutorial on probabilistic topic modeling: Additive regularization for stochastic matrix factorization},
12 |   author={Vorontsov, Konstantin and Potapenko, Anna},
13 |   booktitle={International Conference on Analysis of Images, Social Networks and Texts\_x000D\_},
14 |   pages={29--46},
15 |   year={2014},
16 |   organization={Springer}
17 | }
18 | 
19 | @inproceedings{vorontsov2014additive,
20 |   title={Additive regularization for topic models of text collections},
21 |   author={Vorontsov, KV},
22 |   booktitle={Doklady Mathematics},
23 |   volume={89},
24 |   number={3},
25 |   pages={301--304},
26 |   year={2014},
27 |   organization={Springer}
28 | }
29 | 
30 | @inproceedings{larochelle2011neural,
31 |   title={The neural autoregressive distribution estimator},
32 |   author={Larochelle, Hugo and Murray, Iain},
33 |   booktitle={Proceedings of the Fourteenth International Conference on Artificial Intelligence and Statistics},
34 |   pages={29--37},
35 |   year={2011}
36 | }
37 | 
38 | 
39 | @inproceedings{gu2016deepAPILearning,
40 |   title={Deep API learning},
41 |   author={Gu, Xiaodong and Zhang, Hongyu and Zhang, Dongmei and Kim, Sunghun},
42 |   booktitle={Proceedings of the 2016 24th ACM SIGSOFT International Symposium on Foundations of Software Engineering},
43 |   pages={631--642},
44 |   year={2016},
45 |   organization={ACM}
46 | }
47 | 
48 | @inproceedings{fowkes2016ProbabilisticAPIMining,
49 |   title={Parameter-free probabilistic API mining across GitHub},
50 |   author={Fowkes, Jaroslav and Sutton, Charles},
51 |   booktitle={Proceedings of the 2016 24th ACM SIGSOFT International Symposium on Foundations of Software Engineering},
52 |   pages={254--265},
53 |   year={2016},
54 |   organization={ACM}
55 | }
56 | 
57 | @article{fowkes2016subsequenceMining,
58 |   title={A subsequence interleaving model for sequential pattern mining},
59 |   author={Fowkes, Jaroslav and Sutton, Charles},
60 |   journal={arXiv preprint arXiv:1602.05012},
61 |   year={2016}
62 | }
63 | 
64 | @inproceedings{wang2011code,
65 |   title={Code search via topic-enriched dependence graph matching},
66 |   author={Wang, Shaowei and Lo, David and Jiang, Lingxiao},
67 |   booktitle={Reverse Engineering (WCRE), 2011 18th Working Conference on},
68 |   pages={119--123},
69 |   year={2011},
70 |   organization={IEEE}
71 | }


--------------------------------------------------------------------------------
/presentation/imgs/nade black.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/presentation/imgs/nade black.png


--------------------------------------------------------------------------------
/presentation/imgs/nade.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/presentation/imgs/nade.png


--------------------------------------------------------------------------------
/presentation/imgs/rnn-encoder-decoder white.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/presentation/imgs/rnn-encoder-decoder white.png


--------------------------------------------------------------------------------
/presentation/imgs/rnn-encoder-decoder.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/presentation/imgs/rnn-encoder-decoder.png


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | pandas>=0.20
2 | ast2vec[tf]>=0.2.6-alpha
3 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | import sys
 2 | from setuptools import setup, find_packages
 3 | 
 4 | if sys.version_info < (3, 5, 0):
 5 |     typing = ["typing"]
 6 | else:
 7 |     typing = []
 8 | 
 9 | setup(
10 |     name="snippet_ranger",
11 |     description="Part of source{d}'s stack for machine learning on source code. Provides API and "
12 |                 "tools to train and use models for ecosystem exploratory snippet mining. "
13 |                 "It can help you to learn new libraries faster and speed up coding speed. "
14 |                 "The module allows you to train and use hierarchical topic model on top of "
15 |                 "babelfish UAST for any library you want.",
16 |     version="0.0.1-alpha",
17 |     license="Apache 2.0",
18 |     author="source{d}",
19 |     author_email="machine-learning@sourced.tech",
20 |     url="https://github.com/src-d/snippet-ranger",
21 |     download_url="https://github.com/src-d/snippet-ranger",
22 |     packages=find_packages(exclude=("snippet_ranger.tests",)),
23 |     keywords=["machine learning on source code", "github", "topic modeling",
24 |               "hierarchical topic modeling", "exploratory code search"],
25 |     entry_points={
26 |         "console_scripts": ["snippet_ranger=snippet_ranger.__main__:main"],
27 |     },
28 |     install_requires=["pandas>=0.20",
29 |                       "ast2vec>=0.2.6-alpha"] + typing,
30 |     package_data={"": ["LICENSE", "README.md"]},
31 |     classifiers=[
32 |         "Development Status :: 3 - Alpha",
33 |         "Environment :: Console",
34 |         "Intended Audience :: Developers",
35 |         "License :: OSI Approved :: Apache Software License",
36 |         "Operating System :: POSIX",
37 |         "Programming Language :: Python :: 3.4",
38 |         "Programming Language :: Python :: 3.5",
39 |         "Programming Language :: Python :: 3.6",
40 |         "Topic :: Software Development :: Libraries"
41 |     ]
42 | )
43 | 


--------------------------------------------------------------------------------
/snippet_ranger/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/__init__.py


--------------------------------------------------------------------------------
/snippet_ranger/__main__.py:
--------------------------------------------------------------------------------
  1 | import argparse
  2 | import logging
  3 | import multiprocessing
  4 | import sys
  5 | 
  6 | from modelforge.logs import setup_logging
  7 | from ast2vec.__main__ import one_arg_parser
  8 | from ast2vec.repo2.base import DEFAULT_BBLFSH_TIMEOUT, DEFAULT_BBLFSH_ENDPOINTS
  9 | 
 10 | from snippet_ranger.model2.source2func import source2func_entry
 11 | from snippet_ranger.librariesio_fetcher import dependent_reps_entry, LibrariesIOFetcher
 12 | from snippet_ranger.model2.snippet2df import snippet2df_entry, snippet2fc_df_entry
 13 | from snippet_ranger.model2.snippet2bow import snippet2bow_entry, snippet2fc_bow_entry
 14 | from snippet_ranger.pylib2uast import pylib2uast_entry
 15 | 
 16 | 
 17 | def get_parser() -> argparse.ArgumentParser:
 18 |     """
 19 |     Create main parser.
 20 | 
 21 |     :return: Parser
 22 |     """
 23 |     parser = argparse.ArgumentParser()
 24 |     parser.add_argument("--log-level", default="INFO",
 25 |                         choices=logging._nameToLevel,
 26 |                         help="Logging verbosity.")
 27 | 
 28 |     # Create all common arguments
 29 | 
 30 |     model2input_arg = one_arg_parser(
 31 |         "input", help="Directory to scan recursively for asdf files.")
 32 | 
 33 |     process_arg = one_arg_parser(
 34 |         "-p", "--processes", type=int, default=0,
 35 |         help="Number of processes to use. 0 means CPU count.")
 36 | 
 37 |     filter_arg = one_arg_parser(
 38 |         "--filter", default="**/*.asdf", help="File name glob selector.")
 39 | 
 40 |     library_name_arg = one_arg_parser(
 41 |         "--library_name", help="Provide the name of the library.")
 42 | 
 43 |     library_uast_arg = one_arg_parser(
 44 |         "--library_uast", help="Provide the UAST model of the library. "
 45 |                                "You can build it via ast2vec repo2uast call.")
 46 | 
 47 |     tmpdir_arg = one_arg_parser(
 48 |         "--tmpdir", help="Store intermediate files in this directory instead of /tmp.")
 49 | 
 50 |     df_arg = one_arg_parser(
 51 |         "-d", "--df", dest="docfreq", help="URL or path to the document frequencies.")
 52 | 
 53 |     disable_overwrite_arg = one_arg_parser(
 54 |         "--disable-overwrite", action="store_false", default=True,
 55 |         dest="overwrite_existing",
 56 |         help="Specify if you want to disable overiting of existing models")
 57 | 
 58 |     vocabulary_size_arg = one_arg_parser(
 59 |         "-v", "--vocabulary-size", required=True, type=int,
 60 |         help="Vocabulary size: the tokens with the highest document frequencies will be picked.")
 61 | 
 62 |     bblfsh_args = argparse.ArgumentParser(add_help=False)
 63 |     bblfsh_args.add_argument(
 64 |         "--bblfsh", dest="bblfsh_endpoint",
 65 |         help="Babelfish server's endpoint, e.g. 0.0.0.0:9432. "
 66 |              "You can specify it directly or with BBLFSH_ENDPOINT environment variable. Otherwise "
 67 |              "default will be used (default: %s)" % DEFAULT_BBLFSH_ENDPOINTS)
 68 |     bblfsh_args.add_argument(
 69 |         "--timeout", type=int,
 70 |         help="Babelfish timeout - longer requests are dropped. "
 71 |              "You can specify it directly or with BBLFSH_TIMEOUT environment variable. Otherwise "
 72 |              "default will be used (default: %d sec)" % DEFAULT_BBLFSH_TIMEOUT)
 73 | 
 74 |     linguist_arg = one_arg_parser(
 75 |         "--linguist", help="Path to src-d/enry executable.")
 76 | 
 77 |     output_dir_arg_asdf = one_arg_parser(
 78 |         "-o", "--output", required=True, help="Output path where the .asdf will be stored.")
 79 | 
 80 |     process_1_2_arg = one_arg_parser(
 81 |         "-p", "--processes", type=int, default=2, dest="num_processes",
 82 |         help="Number of parallel processes to run. Since every process "
 83 |              "spawns the number of threads equal to the number of CPU cores "
 84 |              "it is better to set this to 1 or 2.")
 85 |     threads_arg = one_arg_parser(
 86 |         "-t", "--threads", type=int, default=multiprocessing.cpu_count(),
 87 |         help="Number of threads in the UASTs extraction process.")
 88 | 
 89 |     # Create and construct subparsers
 90 | 
 91 |     subparsers = parser.add_subparsers(help="Commands", dest="command")
 92 | 
 93 |     source2func_parser = subparsers.add_parser(
 94 |         "source2func",
 95 |         help="Decompose source model to functions were specified library is used. It makes model "
 96 |              "entry from each function that uses library and produce one Function model from one "
 97 |              "Source model, but it has more entries because of decomposition.",
 98 |         parents=[model2input_arg, filter_arg, process_arg, library_name_arg, library_uast_arg,
 99 |                  disable_overwrite_arg])
100 |     source2func_parser.set_defaults(handler=source2func_entry)
101 | 
102 |     source2func_parser.add_argument("-o", "--output", help="Where to write decomposed models.")
103 | 
104 |     dependent_reps_parser = subparsers.add_parser(
105 |         "dependent_reps",
106 |         help="Create a list of repositories, that are dependent from some specified libraries "
107 |              "using libraries.io dataset.")
108 |     dependent_reps_parser.set_defaults(handler=dependent_reps_entry)
109 |     group = dependent_reps_parser.add_argument_group("libraries")
110 |     group_ex = group.add_mutually_exclusive_group(required=True)
111 |     group_ex.add_argument(
112 |         "--libraries_json",
113 |         help="Provide the input file in json format. It should represent dictionary of library "
114 |              "name, url pairs. You can specify empty url if you are not sure. "
115 |              "Excludes --libraries flag.")
116 |     group_ex.add_argument(
117 |         "--libraries", nargs="+",
118 |         help="The name-url pair of the library in format <library name>:<library url>. You can "
119 |              "specify empty url if you are not sure. Excludes --libraries_json flag.")
120 |     dependent_reps_parser.add_argument(
121 |         "-o", "--output", required=True,
122 |         help="Where to write the list of dependent repos links. Save location for urls. "
123 |              "Specify folder if you have several libraries. Then urls will be stored in the file "
124 |              "<library name>.txt . You can specify file, then all urls will be saved in one file.")
125 |     dependent_reps_parser.add_argument(
126 |         "--librariesio_data", required=True,
127 |         help="Provide the path to libraries.io (v1.0.0) dataset. "
128 |              "You can download it from https://libraries.io/data.")
129 |     dependent_reps_parser.add_argument(
130 |         "--platform", default=LibrariesIOFetcher.DEFAULT_PLATFORM,
131 |         help="The name of package manager.")
132 | 
133 |     snippet2df_parser = subparsers.add_parser(
134 |         "snippet2df", help="Calculate identifier document frequencies from uasts for snippets. "
135 |                            "It counts each snippet separately.",
136 |         parents=[model2input_arg, filter_arg, tmpdir_arg, process_arg, disable_overwrite_arg])
137 |     snippet2df_parser.set_defaults(handler=snippet2df_entry)
138 |     snippet2df_parser.add_argument("output", help="Where to write document frequencies.")
139 | 
140 |     snippet2df_parser = subparsers.add_parser(
141 |         "snippet2fc_df", help="Calculate document frequencies from Function Calls in extracted "
142 |                               "snippets. It counts each snippet separately.",
143 |         parents=[model2input_arg, filter_arg, tmpdir_arg, process_arg, disable_overwrite_arg,
144 |                  library_name_arg, library_uast_arg])
145 |     snippet2df_parser.set_defaults(handler=snippet2fc_df_entry)
146 |     snippet2df_parser.add_argument("output", help="Where to write document frequencies.")
147 | 
148 |     snippet2bow_parser = subparsers.add_parser(
149 |         "snippet2bow", help="Calculate bag of words from Simple Identifiers in extracted uasts.",
150 |         parents=[model2input_arg, filter_arg, process_arg, df_arg, disable_overwrite_arg,
151 |                  vocabulary_size_arg])
152 |     snippet2bow_parser.set_defaults(handler=snippet2bow_entry)
153 |     snippet2bow_parser.add_argument(
154 |         "output", help="Where to write the merged nBOW.")
155 | 
156 |     snippet2fc_bow_parser = subparsers.add_parser(
157 |         "snippet2fc_bow", help="Calculate bag of words from Function Calls in extracted uasts.",
158 |         parents=[model2input_arg, filter_arg, process_arg, df_arg, disable_overwrite_arg,
159 |                  vocabulary_size_arg])
160 |     snippet2fc_bow_parser.set_defaults(handler=snippet2fc_bow_entry)
161 |     snippet2fc_bow_parser.add_argument(
162 |         "output", help="Where to write the merged nBOW.")
163 | 
164 |     snippet2fc_bow_parser = subparsers.add_parser(
165 |         "pylib2uast", help="Converts installed python library to UAST model.",
166 |         parents=[linguist_arg, output_dir_arg_asdf, bblfsh_args, process_1_2_arg,
167 |                  threads_arg, disable_overwrite_arg])
168 |     snippet2fc_bow_parser.set_defaults(handler=pylib2uast_entry)
169 |     snippet2fc_bow_parser.add_argument(
170 |         "input", nargs='+', help="library names.")
171 | 
172 |     return parser
173 | 
174 | 
175 | def main():
176 |     """
177 |     Creates all the argparse-rs and invokes the function from set_defaults().
178 | 
179 |     :return: The result of the function from set_defaults().
180 |     """
181 | 
182 |     parser = get_parser()
183 |     args = parser.parse_args()
184 |     args.log_level = logging._nameToLevel[args.log_level]
185 |     setup_logging(args.log_level)
186 |     try:
187 |         handler = args.handler
188 |     except AttributeError:
189 |         def print_usage(_):
190 |             parser.print_usage()
191 | 
192 |         handler = print_usage
193 |     return handler(args)
194 | 
195 | if __name__ == "__main__":
196 |     sys.exit(main())
197 | 


--------------------------------------------------------------------------------
/snippet_ranger/data/tensorflow_dependent_reps.txt:
--------------------------------------------------------------------------------
   1 | https://github.com/jostep/tfmesos
   2 | https://github.com/Aufban/DeepLearning
   3 | https://github.com/williamleif/mgcn
   4 | https://github.com/mayoyamasaki/yanert
   5 | https://github.com/ttrine/speed
   6 | https://github.com/chernv/DeepSpeech
   7 | https://github.com/dominiek/transferflow
   8 | https://github.com/gvanhorn38/inception
   9 | https://github.com/Lab41/altair
  10 | https://github.com/au9ustine/nd009
  11 | https://github.com/jstnstwrt/tensor-flow-investigation
  12 | https://github.com/Libardo1/edward
  13 | https://github.com/softgearko/tensorflow-lstm-regression
  14 | https://github.com/joyhuang-machine-learning/VisualSearchServer
  15 | https://github.com/zsdonghao/TLayer
  16 | https://github.com/Ilyes-Hammadi/mnist-tensorflow
  17 | https://github.com/nicolas-ivanov/tf_seq2seq_chatbot
  18 | https://github.com/von8/Coursera-ML-AndrewNg
  19 | https://github.com/wacabanga/reverseflow
  20 | https://github.com/lev-kusanagi/cs224n
  21 | https://github.com/BuaaLearn/tensorflow-socher-ntn
  22 | https://github.com/waybarrios/nd101_project3
  23 | https://github.com/powernet-project/powernet
  24 | https://github.com/axeltidemann/propeller
  25 | https://github.com/everpeace/learn-tf
  26 | https://github.com/bienseo/tf-stanford-tutorials
  27 | https://github.com/lethehaiau/BiDAF
  28 | https://github.com/amitanalyste/aurelienGeron
  29 | https://github.com/sosoho/tensorflow-101
  30 | https://github.com/dhaneshr/tensorflow_cookbook
  31 | https://github.com/HubBucket-Team/tensorflow_cookbook
  32 | https://github.com/lingochamp/tensorflow-dkt
  33 | https://github.com/zenna/reverseflow
  34 | https://github.com/mikebarile/script-generator
  35 | https://github.com/mouradmourafiq/openrating
  36 | https://github.com/abhay1/tf_rundown
  37 | https://github.com/cleeea/nutracker
  38 | https://github.com/ClimbsRocks/auto_ml
  39 | https://github.com/sauloal/tf
  40 | https://github.com/VerdigrisTech/lambda-tensorflow-example
  41 | https://github.com/ardamavi/Digit-Classifier
  42 | https://github.com/mfigurnov/sact
  43 | https://github.com/cjackie/CRBM
  44 | https://github.com/nukui-s/supervisednmf
  45 | https://github.com/hzue/KDD-2017
  46 | https://github.com/lsshawn/handson-ml
  47 | https://github.com/rrozewsk/OurProject
  48 | https://github.com/Congo-Collaborations/synthesis-database-public
  49 | https://github.com/EdCo95/scientific-paper-summarisation
  50 | https://github.com/ericlavigne/CarND-Behavioral-Cloning
  51 | https://github.com/HubBucket-Team/deep-learning
  52 | https://github.com/AndrewLouw/NOC-S17-2-Intelligence-Learning
  53 | https://github.com/danlegion/ml-tv-script-generation
  54 | https://github.com/jrios6/AIND-Image-Classification
  55 | https://github.com/befelix/Safe-RL-Benchmark
  56 | https://github.com/chaoshangcs/ORGAN
  57 | https://github.com/TensorVision/TensorVision
  58 | https://github.com/Lewuathe/TensorFlow-StyleTransfer
  59 | https://github.com/tims/tensorflow-assay
  60 | https://github.com/keplr-io/quiver
  61 | https://github.com/RobColeman/data_science_and_engineering_ipython_notebooks
  62 | https://github.com/Thalidomide-d/handson-ml
  63 | https://github.com/ppwwyyxx/tensorpack
  64 | https://github.com/SavchenkoValeriy/rooster
  65 | https://github.com/hnarayanan/artistic-style-transfer
  66 | https://github.com/mailmevj/handson-ml
  67 | https://github.com/lywen52/segmentation_keras
  68 | https://github.com/karthickj25/deep-learning
  69 | https://github.com/rasmusbergpalm/normalization
  70 | https://github.com/pritansh/gunshot_detection
  71 | https://github.com/HimmelStein/neuronet
  72 | https://github.com/lihe1991/gcForest
  73 | https://github.com/BotBounty/tensorflow_cookbook
  74 | https://github.com/babky/deep-learning
  75 | https://github.com/seominjoon/vqa-binary
  76 | https://github.com/NYU-MLL/multiNLI
  77 | https://github.com/salceson/iwium
  78 | https://github.com/imindrajit/Udacity-DLND
  79 | https://github.com/YunLi1988/cs224n-SQuAD
  80 | https://github.com/JamesBrofos/Thor
  81 | https://github.com/gongyanchao/dog-project
  82 | https://github.com/flamoedo/TV-Script-Generation
  83 | https://github.com/jmmanso/deepseries
  84 | https://github.com/nelson-liu/bi-att-flow
  85 | https://github.com/voicy-ai/DialogStateTracking
  86 | https://github.com/Aqueelmiq/PredictUs
  87 | https://github.com/blackbetty/tensorflow-tut
  88 | https://github.com/hunkim/ReinforcementZeroToAll
  89 | https://github.com/armadill-odyssey/DeepDSP
  90 | https://github.com/PaddyT/waveform-asr
  91 | https://github.com/tifoit/bi-attention-flow
  92 | https://github.com/goldenberg/mnistified
  93 | https://github.com/cjxh/SeqGAN
  94 | https://github.com/suriyadeepan/n2n_dialog_system
  95 | https://github.com/iver56/image-regression
  96 | https://github.com/m-anish/autonomio
  97 | https://github.com/niilante/ReinforcementZeroToAll
  98 | https://github.com/Kindpire/machine-learning-final
  99 | https://github.com/Aetf/tensorflow-tbcnn
 100 | https://github.com/sosoho/BossSensor
 101 | https://github.com/ghostviper/handson-ml
 102 | https://github.com/Westermann/master_thesis
 103 | https://github.com/juliakreutzer/neural-slack-bot
 104 | https://github.com/SaeedNajafi/tf_chatbot_seq2seq_antilm
 105 | https://github.com/avinj/RNN
 106 | https://github.com/shintotm/tv-script-generation
 107 | https://github.com/hensden/Music-Genre-Classification
 108 | https://github.com/andhus/deep-dynamic-graphs
 109 | https://github.com/wishingwei/tensorlayer
 110 | https://github.com/nishant-jain-94/lstm-word-prediction
 111 | https://github.com/Ujjwal-9/DeepLearning-Challenges
 112 | https://github.com/Vincent-Ricardo/tensorlayer
 113 | https://github.com/yinnonsanders/talmudgenerator
 114 | https://github.com/tobiajo/yarntf
 115 | https://github.com/chrisburr/tensorprob
 116 | https://github.com/zabing/srez
 117 | https://github.com/tspannhw/tf-stanford-tutorials
 118 | https://github.com/timtwotoes/tv-script-generation
 119 | https://github.com/yoeo/guesslang
 120 | https://github.com/dennybritz/sentiment-analysis
 121 | https://github.com/313-Ventures/edward
 122 | https://github.com/maxbarkhausen/sparseflow
 123 | https://github.com/pcuellar/Deep-Learning-TensorFlow
 124 | https://github.com/vyraun/chatbot-MemN2N-tensorflow
 125 | https://github.com/dmcguckin/handson-ml
 126 | https://github.com/civisanalytics/muffnn
 127 | https://github.com/gulsunde/predict_stock_py
 128 | https://github.com/jshin49/cnn-cats-vs-dogs
 129 | https://github.com/Cyberfreakier/uda_tv_script_generator
 130 | https://github.com/fdalvi/cat-detector
 131 | https://github.com/astriker/DeepLearningZeroToAll
 132 | https://github.com/salathegroup/deep-height
 133 | https://github.com/korepwx/madoka
 134 | https://github.com/Scitator/rstools
 135 | https://github.com/nithishdivakar/Talks-and-Tutorials
 136 | https://github.com/fral92/TF_main_loop
 137 | https://github.com/OSSDC/pygta5
 138 | https://github.com/metaflow-ai/hive
 139 | https://github.com/jakebian/quiver
 140 | https://github.com/suntzualex/deep-learning
 141 | https://github.com/AlexFridman/visits-detector
 142 | https://github.com/pdwyys20/deep-learning
 143 | https://github.com/eklitzke/dnn-fastai-project
 144 | https://github.com/ml-lab/magenta_session
 145 | https://github.com/fonsecapeter/mnist
 146 | https://github.com/henriblancke/neural-chat
 147 | https://github.com/m516825/ADL2016
 148 | https://github.com/RamaneekGill/dicom-batch-loader
 149 | https://github.com/LqNoob/tensorflow_cookbook
 150 | https://github.com/apolloodilo/lisa-node
 151 | https://github.com/yebrahim/pydatalab
 152 | https://github.com/stompchicken/charpathy
 153 | https://github.com/jambobjambo/Firefly
 154 | https://github.com/ramshank/deep-learning
 155 | https://github.com/LKH-1/DeepLearningZeroToAll
 156 | https://github.com/sperazza/RnnTvScriptGeneration
 157 | https://github.com/paulhendricks/edward
 158 | https://github.com/allenai/bi-att-flow
 159 | https://github.com/mluszczyk/ml1617-mnist
 160 | https://github.com/LuWao/tf_unet
 161 | https://github.com/Liberus/MlHomework2
 162 | https://github.com/yaochengji/srez
 163 | https://github.com/formath/deep_recommend_system
 164 | https://github.com/LoveShun/Machine_Learning_Practice
 165 | https://github.com/dlohith/tf_seq2seq_chatbot
 166 | https://github.com/ilhamadun/skripsi-har
 167 | https://github.com/shaharelisha/music-generator
 168 | https://github.com/teffland/Relation-Extraction
 169 | https://github.com/Kensuke-Mitsuzawa/keras-codes
 170 | https://github.com/lukejduncan/tfimgtools
 171 | https://github.com/nihitx/tv-script-generation
 172 | https://github.com/wemakefocus/retrievalBasedModel
 173 | https://github.com/Slaski/Deep-Learning-Nanodegree---Generate-TV-Scripts
 174 | https://github.com/OSSDC/SimGAN
 175 | https://github.com/arnocandel/cvxflow
 176 | https://github.com/krish5989/google-sample-code
 177 | https://github.com/CarlSouthall/TFCS
 178 | https://github.com/ericzhao28/8thLightApp
 179 | https://github.com/ml-lab/deeppose_tf
 180 | https://github.com/hackliff/stacks
 181 | https://github.com/MarcoForte/AutoPortraitMatting
 182 | https://github.com/Liwmo/tv-script-generation
 183 | https://github.com/adrianjrandall/hyperledger-test
 184 | https://github.com/akaitsuki-ii/CS224n
 185 | https://github.com/rsanchezavalos/compranet
 186 | https://github.com/daoliker/deep_recommend_system
 187 | https://github.com/957805875/tensorlayer
 188 | https://github.com/clems4ever/tensorflow-wavenet
 189 | https://github.com/thiippal/tankbuster
 190 | https://github.com/exe1023/VIN-snake
 191 | https://github.com/alexfridlyand/SimGAN
 192 | https://github.com/samithaj/cs224n-1
 193 | https://github.com/zhuqiannan/tensorflow-socher-ntn
 194 | https://github.com/miku/nntour
 195 | https://github.com/ikhlestov/vision_networks
 196 | https://github.com/ml-lab/MuGo
 197 | https://github.com/luismayta/examples-tensorflow
 198 | https://github.com/waprin/cloudml-samples
 199 | https://github.com/Ujjwal-9/reinforcement-learning
 200 | https://github.com/handoolki/DeepLearningZeroToAll
 201 | https://github.com/Caffeinism/goodluck-tensor
 202 | https://github.com/apacha/MusicScoreClassifier
 203 | https://github.com/zentechthaingo/tf-stanford-tutorials
 204 | https://github.com/captify-alazorenko/RL_prod
 205 | https://github.com/kaiquewdev/palindromic_model
 206 | https://github.com/ligechina/bi-att-flow
 207 | https://github.com/KrUciFieR-Jr/Digit-Recognition-Using-TensorFlow
 208 | https://github.com/RajPratim21/thirdEye
 209 | https://github.com/dhaneshr/tf_unet
 210 | https://github.com/BenderV/self_driving_car
 211 | https://github.com/Gabriele91/DENN
 212 | https://github.com/DidelotK/deep_learning_vm_keras
 213 | https://github.com/munky69rock/mnist-demo
 214 | https://github.com/twiecki/edward
 215 | https://github.com/tkipf/gcn
 216 | https://github.com/fartashf/cleverhans
 217 | https://github.com/rizkiarm/LipNet
 218 | https://github.com/koreyoshi-mln/simple_captcha_inference_logon_demo_malina
 219 | https://github.com/cmondorf/tv-script-generation
 220 | https://github.com/steelcolosus/generate.tv.scripts
 221 | https://github.com/hammerlab/mhcflurry
 222 | https://github.com/DOsinga/reverse_image_search
 223 | https://github.com/wtmenten/oscars
 224 | https://github.com/nickjalbert/nickj-tensorflow-tutorial
 225 | https://github.com/gmlove/tf-stanford-tutorials
 226 | https://github.com/ic/gits
 227 | https://github.com/waybarrios/meetup_pythonbq_deeplearning
 228 | https://github.com/feynmanliang/bachbot
 229 | https://github.com/LinDong123a/2017-2018-
 230 | https://github.com/nyk510/bayesian_nn
 231 | https://github.com/tgsmith61591/smrt
 232 | https://github.com/BenGoBlue05/tv_script_generation
 233 | https://github.com/thiagoqd/udacity-deep-learning-foundations
 234 | https://github.com/ml-lab/kaggle-dstl
 235 | https://github.com/yiweishe/cs224n
 236 | https://github.com/menxia/udacity-deep-learning
 237 | https://github.com/jakesnell/myshkin
 238 | https://github.com/JianxiangFENG/Udacity_project
 239 | https://github.com/pratimaupadhyay02/thirdEye
 240 | https://gitlab.com/dm4562/hand_movement
 241 | https://github.com/efoley/deep-learning
 242 | https://github.com/jmcx/troll-api
 243 | https://github.com/smccumsey/poco-waggle-classroom
 244 | https://github.com/brannondorsey/midi-rnn
 245 | https://github.com/knathanieltucker/tf229
 246 | https://github.com/zxzhijia/pygta5
 247 | https://github.com/infpsyndrome/tf-stanford-tutorials
 248 | https://github.com/Josecamilo94/ImageTag
 249 | https://github.com/recnet/model
 250 | https://github.com/ml-lab/tensorflow-speech-recognition
 251 | https://github.com/geoffreysteven/aind2-cnn
 252 | https://github.com/googlecodelabs/nest-tensorflow
 253 | https://github.com/peterwilli/NameAI
 254 | https://github.com/technologiclee/tensorflow-socher-ntn
 255 | https://github.com/barty777/deep_humor
 256 | https://github.com/mgurdal/tensorflow-dersleri
 257 | https://github.com/daniele-sartiano/deepbets
 258 | https://github.com/ruoccoma/semsearch
 259 | https://github.com/saurabhmathur96/happy-and-you-know-it
 260 | https://github.com/zhanghaoyu1993/attention-sum-reader
 261 | https://github.com/kirtanechiron/etherbot
 262 | https://github.com/Arya-ai/braid
 263 | https://github.com/safer41/aKountable
 264 | https://github.com/niilante/DeepLearningZeroToAll
 265 | https://github.com/AlexRobson/GenAdvNetworks_MNIST
 266 | https://github.com/Kyate/text-to-image
 267 | https://github.com/ErickDiaz/TensorFlow_Lab
 268 | https://github.com/LulingHan/Diagnose-Transformer-DBN
 269 | https://github.com/jtoy/Email-Responder
 270 | https://github.com/aldopareja/deeprl-hw3
 271 | https://github.com/BotBounty/tf-stanford-tutorials
 272 | https://github.com/mxl1990/tensorflow-101
 273 | https://github.com/nwhidden/ND101-Deep-Learning
 274 | https://github.com/ibab/tensorprob
 275 | https://github.com/3D-CONV/tensorflow-101
 276 | https://github.com/mharrend/NNFlow
 277 | https://github.com/shareactorIO/source.ml
 278 | https://github.com/samithaj/lda2vec-tf
 279 | https://github.com/gelsto/SpeakEasy
 280 | https://github.com/mathur/voyager
 281 | https://github.com/hrishikeshvganu/clipper
 282 | https://github.com/dharness/sqwak
 283 | https://github.com/lopuhin/sensefreq
 284 | https://github.com/rkargon/Scene-Labeling
 285 | https://github.com/sgaurav/Seq2Seq_Upgrade_TensorFlow
 286 | https://github.com/VigneshSrinivasan10/interprettensor
 287 | https://github.com/liuchunhuahua/tensorflow-socher-ntn
 288 | https://github.com/databricks/spark-deep-learning
 289 | https://github.com/tentangdata/crane
 290 | https://github.com/linjian93/tensorflow_vo_new
 291 | https://github.com/Coder-Yu/deep_recommend_system
 292 | https://github.com/quangvu0702/TensorFlow-Tutorials
 293 | https://bitbucket.org/Sabeeka/conversation-tensorflow-generative-model
 294 | https://github.com/grahamaloo/oscars
 295 | https://github.com/elfklx/ner
 296 | https://github.com/yogurito/dlnd-intro-to-rnn
 297 | https://github.com/ontouchstart/binder-tensorflow
 298 | https://github.com/dask/dask-tensorflow
 299 | https://github.com/sunny8k/HelloWorld
 300 | https://github.com/hartikainen/cs224n
 301 | https://github.com/benkamphaus/keras-to-cortex
 302 | https://github.com/bigchange/cs224u
 303 | https://github.com/rdadolf/fathom
 304 | https://github.com/taki0112/DeepLearningZeroToAll
 305 | https://github.com/anhelus/convnet_tflow
 306 | https://github.com/dataPipelineAU/learningtensorflow_lessons
 307 | https://github.com/anuragmishracse/caption_generator
 308 | https://github.com/Satyaki0924/project_3_udacity
 309 | https://github.com/mainyaa/tensorflow_mnist_cloudml
 310 | https://github.com/eltonlaw/impyute
 311 | https://github.com/chusine/dlnd
 312 | https://github.com/yankov/netron
 313 | https://github.com/Andrew-Jiang/handson-ml
 314 | https://github.com/AasthaGupta/Fun-Lyrics
 315 | https://github.com/mariocespindola/FirstTensorFlowAdventure
 316 | https://github.com/perezmunoz/tianchiclassification
 317 | https://github.com/cangermueller/deepcpg
 318 | https://github.com/GeekLiB/facenet
 319 | https://github.com/miku/tensorflow_cookbook
 320 | https://github.com/jgensler8/my-tensorflow-journey
 321 | https://github.com/Mersaul4/project1
 322 | https://github.com/sugyan/tf-embedding-visualization-demo
 323 | https://github.com/Tesla7D/ATT_Demo
 324 | https://github.com/takahashik/docker-python-ml
 325 | https://github.com/datasart/BossSensor
 326 | https://github.com/mike121/nsynth-convert
 327 | https://github.com/webarmor/python-docs-samples
 328 | https://github.com/ml-lab/facenet
 329 | https://github.com/ml-lab/WaterNet
 330 | https://github.com/priyankakukreja267/scanner
 331 | https://github.com/ai2160/cs224u
 332 | https://github.com/dwgoon/deepfit
 333 | https://github.com/MarkDaoust/tfutils
 334 | https://github.com/ycguo028/zhusuan
 335 | https://github.com/zhwhong/awesome-deep-learning
 336 | https://github.com/askerry/dotfiles
 337 | https://github.com/ml-lab/seq2seq-2
 338 | https://github.com/DanburyAI/AUG2016-TensorFlow-Presentation-by-Andrew-Rib
 339 | https://github.com/GokuMohandas/Attentional-Interfaces-O-Reilly
 340 | https://github.com/jsmits/keras-inception-service
 341 | https://github.com/Vunb/tf_seq2seq_chatbot
 342 | https://github.com/ALISCIFP/Segmentation
 343 | https://github.com/Aaussh/Anna-KaRNNa
 344 | https://github.com/zabarnes/RattLe
 345 | https://github.com/Appsilon/hakathon-120416
 346 | https://github.com/yesup/tensorflow-serving-client-python
 347 | https://github.com/CNUPiedPiper/Recording
 348 | https://github.com/vyse8/neuralvqa3
 349 | https://github.com/elm200/recognize-dogs-and-cats
 350 | https://github.com/AshishBora/csgm
 351 | https://github.com/PMBio/deepcpg
 352 | https://github.com/alexklibisz/isbi-2012
 353 | https://github.com/andychisholm/mimo
 354 | https://github.com/peterlau123/facenet
 355 | https://github.com/gcmsrc/UDACITY-DLND-Text-LSTM
 356 | https://github.com/BotBounty/chatbot-retrieval
 357 | https://github.com/JarvisFei/my-first-neural-network
 358 | https://github.com/ankeshanand/neural-cryptography-tensorflow
 359 | https://github.com/raphael-sch/PythonPathLSTM
 360 | https://github.com/cuijianzhu/tinier-nn
 361 | https://github.com/dadaromeo/recsys-hpf
 362 | https://github.com/torsknod/python-keras-matplotlib-numpy-pyfftw-soundfile-theano-youtube_dl-docker
 363 | https://github.com/abhi1092/RNN_langauge_model_jokes_corpus
 364 | https://github.com/ml-lab/handson-ml
 365 | https://github.com/Kcrong/League-of-Fortuneteller
 366 | https://github.com/saitai0802/style-transfer-lstm
 367 | https://github.com/samuelzhouhe/mnist-cnn
 368 | https://github.com/chrisvmiller/analytics
 369 | https://github.com/eleijonmarck/lane-follower
 370 | https://github.com/CSweetBlue/Tensorflow-Music-Generation-ByWaves
 371 | https://github.com/antimon2/tfgraphviz
 372 | https://github.com/sunwillz/kdd2017
 373 | https://github.com/barefoothiker/webChronux
 374 | https://github.com/Semantics3/dist-keras
 375 | https://github.com/datankai/julieta-mi
 376 | https://github.com/ml-lab/sact
 377 | https://github.com/justrypython/captcha_break
 378 | https://github.com/mhbashari/machine-learning-snippets
 379 | https://github.com/Smeb/camino-ml
 380 | https://github.com/seominjoon/qrn
 381 | https://github.com/Amarjyotismruti/iLQR-REINFORCE-DAGGER
 382 | https://github.com/shinsec/deep-pwning
 383 | https://github.com/91Eric/DeepLearning
 384 | https://github.com/MaxDam/FenceIndoor
 385 | https://github.com/joaoalvarenga/namegenderclassifier
 386 | https://github.com/GoooQ/Deep-Learning-TensorFlow
 387 | https://github.com/StenaTransformations/namoline
 388 | https://github.com/LuanaLabs/keras
 389 | https://github.com/tnedev/tf_chatbot_seq2seq_antilm
 390 | https://github.com/SudalaiRajkumar/tf-stanford-tutorials
 391 | https://github.com/ObadaJabassini/arabic-text-to-speech
 392 | https://github.com/guillaume-chevalier/Hyperopt-Keras-CNN-CIFAR-100
 393 | https://github.com/sharadmv/deepx
 394 | https://github.com/seokjunbing/cs75
 395 | https://github.com/mkustermann/cs224n
 396 | https://github.com/random-forests/handson-ml
 397 | https://github.com/slsfcteam/kaggle-slsfc
 398 | https://github.com/yyao007/real-estate-analysis
 399 | https://github.com/ataber/Email-Responder
 400 | https://github.com/codekansas/seqgan-text-tensorflow
 401 | https://github.com/Yoctol/yoctol-keras-layer-zoo
 402 | https://github.com/liusiqi43/txt2calories
 403 | https://github.com/pika11/neural-network-tv-script-generation
 404 | https://github.com/UOADataScience/auckland-ai-meetup-x-triage
 405 | https://github.com/pnpnpn/keras-attic
 406 | https://github.com/brilee/MuGo
 407 | https://github.com/mtoo020/Medicai
 408 | https://github.com/elsclarysse/dlnd-tv-script-generation
 409 | https://github.com/sujithv28/Behavioral-Cloning-Hacktorial
 410 | https://github.com/vwms/Dockerfile-1
 411 | https://github.com/Arun-Singh-Chauhan-09/Chatbot_Retrival
 412 | https://github.com/dmitrime/convolutional-kanji
 413 | https://github.com/ml-lab/tensorflow_qrnn
 414 | https://github.com/RedSquadron544/rnn-classifier
 415 | https://github.com/GeekLiB/tensorflow-wavenet
 416 | https://github.com/marionleborgne/lstm-talk
 417 | https://github.com/KittenCN/pyBossSensor
 418 | https://github.com/zentechthaingo/facenet
 419 | https://github.com/ehfo0/artistic-style-transfer
 420 | https://github.com/hzue/kkbox-interview
 421 | https://github.com/Corey-Zumar/clipper-db-queries
 422 | https://github.com/Peanets/rl
 423 | https://github.com/frankgu/3d-DenseNet
 424 | https://github.com/mzp/arisu-in-fact
 425 | https://github.com/patwie-stuff/DeepSpeech
 426 | https://github.com/Libardo1/dask-tensorflow
 427 | https://github.com/dzorlu/parsecontent
 428 | https://github.com/vunb/tf_chatbot_seq2seq_antilm
 429 | https://github.com/JGrzybowski/vindinium-curses_ui
 430 | https://github.com/udacity/aind2-cnn
 431 | https://github.com/dolokov/SimGAN
 432 | https://github.com/kkuchar2/MgrAIC
 433 | https://github.com/khshim/tflemon
 434 | https://github.com/jshin49/Kaggle-Cat-vs-Dog-Tensorflow-CNN
 435 | https://github.com/shaunstanislaus/edward
 436 | https://github.com/AlgoDerm-dev/AlgoDerm-backend
 437 | https://github.com/nanounanue/rita-pipeline
 438 | https://github.com/MitPandya/Human-Action-Recognition-and-Video-Classification-using-SVM-and-Deep-CNN-
 439 | https://github.com/HubBuckets/handson-ml
 440 | https://github.com/welschma/NNFlow
 441 | https://github.com/RobSalzwedel/tf-stanford-tutorials
 442 | https://github.com/thanhson1085/Hello-AI
 443 | https://github.com/zhanghaoyu1993/RC-experiments
 444 | https://github.com/azavea/quiver
 445 | https://github.com/fundsan/classify
 446 | https://github.com/MichaelFeng87/Defect-Detection-in-Nanofibers-by-Image-Classification
 447 | https://github.com/FragLegs/nativeness
 448 | https://github.com/mzp/EagleJumpSystem
 449 | https://github.com/ZeroPage/machine-learning
 450 | https://github.com/yesup/tensorflow-exported-model-reader
 451 | https://github.com/taose-deeplearning/prediction_engine
 452 | https://github.com/ikhlestov/rbm_based_autoencoders_with_tensorflow
 453 | https://github.com/openai/baselines
 454 | https://github.com/pbalapra/sandbox
 455 | https://github.com/shotastage/prism
 456 | https://github.com/Joey-Liu/cs224n-2017-assignments
 457 | https://github.com/ReDeiPirati/tf-stanford-tutorials
 458 | https://gitlab.com/thanhngvpt/tensorflowlearning
 459 | https://github.com/danlegion/intro-to-tensorflow
 460 | https://github.com/vincentadam87/MFVI
 461 | https://github.com/artBoffin/GooeyBrain
 462 | https://github.com/jimfleming/LAPGAN
 463 | https://github.com/aajrami/DLND-TV-Script-Generation
 464 | https://github.com/hpssjellis/char-rnn-tensorflow-music-3dprinting
 465 | https://github.com/betterenvi/QA-rankit
 466 | https://github.com/ml-ai-nlp-ir/cvxflow
 467 | https://github.com/nengo/nengo_dl
 468 | https://github.com/Yum1ng/DCGAN-Image-Super-Resolution
 469 | https://github.com/BenJamesbabala/bachbot
 470 | https://github.com/rjpower/meridian
 471 | https://github.com/FragLegs/embedor
 472 | https://github.com/tongda/tf-stanford-tutorials
 473 | https://github.com/hunkim/DeepLearningZeroToAll
 474 | https://github.com/3D-CONV/DeepLearningZeroToAll
 475 | https://github.com/samjabrahams/taqtoe
 476 | https://github.com/Higgins2718/promethea2
 477 | https://github.com/tunamonster/CS224n_2017
 478 | https://github.com/tobegit3hub/deep_recommend_system
 479 | https://github.com/1heart/nnmf
 480 | https://github.com/iamsteveng/AIND-DogProject
 481 | https://github.com/Xanther/PyVison
 482 | https://github.com/shapeace/DeepLearningZeroToAll
 483 | https://github.com/danielshiferaw/Deep-Learning-Question-Answering-on-SQuAD
 484 | https://github.com/melindadevins/deep-learning
 485 | https://github.com/pandeydivesh15/AVSR-Deep-Speech
 486 | https://github.com/jdanbrown/pydatalab
 487 | https://github.com/fvisin/main_loop_tf
 488 | https://github.com/autonomio/full
 489 | https://github.com/gan3sh500/keras-lsgan
 490 | https://gitlab.com/hohohahalala/kkbox-interview
 491 | https://github.com/dmonllao/moodleinspire-python-backend
 492 | https://github.com/sandz-in/BICapstoneProject
 493 | https://github.com/ml-lab/twpca
 494 | https://github.com/iver56/cnn-clock
 495 | https://github.com/n-kats/tf-gogh
 496 | https://github.com/Panaetius/IP5
 497 | https://github.com/307509256/chatbot-retrieval
 498 | https://github.com/selimyoussry/datadriven-blood
 499 | https://github.com/nanfengpo/crack_captcha
 500 | https://github.com/MahdiNazemi/edward
 501 | https://github.com/eou-mrm/pipeline
 502 | https://github.com/rupanroy6/handson-ml
 503 | https://github.com/ml-lab/dlbench
 504 | https://github.com/Mvrm/deep-learning-workshop
 505 | https://github.com/eklitzke/tf-slice
 506 | https://github.com/andrewwilson/mlnd_capstone
 507 | https://github.com/tomasgarzon/webinar-machine-learning
 508 | https://github.com/dhaneshr/handson-ml
 509 | https://github.com/tattn/tensorflow-chatbot-jp
 510 | https://github.com/jacobperricone/cs224n
 511 | https://github.com/ShobhitMaheshwari/psl
 512 | https://github.com/bogdan-kulynych/textfool
 513 | https://github.com/yuhui-lin/web_page_classification
 514 | https://github.com/brianmhiggins/cs224-assign3
 515 | https://github.com/hduongtrong/lstmroots
 516 | https://github.com/cahya-wirawan/opentc
 517 | https://github.com/dailysoap/cs224n
 518 | https://github.com/overkillen/PitE-Forecast-Currency
 519 | https://github.com/msankar/convolutionNeuralNetworkProject
 520 | https://github.com/Praveen-Gupta/handson-ml
 521 | https://github.com/utsavgarg/IDE
 522 | https://github.com/apolloswisdom/BossSensor
 523 | https://github.com/gvoysey/DeepSpeech
 524 | https://github.com/llSourcell/tensorflow_speech_recognition_demo
 525 | https://github.com/CodeLeague/neural_complete
 526 | https://github.com/yarikos/pygta5
 527 | https://github.com/chenjun0210/deep_recommend_system
 528 | https://github.com/HaraldoFilho/DLND-transfer-learning
 529 | https://github.com/RedSunCMX/tensorflow-101
 530 | https://github.com/lucywi/artistic-style-transfer
 531 | https://github.com/kimoktm/U-Net
 532 | https://github.com/ragundez/data-science-summit-2016
 533 | https://github.com/philipperemy/tensorflow-ctc-speech-recognition
 534 | https://github.com/TokyoIndex/dog_project
 535 | https://github.com/petrux/dket
 536 | https://github.com/daimrod/opinion-sentence-annotator
 537 | https://github.com/yungbyun/DeepLearningZeroToAll
 538 | https://github.com/gretchenriggs/Nature...Or-Not-
 539 | https://github.com/MarvinTeichmann/Tensorflow-Segmentation-Toolkit
 540 | https://github.com/bfortuner/deephacks
 541 | https://github.com/deekshithmarla/braid
 542 | https://github.com/scne/svhn_classifier
 543 | https://github.com/udacity/dog-project
 544 | https://github.com/lene/nn-wtf
 545 | https://github.com/paarthneekhara/text-to-image
 546 | https://github.com/icoxfog417/DialogueBreakdownDetection2016
 547 | https://github.com/xymeow/BossSensor
 548 | https://github.com/nnbuilder/nnbuilder
 549 | https://github.com/keonkim/reinforcement-learning
 550 | https://github.com/zsdonghao/tensorlayer
 551 | https://gitlab.com/Hyogen/MesCulturalAlicanteKeras
 552 | https://github.com/douglaseck/aiexperiments-ai-duet
 553 | https://github.com/shivam-kotwalia/mnist
 554 | https://github.com/soodoku/ethnicolr
 555 | https://github.com/achillesrasquinha/Fabrik
 556 | https://github.com/philipperemy/tensorflow-cnn-time-series
 557 | https://github.com/goodasa/data_school_at_gachon
 558 | https://github.com/leotouroul/network_game_theory
 559 | https://github.com/MichaelObi/SimpleBot
 560 | https://github.com/mouradmourafiq/tensorflow-lstm-regression
 561 | https://github.com/fluxcapacitor/source.ml
 562 | https://github.com/sg-kim/DeepLearningZeroToAll
 563 | https://github.com/johnpineda4/tensorflow_speech_recognition_demo
 564 | https://github.com/luisguiserrano/AIND-DL
 565 | https://github.com/jimmyzzu/libsdae-autoencoder-tensorflow
 566 | https://github.com/rmdort/tensorflow_cookbook
 567 | https://github.com/nazar-ivantsiv/bee-brood-counter
 568 | https://github.com/tansey/sdp
 569 | https://github.com/Shaggy2606/Api_DBMSProject
 570 | https://github.com/dhruvramani/RecipeNet
 571 | https://github.com/mgka/notebook
 572 | https://github.com/zakonsx/chatbot-retrieval
 573 | https://github.com/jwzinser/proyecto
 574 | https://github.com/oeuf/on-the-dl
 575 | https://github.com/davidjurgens/equilid
 576 | https://github.com/ml-lab/dfi-tensorflow
 577 | https://github.com/MichaelFeng87/facenet
 578 | https://github.com/xiexingzhu/aces
 579 | https://github.com/brianmhiggins/cs_294w_senior_project
 580 | https://github.com/onpoeet/text-to-image
 581 | https://github.com/2018sjain/CartPolev0-DNN
 582 | https://github.com/cc13ny/tensorlayer
 583 | https://github.com/kartikT007/Udacity
 584 | https://github.com/EmmaBYPeng/Tensorflow-DeconvNet-Segmentation
 585 | https://github.com/xcwill/my_chatbot
 586 | https://github.com/rising-turtle/DeepLearning_study
 587 | https://github.com/nanounanue/jitomate
 588 | https://github.com/viswavi/languageid
 589 | https://github.com/lucasvieirademiranda/tv-script-generation
 590 | https://github.com/slaclab/psmlearn
 591 | https://github.com/Crashthatch/tensorflow-lstm-regression
 592 | https://github.com/thisisjl/KerasMNIST_tutorial
 593 | https://github.com/icoxfog417/magenta_session
 594 | https://github.com/llSourcell/artistic-style-transfer
 595 | https://github.com/aredhatgopi/BML
 596 | https://github.com/kenstars/chatbot-retrieval
 597 | https://github.com/shkr/tensorflow_examples
 598 | https://github.com/amirj/neural-relevance-model
 599 | https://github.com/LHHIGHTECH/tensorflow_speech_recognition_demo
 600 | https://github.com/leovetter/youtube8m
 601 | https://github.com/distagon/DeepLearningZeroToAll
 602 | https://github.com/Ggoals/DeepLearningZeroToAll
 603 | https://github.com/brangerbriz/midai
 604 | https://github.com/thrillerist/TensorFlow-Tutorials
 605 | https://github.com/Shetty4L/malware-classification
 606 | https://github.com/llSourcell/tf_seq2seq_chatbot
 607 | https://github.com/larahronn/TFLearn_projects
 608 | https://github.com/shrjain/query-embeddings
 609 | https://github.com/xmartlabs/benderthon
 610 | https://github.com/dimorinny/tensorflow-image-classificator
 611 | https://github.com/pacocp/Defect-Detection-in-Nanofibers-by-Image-Classification
 612 | https://github.com/jottenlips/DeepDSP
 613 | https://github.com/qiuwch/tensorpack
 614 | https://github.com/FlowSea/BossSensor
 615 | https://github.com/masinogns/fefe
 616 | https://github.com/atveit/keras2ios
 617 | https://github.com/quangvu0702/sku_2_vec
 618 | https://github.com/brendansudol/hello-tensorflow
 619 | https://github.com/nilwyh/alitrade
 620 | https://github.com/DangerousDoughnuts/DoughnutCalendar
 621 | https://bitbucket.org/Eternal_Stranger/boss-sensor
 622 | https://github.com/fanderegg/wikipedia_classification
 623 | https://github.com/jthurst3/MemeCaptcha
 624 | https://github.com/djahng/p3-tv-script-generation
 625 | https://github.com/ajvani/cardr-public
 626 | https://github.com/icoxfog417/tying-wv-and-wc
 627 | https://github.com/jvlmdr/simple-rl
 628 | https://github.com/robott12/didactic_lda
 629 | https://github.com/pminervini/neural-walker
 630 | https://github.com/kingfengji/gcForest
 631 | https://github.com/omarbenzekri/test
 632 | https://github.com/hiroyuki827/tensorflow_workdir
 633 | https://github.com/banu-prakash/DNN
 634 | https://github.com/elenduuche/tf-stanford-tutorials
 635 | https://github.com/jiegzhan/TensorFlow-Tutorials
 636 | https://github.com/ruimashita/dnn
 637 | https://github.com/G10DRAS/g2p-seq2seq
 638 | https://github.com/etkirsch/autoambience
 639 | https://github.com/sytjyjj/Math624Project
 640 | https://github.com/Omranic/DeepLearningZeroToAll
 641 | https://github.com/WenchenLi/chatbot-UDC-dual-encoder-lstm
 642 | https://github.com/jimmec/tensorflow-demo
 643 | https://github.com/stephenhky/MoguNumerics
 644 | https://github.com/shahaf-sameach/noya
 645 | https://github.com/tempbottle/tensorflow_cookbook
 646 | https://github.com/AjayTalati/tinier-nn
 647 | https://github.com/raktimmondol/deep-belief-network
 648 | https://github.com/GzuPark/tv_script_generation
 649 | https://github.com/CVML/tensorflow_cookbook
 650 | https://github.com/TheBottleSeller/butter
 651 | https://github.com/Zer0101/colorize--nn3gen
 652 | https://github.com/tony36486/Machine-Learning
 653 | https://github.com/bcmertz/Frame-Python
 654 | https://github.com/fastai/word-embeddings-workshop
 655 | https://github.com/lessons-of-k4zzk/lessons-flask
 656 | https://github.com/lnicalo/tensorflow_cookbook
 657 | https://github.com/mitchelljeff/modelf
 658 | https://github.com/ganguli-lab/twpca
 659 | https://github.com/yidiz9404/image_captioning
 660 | https://github.com/uiureo/ossan-filter
 661 | https://github.com/ErickDiaz/word2vec_embeddings
 662 | https://github.com/chenmingxiang110/cs224_reconstruction
 663 | https://github.com/alifanov/pix2code-reimplement
 664 | https://github.com/nsbradford/CS525-DeepNeuralNetworks
 665 | https://github.com/lzgahbb/facenet
 666 | https://github.com/calvinschmdt/EasyTensorflow
 667 | https://github.com/roshanatl/heroku-basic-flask
 668 | https://github.com/tensorprob/tensorprob
 669 | https://github.com/Libardo1/deep_recommend_system
 670 | https://github.com/chrisloy/transcribe
 671 | https://github.com/mentix02/ManAI
 672 | https://github.com/aimeida/ner
 673 | https://github.com/ErickDiaz/TFLearn_sentiment_analysis
 674 | https://github.com/devilhtc/cs224-assign3
 675 | https://github.com/LepiorzDaniel/test2
 676 | https://github.com/danaoira/Miscellaneous
 677 | https://github.com/JulianYG/224nfinalproject
 678 | https://github.com/HvyD/AIND2-Dog_Project
 679 | https://github.com/ivan-liljeqvist/MachineLearningFun
 680 | https://github.com/inspur-iop/zhusuan
 681 | https://github.com/bentocin/dlnd_project3_tv_script_generation
 682 | https://github.com/danielyinanc/desktop
 683 | https://github.com/markusodenthal/intro-to-rnn
 684 | https://github.com/watrool/dog_breed_dectetor
 685 | https://github.com/nirgn975/DLND
 686 | https://github.com/ml-lab/deep-pwning
 687 | https://github.com/JosephCatrambone/ImageFab
 688 | https://github.com/ykl7/image-ns
 689 | https://github.com/dfgit/cdsw-short
 690 | https://github.com/0xcaff/nos-stock
 691 | https://github.com/meinternational/tensorflow_udacity
 692 | https://github.com/jmeakin/courses
 693 | https://github.com/mandalsaroj/q-categorizer
 694 | https://github.com/franciscovargas/AT-THack
 695 | https://github.com/pedrohserrano/jitomate
 696 | https://github.com/fhennecker/meta-rl-acrobot
 697 | https://github.com/sightlabs/dist-keras
 698 | https://github.com/guziks/dlnd-tv-script-generation
 699 | https://github.com/YuriyGuts/snake-ai-reinforcement
 700 | https://github.com/bogdan-kulynych/denoising-cnn
 701 | https://github.com/cchio/deep-pwning
 702 | https://github.com/joancarles-upv/OSVOS-TensorFlow
 703 | https://github.com/Sasha-P/Whats-cooking
 704 | https://github.com/jolohan/ML4
 705 | https://github.com/sleepokay/mnist-flask-app
 706 | https://github.com/ltrottier/keras-object-recognition
 707 | https://github.com/bluedot951/PennApps2016
 708 | https://github.com/daniel-muthukrishna/DASH
 709 | https://github.com/Glitch-is/ARTI-NOAH
 710 | https://github.com/timpetri/CS525_Project
 711 | https://github.com/jzbjyb/DSSA
 712 | https://github.com/aniketshukla/AudioSentiment
 713 | https://github.com/ami-GS/ngraph
 714 | https://github.com/tayrelgrin/BossSensor
 715 | https://github.com/smrjan/machine-learning
 716 | https://github.com/cache-me-outside/odark
 717 | https://github.com/jrios6/DLND-TV-Script-Generation
 718 | https://github.com/yfpeng/cs224n
 719 | https://github.com/ageron/tensorflow-safari-course
 720 | https://github.com/ml-ai-nlp-ir/EasyTensorflow
 721 | https://github.com/KatsuyaKawabe/traffic_predict
 722 | https://github.com/morganw/Scene-Labeling
 723 | https://github.com/thunn/tensorflow_tutorials
 724 | https://github.com/JGuillaumin/deepingen
 725 | https://github.com/mdda/deep-learning-workshop
 726 | https://github.com/minhoolee/Synopsys-Project-2017
 727 | https://github.com/stefanwebb/tensorflow-models
 728 | https://github.com/PlanetExp/ca-rnn
 729 | https://github.com/RuiShu/kaos
 730 | https://github.com/Vasuji/deep-learning
 731 | https://github.com/laozhuang727/DeepLearning-SirajologyChallenges
 732 | https://github.com/ram978/Coursera-ML-AndrewNg
 733 | https://github.com/fastforwardlabs/vae-tf
 734 | https://github.com/valohai/tensorflow-example
 735 | https://github.com/gxlzj/CS224nProj_src
 736 | https://github.com/yj20586/deep_recommend_system
 737 | https://github.com/jotterbach/dstk
 738 | https://github.com/BenjaVR/delay-genie
 739 | https://github.com/ForkedReposBak/tensorflow-101
 740 | https://github.com/PythonWorkshop/intro-to-tensorflow
 741 | https://github.com/matheuslrsouza/deep-learning
 742 | https://github.com/boerjames/leuko-tf
 743 | https://github.com/imagef/tensorlayer
 744 | https://github.com/hanna216/RIN
 745 | https://github.com/tperol/ConvNetQuake
 746 | https://github.com/RohanVardhan/House-Price-Prediction-Analysis
 747 | https://github.com/robeceiro/aind2-dog-project
 748 | https://github.com/perchrib/masters_thesis
 749 | https://github.com/marsma/deep_recommend_system
 750 | https://github.com/kornilova-l/tensorflow-pokemon
 751 | https://github.com/adrianlyjak/harry_potter_machine
 752 | https://github.com/chenbiaolong/tfmesos
 753 | https://github.com/ebigelow/detect-relationships
 754 | https://github.com/ml-ai-nlp-ir/tf-stanford-tutorials
 755 | https://github.com/playgood111/gcForest-1
 756 | https://github.com/mrdougwright/DLND-rnn-tv-script
 757 | https://github.com/petrux/LiTeFlow
 758 | https://github.com/vykanton/kokako
 759 | https://github.com/zixia/python-facenet
 760 | https://github.com/xmfbit/tf-stanford-tutorials
 761 | https://github.com/seanchen11/Keras
 762 | https://github.com/shoeffner/ann3depth
 763 | https://github.com/Aggrathon/GANTextureGenerator
 764 | https://github.com/fomorians/tfstage
 765 | https://github.com/vunb/tf-stanford-tutorials
 766 | https://github.com/inessus/Deep-Learning-TensorFlow
 767 | https://github.com/Vasuji/DLND-tf-stanford-tutorials-sequence-to-sequence
 768 | https://github.com/zhangrao1990/CS224N
 769 | https://github.com/shamazharikh/BRATZZ_ZEGMENTATION
 770 | https://github.com/aschampion/diluvian
 771 | https://github.com/rajat1994/TensorFlow_Flask_MNIST_Heroku
 772 | https://github.com/wavelets/pydata-amazon-products
 773 | https://github.com/otaviogood/carputer
 774 | https://github.com/Shmuma/rl
 775 | https://github.com/h4nyu/deep-trader
 776 | https://github.com/takemikami/imas_hack-20170517
 777 | https://github.com/tokestermw/text-gan-tensorflow
 778 | https://github.com/Blusea/tf-stanford-tutorials
 779 | https://github.com/juanka1331/VAN-applied-to-Nifti-images
 780 | https://github.com/nelson-liu/paraphrase-id-tensorflow
 781 | https://github.com/zentechthaingo/EasyTensorflow
 782 | https://github.com/tcrossland/time_series_prediction
 783 | https://github.com/Libardo1/Deep-Learning-TensorFlow
 784 | https://github.com/llSourcell/How-to-Generate-Art-Demo
 785 | https://github.com/dennybritz/chatbot-retrieval
 786 | https://github.com/tf-learning/tf-mnist
 787 | https://github.com/knathanieltucker/tf-keras-tutorial
 788 | https://github.com/seominjoon/dqa-net
 789 | https://github.com/dddoss/tensorflow-socher-ntn
 790 | https://github.com/peixuanx/ChatBot
 791 | https://github.com/ximen120/dataAnalysis
 792 | https://github.com/shorxp/tensorlayer
 793 | https://github.com/webb04/NetflixPauser
 794 | https://github.com/lean-poker-bob/poker-player-smiling-duck-ai-test
 795 | https://github.com/kabina/tf_seq2seq_chatbot
 796 | https://github.com/yandexdataschool/neurohack-2016-starterkit
 797 | https://github.com/Avsecz/concise
 798 | https://github.com/Amber819/awesome-embedding-models
 799 | https://github.com/dajiu/BossSensor
 800 | https://github.com/NeverDoubtTheWorm/Deep-Learning-Nanodegree-nd101
 801 | https://github.com/cerndb/dist-keras
 802 | https://github.com/codelab-tf-got/code
 803 | https://github.com/quietcoolwu/tf-stanford-tutorials
 804 | https://github.com/lnchpd/udacity_dl
 805 | https://github.com/nkundiushuti/pydata2017bcn
 806 | https://github.com/nandakishorkoka/deep-learning-nd
 807 | https://github.com/ml-lab/lda2vec-tf
 808 | https://github.com/tjacobs/baselines
 809 | https://github.com/kairen/tensorflow-workshop
 810 | https://github.com/Vunb/SpeakEasy
 811 | https://github.com/meranaamjoker/deep-learning
 812 | https://github.com/ADGEfficiency/energy_py
 813 | https://github.com/rajat1994/WebApp-for-breast-cancer-detection
 814 | https://github.com/dharness/sqwak-api
 815 | https://github.com/yesray0216/pygta5
 816 | https://github.com/liuzard/Deep-Learning-TensorFlow
 817 | https://github.com/akset8/skynet
 818 | https://github.com/lopuhin/kaggle-dstl
 819 | https://github.com/markiett/deep-learning
 820 | https://github.com/gaoxuesong/DeepSpeech
 821 | https://github.com/keevol/BossSensor
 822 | https://github.com/miyamotok0105/ai_chatbot
 823 | https://github.com/Tornadoman/captcha-break
 824 | https://github.com/625673575/PyGTA
 825 | https://github.com/hershal/tensorflow-testing
 826 | https://github.com/Adamits/arapaho_library
 827 | https://github.com/vssouza/multilayer-perceptron-tf
 828 | https://github.com/aprice2704/dlnd-project3
 829 | https://github.com/wagamamaz/tensorlayer
 830 | https://github.com/zekearneodo/tf_spectral
 831 | https://github.com/hongj77/DeepLearningGameAI
 832 | https://github.com/jbencook/zappa-tensorflow-poc
 833 | https://github.com/jessejlt/cifar10
 834 | https://github.com/kensk8er/langdist
 835 | https://github.com/galaxysd/BossSensor
 836 | https://github.com/chiphuyen/tf_oreilly
 837 | https://github.com/CV-IP/Scene-Labeling
 838 | https://github.com/suriyadeepan/hcn
 839 | https://github.com/daniel-shimon/char-rnn-tensorflow
 840 | https://github.com/CachesToCaches/tensorflow_tutorials
 841 | https://github.com/seher0/mt
 842 | https://github.com/damienstanton/ai-training
 843 | https://gitlab.com/yogeshc/edward
 844 | https://github.com/pedroabg/dlnd
 845 | https://github.com/petrbel/sds
 846 | https://github.com/justmeshishir/orchestrate-ai
 847 | https://github.com/Swig-DPI/udacity-p3
 848 | https://github.com/HCTsai/OpenIC
 849 | https://github.com/mouradmourafiq/philo2vec
 850 | https://github.com/Yoctol/SeqGAN
 851 | https://github.com/koyo922/deep-learning
 852 | https://github.com/ybai62868/tensorlayer
 853 | https://github.com/elenduuche/tensorflow_cookbook
 854 | https://github.com/bsuper/biomet
 855 | https://github.com/DavieHR/BossSensor
 856 | https://github.com/akkefa/facefinder
 857 | https://github.com/DannyGsGit/GTC_2017_Experiments
 858 | https://github.com/fhennecker/meta-reinforcement-learning
 859 | https://github.com/GeekLiB/tensorflow_speech_recognition_demo
 860 | https://github.com/pannous/DeepSpeech
 861 | https://github.com/kevin28520/tensorflow_cookbook
 862 | https://github.com/OrkoHunter/MLinProduction
 863 | https://github.com/jt6211/deep-learning
 864 | https://github.com/vssouza/handwritten-recognition-tflearn
 865 | https://github.com/bio-ontology-research-group/rulemin
 866 | https://github.com/shareactorIO/pipeline
 867 | https://github.com/linxinzhe/deep-learning
 868 | https://github.com/scharoun/DeepSpeech
 869 | https://github.com/SudhakarReddyPeddinti/tensorflow-cnn-web
 870 | https://github.com/ExtraYin/Measure_Relationship_Strength
 871 | https://github.com/junmyung/Tensorflow-DeconvNet-Segmentation
 872 | https://github.com/kanalasumant/artistic-style-transfer
 873 | https://github.com/aurelius23/deep-learning
 874 | https://github.com/Pholey/Pathfinder
 875 | https://github.com/dragonabyss/DeepLearningZeroToAll
 876 | https://github.com/icrtiou/Coursera-ML-AndrewNg
 877 | https://github.com/slinjhu/LearnTensorflow
 878 | https://github.com/matthewzar/UdacityProject3ScriptGenerator
 879 | https://github.com/AuroraLHT/face-generator
 880 | https://github.com/noootown/Forex-DQN
 881 | https://github.com/pligor/msd-music-genre-classification
 882 | https://github.com/smashingboxes/ML_Experiments
 883 | https://github.com/lsls01/Udacity_Deep_Learning_Foundation_Projects
 884 | https://github.com/bio-ontology-research-group/deepgoweb
 885 | https://github.com/ml-ai-nlp-ir/seq2seq-1
 886 | https://github.com/KirovVerst/tensorflow
 887 | https://github.com/erfannoury/qrn
 888 | https://github.com/comzyh/python-grpc-async-server-example
 889 | https://github.com/michalpelka/How-to-Generate-Art-Demo
 890 | https://github.com/aiUIUC/pyAIUtils
 891 | https://github.com/apurveyajnik/DeepLearning-stuff
 892 | https://github.com/andykamath/Caption-Generator
 893 | https://github.com/MandyZChen/srez
 894 | https://github.com/jay-dee7/handson-ml
 895 | https://github.com/arabiaweather/athena
 896 | https://github.com/GeekLiB/BossSensor
 897 | https://github.com/BenjaminBossan/mink
 898 | https://github.com/ProofByConstruction/texture-networks
 899 | https://github.com/doradora2017/project3-tv-script-generation
 900 | https://github.com/krinkels/sketch-recognition
 901 | https://github.com/xymeow/neural-style-visualizer
 902 | https://github.com/151706061/tensorlayer-chinese
 903 | https://github.com/ImperialAlphaLab/pygreg
 904 | https://github.com/hughhan1/artwork
 905 | https://github.com/bradyz/geometry_processing
 906 | https://github.com/random-forests/tf-stanford-tutorials
 907 | https://github.com/lcoulet/srez
 908 | https://github.com/jkahn/samyro
 909 | https://github.com/LeeKyungMoon/Judging-a-Book-by-its-Cover
 910 | https://github.com/davidbernat/hello-planet
 911 | https://github.com/dkatz24/DLND
 912 | https://github.com/mding5692/MLForHackers
 913 | https://github.com/jjz/intro-to-tensorflow
 914 | https://github.com/winpraneeth/tv-script-generation
 915 | https://github.com/brangerbriz/midi-rnn
 916 | https://github.com/kootenpv/deep_eye2mouse
 917 | https://github.com/ml-lab/unrolled_gan
 918 | https://github.com/weissercn/MLTools
 919 | https://github.com/toc14C/bioisosteres
 920 | https://github.com/dkarmon/keras_hyperparams_optimizer
 921 | https://github.com/alexgarciac/TensorFlow-Tutorials
 922 | https://github.com/pratos/tflaskapi
 923 | https://bitbucket.org/rscapplications/chemlistem
 924 | https://github.com/coopie/speech_ml
 925 | https://github.com/ctmakro/canton
 926 | https://github.com/cmebionic/TensorFlow-Tutorials
 927 | https://github.com/nelhage/tf-experiments
 928 | https://github.com/chuckcho/coursera-ML
 929 | https://github.com/Libardo1/quiver
 930 | https://github.com/Ram81/IDE
 931 | https://github.com/Parsonswlu/dog-project
 932 | https://github.com/ElchinValiyev/tf-embedding-visualization-demo
 933 | https://github.com/animate-object/r-prime
 934 | https://github.com/tfboyd/dlbench
 935 | https://github.com/Bakuutin/lstm_text_generator
 936 | https://github.com/rjw57/yoshi-tf-example
 937 | https://github.com/polyaxon/polyaxon
 938 | https://github.com/nicolashennetier/questions_answering
 939 | https://github.com/sunq-run/test
 940 | https://github.com/nicolas-ivanov/seq2seq-1
 941 | https://github.com/Kiri23/image_recognition_web_app
 942 | https://github.com/goldservice2017/Face-Detection
 943 | https://github.com/braingineer/opentc
 944 | https://github.com/alexgurrola/ai-reference
 945 | https://github.com/fernandomarins/tv-script-generation-dlnd
 946 | https://github.com/hopshadoop/hops-tensorflow
 947 | https://github.com/shmsw25/bi-att-flow
 948 | https://github.com/derui/painter-tensorflow
 949 | https://github.com/meereeum/vANNilla-tf
 950 | https://github.com/MaybeS/face-detection
 951 | https://github.com/trung-gm/deep-learning
 952 | https://github.com/AvijitGhosh82/SMA_InterIIT_2017
 953 | https://github.com/ALISCIFP/Tensorflow-Segmentation-Toolkit
 954 | https://github.com/SooluThomas/Auro
 955 | https://github.com/datalogue/keras-attention
 956 | https://github.com/janvdvegt/KernelMixtureNetwork
 957 | https://github.com/NiloofarAzizi/PredictionSegmentation
 958 | https://github.com/ndeepesh/Udacity-DLND
 959 | https://github.com/Large-Scale-Tensor-Decomposition/tensorD
 960 | https://github.com/JKKorea/DeepLearningZeroToAll
 961 | https://github.com/SolessChong/qunzhume-ai
 962 | https://github.com/icareon/tv-script-generation
 963 | https://github.com/HuoShan-Corleone/Udacity_DLND_P3_Master
 964 | https://github.com/Dakurels/beta-gomoku
 965 | https://github.com/melfm/dukecone
 966 | https://github.com/paulperry/kaggle
 967 | https://github.com/meereeum/lda2vec-tf
 968 | https://github.com/m-heerde/wheat-beer_with_banana-juice
 969 | https://github.com/ml-lab/ImageRetrieval-tf
 970 | https://github.com/kootenpv/neural_complete
 971 | https://github.com/awjuliani/dfp
 972 | https://github.com/hershedtilak/CS224N
 973 | https://github.com/davidbernat/for-viewing
 974 | https://github.com/ChengjinLi/machine_learning
 975 | https://github.com/WoundMetrics/facenet
 976 | https://github.com/JamesDaniel/tensorflow-transform-images
 977 | https://github.com/ml-lab/aiexperiments-ai-duet
 978 | https://github.com/dashan-emr/GPflow
 979 | https://github.com/gongyanchao/aind2-rnn
 980 | https://github.com/cwwwu/udacity-dlnd-projects
 981 | https://github.com/vladbataev/ctc_tensorflow
 982 | https://github.com/ajayunagar/DeepLearningZeroToAll
 983 | https://github.com/jimmcgaw/tensor
 984 | https://github.com/gakarak/BTBDB_ImageAnalysisSubPortal
 985 | https://github.com/DiamonJoy/tensorlayer
 986 | https://github.com/ALISCIFP/TensorVision
 987 | https://github.com/dplewa/ml-letters-2017
 988 | https://github.com/DivyanshBhatia/DeepLearning-tv-script-generator
 989 | https://github.com/pdwyys20/cn-deep-learning
 990 | https://github.com/jiamings/markov-chain-gan
 991 | https://github.com/shivam-kotwalia/vgg16_heroku
 992 | https://github.com/ralphatobe/CS224NHW3
 993 | https://github.com/LanJosh/TheAITimes
 994 | https://github.com/blackecho/Deep-Learning-TensorFlow
 995 | https://github.com/SDupZ/mlsdupz
 996 | https://github.com/swhh/deepqlearning
 997 | https://github.com/jbrubaker/ml_tests
 998 | https://github.com/faroit/nsynth-convert
 999 | https://github.com/shuvanon/Biryani-or-Not-Biryani
1000 | https://github.com/hdasappinc/chatbot-retrieval
1001 | https://github.com/eglassman/MLforPrograms
1002 | https://github.com/jaquim/MediaUnderstandingAPI
1003 | https://github.com/tucanae47/tensorpeers
1004 | https://github.com/freaad/srez
1005 | https://github.com/gfyoung/logofinder
1006 | https://github.com/apolanco3225/Generate-Simpsons-TV-Scripts-using-RNNs
1007 | https://github.com/cgc/rnd
1008 | https://github.com/arhik/nupic.research
1009 | https://github.com/anjishnu/surreal
1010 | https://github.com/JasonNK/tv-script-generation
1011 | https://github.com/appcoreopc/kaggleCompete
1012 | https://github.com/melindadevins/How-to-Generate-Art-Demo
1013 | https://github.com/vanyaland/deep-learning-foundation
1014 | https://github.com/TalkingData/edward
1015 | https://github.com/faisal-w/chatbot-retrieval
1016 | https://github.com/taweechoke/Project
1017 | https://github.com/ZhaoJ9014/One-Hundred-Layers-Tiramisu
1018 | https://github.com/xebia-france/magritte
1019 | https://github.com/ml-lab/Seq2Seq_Upgrade_TensorFlow
1020 | https://github.com/reinforceio/tensorforce
1021 | https://github.com/haolang9527/SeniblityClassfiction_zh
1022 | https://github.com/brotherhuang/tensorflow_cookbook
1023 | https://github.com/kod3r/Project_RNN_Enhancement
1024 | https://github.com/AndreaSuckro/CANN
1025 | https://github.com/w821881341/gcforest
1026 | https://github.com/ml-lab/csgm
1027 | https://github.com/RowlandOti-Student/TensorFlow-Tutorials
1028 | https://github.com/lolkids/chatbot-retrieval
1029 | https://github.com/chatappcodepath/tf_seq2seq_chatbot
1030 | https://github.com/pangjiuzala/deeplearning
1031 | https://github.com/freaad/BossSensor
1032 | https://github.com/Congo-Collaborations/ntds_2016
1033 | https://github.com/ThomasChen94/Authorship-Identification
1034 | https://github.com/stefanwebb/tensorflow-datasets
1035 | https://github.com/YRustt/Course-work
1036 | https://github.com/kensk8er/chicksexer
1037 | https://github.com/nicolas-ivanov/Seq2Seq_Upgrade_TensorFlow
1038 | https://github.com/Rperry2174/neural-net-digit-converter
1039 | https://github.com/Fematich/conceptnetwork
1040 | https://github.com/rafaelnovello/mnist-demo
1041 | https://github.com/lucasdavid/connoisseur
1042 | https://github.com/JeremyCHN/DLND-tv-script-generation
1043 | https://github.com/mattberjon/image-classification
1044 | https://github.com/Jakobovski/alt_backprop
1045 | https://github.com/gorefbitim/NN
1046 | https://github.com/gxie20/tv-script-generation
1047 | https://github.com/Rob-M-F/transfer-learning
1048 | https://github.com/apacha/MusicSymbolClassifier
1049 | https://github.com/samuelzhouhe/CIFAR10
1050 | https://github.com/parkerzf/nowinteract
1051 | https://github.com/kashim-zcxk/clasificador-mascota
1052 | https://github.com/sheuan/deep-learning
1053 | https://github.com/nyhkwon/ClassifyingDriverBehavior
1054 | https://github.com/danieljl/aind-dog-project
1055 | https://github.com/nitro-code/inception-api
1056 | https://github.com/vickydasta/tf-stanford-tutorials
1057 | https://github.com/mKaloer/ArcadeReinforcementLearning
1058 | https://github.com/bgfurfeature/Deep-Learning-TensorFlow
1059 | https://github.com/quickresolve/accel.ai
1060 | https://github.com/alshedivat/edward
1061 | https://github.com/benmathes/tensorflow
1062 | https://github.com/winnerineast/tensorflow_cookbook
1063 | https://github.com/copotron/SDC-P5
1064 | https://github.com/joshcai/aDi-music
1065 | https://github.com/361512/cs224u
1066 | https://github.com/sohcalvin/ref
1067 | https://github.com/webeng/bi-att-flow
1068 | https://github.com/lucawint/html_ner_keras
1069 | https://github.com/dem-esgal/Deep-Learning-TensorFlow
1070 | https://github.com/ejconlon/digits
1071 | https://github.com/nanoporetech/medaka
1072 | https://github.com/tbornt/UCDIG_tensorflow
1073 | 


--------------------------------------------------------------------------------
/snippet_ranger/data/tqdm_dependent_reps.txt:
--------------------------------------------------------------------------------
   1 | https://github.com/dtorrejo/py-nlp
   2 | https://github.com/pranavlathigara/FreeWifi
   3 | https://github.com/TariqAHassan/BioVida
   4 | https://github.com/austinhartzheim/nothing-to-hide
   5 | https://github.com/rusenask/hoverfly-example-readthedocs
   6 | https://github.com/matthewfl/nlp-entity-convnet
   7 | https://github.com/autojazari/sdc-lab1-notmnist
   8 | https://github.com/nikhilkumarsingh/content-downloader
   9 | https://github.com/shaunstanislaus/statuspage
  10 | https://github.com/guardian/data-projector
  11 | https://github.com/umitunal/MLAlgorithms
  12 | https://github.com/billvsme/videoSpider
  13 | https://github.com/nirizr/timewatch
  14 | https://github.com/TurfMedia/statuspage
  15 | https://github.com/ruaruagerry/tenhou-python-bot
  16 | https://github.com/rocity/dj-instagram
  17 | https://github.com/gbhrdt/instabot
  18 | https://github.com/luiscruz/ghsearch-python
  19 | https://github.com/iAnanich/gismeteo-news-scraping
  20 | https://github.com/atlab/attorch
  21 | https://github.com/rushter/MLAlgorithms
  22 | https://bitbucket.org/medtechdiagnostics/video2dcm
  23 | https://github.com/Ghadjeres/DeepBach
  24 | https://github.com/nisace/gan-lib
  25 | https://github.com/pjthepooh/BigBoldBets
  26 | https://github.com/ag-gipp/imageplag
  27 | https://github.com/growbots/dataproc-config
  28 | https://github.com/brainix/pottery
  29 | https://github.com/fmoliveira/statuspage
  30 | https://github.com/kingtaurus/cs231n
  31 | https://github.com/SunDwarf/Spacemail
  32 | https://github.com/verkaufer/RandomPokemonAlexa
  33 | https://github.com/Mavrx-inc/sentinelsat
  34 | https://github.com/miumiu0917/LifeGame
  35 | https://github.com/biocommons/biocommons.seqrepo
  36 | https://github.com/ToniCreswell/piGAN
  37 | https://github.com/bryant1410/readmesfix
  38 | https://github.com/pmlandwehr/cf_maintainer_bot
  39 | https://github.com/sefakilic/cgb
  40 | https://github.com/agj60/face_generation
  41 | https://github.com/blue-yonder/tsfresh
  42 | https://github.com/Miserlou/serverless-imagehost
  43 | https://github.com/m09/examples
  44 | https://github.com/Sherwoodwt/TaskManager
  45 | https://github.com/lethehaiau/BiDAF
  46 | https://github.com/njross/dc-law-tools
  47 | https://github.com/thias15/dl-nd-project2
  48 | https://github.com/XENON1T/hax
  49 | https://github.com/valgur/sentinelsat
  50 | https://github.com/theref/Axelrod
  51 | https://github.com/totalgood/pugnlp
  52 | https://github.com/scriptotek/lokar
  53 | https://github.com/sacreman/dlcli
  54 | https://github.com/thriveministry/statuspage
  55 | https://github.com/NikitaKoshelev/uragan
  56 | https://github.com/yamakira/datasploit
  57 | https://github.com/bobcolner/pgrap
  58 | https://github.com/oryonatan/tv23_site
  59 | https://github.com/rh-marketingops/mlsm
  60 | https://github.com/tkw1536/TrainIsLate
  61 | https://github.com/masasin/resume
  62 | https://github.com/melindadevins/five-video-classification-methods
  63 | https://github.com/bparafina/robobadger
  64 | https://github.com/antiboredom/stocktalk
  65 | https://github.com/kitanata/fantasy-sports-data-analysis
  66 | https://github.com/SBUtltmedia/postreq-python-peoplesoft
  67 | https://github.com/coltyharrison/throne-facts-alexa-skill
  68 | https://github.com/jnazaren/CS105-DataProject
  69 | https://github.com/nav97/Twitter-Profile-Analytics
  70 | https://github.com/AlexandreDecan/ecos-emse
  71 | https://github.com/sarahannnicholson/FNC
  72 | https://github.com/xjdr/pbs
  73 | https://github.com/prasadsawant5/image-classification
  74 | https://github.com/rolando-contrib/TeamHG-Memex-Formasaurus
  75 | https://github.com/sethlivingston/django-mississippi
  76 | https://gitlab.com/cimenx/post-processing-OCR
  77 | https://github.com/texastribune/tx_lobbying
  78 | https://github.com/HubBucket-Team/deep-learning
  79 | https://github.com/jrios6/AIND-Image-Classification
  80 | https://github.com/Antidote1911/cryptoshop
  81 | https://github.com/fhennecker/deepdoom
  82 | https://github.com/adlius/ROSIEBot
  83 | https://github.com/HypothesisWorks/hypothesis-python
  84 | https://github.com/pombredanne/Zappa
  85 | https://github.com/sc4brain/swc2vtk
  86 | https://github.com/naggie/dsblog
  87 | https://github.com/a-rank/avaandmed
  88 | https://gitlab.com/theSage21/malayalam-OCR
  89 | https://github.com/Libardo1/MLAlgorithms
  90 | https://github.com/ppca/DLND-project2
  91 | https://github.com/StepicOrg/django-cities
  92 | https://github.com/eea/eea.corpus
  93 | https://gitlab.com/abassi/ponchoSimon
  94 | https://github.com/ppwwyyxx/tensorpack
  95 | https://github.com/nishworks/Flask-starter
  96 | https://github.com/makokal/funzo
  97 | https://github.com/cdg46/statuspage
  98 | https://github.com/Wavesflag/neupy
  99 | https://github.com/saketkc/moca
 100 | https://github.com/mtahirtariq/instagram-scraper
 101 | https://github.com/karthickj25/deep-learning
 102 | https://github.com/serverdensity/performance-dashboard
 103 | https://github.com/saasgasques/deep-learning
 104 | https://github.com/cauebs/serenata-de-amor
 105 | https://github.com/perimeterofwisdom/statuspage
 106 | https://github.com/ivanychev/pygram
 107 | https://github.com/hulatang/manim
 108 | https://github.com/thulinh12a1/ML_Algorithms
 109 | https://github.com/hmishfaq/pymc3
 110 | https://github.com/WeareJoker/sniff_sender
 111 | https://github.com/knjcode/imgtile
 112 | https://github.com/imindrajit/Udacity-DLND
 113 | https://github.com/YunLi1988/cs224n-SQuAD
 114 | https://github.com/serkanh/Zappa
 115 | https://github.com/orf/spam
 116 | https://github.com/seoweon/narajangteo
 117 | https://github.com/taozi/incubator-singa
 118 | https://github.com/midamo/pylinac
 119 | https://github.com/vyomshm/GAN_face_generation
 120 | https://github.com/500646/Feigong
 121 | https://github.com/eFrane/treemeta
 122 | https://github.com/gongyanchao/dog-project
 123 | https://github.com/NetEaseGame/AutomatorX
 124 | https://github.com/RowlandOti/GenerativeAdversarialNeuralNetwork-FaceGeneration
 125 | https://github.com/barentsen/k2flix
 126 | https://github.com/nelson-liu/bi-att-flow
 127 | https://github.com/traVaulta/another-drop
 128 | https://github.com/cwonrails/statuspage
 129 | https://github.com/melyamri/woa
 130 | https://github.com/Markin/memex-pinterest
 131 | https://github.com/gtamazian/evolspace
 132 | https://github.com/rjames86/slogger2
 133 | https://github.com/tifoit/bi-attention-flow
 134 | https://github.com/bckim92/DQN_gym
 135 | https://github.com/luiscruz/greenbenchmark
 136 | https://github.com/dynamomobile/django-cities
 137 | https://github.com/bschreck/lil-neuron
 138 | https://github.com/achillesrasquinha/trump2cash
 139 | https://github.com/omergunal/hackerbot
 140 | https://github.com/michaelluk/Zappa
 141 | https://github.com/gravitee-io/gravitee-docker
 142 | https://github.com/MetaMetricsInc/Zappa
 143 | https://github.com/jacobmarshall-etc/statuspage
 144 | https://github.com/jayanthkoushik/semantic-scene-search
 145 | https://github.com/jparrent/sne
 146 | https://github.com/matfleaydaly/mpstatus
 147 | https://github.com/ogrisel/thinc
 148 | https://github.com/jt-wang/instagram-scraper
 149 | https://github.com/Brok-Bucholtz/P5-Beta
 150 | https://github.com/energee/panda
 151 | https://github.com/HackTheStacks/TeamDarWin-darwin-cluster
 152 | https://github.com/kimjoseph95/python-fluent-samples
 153 | https://github.com/edx/django-config-models
 154 | https://github.com/bemonolit/datasploit
 155 | https://github.com/Salamek/ddrescue-ffile
 156 | https://github.com/TinaMor/bc-15-twitter-sentiment-analysis-cli
 157 | https://github.com/a1ip/statuspage
 158 | https://github.com/hemulin/airvpn_toggler
 159 | https://github.com/KeplerGO/k2-quality-control
 160 | https://github.com/hc-BLISTR/BLISTR-main
 161 | https://github.com/federicosan/deep-learning
 162 | https://github.com/blangwallner/Udacity---Deep-Learning-ND-Project-5
 163 | https://github.com/pcuellar/Deep-Learning-TensorFlow
 164 | https://github.com/kootenpv/whereami
 165 | https://github.com/criecm/iocage
 166 | https://github.com/el98006/sandbox
 167 | https://github.com/greytip/data-science-utils
 168 | https://github.com/chuckbasstan123/pyTorch_project
 169 | https://github.com/kiat/MLAlgorithms
 170 | https://github.com/hammerlab/cohorts
 171 | https://github.com/firstjob/displaCy-server
 172 | https://github.com/ciancica/instabot
 173 | https://github.com/tiandiao123/Variational-Autoencoder
 174 | https://github.com/zhuhongweiyi/FaceTracker
 175 | https://github.com/sharadmv/trees
 176 | https://github.com/ramon-oliveira/aorun
 177 | https://github.com/jshin49/cnn-cats-vs-dogs
 178 | https://github.com/ConfidentCannabis/Zappa
 179 | https://github.com/FatihZor/datasploit
 180 | https://github.com/DCgov/poirot
 181 | https://github.com/Miserlou/django-zappa
 182 | https://github.com/codeforberlin/treemeta
 183 | https://github.com/PacktPublishing/Learning-Python-for-Forensics
 184 | https://github.com/kod3r/neupy
 185 | https://github.com/noruna/statuspage
 186 | https://github.com/Dgo-list/django-page-cms
 187 | https://github.com/defrex/spendwell
 188 | https://github.com/fral92/TF_main_loop
 189 | https://github.com/nithishdivakar/Talks-and-Tutorials
 190 | https://github.com/workforce-data-initiative/skills-api
 191 | https://github.com/masterminddevteam/alborghetti
 192 | https://github.com/mer163/AutomatorX
 193 | https://github.com/suntzualex/deep-learning
 194 | https://github.com/pln-fing-udelar/false-friends
 195 | https://github.com/pdwyys20/deep-learning
 196 | https://github.com/bmallin/SeqInfo
 197 | https://github.com/m-k-S/MLAlgorithms
 198 | https://github.com/codefortulsa/OpenTulsaDataTools
 199 | https://github.com/khrigo/instragram-follow
 200 | https://github.com/henriblancke/neural-chat
 201 | https://github.com/m516825/ADL2016
 202 | https://github.com/DigiCred/Zappa
 203 | https://github.com/ndronen/spelling
 204 | https://github.com/patrickmesana/conditional-image-generation
 205 | https://github.com/huntwelch/MongoBot
 206 | https://github.com/ramshank/deep-learning
 207 | https://github.com/geodesignhub/LanduseAllocationModel
 208 | https://github.com/jubayerarefin/django-cities
 209 | https://github.com/allenai/bi-att-flow
 210 | https://github.com/starakaj/wikisonnet
 211 | https://github.com/instagrambot/instabot
 212 | https://github.com/Chan9390/datasploit
 213 | https://github.com/bluetouch/kur
 214 | https://github.com/HubBucket-Team/tsfresh
 215 | https://github.com/tigerlero/amazonur8
 216 | https://github.com/WyldPhyr/whereami
 217 | https://github.com/ghackebeil/PyORAM
 218 | https://github.com/materialsproject/fireworks
 219 | https://github.com/faroit/pyCFM
 220 | https://github.com/martinkersner/BeaverDam
 221 | https://github.com/MikeDacre/dbSNP
 222 | https://github.com/willyb321/zeroclickinfo-fathead
 223 | https://github.com/dssg/sanergy-public
 224 | https://github.com/shaharelisha/music-generator
 225 | https://github.com/KingEdwardI/pyxm
 226 | https://github.com/bstriner/keras-tqdm
 227 | https://github.com/clcarwin/examples
 228 | https://github.com/elmarhaussmann/saliency-salgan-2017
 229 | https://github.com/sheuan/tensorpack
 230 | https://github.com/davedoesdev/dtuf
 231 | https://github.com/harvard-lil/ftl-sandbox
 232 | https://github.com/vmoll/moba_quiz
 233 | https://github.com/paulhendricks/neupy
 234 | https://github.com/1462326016/MLAlgorithms
 235 | https://github.com/buriburisuri/sugartensor
 236 | https://github.com/mkoconnor/manim
 237 | https://github.com/omerbenamram/pyzap
 238 | https://github.com/pedvide/simetuc
 239 | https://github.com/barentsen/k2mosaic
 240 | https://github.com/ollie314/MLAlgorithms
 241 | https://github.com/ericzhao28/8thLightApp
 242 | https://github.com/soundsilence/examples
 243 | https://github.com/ml-lab/deeppose_tf
 244 | https://github.com/matt-hayden/screencap
 245 | https://github.com/wangjiezhe/FetchNovels
 246 | https://github.com/stitchfix/fauxtograph
 247 | https://github.com/BlastLibrary/statuspage
 248 | https://github.com/akaitsuki-ii/CS224n
 249 | https://github.com/tdeboissiere/FaceTracker
 250 | https://github.com/BertrandBordage/django-tree
 251 | https://github.com/bede/kindel
 252 | https://github.com/jmrf/lstm_pos_tagger
 253 | https://github.com/quietcoolwu/example-code
 254 | https://github.com/astrocatalogs/cne-external
 255 | https://github.com/XENON1T/laidbax
 256 | https://github.com/ioanmoldovan/zeroclickinfo-fathead
 257 | https://github.com/fdayoub/MLAlgorithms
 258 | https://github.com/thesby/barrista
 259 | https://github.com/sjakthol/dedup-simulator
 260 | https://github.com/vm/nba
 261 | https://github.com/SWTPAIN/dlnd-project-image-classificaiton
 262 | https://github.com/gaeun/MLAlgorithms
 263 | https://github.com/albalu/atomate
 264 | https://github.com/reyreaud-l/unsplashdownloader
 265 | https://github.com/oroszgy/cookiecutter-ml-flask
 266 | https://github.com/ganguli-lab/deepchaos
 267 | https://github.com/bozzmob/udacity-deep-learning-nanodegree
 268 | https://github.com/Corvince/mesa
 269 | https://github.com/condnsdmatters/twirps
 270 | https://github.com/desecho/django-tqdm
 271 | https://github.com/arcestia/Belati
 272 | https://github.com/dtorrejo/py-nlp
 273 | https://github.com/ChristianBagley/unsubscribe
 274 | https://github.com/DatapuntAmsterdam/panorama
 275 | https://github.com/sappy5678/freepacktbook
 276 | https://github.com/Lucidyan/goto
 277 | https://github.com/ligechina/bi-att-flow
 278 | https://github.com/Detry322/remember-app
 279 | https://github.com/jllan/comment_sentiment_analysis
 280 | https://github.com/caasted/face-generation
 281 | https://github.com/Gabriele91/DENN
 282 | https://github.com/shaypal5/pdpipe
 283 | https://github.com/dialoguemd/menhir
 284 | https://github.com/XENON1T/emo
 285 | https://github.com/sdobz/pyfftviz
 286 | https://github.com/iammrhelo/ISCR
 287 | https://github.com/jrkerns/pylinac
 288 | https://github.com/gasgas4/MLAlgorithms
 289 | https://github.com/zrichardson8039/TopTrader
 290 | https://github.com/ThomasHSmith/PhosphoProTools
 291 | https://github.com/nishworks/python-starter
 292 | https://github.com/ssfg/nnvis
 293 | https://github.com/naver/devcenter-open-project-migration
 294 | https://github.com/dveselov/dialog2017
 295 | https://github.com/nbkm8y5/nlp
 296 | https://github.com/nyk510/bayesian_nn
 297 | https://github.com/sllecks/deep_learning
 298 | https://github.com/Lidaguo/MLAlgorithms
 299 | https://github.com/elliottcarlson/MongoBot
 300 | https://github.com/thiagoqd/udacity-deep-learning-foundations
 301 | https://github.com/weng-lab/iocage
 302 | https://github.com/ml-lab/kaggle-dstl
 303 | https://github.com/nschloe/perfplot
 304 | https://github.com/bjd2385/kadenza
 305 | https://github.com/stkerr/railbaron
 306 | https://github.com/lipov3cz3k/waste-transportation-manager
 307 | https://github.com/mdbconsulting/deep-learning
 308 | https://github.com/Ziewvater/YoutubeGiffer
 309 | https://github.com/JelleAalbers/blipflip
 310 | https://github.com/sshleifer/ml_6867
 311 | https://github.com/EN10/STT
 312 | https://github.com/homm/cachecleaner
 313 | https://github.com/muxuezi/lianjia
 314 | https://github.com/ml-lab/kur
 315 | https://github.com/lemiwinks/imageClassification
 316 | https://github.com/Illedran/DL-HEP
 317 | https://github.com/efoley/deep-learning
 318 | https://github.com/sturoscy-personal/react_meetup
 319 | https://github.com/barronalex/Tacotron
 320 | https://github.com/ryanpdwyer/1605-phasekick
 321 | https://github.com/wkentaro/pytorch-fcn
 322 | https://github.com/patwie-stuff/tensorpack
 323 | https://github.com/mynameisfiber/fakenewschallenge
 324 | https://github.com/GapData/tpot
 325 | https://github.com/andrewliao11/Tensorflow-Multi-Threading-Classifier
 326 | https://github.com/jvalansi/HelloDjango
 327 | https://github.com/security-geeks/IPTV
 328 | https://github.com/nueverest/vue_flask
 329 | https://github.com/ytworks/Udacity_Project5
 330 | https://github.com/geoffreysteven/aind2-cnn
 331 | https://github.com/narfman0/mobile_backend
 332 | https://github.com/pzp1997/Alexa-Sefaria
 333 | https://github.com/mothsART/linkmanager
 334 | https://github.com/kevinmel2000/Formasaurus
 335 | https://github.com/chakki-works/chazutsu
 336 | https://github.com/hopsmdev/playground
 337 | https://github.com/Sliding-Mapping/tensorpack
 338 | https://github.com/TUT-ARG/DCASE2017-baseline-system
 339 | https://github.com/edawine/sugartensor
 340 | https://github.com/StarCYing/tag_sapphire
 341 | https://github.com/Libardo1/speech-to-text-wavenet
 342 | https://github.com/saurabhmathur96/happy-and-you-know-it
 343 | https://gitlab.com/iAmMrinal0/resume
 344 | https://github.com/DatapuntAmsterdam/atlas_panorama
 345 | https://github.com/Miserlou/Zappa
 346 | https://github.com/janga1997/Axelrod
 347 | https://github.com/hh2010/malware_classify
 348 | https://github.com/mkowoods/deep-learning
 349 | https://github.com/ayushgoyal1830/image-classification
 350 | https://github.com/cnpy/pythoner.org
 351 | https://github.com/GjjvdBurg/HugoPhotoSwipe
 352 | https://github.com/TeamHG-Memex/undercrawler
 353 | https://github.com/bespoke-digital/spendwell
 354 | https://github.com/ypwalter/Hasal
 355 | https://github.com/ErickDiaz/TensorFlow_Lab
 356 | https://github.com/damasktb/NewsGraph
 357 | https://github.com/akram-mohammed/candis
 358 | https://github.com/Empia/kur
 359 | https://github.com/fluentpython/example-code
 360 | https://github.com/diandianhanbin/AutomatorX
 361 | https://github.com/notnami/autoframenet
 362 | https://github.com/cwonrails/Zappa
 363 | https://github.com/SkyTreasure/Image-Classification
 364 | https://github.com/unibg-seclab/shuffleindex
 365 | https://github.com/rogern7/statuspage
 366 | https://github.com/jperl/stock2vec
 367 | https://github.com/omaralbeik/dlnd_face_generation
 368 | https://github.com/veltzer/pytsv
 369 | https://github.com/jarek/electric2go
 370 | https://github.com/nwhidden/ND101-Deep-Learning
 371 | https://github.com/chenliangomc/biocommons.seqrepo
 372 | https://github.com/antiboredom/videogrep
 373 | https://github.com/Backblaze/B2_Command_Line_Tool
 374 | https://github.com/bestwpw/MLAlgorithms
 375 | https://github.com/SomaticLabs/fetch-datasheet
 376 | https://github.com/shlomihod/cerca
 377 | https://gitlab.com/Mathsoum/abelujo
 378 | https://github.com/NikosVlagoidis/videomaker
 379 | https://github.com/OCHA-DAP/hdx-data-freshness
 380 | https://github.com/PhoenixAlx/VideoNames
 381 | https://github.com/audiolion/das-profiles
 382 | https://github.com/martinyelland/rjvstatus
 383 | https://github.com/Trietptm-on-Security/security-scripts
 384 | https://github.com/nflszyy/tigercinema
 385 | https://github.com/kevjue/reading_comprehension_deep_learning
 386 | https://github.com/Leeps-Lab/otree-core
 387 | https://github.com/coding-blocks/content-downloader
 388 | https://github.com/oliverbhull/dingdongdash
 389 | https://github.com/bayeshack2016/sysj
 390 | https://github.com/ankitPagalGuy/image-classification
 391 | https://github.com/AcamTech/statuspage
 392 | https://github.com/opentargets/phewascatalog_parser
 393 | https://github.com/swaption2009/dlnd_face_generation
 394 | https://github.com/quiltdata/quilt
 395 | https://github.com/yashwanthbabu/whereami
 396 | https://github.com/aseyboldt/dync
 397 | https://github.com/KyleMarMc/social_media_comparison
 398 | https://github.com/BUYMERCIER/instagram-scraper
 399 | https://github.com/amamaenko/defl
 400 | https://github.com/Sudhar287/incubator-singa
 401 | https://github.com/rh-marketingops/dwm
 402 | https://github.com/shaunstanislaus/datasploit
 403 | https://github.com/sschnug/pyannote-video
 404 | https://github.com/MordFee/OCR
 405 | https://github.com/kylerjohnston/dnc-emails
 406 | https://github.com/Miserlou/flask-zappa
 407 | https://github.com/eReuse/workbench
 408 | https://github.com/chamm1028/TwitterTrader
 409 | https://github.com/lacava/few
 410 | https://github.com/ppleskov/instabot
 411 | https://github.com/TadLeonard/tfatool
 412 | https://github.com/iammarvelous/examples
 413 | https://github.com/Teichlab/SpatialDE
 414 | https://github.com/matt-hayden/faceswap
 415 | https://github.com/mfussenegger/cr8
 416 | https://github.com/matt-hayden/VideoClipSplitter
 417 | https://github.com/InnocuousAchilles/misc
 418 | https://github.com/SivyerLab/pyStim
 419 | https://github.com/Sharathnasa/DeepLearningNanoDegreeImageClassification
 420 | https://github.com/awesome-python/Zappa
 421 | https://github.com/antingshen/BeaverDam
 422 | https://github.com/blee-mapr/changeString
 423 | https://github.com/Antman261/Gigger-Webserver
 424 | https://github.com/tellybug/Zappa
 425 | https://github.com/chusine/dlnd
 426 | https://github.com/XENON1T/pax
 427 | https://github.com/jayfk/Zappa
 428 | https://github.com/18F/acquisitions.18f.gov
 429 | https://github.com/ralic/Memo-Utils
 430 | https://github.com/safdark/DL-5-face-generation
 431 | https://github.com/tylerlaberge/Jasper
 432 | https://github.com/interrogator/pollux
 433 | https://github.com/janeen666/mi-instrument
 434 | https://github.com/gwillem/magento-downloader
 435 | https://github.com/buinyi/image-classification-with-CNN
 436 | https://github.com/jason-neal/companion_simulations
 437 | https://github.com/htoyryla/wavenet
 438 | https://github.com/zhwhong/awesome-deep-learning
 439 | https://github.com/mr-ravin/GAN-Face-Generation
 440 | https://github.com/invinst/CPDBv2_backend
 441 | https://github.com/GokuMohandas/Attentional-Interfaces-O-Reilly
 442 | https://github.com/emencia/django-postgrefts
 443 | https://github.com/jekbradbury/examples
 444 | https://github.com/rizafahmi/zappa_playground
 445 | https://github.com/python-dirbtuves/akl.lt
 446 | https://github.com/nromashchenko/amquery
 447 | https://github.com/COMBINE-lab/GRASS
 448 | https://github.com/DiNAi/neon
 449 | https://github.com/pydo/vlc-gif-creator
 450 | https://github.com/aliutkus/commonfate
 451 | https://github.com/OutloudTeam/statuspage
 452 | https://github.com/abrasumente233/manim
 453 | https://github.com/ratson/track-them-all
 454 | https://github.com/Licenser/iocage
 455 | https://github.com/cstatz/desolvex
 456 | https://github.com/TeamHG-Memex/Formasaurus
 457 | https://github.com/dmonn/GAN-face-generator
 458 | https://github.com/dylanthomas/tensorpack
 459 | https://github.com/JarvisFei/my-first-neural-network
 460 | https://github.com/Eudie/Udacity-Deep_Learning_Foundation
 461 | https://github.com/saikatkumardey/MLAlgorithms
 462 | https://github.com/BigBrotherTrade/dashboard
 463 | https://github.com/GIS-FCU/sdi-converter
 464 | https://github.com/mordred-descriptor/mordred
 465 | https://github.com/c0nn3r/jabberwocky
 466 | https://github.com/m3wolf/scimap
 467 | https://github.com/darkarraylord/dlnd_project2_image_classification
 468 | https://github.com/BhargavaRamM/kur
 469 | https://github.com/innovationcolab/statuspage
 470 | https://github.com/Exploit-install/datasploit
 471 | https://github.com/gpantelis/moviepy
 472 | https://github.com/ErillLab/CGB
 473 | https://github.com/MihailoIsakov/love-for-sandwiches
 474 | https://github.com/sdobz/FractalWednesday
 475 | https://github.com/nbigot/rss-scrapper
 476 | https://github.com/julianarhee/morph-pov
 477 | https://github.com/matt-hayden/tagxon
 478 | https://github.com/woshikangfei/image-classification
 479 | https://github.com/Smeb/camino-ml
 480 | https://github.com/shuyl105/2015Spring_InteractivePrototyping_assignment
 481 | https://github.com/phiendp/udacity-face-generation
 482 | https://github.com/mlasy/Machine-Learning-Nanodegree-Udacity
 483 | https://github.com/metrasynth/sunvox-dll-python
 484 | https://github.com/PranavKrishnan/Zappa
 485 | https://github.com/jdcourcol/NeuroM
 486 | https://github.com/MerlinTechnology/lmdo
 487 | https://github.com/GoooQ/Deep-Learning-TensorFlow
 488 | https://github.com/ranjinidas/Axelrod
 489 | https://github.com/kpj/SeqPipe
 490 | https://github.com/MinhwanYu/ED-fakeTextGenerator
 491 | https://github.com/jorgergb/image-classification
 492 | https://github.com/mishin/statuspage
 493 | https://github.com/CCharlieLi/funny_tool
 494 | https://github.com/dhaval17/DS_Store
 495 | https://github.com/gregorynicholas/moviepy
 496 | https://github.com/VEVO/pymaptools
 497 | https://github.com/cameronmaske/Zappa
 498 | https://github.com/pika11/neural-network-face-generation
 499 | https://github.com/yyao007/real-estate-analysis
 500 | https://github.com/urandomio/instagram_auto_accept
 501 | https://github.com/mithron/mgt-routes
 502 | https://github.com/WarrenGreen/Udacity-DL-ImageClassification
 503 | https://github.com/ChangLabUcsf/img_pipe
 504 | https://github.com/indodutch/sim-city-client
 505 | https://github.com/Swarchal/morar
 506 | https://github.com/Elishanto/VK-Word-Cloud
 507 | https://github.com/zivelai/deep-learning
 508 | https://github.com/Kyubyong/speech-to-text-wavenet
 509 | https://github.com/Niklas9/testvibe
 510 | https://github.com/dreness/scrap
 511 | https://github.com/shaunstanislaus/Zappa
 512 | https://github.com/falgore88/grafana-metrics
 513 | https://github.com/kn16h7/PhishingKitHunter
 514 | https://github.com/Trietptm-on-Security/zentral
 515 | https://github.com/davidnuon/moviepy-talk
 516 | https://github.com/ryanfox/retread
 517 | https://github.com/whereskenneth/AssayInterchange
 518 | https://github.com/fluquid/html-to-etree
 519 | https://github.com/oscarbranson/cbsyst
 520 | https://github.com/shaunstanislaus/videogrep
 521 | https://github.com/striblab/instagram_scraper
 522 | https://github.com/projectmesa/mesa
 523 | https://github.com/udacity/aind2-cnn
 524 | https://github.com/ml-lab/DeepLearningImplementations
 525 | https://github.com/yk/tensorpack
 526 | https://github.com/lcbb/pyDAEDALUS
 527 | https://github.com/jshin49/Kaggle-Cat-vs-Dog-Tensorflow-CNN
 528 | https://github.com/Vizzuality/dockerized_jupyters
 529 | https://github.com/ml-lab/attention-transfer
 530 | https://github.com/itmib/memex-pinterest
 531 | https://github.com/tboudreaux/astroSynth
 532 | https://github.com/josephcslater/harmonic_balance
 533 | https://github.com/kevinmel2000/memex-pinterest
 534 | https://github.com/subutai/nupic.research
 535 | https://github.com/ChangLabUcsf/electrode_grid
 536 | https://github.com/sashgorokhov/gmusicsync
 537 | https://github.com/totalgood/nlpia
 538 | https://github.com/juliustip/statuspage
 539 | https://github.com/kmike/morphine
 540 | https://github.com/yurri92/MPLS-inventory-management
 541 | https://github.com/oscarlevin/manim
 542 | https://github.com/ISVWorld/undercrawler
 543 | https://github.com/ve-interactive/Pynexus
 544 | https://github.com/Scitator/TF-seq2seq
 545 | https://github.com/Key-Zone/pyannote-video
 546 | https://github.com/ElaineBao/imagenet
 547 | https://github.com/eldos-dl/Zappa
 548 | https://github.com/fernandezcuesta/t4Monitor
 549 | https://github.com/SANBI-SA/combat_tb_model
 550 | https://github.com/ikhlestov/rbm_based_autoencoders_with_tensorflow
 551 | https://github.com/Anatoly-vivaki1986/ML-Algorithms
 552 | https://github.com/jake-b/icloud_photos_downloader
 553 | https://github.com/pyannote/pyannote-video
 554 | https://github.com/MordFee/Elasticsearch
 555 | https://github.com/ala-aboudib/dlnd_face_generation_proj
 556 | https://github.com/popookitty/IPTV
 557 | https://github.com/openai/baselines
 558 | https://github.com/timofurrer/leaked
 559 | https://github.com/AlexandreDecan/ecos-wea2016
 560 | https://github.com/romovpa/ecmlpkdd2016-otp-bank-upselling
 561 | https://github.com/volans-/cumin
 562 | https://github.com/ChrisYang/pyannote-video
 563 | https://github.com/FakeNewsChallenge/fnc-1-baseline
 564 | https://github.com/DarkVinci/cifar10
 565 | https://github.com/armory-io/winnaker
 566 | https://github.com/mapillary/mapillary_vistas
 567 | https://github.com/blondegeek/MatMethods
 568 | https://github.com/danlegion/intro-to-tensorflow
 569 | https://github.com/kcavagnolo/docker_opt
 570 | https://github.com/JNingWei/Image-Filter
 571 | https://github.com/vcashk/Project5_Face_Recognition
 572 | https://github.com/security-geeks/tweets_analyzer
 573 | https://github.com/limix/glimix-core
 574 | https://github.com/betterenvi/QA-rankit
 575 | https://github.com/EmanAbbas/cdf
 576 | https://github.com/bede/tictax
 577 | https://github.com/sayanarijit/activity
 578 | https://github.com/JaoMarcos/cifar-image-classification
 579 | https://github.com/mariusmagureanu/AutomatorX
 580 | https://github.com/gzlixiaochao/AutomatorX
 581 | https://github.com/jtemporal/jessie
 582 | https://github.com/robertcsapo/cisco-meraki-fw-ap-rules-api
 583 | https://github.com/roebius/deeplearning1_keras2
 584 | https://github.com/futurice/whereareyou
 585 | https://github.com/carlosb1/MLAlgorithms
 586 | https://github.com/erwinfeser/django-cities
 587 | https://github.com/the-winter/spaceapps2017_matches
 588 | https://github.com/my-iPad-air-2/incubator-singa
 589 | https://github.com/Higgins2718/promethea2
 590 | https://github.com/ml-lab/resnet_cnn_mri_adni
 591 | https://github.com/schwa/punic
 592 | https://github.com/yolandawww/QASystem
 593 | https://github.com/EnterStudios/Zappa
 594 | https://github.com/thiagoricieri/image-classification
 595 | https://github.com/iamsteveng/AIND-DogProject
 596 | https://github.com/danielshiferaw/Deep-Learning-Question-Answering-on-SQuAD
 597 | https://github.com/melindadevins/deep-learning
 598 | https://github.com/CryptoConsultants/statuspage
 599 | https://github.com/kuralabs/mivotico-tse2sql
 600 | https://github.com/martinprojectco/statuspage
 601 | https://github.com/whereskenneth/Dwarfsquad
 602 | https://github.com/target/winnaker
 603 | https://github.com/fvisin/main_loop_tf
 604 | https://github.com/dc-geobr/serenata-de-amor
 605 | https://github.com/awesome-python/kur
 606 | https://github.com/jayfk/statuspage
 607 | https://github.com/tsalo/pliers
 608 | https://github.com/mansweet/sklearn-crfsuite
 609 | https://github.com/kratsg/optimization
 610 | https://github.com/JRCSTU/CO2MPAS-TA
 611 | https://github.com/JoostJM/pyradiomics_OLD
 612 | https://github.com/ml-lab/twpca
 613 | https://github.com/tp7309/TTPassGen
 614 | https://github.com/veltzer/pyawskit
 615 | https://github.com/choldgraf/methods_encoding_model
 616 | https://github.com/waseem18/Hacks
 617 | https://github.com/programmingtips/statuspage
 618 | https://github.com/knowsuchagency/nationalinsecurityagency
 619 | https://github.com/ddepaoli3/snapshot-ec2-lambda
 620 | https://github.com/vatlab/SOS
 621 | https://github.com/dvopsway/datasploit
 622 | https://github.com/mgharbi/demosaicnet
 623 | https://github.com/dvu4/DLND-image-classification
 624 | https://gitlab.com/cloudrave/gitlab-project-mover
 625 | https://github.com/rohitit09/collabix2
 626 | https://github.com/softwaremechanic/data-science-utils
 627 | https://github.com/jonathanhfriedman/pymc3
 628 | https://github.com/DroidSky/FreeWifi
 629 | https://github.com/BestSonny/examples
 630 | https://github.com/choltz95/political-scraper
 631 | https://github.com/ukgovdatascience/classifyintents
 632 | https://github.com/courtneysmithcft/Wifi
 633 | https://github.com/bogdan-kulynych/textfool
 634 | https://github.com/smrjan/deep-learning
 635 | https://github.com/raccoongang/edx-analytics-data-api
 636 | https://github.com/eriche2016/pytorch_projects_misc
 637 | https://github.com/zodman/nyaa_indexer
 638 | https://github.com/dferrante/waze
 639 | https://github.com/dailysoap/cs224n
 640 | https://github.com/msankar/convolutionNeuralNetworkProject
 641 | https://github.com/caplincapture/GAN-mnist-celeb
 642 | https://github.com/zhuruihe/generate_face
 643 | https://github.com/VEVO/hidi
 644 | https://github.com/fastforwardlabs/tweetratio
 645 | https://github.com/open-ods/open-ods
 646 | https://github.com/if-then-fund/if.then.fund
 647 | https://github.com/ramalho/tudo-agora
 648 | https://github.com/rafidrm/invo
 649 | https://github.com/davidhsv/deep-learning
 650 | https://github.com/HaraldoFilho/DLND-transfer-learning
 651 | https://github.com/log0ymxm/corgi
 652 | https://github.com/dem-esgal/Deep-Learning-TensorFlow
 653 | https://github.com/TokyoIndex/dog_project
 654 | https://github.com/vnbot2/UdacityCourse
 655 | https://github.com/electronick1/stepist
 656 | https://github.com/TellinaTool/awesome_nmt
 657 | https://github.com/manolo-rocks/django-manolo
 658 | https://github.com/oceanobservatories/mi-instrument
 659 | https://github.com/nkoshell/iss-positioner
 660 | https://github.com/invinst/CPDB
 661 | https://github.com/omaralbeik/dlnd_image_classification
 662 | https://github.com/AAbercrombie0492/satellite_imagery_feature_detection
 663 | https://github.com/bogdal/calibre-books
 664 | https://github.com/lucaskolstad/MLAlgorithms
 665 | https://github.com/udacity/dog-project
 666 | https://github.com/condnsdmatters/archipelago
 667 | https://github.com/jujiGu/Image-Filter
 668 | https://github.com/twocs/kur
 669 | https://github.com/theSage21/rlagents
 670 | https://github.com/MinaRe/DeepLearningImplementations
 671 | https://github.com/Miserlou/django-helloworld
 672 | https://github.com/basveeling/wavenet
 673 | https://github.com/mr-karan/kiteHistory
 674 | https://github.com/sirex/ubuntu.lt
 675 | https://github.com/Jaemu/sound-finder
 676 | https://github.com/4Quant/fauxtograph
 677 | https://github.com/dizcza/GesturesSpeech
 678 | https://github.com/ml-lab/saliency-salgan-2017
 679 | https://github.com/fifthecho/zappa-sanic
 680 | https://github.com/fabiofumarola/face_generator
 681 | https://github.com/JelleAalbers/blueice
 682 | https://github.com/GjjvdBurg/abed
 683 | https://github.com/kallimachos/cookbook
 684 | https://github.com/goaheadxyy/cs224n_2017_final_project
 685 | https://github.com/GapData/MLAlgorithms
 686 | https://github.com/interrogator/tucan
 687 | https://github.com/dssg/pgdedupe
 688 | https://github.com/luisguiserrano/AIND-DL
 689 | https://github.com/t4d/PhishingKitHunter
 690 | https://github.com/cookieshake/daum-news-crawler
 691 | https://github.com/dreadworks/college-cv
 692 | https://github.com/Kazanz/easy-etl
 693 | https://github.com/mo-san/niconico-tools
 694 | https://github.com/ml-lab/dfi-tensorflow
 695 | https://github.com/chuckoy/Zappa-1
 696 | https://github.com/abearman/cs224n-project
 697 | https://github.com/coderdj/emo
 698 | https://github.com/Miserlou/zappa-slack-inviter
 699 | https://github.com/kzjnet/MomentumBackgrounds
 700 | https://github.com/materialsproject/MPContribs
 701 | https://github.com/titouanc/ld2-gpu
 702 | https://github.com/inancgumus/MLAlgorithms
 703 | https://github.com/lukedoolittle/isvcdownloader
 704 | https://github.com/marcusrehm/serenata-de-amor
 705 | https://github.com/kartikT007/Udacity
 706 | https://github.com/rising-turtle/DeepLearning_study
 707 | https://github.com/seecsos/lms
 708 | https://github.com/larahronn/image_classification
 709 | https://github.com/idrdex/star-django
 710 | https://github.com/woaichipinngguo/neupy
 711 | https://github.com/aaront/sunglasses
 712 | https://github.com/MetroTenants/squared_away_reporter
 713 | https://github.com/chrinide/MLAlgorithms
 714 | https://github.com/a19641sk/Twitter-GIF-extractor
 715 | https://github.com/sdandia/implementation-dash
 716 | https://github.com/tinaher522/FakeNewsChallenge
 717 | https://github.com/TeamHG-Memex/memex-pinterest
 718 | https://github.com/Ingener74/Small-Screwdriver
 719 | https://github.com/bogdal/intercity-tickets
 720 | https://github.com/abilian/abilian-core
 721 | https://github.com/blag/django-world-languages
 722 | https://github.com/gazay/mlbootcamp
 723 | https://github.com/freaad/notebooks
 724 | https://github.com/evandrone/Zappa
 725 | https://github.com/huanle543/python2_projects
 726 | https://github.com/ldotlopez/arroyo
 727 | https://github.com/TeechLTD/twitter-bot
 728 | https://github.com/stevenjkern/pymc3
 729 | https://github.com/chanwooyang/Udacity-Deep-Learning
 730 | https://github.com/beelives/Feigong
 731 | https://github.com/johanssk/hpib-dmm-data-logger
 732 | https://github.com/DatapuntAmsterdam/metadata
 733 | https://github.com/mdbloice/Augmentor
 734 | https://github.com/NasaAppChallenge/birdseye-server
 735 | https://bitbucket.org/iskur/vg
 736 | https://github.com/xiaohan2012/snpp
 737 | https://github.com/ogrergo/Summarization
 738 | https://github.com/mohanaravind/Project-5-Face-Generation
 739 | https://github.com/pmlandwehr/cf-farrier
 740 | https://github.com/qiuwch/tensorpack
 741 | https://github.com/rodjun/general_selfdriving_ai
 742 | https://github.com/barentsen/k2-quality-control
 743 | https://github.com/kmike/pymorphy2-dicts
 744 | https://github.com/metrasynth/radiant-voices
 745 | https://github.com/GracelynNewhouse/Udacity-Deep-Learning
 746 | https://github.com/Dispersive-Hydrodynamics-Lab/PACE
 747 | https://github.com/semio/ddf_utils
 748 | https://github.com/MicroServiceProvider/Zappa
 749 | https://github.com/caxenie/MLAlgorithms
 750 | https://github.com/astrocatalogs/astrocats
 751 | https://github.com/hsharrison/tweetstash
 752 | https://github.com/foozzi/linux.org.ru-gallery
 753 | https://github.com/rlnsanz/delft
 754 | https://github.com/B1zzy1/PYoutube
 755 | https://github.com/hiorws/sominer
 756 | https://github.com/vzhong/embeddings
 757 | https://github.com/rayykim/kolibri
 758 | https://github.com/mquezada/ams
 759 | https://github.com/JohnDevitt/cloud_3.0
 760 | https://github.com/pennomi/brimstone-rpg
 761 | https://github.com/therebelbeta/datasploit
 762 | https://github.com/TeamHG-Memex/soft404
 763 | https://github.com/0adbylad/IPTV
 764 | https://github.com/ricardosbarbosa/image-classification
 765 | https://github.com/paulhendricks/example-code
 766 | https://github.com/MingL1989/Image-Filter
 767 | https://github.com/gamealerts/statuspage
 768 | https://github.com/iammrhelo/toneanalyser
 769 | https://github.com/teonite/convnet-filter
 770 | https://github.com/victoriaaoka/bc-16-Twitter-Sentiment-Analysis-
 771 | https://github.com/JelleAalbers/plunc
 772 | https://github.com/Datalker/DLND-Udacity
 773 | https://github.com/DatapuntAmsterdam/nap_meetbouten
 774 | https://github.com/deepgram/kur
 775 | https://github.com/Netherdrake/steemtools
 776 | https://github.com/immersinn/ncga
 777 | https://github.com/jadebayo/deep-learning-foundations
 778 | https://github.com/HenryGessau/HgUtils
 779 | https://github.com/edgarriba/examples
 780 | https://github.com/mlesfield/biorep-etl
 781 | https://github.com/Cloud-CV/visual-chatbot
 782 | https://github.com/lishouguang/MLAlgorithms
 783 | https://github.com/ConsenSys/pycaptureth
 784 | https://github.com/mynameisfiber/lpocolypse
 785 | https://github.com/fluentpython/notebooks
 786 | https://github.com/NervanaSystems/ngraph
 787 | https://github.com/theotheo/couchsurfing-scraper
 788 | https://github.com/jcode89/DataDotPy
 789 | https://github.com/antiboredom/popcorn-exporter
 790 | https://github.com/Higgins2718/promethea5
 791 | https://github.com/dnlcrl/PyFunt
 792 | https://github.com/Netflix/repokid
 793 | https://github.com/GeorgeWang1994/PiperMarkdown
 794 | https://github.com/EdwardBetts/undercrawler
 795 | https://github.com/SBRG/ssbio
 796 | https://github.com/PythonForensics/Learning-Python-for-Forensics
 797 | https://github.com/thrabchak/Udacity-Data-Analysis
 798 | https://github.com/torrance/sorcerer
 799 | https://github.com/mikethebeer/cr8
 800 | https://github.com/pmlandwehr/tick-my-feedstocks
 801 | https://github.com/vkhokhla/pymc3
 802 | https://github.com/russon77/off-the-beaten-path-backend
 803 | https://github.com/charx0r/formasaurus
 804 | https://github.com/SidHeg/practice
 805 | https://github.com/HackTheDinos/Pyard-Bone-Scripts
 806 | https://github.com/veltzer/pycmdtools
 807 | https://github.com/ganguli-lab/twpca
 808 | https://github.com/ErickDiaz/word2vec_embeddings
 809 | https://github.com/chenmingxiang110/cs224_reconstruction
 810 | https://github.com/dennisjay/dlnd-face-generation
 811 | https://github.com/ilogik/s3du
 812 | https://github.com/otterlogic/dj-stripe
 813 | https://github.com/Code4HR/NN-city-scraper
 814 | https://github.com/ungarj/mapchete
 815 | https://github.com/tttthomasssss/wort
 816 | https://github.com/dhiana/pretty_tsne
 817 | https://github.com/dssg/johnson-county-ddj-public
 818 | https://github.com/richiverse/Zappa
 819 | https://github.com/cthorey/AGU_Data
 820 | https://github.com/casperdcl/simple-customized-crawler
 821 | https://github.com/tonal/bottle-pymysql
 822 | https://github.com/HongSeokHwan/salt
 823 | https://github.com/coursera/courseraresearchexports
 824 | https://github.com/chenyuntc/examples
 825 | https://github.com/mikesj-public/dcgan-autoencoder
 826 | https://github.com/cphyc/adsquery
 827 | https://github.com/chaoxxxu/AutomatorX
 828 | https://github.com/nclouds/pager-reports
 829 | https://github.com/JulianKahnert/classification
 830 | https://github.com/JulianYG/224nfinalproject
 831 | https://github.com/jedie/PyHardLinkBackup
 832 | https://github.com/MrSaad/signet
 833 | https://github.com/JasonAHeron/RedditBot
 834 | https://github.com/YukiSakai1209/tpot
 835 | https://github.com/NORCatUofC/zappa_watson_wrapper
 836 | https://github.com/rhiever/tpot
 837 | https://github.com/silky/videogrep
 838 | https://github.com/watrool/dog_breed_dectetor
 839 | https://github.com/ashoeb81/DLND-Project-5-Solution
 840 | https://github.com/fact-project/darkspot
 841 | https://github.com/Qbitus/serverless-imagehost
 842 | https://github.com/ChangLabUcsf/intonatang
 843 | https://github.com/xibinyue/examples
 844 | https://github.com/cmward/text-scene
 845 | https://github.com/purrcat259/twitch-statistics
 846 | https://github.com/mynameisfiber/word2vec_debias
 847 | https://github.com/ludwiktrammer/deep-learning
 848 | https://github.com/ankitmathur3193/song-cli
 849 | https://github.com/iammrhelo/edgar-10k-sa
 850 | https://github.com/futurever/MLAlgorithms
 851 | https://github.com/MontrealCorpusTools/Montreal-Forced-Aligner
 852 | https://github.com/ChunfangWang/TravisCaffeTest
 853 | https://github.com/Pirate-Crew/IPTV
 854 | https://github.com/renjithsraj/whereami
 855 | https://github.com/BlueBrain/NeuroM
 856 | https://github.com/peterspackman/hstools
 857 | https://github.com/farukrahmet/vikipedia
 858 | https://github.com/wengole/eveonline-assistant
 859 | https://github.com/NeverDoubtTheWorm/Face-Generation-nd101
 860 | https://github.com/virantha/photokeeper
 861 | https://github.com/nitarshan/variational-autoencoder
 862 | https://github.com/johannesgiorgis/deep_learning
 863 | https://github.com/stefanfoulis/timelapse-manager
 864 | https://github.com/Miiha/FilmAnalyzerKit
 865 | https://github.com/jensfinnas/ktweb-scraper
 866 | https://github.com/limix/optimix
 867 | https://github.com/ami-GS/ngraph
 868 | https://github.com/davedoesdev/dxf
 869 | https://github.com/smrjan/machine-learning
 870 | https://github.com/nprapps/mapturner
 871 | https://github.com/dhruvraj-singh-rawat/face-generation
 872 | https://github.com/physion/osl-delivery
 873 | https://github.com/GlaciumVulpes/face_generation
 874 | https://github.com/blezek/pyradiomics
 875 | https://github.com/lukeyeager/pytorch-examples
 876 | https://github.com/nims11/animemon
 877 | https://github.com/VonStruddle/PyHunter
 878 | https://github.com/emanuelfeld/poirot
 879 | https://github.com/minhoolee/Synopsys-Project-2017
 880 | https://github.com/psobot/SampleScanner
 881 | https://github.com/Vasuji/deep-learning
 882 | https://gitlab.com/virtualtam/abelujo
 883 | https://github.com/jind11/SQuAD-QA-System
 884 | https://github.com/followloda/example-code
 885 | https://github.com/JanVan01/sentinel1_s3_ingestor
 886 | https://github.com/aldilaff/reversegifsbot
 887 | https://github.com/ltfschoen/content-downloader
 888 | https://github.com/sentinelsat/sentinelsat
 889 | https://github.com/TrinityComputers/Formasaurus
 890 | https://github.com/PuchatekwSzortach/printed_characters_net
 891 | https://github.com/lepisma/mpm
 892 | https://github.com/aboucaud/adcf
 893 | https://github.com/beaukams/content-downloader
 894 | https://github.com/matheuslrsouza/deep-learning
 895 | https://github.com/paulhendricks/notebooks
 896 | https://github.com/tperol/ConvNetQuake
 897 | https://github.com/robeceiro/aind2-dog-project
 898 | https://github.com/AlexandreDecan/ecos-SANER2017
 899 | https://github.com/Statflo/statuspage
 900 | https://github.com/RustyHoff/CGC-Bookmark-Downloader
 901 | https://github.com/cmarkello/toil-scripts
 902 | https://github.com/ebigelow/detect-relationships
 903 | https://github.com/samm81/ut-nutrition
 904 | https://github.com/Cranial-XIX/VAE-for-Image-Completion
 905 | https://github.com/tyler-romero/squad-reading-comprehension
 906 | https://github.com/ml-lab/BeaverDam
 907 | https://github.com/mrMarcosss/comarket
 908 | https://github.com/pabloazevedo/DeepBach
 909 | https://github.com/esuteau/gan_face_generation
 910 | https://github.com/margaret/seam-carver
 911 | https://github.com/digris/openbroadcast.org
 912 | https://github.com/QuincyLarson/FreeWifi
 913 | https://github.com/pymc-devs/pymc3
 914 | https://github.com/nagappankv/dlnd-project2
 915 | https://github.com/regeirk/pycwt
 916 | https://github.com/rolando-archive/undercrawler
 917 | https://github.com/chenwardT/lol_stats2
 918 | https://github.com/SeMeKh/sharif_cn_pa_evaluator
 919 | https://github.com/KevBrewt/Geospatial-Vision-and-Visualization
 920 | https://github.com/luivilella/simpleminer
 921 | https://github.com/Shmuma/rl
 922 | https://github.com/aschampion/diluvian
 923 | https://github.com/SANBI-SA/tb2neo
 924 | https://github.com/DatapuntAmsterdam/bbga
 925 | https://github.com/Armax/IPTV
 926 | https://github.com/tokestermw/text-gan-tensorflow
 927 | https://github.com/attributedata/quilt
 928 | https://github.com/knowledgewarrior/zeroclickinfo-fathead
 929 | https://github.com/nelson-liu/paraphrase-id-tensorflow
 930 | https://github.com/jkarimi91/cliggle
 931 | https://github.com/rladeira/mltils
 932 | https://github.com/nschloe/betterbib
 933 | https://github.com/sarath-hotspot/udacity-project-5-face-generation
 934 | https://github.com/AlexisEidelman/tpot
 935 | https://github.com/pypa/twine
 936 | https://github.com/jocephus/datasploit
 937 | https://github.com/beshrkayali/gifbook
 938 | https://github.com/WesleyDevLab/videoSpider
 939 | https://github.com/zhangxulong/baseZhang
 940 | https://github.com/lukashh7/ids-network-simulator
 941 | https://github.com/Zulko/moviepy
 942 | https://github.com/datadesk/congress-headshots-lambda
 943 | https://github.com/PlamenStilyianov/Python3
 944 | https://github.com/dezede/dezede
 945 | https://github.com/kotarohara/SidewalkMask
 946 | https://github.com/achim1/pyevsel
 947 | https://github.com/Cyberfreakier/uda_image_classification
 948 | https://github.com/ml-lab/fauxtograph
 949 | https://github.com/uwdb/istc_oceanography
 950 | https://github.com/sasha42/Mailchimp-utility
 951 | https://github.com/devendrasr/MLAlgorithms
 952 | https://github.com/pfultz2/shake-pm
 953 | https://github.com/NeverDoubtTheWorm/Deep-Learning-Nanodegree-nd101
 954 | https://github.com/kwameboame/speech-to-text-wavenet
 955 | https://github.com/Teichlab/readquant
 956 | https://github.com/rasbt/MLAlgorithms
 957 | https://github.com/xeroc/uptick
 958 | https://github.com/nandakishorkoka/deep-learning-nd
 959 | https://github.com/lnchpd/udacity_dl
 960 | https://github.com/slippers/py-flask-jsontools
 961 | https://github.com/ShiftCtrlGroup/tweets_analyzer
 962 | https://github.com/tjacobs/baselines
 963 | https://github.com/qbicsoftware/dync
 964 | https://github.com/geggiot/IPTV
 965 | https://github.com/ropable/prs
 966 | https://github.com/meranaamjoker/deep-learning
 967 | https://github.com/crate/crate
 968 | https://github.com/finzellt/novae
 969 | https://github.com/CasAndreu/rlda
 970 | https://github.com/MichaelFeng87/deconvfaces
 971 | https://github.com/AjayTalati/piGAN
 972 | https://github.com/liuzard/Deep-Learning-TensorFlow
 973 | https://github.com/modsim/mycelyso
 974 | https://github.com/VonRosenchild/tsfresh
 975 | https://github.com/nackjicholson/ergast-python
 976 | https://github.com/jni/skan
 977 | https://github.com/lopuhin/kaggle-dstl
 978 | https://github.com/markiett/deep-learning
 979 | https://github.com/stradigilabs/fnc-1
 980 | https://github.com/Samurais/DeepQA2
 981 | https://github.com/amaiasalvador/imcap_keras
 982 | https://github.com/rfzabick/datasploit
 983 | https://github.com/pycomlink/pycomlink
 984 | https://github.com/kklw/example-code
 985 | https://github.com/TAMU-CPT/galaxy-workflows
 986 | https://github.com/Sardhendu/pymc3
 987 | https://github.com/ojengwa/statuspage
 988 | https://github.com/sanghack81/pyKCIPT
 989 | https://github.com/Hironsan/natural-language-preprocessings
 990 | https://github.com/liqd/django_zbp
 991 | https://github.com/rolando/databrewer
 992 | https://github.com/ktosiu/python-pool-performance
 993 | https://github.com/hongj77/DeepLearningGameAI
 994 | https://github.com/kounoike/comskip_to_html
 995 | https://github.com/qntcat/tensorpack
 996 | https://github.com/elebumm/HowItsMadeBot
 997 | https://github.com/wanjinchang/PyFunt
 998 | https://github.com/carlosdanielcsantos/visire
 999 | https://github.com/sbartek/tf-image-classification
1000 | https://github.com/scitran/python-client
1001 | https://github.com/gabrielStanovsky/unified-factuality
1002 | https://github.com/eddieantonio/judging-commits
1003 | https://github.com/pratimaupadhyay02/serverless-slack-bot
1004 | https://github.com/pedroabg/dlnd
1005 | https://github.com/craigcabrey/academify
1006 | https://github.com/fusioneng/gif2html5-app
1007 | https://github.com/justmeshishir/orchestrate-ai
1008 | https://github.com/patrickvossler18/cglp_project
1009 | https://github.com/ml-ai-nlp-ir/keras-tqdm
1010 | https://gitlab.com/holyox/malayalam-OCR
1011 | https://github.com/erictzeng/adda
1012 | https://github.com/koyo922/deep-learning
1013 | https://github.com/phdkiran/deeplearning-floyd
1014 | https://github.com/mikebarile/image-classifier
1015 | https://github.com/andresriancho/pico-string-compare-local
1016 | https://github.com/techorilla/tradlytics-backend
1017 | https://github.com/ErmiyaEskandary/instabot
1018 | https://github.com/ojosdegris/Zappa
1019 | https://github.com/MohanL/MLAlgorithms
1020 | https://github.com/littlezz/island-backup
1021 | https://github.com/themantalope/maakclusterutils
1022 | https://github.com/sailist/manim
1023 | https://github.com/maplewizard/examples
1024 | https://github.com/SenorPez/project-cars-replay-enhancer
1025 | https://github.com/jt6211/deep-learning
1026 | https://github.com/eerwitt/tensorflow-csv-to-api
1027 | https://github.com/monfera/ecogtools
1028 | https://github.com/LewisMM/django-zappa
1029 | https://github.com/trivago/Protector
1030 | https://github.com/martyni/boop
1031 | https://github.com/anuragaryan/tweets_analyzer
1032 | https://github.com/justin8/video_utils
1033 | https://github.com/linxinzhe/deep-learning
1034 | https://github.com/a568066242/MLAlgorithms
1035 | https://github.com/Trietptm-on-Security/tweets_analyzer
1036 | https://github.com/psaintlaurent/MongoBot
1037 | https://github.com/pathcl/example-code
1038 | https://github.com/scottquiring/Udacity_Deeplearning
1039 | https://github.com/notnami/annotate
1040 | https://github.com/alajara/Axelrod
1041 | https://github.com/GapData/pymc3
1042 | https://github.com/aurelius23/deep-learning
1043 | https://github.com/jacebrowning/yorm
1044 | https://github.com/WebarchivCZ/WA-KAT
1045 | https://github.com/intelradoux/gravitee-docker
1046 | https://github.com/egidijukas/udacity-nanodegree-deeplearing
1047 | https://github.com/emabishi/bc-7-Quiz-Application
1048 | https://github.com/LaurentDumont/eve_skillbook_trading
1049 | https://github.com/mc706/webmon
1050 | https://github.com/fw1121/whereami
1051 | https://github.com/vsumanbabu/DeepLearning-ImageClassification
1052 | https://github.com/openEduConnect/eduextractor
1053 | https://github.com/pyupio/github-requirements
1054 | https://github.com/syphon7/Zappa
1055 | https://github.com/sdy8181/AutomatorX
1056 | https://github.com/Chadys/Axelrod
1057 | https://github.com/AlbericC/comics-downloader
1058 | https://github.com/yunify/qsctl
1059 | https://github.com/maplet/pyMap
1060 | https://github.com/4Quant/pyradiomics
1061 | https://github.com/noootown/Forex-DQN
1062 | https://gitlab.com/arkingupta/kolibri
1063 | https://github.com/changbindu/rufeng-finance
1064 | https://github.com/marketmuse/word2vec-api
1065 | https://github.com/EnriqueCornejo/rasdatools
1066 | https://github.com/dpshelio/busfactor
1067 | https://github.com/sharsque/code-mixing-social-media
1068 | https://github.com/lsls01/Udacity_Deep_Learning_Foundation_Projects
1069 | https://github.com/IS-ENES-Data/esgf-prepare
1070 | https://github.com/welchbj/tt
1071 | https://github.com/pkumusic/E-DRL
1072 | https://github.com/ternaus/kaggle_dstl_submission
1073 | https://github.com/markusodenthal/image_classification
1074 | https://github.com/xeng1/ytdl
1075 | https://github.com/thenewinquiry/conspiracy
1076 | https://github.com/msttyy/AutomatorX
1077 | https://github.com/mbrner/taco_salad
1078 | https://github.com/sdtm1016/rbtools
1079 | https://github.com/DatapuntAmsterdam/atlas_milieuthemas
1080 | https://github.com/nkpanda/datasploit
1081 | https://github.com/lirantal/statuspage
1082 | https://github.com/rarcega/instagram-scraper
1083 | https://github.com/amarder/fuzz
1084 | https://github.com/austinvernsonger/statuspage
1085 | https://github.com/pirate/whereami
1086 | https://github.com/SonyCSL-Paris/DeepBach
1087 | https://github.com/Data-Mechanics/geoql
1088 | https://github.com/nuncjo/comicthief
1089 | https://github.com/freedomofpress/fingerprint-securedrop
1090 | https://github.com/imankulov/pyconru2014
1091 | https://gitlab.com/MarSoft/ebayhistory
1092 | https://github.com/SANBI-SA/tree2neo
1093 | https://github.com/ypwhs/CarND-TensorFlow-L2
1094 | https://github.com/ALISCIFP/tensorpack
1095 | https://github.com/ColCarroll/email_fetcher
1096 | https://github.com/18F/acqstackdb
1097 | https://github.com/sethlivingston/django-amptags
1098 | https://github.com/sirex/databot
1099 | https://github.com/18965050/fluent-python
1100 | https://github.com/beeftornado/duplicate-image-finder
1101 | https://github.com/wkentaro/fcn
1102 | https://github.com/sautumn/HealthScoreScraper
1103 | https://github.com/LeeKyungMoon/Judging-a-Book-by-its-Cover
1104 | https://github.com/xeroc/bitshares-pricefeed
1105 | https://github.com/iCHAIT/moviemon
1106 | https://github.com/codeforberlin/trees-api
1107 | https://github.com/dkatz24/DLND
1108 | https://github.com/Plushkin/instabot
1109 | https://github.com/dantasse/nghd_scraper
1110 | https://github.com/trenton3983/Fluent_Python
1111 | https://github.com/mateuszmrozewski/nd101_project_5
1112 | https://github.com/Data-Mechanics/bps-simulated-data
1113 | https://bitbucket.org/bgframework/bgparsers
1114 | https://github.com/ml-lab/unrolled_gan
1115 | https://github.com/Smerity/examples
1116 | https://github.com/tomzhang/gransk
1117 | https://github.com/subodh-malgonde/serverless-slack-bot
1118 | https://github.com/coopie/speech_ml
1119 | https://github.com/agileronin/skills-api
1120 | https://github.com/AlexEntersis/Grabber
1121 | https://github.com/fossasia/parliament-scaper
1122 | https://github.com/welchr/swiss
1123 | https://github.com/m3brown/giffer
1124 | https://github.com/synapsemx/statuspage
1125 | https://github.com/SCORE42/django-page-cms
1126 | https://github.com/DjedStudios/robobadger
1127 | https://github.com/jiasir/playback
1128 | https://github.com/gcarq/keras-timeseries-prediction
1129 | https://github.com/CiwPython/Ciw
1130 | https://github.com/sirsleepy93/DeepLearningProject5
1131 | https://github.com/Parsonswlu/dog-project
1132 | https://github.com/icoxfog417/mlimages
1133 | https://github.com/thaihust/MLAlgorithms
1134 | https://github.com/TeamHG-Memex/sklearn-crfsuite
1135 | https://github.com/hackingmaterials/atomate
1136 | https://github.com/AllenDowney/fluent-python-notebooks
1137 | https://github.com/tessazglue/whereami
1138 | https://github.com/tranquilo12/kli
1139 | https://github.com/pathcl/notebooks-1
1140 | https://github.com/mrpau-eduard/kolibri
1141 | https://github.com/brandonxiang/pyMap
1142 | https://github.com/natoromano/nupic.research
1143 | https://github.com/cbaziotis/ekphrasis
1144 | https://github.com/abilian/abilian-crm-core
1145 | https://github.com/algo-holic/MLAlgorithms
1146 | https://github.com/pratyakshs/reading-comprehension
1147 | https://github.com/CrazyFork/MLAlgorithms
1148 | https://github.com/bogdal/freepacktbook
1149 | https://github.com/andymarthin/facebook-page-album-downloader
1150 | https://github.com/tudo-astroparticlephysics/pydisteval
1151 | https://github.com/Nozdi/masters
1152 | https://github.com/shmsw25/bi-att-flow
1153 | https://gitlab.com/willzfarmer/scribe
1154 | https://github.com/Nikoleta-v3/Axelrod
1155 | https://github.com/trung-gm/deep-learning
1156 | https://github.com/PorscheLauren/tweets_analyzer
1157 | https://github.com/SooluThomas/Auro
1158 | https://github.com/winpraneeth/image-classification
1159 | https://github.com/harikishen/whereami
1160 | https://github.com/ndeepesh/Udacity-DLND
1161 | https://github.com/MikeDacre/LDDirection
1162 | https://github.com/justin8/tv_report
1163 | https://gitlab.com/aseyfarth/intervallic
1164 | https://github.com/regata/ml-experiments
1165 | https://github.com/lukevs/dtm
1166 | https://github.com/CMPUT404-Fall2016/cmput404-project
1167 | https://github.com/Macielyoung/MLAlgorithms
1168 | https://github.com/yiweishe/cs224n
1169 | https://github.com/10eTechnology/Zappa
1170 | https://github.com/sdux/UDACITY_AI_FOUNDATIONS_DCGAN
1171 | https://github.com/tunnell/wimpstat
1172 | https://github.com/AnthonyBloomer/daftlistings
1173 | https://github.com/c22/smart-api-translator
1174 | https://github.com/Netflix-Skunkworks/aardvark
1175 | https://github.com/DCCouncil/dc-law-tools
1176 | https://github.com/bjmayor/Zappa
1177 | https://github.com/willzfarmer/Python-LSA
1178 | https://github.com/zhenghuangcheng/ML_Algorithms
1179 | https://github.com/tanakatsu/udacity-dlnd-project5-face-generation
1180 | https://github.com/hershedtilak/CS224N
1181 | https://github.com/CyberScions/enumXFF
1182 | https://github.com/explosion/thinc
1183 | https://github.com/dieterich-lab/rp-bp
1184 | https://github.com/jiekebo/housing
1185 | https://github.com/JohnStarich/python-pool-performance
1186 | https://github.com/gerberlab/mitre
1187 | https://github.com/ralph-group/mucloud
1188 | https://github.com/faroit/dsdtools
1189 | https://github.com/mennthor/dotfiles
1190 | https://github.com/cwwwu/udacity-dlnd-projects
1191 | https://github.com/UW-Macrostrat/stromatolites_demo
1192 | https://github.com/localhuman/django-page-cms
1193 | https://github.com/opengridcc/opengrid
1194 | https://github.com/hack-c/cartoonsearch
1195 | https://github.com/jotes/ohtravis
1196 | https://github.com/alexrudy/ClapBot
1197 | https://github.com/tombosc/dict_based_learning
1198 | https://github.com/pdwyys20/cn-deep-learning
1199 | https://github.com/changun/miso_crawldb
1200 | https://github.com/romkof/face_generation
1201 | https://github.com/CloudNuts/Zappa
1202 | https://github.com/TechnicalBro/minecraft-plugin-resolver
1203 | https://github.com/ChezTone/gravitee-docker
1204 | https://github.com/linboqiao/MLAlgorithms
1205 | https://github.com/nickcannariato/tx_lobbying
1206 | https://github.com/datoszs/the-constitutional-court-
1207 | https://github.com/kingmray/franz_mosaic
1208 | https://github.com/astronautskaspars/videogrep
1209 | https://github.com/thisiskeithkwan/image-classification
1210 | https://github.com/No9/iocage
1211 | https://github.com/bgirardeau/securepair
1212 | https://github.com/kz26/dottorrent
1213 | https://github.com/etherealmachine/otree-core
1214 | https://github.com/xysense/BeaverDam
1215 | https://github.com/cgc/rnd
1216 | https://github.com/sheroze1123/ppm
1217 | https://github.com/project-fifo/iocage
1218 | https://github.com/arhik/nupic.research
1219 | https://github.com/sigma-geosistemas/django-cities
1220 | https://github.com/interpretation-experiment/seeds
1221 | https://github.com/nicolehe/the-best-art
1222 | https://github.com/hiteshvaidya/dcgan-autoencoder
1223 | https://github.com/ZhaoJ9014/One-Hundred-Layers-Tiramisu
1224 | https://github.com/mcrowson/rickastley
1225 | https://github.com/JackMc/xkcdscrape
1226 | https://github.com/neocsr/vehicle-detection
1227 | https://github.com/DataSploit/datasploit
1228 | https://github.com/mmmdamin/MIR-crawler
1229 | https://github.com/danielballan/photomosaic
1230 | https://github.com/pallamidessi/pinyin-subtitle
1231 | https://github.com/dmadan86/MLAlgorithms
1232 | https://github.com/sxfmol/example-code
1233 | https://github.com/statgen/pheweb
1234 | https://github.com/MIREL-UNC/echr_dataset
1235 | https://github.com/diogocp/stacktrends
1236 | https://github.com/infosec-au/enumXFF
1237 | https://github.com/pookie9/224NProj
1238 | https://github.com/FordyceLab/geppetto-cli
1239 | https://github.com/hackingmaterials/matminer
1240 | https://github.com/olety/FBD
1241 | https://github.com/kirtanechiron/faceGAN
1242 | https://github.com/mynameisfiber/contribution_votes
1243 | https://github.com/macarthur-lab/gnomad_browser
1244 | https://github.com/HvyD/AIND2-Dog_Project
1245 | https://github.com/narfman0/cookiecutter-mobile-backend
1246 | https://github.com/gamenet/redis-memory-analyzer
1247 | https://github.com/Laurian/popcorn-exporter
1248 | https://github.com/forallsystems/hipc_ccol_sms
1249 | https://github.com/rosenbrockc/fortpy
1250 | https://github.com/southwestjiaotongunivercity/example-code
1251 | https://github.com/314Tech/image-classification
1252 | https://github.com/coderholic/django-cities
1253 | https://github.com/batiste/django-page-cms
1254 | https://github.com/mattberjon/image-classification
1255 | https://github.com/indirectlylit/kolibri
1256 | https://github.com/mesutcan/MLAlgorithms
1257 | https://github.com/bobbyesh/readable
1258 | https://github.com/tybulewicz/illacceptanything
1259 | https://github.com/putmantime/wikigenomes_version2
1260 | https://github.com/Rob-M-F/transfer-learning
1261 | https://github.com/staticor/MLAlgorithms
1262 | https://github.com/yangtuocn/TweetAdventure
1263 | https://github.com/PsyBorgs/redditanalyser
1264 | https://github.com/zackchase/beermind
1265 | https://github.com/pereval-team/datasploit
1266 | https://github.com/sheuan/deep-learning
1267 | https://github.com/learningsociety/deepmodels
1268 | https://github.com/danieljl/aind-dog-project
1269 | https://github.com/SBUtltmedia/postreq-python-scrape
1270 | https://github.com/systemtrader/pymc3
1271 | https://github.com/dan0712/skills-api
1272 | https://github.com/copotron/SDC-P5
1273 | https://github.com/simeks/homo-horreum
1274 | https://github.com/dizballanze/do-latency
1275 | https://github.com/webeng/bi-att-flow
1276 | https://github.com/mikeliturbe/bizkaiko-etxeak
1277 | https://github.com/crakama/tweetAnalysis
1278 | https://github.com/hdatteln/neural_networks
1279 | https://github.com/nestauk/gtr_analysis
1280 | https://github.com/Miserlou/zappa-website
1281 | https://github.com/philip-bl/libcrap
1282 | https://github.com/vishnumani2009/fnc-1-baseline
1283 | https://github.com/FordyceLab/ChIPShOT
1284 | 


--------------------------------------------------------------------------------
/snippet_ranger/librariesio_fetcher.py:
--------------------------------------------------------------------------------
  1 | import json
  2 | import logging
  3 | import os
  4 | 
  5 | import pandas as pd
  6 | 
  7 | from ast2vec.pickleable_logger import PickleableLogger
  8 | from modelforge.progress_bar import progress_bar
  9 | 
 10 | dependencies_filename = "repository_dependencies-1.0.0-2017-06-15.csv"
 11 | repos_filename = "repositories-1.0.0-2017-06-15.csv"
 12 | projects_filename = "projects-1.0.0-2017-06-15.csv"
 13 | 
 14 | 
 15 | class LibrariesIOFetcher(PickleableLogger):
 16 |     """
 17 |     Class to get useful information from Libraries.io dataset.
 18 | 
 19 |     It is used to get list of repositories which use specified libraries.
 20 |     It runs following pipeline (get_dependent_rep_urls function).
 21 |     1. Get information about libraries.
 22 |     2. Get information about repositories that depend on libraries.
 23 |     3. Create and save links to this repositories.
 24 |     """
 25 | 
 26 |     DEFAULT_PLATFORM = "Pypi"
 27 |     CHUNKSIZE = 1000000
 28 |     HOST2LINK = {"GitHub": "github.com/",
 29 |                  "GitLab": "gitlab.com/",
 30 |                  "Bitbucket": "bitbucket.org/"}
 31 | 
 32 |     def __init__(self, librariesio_path, log_level=logging.INFO):
 33 |         """
 34 |         :param librariesio_path: Path to a folder where librariesio dataset is stored.
 35 |         :param log_level: log level of current class.
 36 |         """
 37 |         super(LibrariesIOFetcher, self).__init__(log_level=log_level)
 38 |         self._librariesio_path = librariesio_path
 39 | 
 40 |     def get_lib_info(self, libraries, platform, save_to=None):
 41 |         """
 42 |         Creates pandas dataframe with information about libraries from specified platform
 43 |         from Libraries.io.
 44 | 
 45 |         :param libraries: Dict of names and urls to repo or homepage. You can use empty url if \
 46 |             you are not sure about the link.
 47 |         :param platform: Package platform where the library is published. You can use empty \
 48 |             platform if you are not sure about a link.
 49 |         :param save_to: Path to save pandas dataframe with all information about libraries
 50 |         :return: Pandas dataframe with all information about libraries.
 51 |         """
 52 | 
 53 |         libs_info = pd.DataFrame()
 54 |         projects_path = os.path.join(self._librariesio_path, projects_filename)
 55 |         self._log.info("Looking for libraries info...")
 56 |         for chunk in pd.read_csv(projects_path, chunksize=LibrariesIOFetcher.CHUNKSIZE,
 57 |                                  index_col=False, dtype=object):
 58 |             for lib_name in libraries:
 59 |                 indexes = (chunk["Name"] == lib_name)
 60 |                 if platform != "":
 61 |                     indexes = indexes & (chunk["Platform"] == platform)
 62 |                 if libraries[lib_name] != "":
 63 |                     indexes = indexes & ((chunk["Repository URL"] == libraries[lib_name]) |
 64 |                                          pd.isnull(chunk["Repository URL"]))
 65 |                     res = chunk[indexes]
 66 |                     if len(res) > 0:
 67 |                         self._log.info("%s library entry is found!", lib_name)
 68 |                     libs_info = pd.concat([libs_info, res])
 69 |                     if save_to:
 70 |                         libs_info.to_csv(save_to, index=False)
 71 | 
 72 |         return libs_info
 73 | 
 74 |     def get_dependent_reps(self, libs_info, save_to=None):
 75 |         """
 76 |         Creates pandas dataframe with all information about dependent repositories from libraries.
 77 | 
 78 |         :param libs_info: Pandas dataframe with all information about libraries.
 79 |         :param save_to: Path to save pandas dataframe with all information about libraries if you \
 80 |             want to save it.
 81 |         :return: Pandas dataframe with all information about dependent repositories.
 82 |         """
 83 |         self._log.info("Creating list of dependent repos...")
 84 |         if hasattr(libs_info["ID"], "tolist"):
 85 |             lib_id2name = dict(zip(libs_info["ID"].tolist(), libs_info["Name"].tolist()))
 86 |         else:
 87 |             lib_id2name = {libs_info["ID"]: libs_info["Name"]}
 88 |         pd_result = []
 89 |         dependencies_path = os.path.join(self._librariesio_path, dependencies_filename)
 90 |         for chunk in progress_bar(pd.read_csv(dependencies_path,
 91 |                                               chunksize=LibrariesIOFetcher.CHUNKSIZE,
 92 |                                               index_col=False), self._log, expected_size=100):
 93 |             for lib_id in lib_id2name:
 94 |                 res = chunk[chunk["Dependency Project ID"] == int(lib_id)]
 95 |                 if len(res) > 0:
 96 |                     pd_result.append(res)
 97 | 
 98 |         pd_result = pd.concat(pd_result)
 99 |         pd_result["url"] = "https://" + \
100 |                            pd_result["Host Type"].map(LibrariesIOFetcher.HOST2LINK) + \
101 |                            pd_result["Repository Name with Owner"]
102 |         if save_to:
103 |             pd_result.to_csv(save_to, index=False)
104 | 
105 |         return pd_result
106 | 
107 |     def save_urls_only(self, dependent_reps, libs_info, save_to):
108 |         """
109 |         Create urls for repositories from dependent_reps for libraries from libs_info.
110 | 
111 |         :param dependent_reps: Pandas dataframe with information about dependent repositories \
112 |             from libraries in libs_info dataframe.
113 |         :param libs_info: Pandas dataframe with all information about libraries.
114 |         :param save_to: Save location for urls. Specify folder if you have several libraries. \
115 |             Then urls will be stored in the file <library name>.txt . You can specify file, then
116 |             all urls will be saved in one file.
117 |         """
118 |         if not os.path.isdir(save_to) and os.path.exists(save_to):
119 |             os.remove(save_to)
120 |         for i, lib in libs_info.iterrows():
121 |             lib_id = int(lib["ID"])
122 |             lib_name = lib["Name"]
123 |             cur_dependent_reps = dependent_reps[dependent_reps["Dependency Project ID"] == lib_id]
124 |             res = cur_dependent_reps["url"].tolist()
125 |             res = list(set(res))
126 | 
127 |             if os.path.isdir(save_to):
128 |                 save_path = os.path.join(save_to, lib_name + ".txt")
129 |             else:
130 |                 save_path = save_to
131 | 
132 |             with open(save_path, "a") as f:
133 |                 for line in res:
134 |                     f.write(line + "\n")
135 | 
136 |     def get_dependent_rep_urls(self, libraries, platform, output):
137 |         """
138 |         Extract and save dependent urls of dependent repositories.
139 | 
140 |         :param libraries: Dict of names and urls to repo or homepage. You can use empty url if \
141 |             you are not sure about the link.
142 |         :param platform: Package platform where the library is published. You can use empty
143 |         platform if you are not sure about a link.
144 |         :param output: Save location for urls. Specify folder if you have several libraries. \
145 |             Then urls will be stored in the file <library name>.txt . You can specify file, then
146 |             all urls will be saved in one file.
147 |         :return:
148 |         """
149 |         libraries_info = self.get_lib_info(libraries, platform)
150 |         dependent_reps = self.get_dependent_reps(libraries_info)
151 |         self.save_urls_only(dependent_reps, libraries_info, save_to=output)
152 | 
153 |     def _get_log_name(self):
154 |         return "LibrariesIOFetcher"
155 | 
156 | 
157 | def dependent_reps_entry(args):
158 |     if args.libraries:
159 |         libraries = dict(lib.split(":", maxsplit=1) for lib in args.libraries)
160 |     else:
161 |         libraries = json.load(open(args.libraries_json))
162 | 
163 |     libio = LibrariesIOFetcher(args.librariesio_data, args.log_level)
164 |     libio.get_dependent_rep_urls(libraries, args.platform, args.output)
165 | 


--------------------------------------------------------------------------------
/snippet_ranger/model2/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/model2/__init__.py


--------------------------------------------------------------------------------
/snippet_ranger/model2/base_split.py:
--------------------------------------------------------------------------------
 1 | from typing import Iterable
 2 | 
 3 | from modelforge import Model
 4 | from ast2vec import Model2Base
 5 | 
 6 | 
 7 | class Model2BaseSplit(Model2Base):
 8 |     """
 9 |     Class to split the model content and save it in a new model.
10 |     `Model2Base.MODEL_FROM` should be iterable and iterator returns will be called model objects.
11 |     For example, one can split objects of :class:`ast2vec.Source` to functions parts and store it
12 |     as :class:`snippet_ranger.Snippet` model (see :class:`snippet_ranger.Source2Func` class).
13 | 
14 |     This class the next pipeline:
15 |     1. Filter unrelated objects in the input Model with `input_model_object_criteria` function.
16 |     2. Split one model object into several objects of new model with `split_model_object` function.
17 |     3. Discard some new objects appeared on step 2 with `output_model_object_criteria` function.
18 |     4. Save new model with all remaining object.
19 | 
20 |     Produce exactly one model from one.
21 |     """
22 |     def __init__(self, *args, **kwargs):
23 |         super(Model2BaseSplit, self).__init__(*args, **kwargs)
24 | 
25 |     def filter_input_model_content(self, model) -> Iterable:
26 |         """
27 |         Filter object of input model by criteria in input_model_object_criteria
28 |         :return: Remaining objects.
29 |         """
30 |         return filter(self.input_model_object_criteria, model)
31 | 
32 |     def input_model_object_criteria(self, model_object):
33 |         """
34 |         Criteria for input model filtering.
35 |         No filtration by default.
36 |         :param model_object: Model object.
37 |         :return:
38 |         """
39 |         return True
40 | 
41 |     def filter_output_model_object(self, model_object) -> Iterable:
42 |         """
43 |         Filter object of output model by criteria in output_model_object_criteria
44 |         :return:
45 |         """
46 |         return filter(self.output_model_object_criteria, model_object)
47 | 
48 |     def output_model_object_criteria(self, model_object):
49 |         """
50 |         Criteria for output objects filtering.
51 |         No filtration by default.
52 |         :param model_object: Model object.
53 |         :return: Remaining objects.
54 |         """
55 |         return True
56 | 
57 |     def convert_model(self, model_from: Model) -> Model:
58 |         result = []
59 |         for model_object in self.filter_input_model_content(iter(model_from)):
60 |             out_model_part = self.split_model_object(model_from, model_object)
61 |             for out_model_object in self.filter_output_model_object(out_model_part):
62 |                 result.append(out_model_object)
63 |         if result:
64 |             out_model = self.construct(model_from, result)
65 |         else:
66 |             raise ValueError("All functions are filtered and you get empty model.")
67 |         return out_model
68 | 
69 |     def split_model_object(self, model_from: Model, model_object) -> Iterable:
70 |         """
71 |         This function must be implemented in the child classes.
72 | 
73 |         :param model_from: The full input model instance.
74 |         :param model_object: The current model object instance to split.
75 |         :return: List or tuple of parameters for output model objects initialization.
76 |         """
77 |         raise NotImplementedError
78 | 
79 |     def construct(self, model_from: Model, result: list) -> Model:
80 |         """
81 |         Construct out model from objects.
82 |         This function must be implemented in the child classes.
83 | 
84 |         :param model_from: The full input model instance.
85 |         :param result: objects from `split_model_object`
86 |         :return: Output model.
87 |         """
88 |         raise NotImplementedError
89 | 


--------------------------------------------------------------------------------
/snippet_ranger/model2/snippet2bow.py:
--------------------------------------------------------------------------------
  1 | import os
  2 | from collections import defaultdict
  3 | import logging
  4 | import math
  5 | 
  6 | from ast2vec.bow import BOW
  7 | from ast2vec.model2.source2bow import UastModel2BOW, Uasts2BOW
  8 | from ast2vec.df import DocumentFrequencies
  9 | from ast2vec.token_parser import NoTokenParser
 10 | from ast2vec.uast_ids_to_bag import UastIds2Bag
 11 | from ast2vec.bblfsh_roles import SIMPLE_IDENTIFIER, CALL_CALLEE
 12 | import numpy
 13 | from scipy.sparse import csr_matrix
 14 | 
 15 | from snippet_ranger.models.snippet import Snippet
 16 | 
 17 | 
 18 | class Snippet2BOW(Uasts2BOW):
 19 |     def __init__(self, vocabulary: dict, docfreq: DocumentFrequencies,
 20 |                  getter: callable, token_parser=None, role=SIMPLE_IDENTIFIER):
 21 |         super().__init__(vocabulary, docfreq, getter)
 22 |         if token_parser is not None:
 23 |             self._uast2bag = UastIds2Bag(vocabulary, token_parser)
 24 |         self.role = role
 25 | 
 26 |     def __call__(self, file_uast):
 27 |         freqs = defaultdict(int)
 28 |         bag = self._uast2bag.uast_to_bag(self._getter(file_uast), self.role)
 29 |         for key, freq in bag.items():
 30 |             freqs[key] += freq
 31 |         missing = []
 32 |         for key, val in freqs.items():
 33 |             try:
 34 |                 freqs[key] = math.log(1 + val) * math.log(
 35 |                     self._docfreq.docs / self._docfreq[self._reverse_vocabulary[key]])
 36 |             except KeyError:
 37 |                 missing.append(key)
 38 |         for key in missing:
 39 |             del freqs[key]
 40 |         return dict(freqs)
 41 | 
 42 | 
 43 | class SnippetModel2BOW(UastModel2BOW):
 44 |     MODEL_FROM_CLASS = Snippet
 45 | 
 46 |     def __init__(self, topn, docfreq, *args, **kwargs):
 47 |         super().__init__(topn, docfreq, *args, **kwargs)
 48 |         vocabulary = {t: i for i, t in enumerate(self._tokens)}
 49 |         self._uasts2bow = Snippet2BOW(vocabulary, docfreq, lambda x: x)
 50 | 
 51 |     def convert_model(self, model: Snippet) -> BOW:
 52 |         bags = [self._uasts2bow(uast) for uast in model.uasts]
 53 |         data = list(zip(*[(bag_[x], i, x) for i, bag_ in enumerate(bags) for x in bag_]))
 54 |         matrix = csr_matrix((data[0], (data[1], data[2])),
 55 |                             shape=(len(bags), len(self._uasts2bow.vocabulary)),
 56 |                             dtype=numpy.float32)
 57 |         bow = BOW(log_level=logging.WARNING)
 58 |         bow.construct(repos=model.names, matrix=matrix, tokens=self._tokens)
 59 |         bow.meta["dependencies"] = [self._uasts2bow.docfreq]
 60 |         return bow
 61 | 
 62 | 
 63 | class SnippetModel2FuncCallsBOW(UastModel2BOW):
 64 |     # TODO(zurk): docstring
 65 | 
 66 |     MODEL_FROM_CLASS = Snippet
 67 | 
 68 |     def __init__(self, topn, docfreq, *args, **kwargs):
 69 |         super().__init__(topn, docfreq, *args, **kwargs)
 70 |         vocabulary = {t: i for i, t in enumerate(self._tokens)}
 71 |         self._uasts2bow = Snippet2BOW(vocabulary, docfreq, lambda x: x, NoTokenParser(),
 72 |                                       CALL_CALLEE)
 73 | 
 74 |     def convert_model(self, model: Snippet) -> BOW:
 75 |         bags = [self._uasts2bow(uast) for uast in model.uasts]
 76 |         data = list(zip(*[(bag_[x], i, x) for i, bag_ in enumerate(bags) for x in bag_]))
 77 |         matrix = csr_matrix((data[0], (data[1], data[2])),
 78 |                             shape=(len(bags), len(self._uasts2bow.vocabulary)),
 79 |                             dtype=numpy.float32)
 80 |         bow = BOW(log_level=logging.WARNING)
 81 |         bow.construct(repos=model.names, matrix=matrix, tokens=self._tokens)
 82 |         bow.meta["dependencies"] = [self._uasts2bow.docfreq]
 83 |         return bow
 84 | 
 85 | 
 86 | def snippet2bow_entry(args):
 87 |     df = DocumentFrequencies().load(args.docfreq)
 88 |     os.makedirs(args.output, exist_ok=True)
 89 |     converter = SnippetModel2BOW(args.vocabulary_size, df, num_processes=args.processes,
 90 |                                  overwrite_existing=args.overwrite_existing)
 91 |     converter.convert(args.input, args.output, pattern=args.filter)
 92 | 
 93 | 
 94 | def snippet2fc_bow_entry(args):
 95 |     df = DocumentFrequencies().load(args.docfreq)
 96 |     os.makedirs(args.output, exist_ok=True)
 97 |     converter = SnippetModel2FuncCallsBOW(args.vocabulary_size, df, num_processes=args.processes,
 98 |                                           overwrite_existing=args.overwrite_existing)
 99 |     converter.convert(args.input, args.output, pattern=args.filter)
100 | 


--------------------------------------------------------------------------------
/snippet_ranger/model2/snippet2df.py:
--------------------------------------------------------------------------------
 1 | import tempfile
 2 | from typing import Union
 3 | 
 4 | from ast2vec.model2.source2df import Uast2DocFreq, MergeDocFreq
 5 | from ast2vec.df import DocumentFrequencies
 6 | from ast2vec.bblfsh_roles import SIMPLE_IDENTIFIER, CALL_CALLEE
 7 | from ast2vec.source import UASTModel
 8 | from ast2vec.uast_ids_to_bag import UastIds2Bag
 9 | from snippet_ranger.utils import get_func_names_bow
10 | from snippet_ranger.model2.source2func import process_lib_functions
11 | 
12 | from modelforge import Model
13 | 
14 | from snippet_ranger.models.snippet import Snippet
15 | 
16 | 
17 | class FilterVocabulary:
18 |     def __init__(self, filter_set):
19 |         self.filter_set = filter_set
20 | 
21 |     def __getitem__(self, item):
22 |         if item in self.filter_set:
23 |             return item
24 |         raise KeyError
25 | 
26 | 
27 | class Snippet2DocFreq(Uast2DocFreq):
28 |     MODEL_FROM_CLASS = Snippet
29 |     MODEL_TO_CLASS = DocumentFrequencies
30 | 
31 |     def __init__(self, role: int=SIMPLE_IDENTIFIER, filter_set: set =None, *args, **kwargs):
32 |         super().__init__(*args, **kwargs)
33 |         self._uast2bag = UastIds2Bag(FilterVocabulary(filter_set) if filter_set else None)
34 |         self.role = role
35 | 
36 |     def convert_model(self, model: Model) -> Union[Model, None]:
37 |         for uast in model.uasts:
38 |             contained = set()
39 |             for key in self._uast2bag.uast_to_bag(uast, role=self.role):
40 |                 contained.add(key)
41 |             for word in contained:
42 |                 self._df[word] += 1
43 |             self._docs += 1
44 | 
45 | 
46 | def snippet2df_entry(args):
47 |     converter = Snippet2DocFreq(num_processes=args.processes,
48 |                                 overwrite_existing=args.overwrite_existing)
49 |     with tempfile.TemporaryDirectory(dir=args.tmpdir, prefix="snippet2df") as tmpdir:
50 |         converter.convert(args.input, tmpdir, pattern=args.filter)
51 |         joiner = MergeDocFreq(num_processes=1)
52 |         joiner.convert(tmpdir, args.output,
53 |                        pattern="%s*.asdf" % DocumentFrequencies.NAME)
54 | 
55 | 
56 | def snippet2fc_df_entry(args):
57 |     lib_model = UASTModel().load(args.library_uast)
58 |     functions_bow = get_func_names_bow(lib_model)
59 |     functions_bow = process_lib_functions(functions_bow)
60 | 
61 |     converter = Snippet2DocFreq(num_processes=args.processes,
62 |                                 overwrite_existing=args.overwrite_existing,
63 |                                 role=CALL_CALLEE, filter_set=functions_bow)
64 |     with tempfile.TemporaryDirectory(dir=args.tmpdir, prefix="snippet2df") as tmpdir:
65 |         converter.convert(args.input, tmpdir, pattern=args.filter)
66 |         joiner = MergeDocFreq(num_processes=1)
67 |         joiner.convert(tmpdir, args.output,
68 |                        pattern="%s*.asdf" % DocumentFrequencies.NAME)
69 | 


--------------------------------------------------------------------------------
/snippet_ranger/model2/source2func.py:
--------------------------------------------------------------------------------
  1 | import logging
  2 | 
  3 | from ast2vec.uast import UASTModel
  4 | from ast2vec.source import Source
  5 | from ast2vec.bblfsh_roles import CALL, CALL_CALLEE, FUNCTION_DECLARATION
  6 | from snippet_ranger.model2.base_split import Model2BaseSplit
  7 | from snippet_ranger.models.snippet import Snippet
  8 | from snippet_ranger.utils import uast_role_nodes, has_import, uast_to_bag, get_func_names_bow
  9 | 
 10 | 
 11 | class Source2Func(Model2BaseSplit):
 12 |     """
 13 |     This class splits files in source model to functions.
 14 |     It makes snippet from each function that satisfies the rule in `output_model_object_criteria`
 15 |     for every file that satisfies the rule in `input_model_object_criteria`.
 16 |     """
 17 |     MODEL_FROM_CLASS = Source
 18 |     MODEL_TO_CLASS = Snippet
 19 | 
 20 |     def __init__(self, libname, lib_funcs_bow=None, *args, **kwargs):
 21 |         """
 22 |         :param libname: Name of the library. All files without library usage are not handled.
 23 |         :param lib_funcs_bow: dictionary of function names (bag of words) which can be used from \
 24 |             the library. You can use just all function names or preprocess it somehow. For \
 25 |             example, remove functions that are common for language or internal functions.
 26 |         :param args: positional arguments to pass to :class:`Model2BaseSplit`.
 27 |         :param kwargs: key arguments to pass to :class:`Model2BaseSplit`.
 28 |         """
 29 |         super(Source2Func, self).__init__(*args, **kwargs)
 30 |         self.libname = libname
 31 |         self.lib_funcs_bow = lib_funcs_bow
 32 |         self.lib_funcs_bow_set = set(lib_funcs_bow)
 33 | 
 34 |         self._log.debug("lib_funcs_bow for {} lib is {}".format(libname, lib_funcs_bow))
 35 |         self.threshold = 0
 36 | 
 37 |     def input_model_object_criteria(self, model_object):
 38 |         """
 39 |         Filtration criteria for input model. Filter all files that are not use specified library.
 40 | 
 41 |         :param model_object: Object of Source model.
 42 |         :return: Library usage indicator.
 43 |         """
 44 |         filename, uast, source = model_object
 45 |         res = has_import(self.libname, uast)
 46 |         return res
 47 | 
 48 |     def split_model_object(self, model_from, model_object):
 49 |         """
 50 |         Parameters iterator for Function models initialisation.
 51 |         This models are split from
 52 | 
 53 |         :param model_from: Full Source model.
 54 |         :param model_object: Current Source model object.
 55 |         :return: parameters for :class:`Snippet` model __init__.
 56 |         """
 57 |         filename, uast, source = model_object
 58 |         have_funcs = False
 59 |         func_nodes = uast_role_nodes(uast, FUNCTION_DECLARATION)
 60 |         for func_node in func_nodes:
 61 |             have_funcs = True
 62 |             pos_start, pos_end = func_node.start_position.line-1, func_node.end_position.line
 63 |             func_source = "\n".join(source.splitlines()[pos_start:pos_end])
 64 |             yield filename, func_node, func_source, pos_start, pos_end
 65 |         if not have_funcs:
 66 |             yield filename, uast, source, 0, source.count("\n")
 67 | 
 68 |     def output_model_object_criteria(self, model_object):
 69 |         """
 70 |         Output model object filter criteria. Filter all :class:`Snippet` model entries that has
 71 |         no calls from the library bag of words are not use the library.
 72 | 
 73 |         :param model_object: Source model object.
 74 |         :return: Library functions usage indicator.
 75 |         """
 76 |         func_node = model_object[1]
 77 |         func_names = uast_to_bag(func_node, role=CALL_CALLEE)
 78 | 
 79 |         common = self.lib_funcs_bow_set & func_names.keys()
 80 |         if common == 0 and self._log.isEnabledFor(logging.DEBUG):
 81 |             self._log.DEBUG("There is no common functions in func_{}-{}_{}".format(
 82 |                 model_object[4], model_object[5], model_object[0]))
 83 |             for key in func_names:
 84 |                 if key in model_object[2]:
 85 |                     self._log.DEBUG("But I can find {} in source!".format(key))
 86 |                     self._log.error("Something strange. "
 87 |                                     "Here is the source code file:\n{}".format(model_object[2]))
 88 |                     break
 89 |         if len(common) > self.threshold:
 90 |             return True
 91 |         return False
 92 | 
 93 |     def construct(self, model_from, result):
 94 |         return Source2Func.MODEL_TO_CLASS().construct(model_from.repository, *zip(*result))
 95 | 
 96 | 
 97 | def process_lib_functions(functions_bow):
 98 |     """
 99 |     Remove bad function names from function bag of words. Specific for Python.
100 |     Removes internal functions and test functions.
101 |     """
102 |     bad_prefixes = ["_", "test"]
103 |     clear_functions_bow = {}
104 |     for k, v in functions_bow.items():
105 |         for bad_prefix in bad_prefixes:
106 |             if k.startswith(bad_prefix):
107 |                 break
108 |         else:
109 |             clear_functions_bow[k] = v
110 | 
111 |     return clear_functions_bow
112 | 
113 | 
114 | def source2func_entry(args):
115 |     lib_model = UASTModel().load(args.library_uast)
116 |     functions_bow = get_func_names_bow(lib_model)
117 |     functions_bow = process_lib_functions(functions_bow)
118 | 
119 |     converter = Source2Func(args.library_name, functions_bow, log_level=args.log_level,
120 |                             num_processes=args.processes,
121 |                             overwrite_existing=args.overwrite_existing)
122 |     converter.convert(args.input, args.output, pattern=args.filter)
123 | 


--------------------------------------------------------------------------------
/snippet_ranger/models/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/models/__init__.py


--------------------------------------------------------------------------------
/snippet_ranger/models/snippet.py:
--------------------------------------------------------------------------------
 1 | from ast2vec import Source
 2 | import numpy as np
 3 | 
 4 | 
 5 | class Snippet(Source):
 6 |     """
 7 |     This model can store code snippets. In general, code snippet is any part of source code file.
 8 |     For example, function declaration is a code snippet. So, this class is the same as source model
 9 |     but have start and end line positions of snippet location in file.
10 |     You can use :class:`Source2Function` transformer to create function snippets from source model.
11 |     """
12 | 
13 |     NAME = "snippet"
14 | 
15 |     def construct(self, repository, filenames, uasts, sources,
16 |                   positions_start=None, positions_end=None, positions=None):
17 |         super(Snippet, self).construct(repository=repository, filenames=filenames,
18 |                                        sources=sources, uasts=uasts)
19 |         if ((positions_start is None) ^ (positions_end is None)) or \
20 |                 ((positions_start is None) ^ (positions is not None)):
21 |             raise ValueError("You should specify both positions_start and positions_end or "
22 |                              "only a positions")
23 |         if positions is None:
24 |             if len(positions_start) != len(positions_end):
25 |                 raise ValueError("Length of positions_start ({}) and positions_end ({}) "
26 |                                  "are not equal".format(len(positions_start), len(positions_end)))
27 |             self._positions = np.array(list(zip(positions_start, positions_end)))
28 |         else:
29 |             self._positions = positions
30 |         return self
31 | 
32 |     @property
33 |     def names(self) -> list:
34 |         """
35 |         Creates the list of names for snippets in the model.
36 |         Usually names are needed for topic modeling to represent different snippets as different
37 |         documents. See `SnippetModel2BOW` transformer.
38 |         """
39 |         return ["{}/{}_{}_{}".format(self._repository, name, st, end).
40 |                 replace(":", "").replace(" ", "_")
41 |                 for name, (st, end) in zip(self._filenames, self._positions)]
42 | 
43 |     @property
44 |     def positions(self):
45 |         """
46 |         Return start and end line positions of snippets.
47 |         """
48 |         return self._positions
49 | 
50 |     @property
51 |     def positions_start(self):
52 |         """
53 |         Return start line position of snippets.
54 |         """
55 |         return self._positions[:, 0].T
56 | 
57 |     @property
58 |     def positions_end(self):
59 |         """
60 |         Return end line position of snippets.
61 |         """
62 |         return self._positions[:, 1].T
63 | 
64 |     def __iter__(self):
65 |         """
66 |         Iterator over the items.
67 |         """
68 |         return zip(self._filenames, self._uasts, self._sources, self._positions)
69 | 
70 |     def __getitem__(self, item):
71 |         """
72 |         Returns file name, uast, source code and positions for the given snippet index.
73 | 
74 |         :param item: Snippet index.
75 |         :return: file name, source code, uast, positions, where positions[0] is start and \
76 |             positions[1] is end.
77 |         """
78 |         return super(Snippet, self).__getitem__(item) + (self._positions[item], )
79 | 
80 |     def _load_tree_kwargs(self, tree):
81 |         tree_kwargs = super(Snippet, self)._load_tree_kwargs(tree)
82 |         tree_kwargs["positions"] = np.array(tree["positions"])
83 |         return tree_kwargs
84 | 
85 |     def _to_dict_to_save(self):
86 |         save_dict = super(Snippet, self)._to_dict_to_save()
87 |         save_dict["positions"] = self._positions
88 |         return save_dict
89 | 


--------------------------------------------------------------------------------
/snippet_ranger/pylib2uast.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | import logging
 3 | from ast2vec.repo2.uast import repos2uast_entry
 4 | from ast2vec.enry import install_enry
 5 | 
 6 | 
 7 | def pylib2uast_entry(args):
 8 |     log = logging.getLogger("pylib2uast")
 9 |     module_names = args.input
10 |     module_dirs = []
11 |     for lib_name in args.input:
12 |         try:
13 |             module = __import__(lib_name)
14 |             module_dir = os.path.abspath(os.path.dirname(module.__file__))
15 |             module_dirs.append(module_dir)
16 |         except ModuleNotFoundError as e:
17 |             log.error("No module named '%s'. Skipping.")
18 | 
19 |     args.input = module_dirs
20 | 
21 |     install_enry()
22 |     repos2uast_entry(args)
23 |     for file in os.listdir(args.output):
24 |         for name in module_names:
25 |             if name in file:
26 |                 break
27 |         os.rename(os.path.join(args.output, file), os.path.join(args.output, name + '.asdf'))
28 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/tests/__init__.py


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/snippet_test_repo.asdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/tests/data/snippet_test_repo.asdf


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/source_test_repo.asdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/tests/data/source_test_repo.asdf


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/test_lib.asdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/tests/data/test_lib.asdf


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/test_lib/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/src-d/snippet-ranger/06247e0492d59b859fe48dea0428171b252770ef/snippet_ranger/tests/data/test_lib/__init__.py


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/test_lib/example.py:
--------------------------------------------------------------------------------
 1 | def f1():
 2 |     pass
 3 | 
 4 | 
 5 | def f2():
 6 |     pass
 7 | 
 8 | 
 9 | def f3():
10 |     def f35():
11 |         pass
12 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/test_librariesio_data/projects-1.0.0-2017-06-15.csv:
--------------------------------------------------------------------------------
1 | ID,Platform,Name,Created Timestamp,Updated Timestamp,Description,Keywords,Homepage URL,Licenses,Repository URL,Versions Count,SourceRank,Latest Release Publish Timestamp,Latest Release Number,Package Manager ID,Dependent Projects Count,Language,Status,Last synced Timestamp,Dependent Repositories Count,Repository ID
2 | 1,Platform1,lib1,2015-01-11 23:56:18 UTC,2017-06-14 01:03:14 UTC,"A starting point for stripped down, structured and nib-less iOS applications including support for CocoaPods and Uncrustify.","",lib1.url,"",lib1.url,0,2,2017-06-14 01:03:05 UTC,,,0,Objective-C,,2017-06-14 01:03:10 UTC,0,3945
3 | 2,Platform2,lib2,2015-01-11 23:56:18 UTC,2017-06-14 01:03:10 UTC,Synchronize code snippets with a git repository.,"",lib2.url,MIT,lib2.url,0,11,2014-03-13 18:40:38 UTC,0.0.4,,0,Objective-C,,2017-06-14 01:03:07 UTC,0,3943


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/test_librariesio_data/repository_dependencies-1.0.0-2017-06-15.csv:
--------------------------------------------------------------------------------
1 | ID,Host Type,Repository Name with Owner,Repository ID,Manifest Platform,Manifest Filepath,Git branch,Manifest kind,Optional,Dependency Project Name,Dependency Requirements,Dependency Kind,Dependency Project ID
2 | 48593218,GitHub,repo1/repo1,1,Bower,bower.json,,manifest,,lib1,~3.2.0,development,1
3 | 48593223,GitHub,repo1/repo1,1,Bower,bower.json,,manifest,,lib2,~2.1.1,development,2
4 | 48593228,GitHub,repo2/repo2,2,Bower,bower.json,,manifest,,lib2,~0.5.0,development,2


--------------------------------------------------------------------------------
/snippet_ranger/tests/data/test_repo/example.py:
--------------------------------------------------------------------------------
 1 | import test_lib
 2 | from test_lib import f1
 3 | 
 4 | 
 5 | def f():
 6 |     f2()
 7 |     f2()
 8 |     f3()
 9 |     f1()
10 |     f3()
11 |     f3()
12 | 
13 | 
14 | def f3():
15 |     f()
16 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/models.py:
--------------------------------------------------------------------------------
1 | import os
2 | 
3 | LIB_NAME = "test_lib"
4 | DATA_DIR = os.path.join(os.path.dirname(__file__), "data/")
5 | TEST_LIB = os.path.join(DATA_DIR, "test_lib.asdf")
6 | TEST_REPO = os.path.join(DATA_DIR, "source_test_repo.asdf")
7 | SNIPPET = os.path.join(DATA_DIR, "snippet_test_repo.asdf")
8 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/test_librariesio_fetcher.py:
--------------------------------------------------------------------------------
 1 | import os
 2 | 
 3 | import unittest
 4 | import tempfile
 5 | 
 6 | from snippet_ranger.librariesio_fetcher import LibrariesIOFetcher
 7 | from snippet_ranger.tests.models import DATA_DIR
 8 | 
 9 | 
10 | class LibrariesIOFetcherTests(unittest.TestCase):
11 |     LIBRARIES_IO_DATA_PATH = os.path.join(DATA_DIR, "test_librariesio_data/")
12 | 
13 |     def setUp(self):
14 |         self.libio = LibrariesIOFetcher(LibrariesIOFetcherTests.LIBRARIES_IO_DATA_PATH)
15 | 
16 |     def get_url_str(self, lib, platform):
17 |         with tempfile.NamedTemporaryFile() as f:
18 |             self.libio.get_dependent_rep_urls(lib, platform, f.name)
19 |             with open(f.name) as f_urls:
20 |                 urls = f_urls.read()
21 |         return set(urls.split("\n")[:-1])
22 | 
23 |     def test_get_dependent_rep_urls(self):
24 |         url1 = set(["https://github.com/repo1/repo1"])
25 |         url2 = set(["https://github.com/repo2/repo2"])
26 | 
27 |         urls = self.get_url_str({"lib1": "lib1.url"}, "")
28 |         self.assertEqual(urls, url1)
29 | 
30 |         urls = self.get_url_str({"lib2": "lib2.url"}, "Platform2")
31 |         self.assertEqual(urls, url1 | url2)
32 |         with self.assertRaises(ValueError) as _:
33 |             self.get_url_str({"lib2": "lib2.url"}, "wrong_platform")
34 | 
35 |         urls = self.get_url_str({"lib1": "lib1.url", "lib2": "lib2.url"}, "")
36 |         self.assertEqual(urls, url1 | url2)
37 | 
38 |         with tempfile.TemporaryDirectory() as tmpdir:
39 |             self.libio.get_dependent_rep_urls(
40 |                 {"lib1": "lib1.url", "lib2": "lib2.url"}, "", tmpdir)
41 | 
42 |             with open(os.path.join(tmpdir, "lib1.txt")) as f_urls:
43 |                 urls = f_urls.read()
44 |             self.assertEqual(set(urls.split("\n")[:-1]), url1)
45 | 
46 |             with open(os.path.join(tmpdir, "lib2.txt")) as f_urls:
47 |                 urls = f_urls.read()
48 |             self.assertEqual(set(urls.split("\n")[:-1]), url1 | url2)
49 | 
50 | if __name__ == "__main__":
51 |     unittest.main()
52 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/test_main.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | from contextlib import contextmanager
 3 | from io import StringIO
 4 | import sys
 5 | import unittest
 6 | import logging
 7 | 
 8 | import snippet_ranger.__main__ as main
 9 | 
10 | 
11 | @contextmanager
12 | def captured_output():
13 |     log = StringIO()
14 |     log_handler = logging.StreamHandler(log)
15 |     logging.getLogger().addHandler(log_handler)
16 |     new_out, new_err = StringIO(), StringIO()
17 |     old_out, old_err = sys.stdout, sys.stderr
18 |     try:
19 |         sys.stdout, sys.stderr = new_out, new_err
20 |         yield sys.stdout, sys.stderr, log
21 |     finally:
22 |         sys.stdout, sys.stderr = old_out, old_err
23 |         logging.getLogger().removeHandler(log_handler)
24 | 
25 | 
26 | class MainTests(unittest.TestCase):
27 |     def test_handlers(self):
28 |         action2handler = {
29 |             "source2func": "source2func_entry",
30 |             "dependent_reps": "dependent_reps_entry",
31 |             "snippet2df": "snippet2df_entry",
32 |             "snippet2bow": "snippet2bow_entry",
33 |             "snippet2fc_bow": "snippet2fc_bow_entry",
34 |             "snippet2fc_df": "snippet2fc_df_entry",
35 |             "pylib2uast": "pylib2uast_entry"
36 | 
37 |         }
38 |         parser = main.get_parser()
39 |         subcommands = set([x.dest for x in parser._subparsers._actions[2]._choices_actions])
40 |         set_action2handler = set(action2handler)
41 |         self.assertFalse(len(subcommands - set_action2handler),
42 |                          "You forgot to add to this test {} subcommand(s) check".format(
43 |                              subcommands - set_action2handler))
44 | 
45 |         self.assertFalse(len(set_action2handler - subcommands),
46 |                          "You cover unexpected subcommand(s) {}".format(
47 |                              set_action2handler - subcommands))
48 | 
49 |         called_actions = []
50 |         args_save = sys.argv
51 |         error_save = argparse.ArgumentParser.error
52 |         try:
53 |             argparse.ArgumentParser.error = lambda self, message: None
54 | 
55 |             for action, handler in action2handler.items():
56 |                 def handler_append(*args, **kwargs):
57 |                     called_actions.append(action)
58 | 
59 |                 handler_save = getattr(main, handler)
60 |                 try:
61 |                     setattr(main, handler, handler_append)
62 |                     sys.argv = [main.__file__, action]
63 |                     main.main()
64 |                 finally:
65 |                     setattr(main, handler, handler_save)
66 |         finally:
67 |             sys.argv = args_save
68 |             argparse.ArgumentParser.error = error_save
69 | 
70 |         set_called_actions = set(called_actions)
71 |         set_actions = set(action2handler)
72 |         self.assertEqual(set_called_actions, set_actions)
73 |         self.assertEqual(len(set_called_actions), len(called_actions))
74 | 
75 |     def test_empty(self):
76 |         args = sys.argv
77 |         error = argparse.ArgumentParser.error
78 |         try:
79 |             argparse.ArgumentParser.error = lambda self, message: None
80 | 
81 |             sys.argv = [main.__file__]
82 |             with captured_output() as (stdout, _, _):
83 |                 main.main()
84 |         finally:
85 |             sys.argv = args
86 |             argparse.ArgumentParser.error = error
87 |         self.assertIn("usage:", stdout.getvalue())
88 | 
89 | 
90 | if __name__ == "__main__":
91 |     unittest.main()
92 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/test_snippet.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | 
 3 | import asdf
 4 | import numpy as np
 5 | from ast2vec.bblfsh_roles import Node
 6 | 
 7 | from modelforge import split_strings
 8 | from snippet_ranger.models.snippet import Snippet
 9 | from snippet_ranger.tests import models
10 | 
11 | 
12 | def validate_asdf_file(obj, filename):
13 |     data = asdf.open(filename)
14 |     obj.assertIn("meta", data.tree)
15 |     obj.assertIn("filenames", data.tree)
16 |     obj.assertIn("sources", data.tree)
17 |     obj.assertIn("uasts", data.tree)
18 |     obj.assertIn("repository", data.tree)
19 |     obj.assertIn("positions", data.tree)
20 |     Node.FromString(split_strings(data.tree["uasts"])[0])
21 |     obj.assertEqual(data.tree["sources"]["lengths"].shape[0],
22 |                     data.tree["uasts"]["lengths"].shape[0])
23 |     obj.assertEqual(0, len(data.tree["meta"]["dependencies"]))
24 |     obj.assertEqual(data.tree["meta"]["model"], "snippet")
25 | 
26 | 
27 | class TestSnippet(unittest.TestCase):
28 |     def setUp(self):
29 |         self.model = Snippet().load(source=models.SNIPPET)
30 | 
31 |     def assert_np_arrays(self, arr1, arr2):
32 |         self.assertEqual(type(arr1), np.ndarray)
33 |         self.assertEqual(type(arr2), np.ndarray)
34 |         self.assertTrue(np.all(arr1 == arr2))
35 | 
36 |     def test_names(self):
37 |         self.assertEqual(self.model.names,
38 |                          ["./snippet_ranger/snippet_ranger/tests/data/test_repo/example.py_4_11"])
39 | 
40 |     def test_item(self):
41 |         model_item = self.model[0]
42 |         self.assertEqual(len(model_item), 4)
43 |         self.assertEqual(model_item[0], "example.py")
44 |         self.assertEqual(type(model_item[1]), Node)
45 |         self.assertEqual(model_item[2],
46 |                          "def f():\n    f2()\n    f2()\n    f3()\n    f1()\n    f3()\n    f3()")
47 |         self.assert_np_arrays(model_item[3], np.array([4, 11]))
48 | 
49 |     def test_iter(self):
50 |         for model_item in self.model:
51 |             self.assertEqual(len(model_item), 4)
52 |             self.assertEqual(model_item[0], "example.py")
53 |             self.assertEqual(type(model_item[1]), Node)
54 |             self.assertEqual(model_item[2],
55 |                              "def f():\n    f2()\n    f2()\n    f3()\n    "
56 |                              "f1()\n    f3()\n    f3()")
57 |             self.assert_np_arrays(model_item[3], np.array([4, 11]))
58 | 
59 |     def test_positions_start(self):
60 |         self.assert_np_arrays(self.model.positions_start, np.array([4]))
61 | 
62 |     def test_positions_end(self):
63 |         self.assert_np_arrays(self.model.positions_end, np.array([11]))
64 | 
65 |     def test_positions(self):
66 |         self.assert_np_arrays(self.model.positions, np.array([[4, 11]]))
67 | 
68 |     def test_bad_construct(self):
69 |         repository = "repo_name"
70 |         filenames = ["file"]
71 |         sources = [""]
72 |         uasts = [Node()]
73 |         positions = np.array([[1, 2], [3, 4]])
74 |         pos_start = [1, 3]
75 |         pos_end = [2, 4]
76 | 
77 |         with self.assertRaises(ValueError):
78 |             Snippet().construct(repository, filenames, sources, uasts)
79 |         with self.assertRaises(ValueError):
80 |             Snippet().construct(repository, filenames, sources, uasts,
81 |                                 pos_start, pos_end, positions)
82 |         with self.assertRaises(ValueError):
83 |             Snippet().construct(repository, filenames, sources, uasts,
84 |                                 positions_start=pos_start, positions=positions)
85 |         with self.assertRaises(ValueError):
86 |             Snippet().construct(repository, filenames, sources, uasts,
87 |                                 positions_end=pos_end, positions=positions)
88 |         with self.assertRaises(ValueError):
89 |             Snippet().construct(repository, filenames, sources, uasts,
90 |                                 positions_start=pos_start, positions_end=[0])
91 | 
92 |         Snippet().construct(repository, filenames, sources, uasts, pos_start, pos_end)
93 |         Snippet().construct(repository, filenames, sources, uasts, positions=positions)
94 | 
95 | 
96 | if __name__ == "__main__":
97 |     unittest.main()
98 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/test_source2func.py:
--------------------------------------------------------------------------------
 1 | import argparse
 2 | import logging
 3 | import os
 4 | import unittest
 5 | import tempfile
 6 | 
 7 | import asdf
 8 | from ast2vec import Source
 9 | from ast2vec.bblfsh_roles import Node
10 | from modelforge import split_strings
11 | 
12 | from snippet_ranger.model2.source2func import Source2Func
13 | from snippet_ranger.model2.source2func import process_lib_functions, source2func_entry
14 | from snippet_ranger.models.snippet import Snippet
15 | from snippet_ranger.tests import models
16 | from snippet_ranger.utils import get_func_names_bow
17 | from snippet_ranger.tests.test_snippet import validate_asdf_file
18 | 
19 | 
20 | class Source2FuncTests(unittest.TestCase):
21 |     def test_get_func_names_bow(self):
22 |         in_bow = {
23 |             "_xxx": 1,
24 |             "xxx": 1,
25 |             "_yyy": 1,
26 |             "yyy": 1,
27 |             "test_x": 1,
28 |             "test_y": 1,
29 |         }
30 |         out_bow = process_lib_functions(in_bow)
31 |         self.assertEqual(out_bow, {"xxx": 1, "yyy": 1})
32 | 
33 |     def test_convert_model(self):
34 |         from ast2vec.bblfsh_roles import Node
35 | 
36 |         lib_model = Source().load(models.TEST_LIB)
37 |         functions_bow = get_func_names_bow(lib_model)
38 |         functions_bow = process_lib_functions(functions_bow)
39 |         self.assertEqual(functions_bow, {"f1": 1, "f2": 1, "f3": 1, "f35": 1})
40 | 
41 |         repo_model = Source().load(models.TEST_REPO)
42 | 
43 |         converter = Source2Func(models.LIB_NAME, functions_bow)
44 |         functons = converter.convert_model(repo_model)
45 | 
46 |         self.assertEqual(len(functons), 1)
47 |         functon_obj = functons[0]
48 |         self.assertEqual(functon_obj[0], "example.py")
49 |         self.assertEqual(type(functon_obj[1]), Node)
50 |         self.assertEqual(functon_obj[2],
51 |                          "def f():\n    f2()\n    f2()\n    f3()\n    f1()\n    f3()\n    f3()")
52 |         self.assertEqual(functon_obj[3][0], 4)
53 |         self.assertEqual(functon_obj[3][1], 11)
54 | 
55 |     def test_source2func_object(self):
56 |         with tempfile.TemporaryDirectory() as tmpdir:
57 |             args = argparse.Namespace(library_uast=models.TEST_LIB,
58 |                                       library_name=models.LIB_NAME,
59 |                                       input=models.DATA_DIR,
60 |                                       output=tmpdir,
61 |                                       filter="**/*.asdf",
62 |                                       log_level=logging.INFO,
63 |                                       processes=1,
64 |                                       overwrite_existing=True)
65 |             source2func_entry(args)
66 |             validate_asdf_file(self, os.path.join(tmpdir, "source_test_repo.asdf"))
67 | 
68 | 
69 | if __name__ == "__main__":
70 |     unittest.main()
71 | 


--------------------------------------------------------------------------------
/snippet_ranger/tests/test_utils.py:
--------------------------------------------------------------------------------
 1 | import unittest
 2 | 
 3 | from ast2vec import Source
 4 | from ast2vec import bblfsh_roles
 5 | 
 6 | from snippet_ranger import utils
 7 | from snippet_ranger.tests import models
 8 | 
 9 | 
10 | class UtilsTests(unittest.TestCase):
11 |     def test_get_func_names_bow(self):
12 |         source = Source().load(models.TEST_LIB)
13 |         bow = utils.get_func_names_bow(source)
14 |         true_bow = {
15 |             "f1": 1,
16 |             "f2": 1,
17 |             "f3": 1,
18 |             "f35": 1}
19 |         self.assertEqual(bow, true_bow)
20 | 
21 |     def test_uast_to_bag(self):
22 |         source = Source().load(models.TEST_REPO)
23 |         uast = source.uasts[0]
24 |         bag = utils.uast_to_bag(uast)
25 |         true_bag = {
26 |             "test_lib": 2,
27 |             "f": 2,
28 |             "f1": 2,
29 |             "f2": 2,
30 |             "f3": 4}
31 |         self.assertEqual(bag, true_bag)
32 | 
33 |     def test_get_imports(self):
34 |         source = Source().load(models.TEST_REPO)
35 |         uast = source.uasts[0]
36 |         imports = utils.get_imports(uast)
37 |         true_imports = {"f1", "test_lib"}
38 |         self.assertEqual(imports, true_imports)
39 | 
40 |         source = Source().load(models.TEST_LIB)
41 |         uast = source.uasts[0]
42 |         imports = utils.get_imports(uast)
43 |         true_imports = set()
44 |         self.assertEqual(imports, true_imports)
45 | 
46 |     def test_has_import(self):
47 |         source = Source().load(models.TEST_REPO)
48 |         self.assertTrue(utils.has_import("f1", source.uasts[0]))
49 |         self.assertTrue(utils.has_import("test_lib", source.uasts[0]))
50 | 
51 |         source = Source().load(models.TEST_LIB)
52 |         self.assertFalse(utils.has_import("f1", source.uasts[0]))
53 |         self.assertFalse(utils.has_import("test_lib", source.uasts[0]))
54 | 
55 | if __name__ == "__main__":
56 |     unittest.main()
57 | 


--------------------------------------------------------------------------------
/snippet_ranger/utils.py:
--------------------------------------------------------------------------------
 1 | from collections import defaultdict
 2 | 
 3 | from ast2vec import Source
 4 | from ast2vec import UASTModel
 5 | from ast2vec import bblfsh_roles
 6 | 
 7 | 
 8 | def uast_to_bag(uast, bag=None, role=bblfsh_roles.SIMPLE_IDENTIFIER):
 9 |     """
10 |     Convert UAST to bag of words for certain role.
11 | 
12 |     :param uast: Uast to process.
13 |     :param bag: Specify existing bag of words if you want to update it.
14 |     :param role: Role or list of roles to get from uast and convert to bag of words.
15 |     :return: bag of words for tokens of nodes.
16 |     """
17 |     if bag is None:
18 |         bag = defaultdict(int)
19 |     # TODO(zurk): Can be optimised if we need. uast_role_nodes make a list from one role.
20 |     for node in uast_role_nodes(uast, roles=role):
21 |         if node.token != "":
22 |             bag[node.token] += 1
23 |     return bag
24 | 
25 | 
26 | def uast_role_nodes(uast, roles=None) -> iter:
27 |     """
28 |     Filter UAST by provided roles and iterate trough corresponding nodes of uast.
29 |     It is a generator.
30 | 
31 |     :param uast:
32 |     :param roles: roles to filter.
33 |     :return: iterator trough corresponding nodes.
34 |     """
35 |     if roles is None:
36 |         roles = [bblfsh_roles.SIMPLE_IDENTIFIER]
37 |     elif isinstance(roles, int):
38 |         roles = [roles]
39 |     elif not isinstance(roles, list):
40 |         raise TypeError()
41 | 
42 |     stack = [uast]
43 |     while stack:
44 |         node = stack.pop(0)
45 |         for role_id in roles:
46 |             if role_id in node.roles:
47 |                 yield node
48 |                 break
49 |         stack.extend(node.children)
50 | 
51 | 
52 | def _iter_imports(uast):
53 |     """
54 |     Internal helper function to iterate through uast's imports
55 |     """
56 |     for n in uast_role_nodes(uast, [bblfsh_roles.IMPORT_PATH, bblfsh_roles.IMPORT_ALIAS]):
57 |         for x in n.token.split("."):
58 |             yield x
59 | 
60 | 
61 | def get_imports(uast):
62 |     """
63 |     Return all module imports from the uast.
64 |     It is specific for Python because imports should be splited by dot.
65 | 
66 |     :param uast:
67 |     :return: set of import names
68 |     """
69 |     return set(_iter_imports(uast))
70 | 
71 | 
72 | def has_import(libname, uast) -> bool:
73 |     """
74 |     Check `libname` import in the uast
75 | 
76 |     :param libname: name of library to check
77 |     :param uast:
78 |     :return:
79 |     """
80 |     for imp in _iter_imports(uast):
81 |         if imp == libname:
82 |             return True
83 |     return False
84 | 
85 | 
86 | def get_func_names_bow(uast_model: UASTModel) -> dict:
87 |     """
88 |     Returns bag of words for functions in all Source model.
89 | 
90 |     :param uast_model: UAST model
91 |     :return: dictionary with words as keys
92 |     """
93 |     func_class_names = None
94 |     for record in uast_model:
95 |         func_class_names = uast_to_bag(record[1], func_class_names,
96 |                                        bblfsh_roles.FUNCTION_DECLARATION_NAME)
97 |     return func_class_names
98 | 


--------------------------------------------------------------------------------