├── README.md ├── capstone-project ├── How can we increase revenue from Catch the Pink Flamingo?.pdf ├── Technical Appendix.pdf ├── graph-analytics.cypher ├── pyspark-mllib-clustering.ipynb └── week1-data-exploration.md ├── graph-analytics ├── adding-to-and-modifying-a-graph.cypher ├── basic-graph-operations-with-cypher.cypher ├── building-a-degree-histogram.scala ├── building-a-graph.scala ├── connectivity-analytics-with-cypher.cypher ├── getting-started-with-neo4j.cypher ├── importing_data_into_neo4j.cypher ├── joining-graph-datasets.scala ├── network-connectedness-and-clustering-components.scala ├── path-analytics-with-cypher.cypher └── plot-the-degree-histogram.scala ├── integration-and-processing ├── exploring-sparksql-and-spark-dataframes.py ├── exporting-data-from-mongodb-to-a-csv-file.md ├── querying-and-exporting-from-mongodb.md ├── querying-data-quiz.py ├── querying-data-quiz.sql ├── querying-doc-mongodb.sh ├── soccer-tweet-analysis.ipynb ├── spark-streaming.ipynb └── spark-wordcount.ipynb ├── introduction ├── HadoopMapReduceQuiz.md └── homework-MapReduce.pdf └── machine-learning ├── classification-in-spark.ipynb ├── clustering.ipynb ├── data-exploration-in-spark-quiz.py ├── data-exploration-in-spark.ipynb ├── handling-missing-values.ipynb └── model-evaluation.ipynb /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/README.md -------------------------------------------------------------------------------- /capstone-project/How can we increase revenue from Catch the Pink Flamingo?.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/capstone-project/How can we increase revenue from Catch the Pink Flamingo?.pdf -------------------------------------------------------------------------------- /capstone-project/Technical Appendix.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/capstone-project/Technical Appendix.pdf -------------------------------------------------------------------------------- /capstone-project/graph-analytics.cypher: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/capstone-project/graph-analytics.cypher -------------------------------------------------------------------------------- /capstone-project/pyspark-mllib-clustering.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/capstone-project/pyspark-mllib-clustering.ipynb -------------------------------------------------------------------------------- /capstone-project/week1-data-exploration.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/capstone-project/week1-data-exploration.md -------------------------------------------------------------------------------- /graph-analytics/adding-to-and-modifying-a-graph.cypher: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/adding-to-and-modifying-a-graph.cypher -------------------------------------------------------------------------------- /graph-analytics/basic-graph-operations-with-cypher.cypher: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/basic-graph-operations-with-cypher.cypher -------------------------------------------------------------------------------- /graph-analytics/building-a-degree-histogram.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/building-a-degree-histogram.scala -------------------------------------------------------------------------------- /graph-analytics/building-a-graph.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/building-a-graph.scala -------------------------------------------------------------------------------- /graph-analytics/connectivity-analytics-with-cypher.cypher: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/connectivity-analytics-with-cypher.cypher -------------------------------------------------------------------------------- /graph-analytics/getting-started-with-neo4j.cypher: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/getting-started-with-neo4j.cypher -------------------------------------------------------------------------------- /graph-analytics/importing_data_into_neo4j.cypher: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/importing_data_into_neo4j.cypher -------------------------------------------------------------------------------- /graph-analytics/joining-graph-datasets.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/joining-graph-datasets.scala -------------------------------------------------------------------------------- /graph-analytics/network-connectedness-and-clustering-components.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/network-connectedness-and-clustering-components.scala -------------------------------------------------------------------------------- /graph-analytics/path-analytics-with-cypher.cypher: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/path-analytics-with-cypher.cypher -------------------------------------------------------------------------------- /graph-analytics/plot-the-degree-histogram.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/graph-analytics/plot-the-degree-histogram.scala -------------------------------------------------------------------------------- /integration-and-processing/exploring-sparksql-and-spark-dataframes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/exploring-sparksql-and-spark-dataframes.py -------------------------------------------------------------------------------- /integration-and-processing/exporting-data-from-mongodb-to-a-csv-file.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/exporting-data-from-mongodb-to-a-csv-file.md -------------------------------------------------------------------------------- /integration-and-processing/querying-and-exporting-from-mongodb.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/querying-and-exporting-from-mongodb.md -------------------------------------------------------------------------------- /integration-and-processing/querying-data-quiz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/querying-data-quiz.py -------------------------------------------------------------------------------- /integration-and-processing/querying-data-quiz.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/querying-data-quiz.sql -------------------------------------------------------------------------------- /integration-and-processing/querying-doc-mongodb.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/querying-doc-mongodb.sh -------------------------------------------------------------------------------- /integration-and-processing/soccer-tweet-analysis.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/soccer-tweet-analysis.ipynb -------------------------------------------------------------------------------- /integration-and-processing/spark-streaming.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/spark-streaming.ipynb -------------------------------------------------------------------------------- /integration-and-processing/spark-wordcount.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/integration-and-processing/spark-wordcount.ipynb -------------------------------------------------------------------------------- /introduction/HadoopMapReduceQuiz.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/introduction/HadoopMapReduceQuiz.md -------------------------------------------------------------------------------- /introduction/homework-MapReduce.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/introduction/homework-MapReduce.pdf -------------------------------------------------------------------------------- /machine-learning/classification-in-spark.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/machine-learning/classification-in-spark.ipynb -------------------------------------------------------------------------------- /machine-learning/clustering.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/machine-learning/clustering.ipynb -------------------------------------------------------------------------------- /machine-learning/data-exploration-in-spark-quiz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/machine-learning/data-exploration-in-spark-quiz.py -------------------------------------------------------------------------------- /machine-learning/data-exploration-in-spark.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/machine-learning/data-exploration-in-spark.ipynb -------------------------------------------------------------------------------- /machine-learning/handling-missing-values.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/machine-learning/handling-missing-values.ipynb -------------------------------------------------------------------------------- /machine-learning/model-evaluation.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/jingwen-z/bigdata-ucsd/HEAD/machine-learning/model-evaluation.ipynb --------------------------------------------------------------------------------