├── .gitignore ├── .travis.yml ├── DESCRIPTION ├── LICENSE.md ├── README.md ├── bin ├── datagen.cmd ├── fakelogs.cmd └── fakelogs.sh ├── files ├── call_signs2.txt ├── callsign_tbl ├── callsign_tbl_sorted ├── callsigns ├── cqlsh_setup ├── fake_logs │ ├── log1.log │ └── log2.log ├── favourite_animals.csv ├── flumeconf.cfg ├── ham.txt ├── happypandas ├── int_string.csv ├── pandainfo.json ├── spam.txt └── testweet.json ├── mini-complete-example ├── README.md ├── build.sbt ├── pom.xml ├── project │ └── plugins.sbt ├── sbt │ └── sbt └── src │ └── main │ ├── java │ └── com │ │ └── oreilly │ │ └── learningsparkexamples │ │ └── mini │ │ └── java │ │ ├── BasicMap.java │ │ └── WordCount.java │ └── scala │ └── com │ └── oreilly │ └── learningsparkexamples │ └── mini │ └── scala │ ├── BasicMap.scala │ └── WordCount.scala ├── pom.xml ├── project └── plugins.sbt ├── run-all-examples ├── sbt └── sbt ├── setup-project └── src ├── R └── finddistance.R ├── main ├── java │ └── com │ │ └── oreilly │ │ └── learningsparkexamples │ │ └── java │ │ ├── BasicAvg.java │ │ ├── BasicAvgMapPartitions.java │ │ ├── BasicAvgWithKryo.java │ │ ├── BasicFlatMap.java │ │ ├── BasicJoinCsv.java │ │ ├── BasicLoadJson.java │ │ ├── BasicLoadSequenceFile.java │ │ ├── BasicLoadWholeCsv.java │ │ ├── BasicMap.java │ │ ├── BasicMapPartitions.java │ │ ├── BasicMapThenFilter.java │ │ ├── BasicMapToDouble.java │ │ ├── BasicQueryCassandra.java │ │ ├── BasicSaveSequenceFile.java │ │ ├── BasicSum.java │ │ ├── CallLog.java │ │ ├── ChapterSixExample.java │ │ ├── HappyPerson.java │ │ ├── IntersectByKey.java │ │ ├── KafkaInput.java │ │ ├── KeyValueMapFilter.java │ │ ├── LoadHive.java │ │ ├── LoadJsonWithSparkSQL.java │ │ ├── MLlib.java │ │ ├── PerKeyAvg.java │ │ ├── RemoveOutliers.java │ │ ├── SparkSQLTwitter.java │ │ ├── StreamingLogInput.java │ │ ├── WordCount.java │ │ └── logs │ │ ├── ApacheAccessLog.java │ │ ├── Flags.java │ │ ├── Functions.java │ │ ├── LogAnalyzerAppMain.java │ │ ├── LogAnalyzerTotal.java │ │ ├── LogAnalyzerWindowed.java │ │ ├── LogStatistics.java │ │ ├── ReadTransferStats.java │ │ └── Renderer.java ├── protobuf │ ├── address_book.proto │ └── places.proto └── scala │ └── com │ └── oreilly │ └── learningsparkexamples │ └── scala │ ├── BasicAvg.scala │ ├── BasicAvgFromFile.scala │ ├── BasicAvgFromFiles.scala │ ├── BasicAvgMapPartitions.scala │ ├── BasicAvgWithKryo.scala │ ├── BasicFilterUnionCombo.scala │ ├── BasicIntersectByKey.scala │ ├── BasicLoadNums.scala │ ├── BasicLoadSequenceFile.scala │ ├── BasicLoadTextFromFTP.scala │ ├── BasicMap.scala │ ├── BasicMapNoCache.scala │ ├── BasicMapPartitions.scala │ ├── BasicMapThenFilter.scala │ ├── BasicParseCsv.scala │ ├── BasicParseJson.scala │ ├── BasicParseJsonWithJackson.scala │ ├── BasicParseWholeFileCsv.scala │ ├── BasicQueryCassandra.scala │ ├── BasicSaveProtoBuf.scala │ ├── BasicSaveSequenceFile.scala │ ├── BasicStreamingExample.scala │ ├── BasicSum.scala │ ├── ChapterSixExample.scala │ ├── FlumeInput.scala │ ├── KafkaInput.scala │ ├── LoadHive.scala │ ├── LoadJsonWithElephantBird.scala │ ├── LoadJsonWithSparkSQL.scala │ ├── LoadKeyValueTextInput.scala │ ├── LoadSimpleJdbc.scala │ ├── MLlib.scala │ ├── MLlibPipeline.disabled_until_111 │ ├── PerKeyAvg.scala │ ├── PipeExample.scala │ ├── RemoveOutliers.scala │ ├── SparkSQLTwitter.scala │ ├── StreamingLogInput.scala │ ├── WordCount.scala │ ├── WriteSimpleDB.scala │ └── logs │ ├── LogAnalyzerAppMain.scala │ ├── LogAnalyzerTotal.scala │ ├── LogAnalyzerWindowed.scala │ └── ReadTransferStats.scala ├── perl └── splitwords.pl └── python ├── AvgMapPartitions.py ├── BasicAvg.py ├── BasicFilterMap.py ├── BasicKeyValueMapFilter.py ├── BasicMap.py ├── BasicMapPartitions.py ├── BasicSum.py ├── ChapterSixExample.py ├── IntersectByKey.py ├── LoadCsv.py ├── LoadHive.py ├── LoadJson.py ├── MLlib.py ├── MakeHiveTable.py ├── MakeParquetFile.py ├── PerKeyAvg.py ├── QueryParquetFile.py ├── QueryParuetFile.py ├── RemoveOutliers.py ├── SparkSQLTwitter.py └── WordCount.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/.gitignore -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/.travis.yml -------------------------------------------------------------------------------- /DESCRIPTION: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/DESCRIPTION -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/LICENSE.md -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/README.md -------------------------------------------------------------------------------- /bin/datagen.cmd: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/bin/datagen.cmd -------------------------------------------------------------------------------- /bin/fakelogs.cmd: -------------------------------------------------------------------------------- 1 | ncat -l 7777 -k -c datagen.cmd -------------------------------------------------------------------------------- /bin/fakelogs.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/bin/fakelogs.sh -------------------------------------------------------------------------------- /files/call_signs2.txt: -------------------------------------------------------------------------------- 1 | KK6JKQ 2 | -------------------------------------------------------------------------------- /files/callsign_tbl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/callsign_tbl -------------------------------------------------------------------------------- /files/callsign_tbl_sorted: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/callsign_tbl_sorted -------------------------------------------------------------------------------- /files/callsigns: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/callsigns -------------------------------------------------------------------------------- /files/cqlsh_setup: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/cqlsh_setup -------------------------------------------------------------------------------- /files/fake_logs/log1.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/fake_logs/log1.log -------------------------------------------------------------------------------- /files/fake_logs/log2.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/fake_logs/log2.log -------------------------------------------------------------------------------- /files/favourite_animals.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/favourite_animals.csv -------------------------------------------------------------------------------- /files/flumeconf.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/flumeconf.cfg -------------------------------------------------------------------------------- /files/ham.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/ham.txt -------------------------------------------------------------------------------- /files/happypandas: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/happypandas -------------------------------------------------------------------------------- /files/int_string.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/int_string.csv -------------------------------------------------------------------------------- /files/pandainfo.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/pandainfo.json -------------------------------------------------------------------------------- /files/spam.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/spam.txt -------------------------------------------------------------------------------- /files/testweet.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/files/testweet.json -------------------------------------------------------------------------------- /mini-complete-example/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/README.md -------------------------------------------------------------------------------- /mini-complete-example/build.sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/build.sbt -------------------------------------------------------------------------------- /mini-complete-example/pom.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/pom.xml -------------------------------------------------------------------------------- /mini-complete-example/project/plugins.sbt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mini-complete-example/sbt/sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/sbt/sbt -------------------------------------------------------------------------------- /mini-complete-example/src/main/java/com/oreilly/learningsparkexamples/mini/java/BasicMap.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/src/main/java/com/oreilly/learningsparkexamples/mini/java/BasicMap.java -------------------------------------------------------------------------------- /mini-complete-example/src/main/java/com/oreilly/learningsparkexamples/mini/java/WordCount.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/src/main/java/com/oreilly/learningsparkexamples/mini/java/WordCount.java -------------------------------------------------------------------------------- /mini-complete-example/src/main/scala/com/oreilly/learningsparkexamples/mini/scala/BasicMap.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/src/main/scala/com/oreilly/learningsparkexamples/mini/scala/BasicMap.scala -------------------------------------------------------------------------------- /mini-complete-example/src/main/scala/com/oreilly/learningsparkexamples/mini/scala/WordCount.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/mini-complete-example/src/main/scala/com/oreilly/learningsparkexamples/mini/scala/WordCount.scala -------------------------------------------------------------------------------- /pom.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/pom.xml -------------------------------------------------------------------------------- /project/plugins.sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/project/plugins.sbt -------------------------------------------------------------------------------- /run-all-examples: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/run-all-examples -------------------------------------------------------------------------------- /sbt/sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/sbt/sbt -------------------------------------------------------------------------------- /setup-project: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/setup-project -------------------------------------------------------------------------------- /src/R/finddistance.R: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/R/finddistance.R -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicAvg.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicAvg.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicAvgMapPartitions.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicAvgMapPartitions.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicAvgWithKryo.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicAvgWithKryo.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicFlatMap.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicFlatMap.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicJoinCsv.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicJoinCsv.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicLoadJson.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicLoadJson.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicLoadSequenceFile.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicLoadSequenceFile.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicLoadWholeCsv.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicLoadWholeCsv.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicMap.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicMap.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicMapPartitions.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicMapPartitions.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicMapThenFilter.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicMapThenFilter.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicMapToDouble.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicMapToDouble.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicQueryCassandra.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicQueryCassandra.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicSaveSequenceFile.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicSaveSequenceFile.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/BasicSum.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/BasicSum.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/CallLog.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/CallLog.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/ChapterSixExample.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/ChapterSixExample.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/HappyPerson.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/HappyPerson.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/IntersectByKey.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/IntersectByKey.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/KafkaInput.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/KafkaInput.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/KeyValueMapFilter.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/KeyValueMapFilter.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/LoadHive.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/LoadHive.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/LoadJsonWithSparkSQL.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/LoadJsonWithSparkSQL.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/MLlib.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/MLlib.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/PerKeyAvg.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/PerKeyAvg.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/RemoveOutliers.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/RemoveOutliers.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/SparkSQLTwitter.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/SparkSQLTwitter.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/StreamingLogInput.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/StreamingLogInput.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/WordCount.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/WordCount.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/ApacheAccessLog.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/ApacheAccessLog.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/Flags.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/Flags.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/Functions.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/Functions.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/LogAnalyzerAppMain.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/LogAnalyzerAppMain.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/LogAnalyzerTotal.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/LogAnalyzerTotal.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/LogAnalyzerWindowed.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/LogAnalyzerWindowed.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/LogStatistics.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/LogStatistics.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/ReadTransferStats.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/ReadTransferStats.java -------------------------------------------------------------------------------- /src/main/java/com/oreilly/learningsparkexamples/java/logs/Renderer.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/java/com/oreilly/learningsparkexamples/java/logs/Renderer.java -------------------------------------------------------------------------------- /src/main/protobuf/address_book.proto: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/protobuf/address_book.proto -------------------------------------------------------------------------------- /src/main/protobuf/places.proto: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/protobuf/places.proto -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvg.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvg.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgFromFile.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgFromFile.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgFromFiles.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgFromFiles.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgMapPartitions.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgMapPartitions.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgWithKryo.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicAvgWithKryo.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicFilterUnionCombo.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicFilterUnionCombo.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicIntersectByKey.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicIntersectByKey.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicLoadNums.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicLoadNums.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicLoadSequenceFile.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicLoadSequenceFile.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicLoadTextFromFTP.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicLoadTextFromFTP.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMap.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMap.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMapNoCache.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMapNoCache.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMapPartitions.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMapPartitions.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMapThenFilter.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicMapThenFilter.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseCsv.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseCsv.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseJson.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseJson.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseJsonWithJackson.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseJsonWithJackson.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseWholeFileCsv.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicParseWholeFileCsv.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicQueryCassandra.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicQueryCassandra.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicSaveProtoBuf.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicSaveProtoBuf.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicSaveSequenceFile.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicSaveSequenceFile.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicStreamingExample.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicStreamingExample.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/BasicSum.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/BasicSum.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/ChapterSixExample.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/ChapterSixExample.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/FlumeInput.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/FlumeInput.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/KafkaInput.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/KafkaInput.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/LoadHive.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/LoadHive.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/LoadJsonWithElephantBird.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/LoadJsonWithElephantBird.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/LoadJsonWithSparkSQL.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/LoadJsonWithSparkSQL.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/LoadKeyValueTextInput.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/LoadKeyValueTextInput.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/LoadSimpleJdbc.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/LoadSimpleJdbc.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/MLlib.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/MLlib.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/MLlibPipeline.disabled_until_111: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/MLlibPipeline.disabled_until_111 -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/PerKeyAvg.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/PerKeyAvg.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/PipeExample.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/PipeExample.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/RemoveOutliers.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/RemoveOutliers.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/SparkSQLTwitter.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/SparkSQLTwitter.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/StreamingLogInput.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/StreamingLogInput.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/WordCount.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/WordCount.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/WriteSimpleDB.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/WriteSimpleDB.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/logs/LogAnalyzerAppMain.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/logs/LogAnalyzerAppMain.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/logs/LogAnalyzerTotal.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/logs/LogAnalyzerTotal.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/logs/LogAnalyzerWindowed.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/logs/LogAnalyzerWindowed.scala -------------------------------------------------------------------------------- /src/main/scala/com/oreilly/learningsparkexamples/scala/logs/ReadTransferStats.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/main/scala/com/oreilly/learningsparkexamples/scala/logs/ReadTransferStats.scala -------------------------------------------------------------------------------- /src/perl/splitwords.pl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/perl/splitwords.pl -------------------------------------------------------------------------------- /src/python/AvgMapPartitions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/AvgMapPartitions.py -------------------------------------------------------------------------------- /src/python/BasicAvg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/BasicAvg.py -------------------------------------------------------------------------------- /src/python/BasicFilterMap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/BasicFilterMap.py -------------------------------------------------------------------------------- /src/python/BasicKeyValueMapFilter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/BasicKeyValueMapFilter.py -------------------------------------------------------------------------------- /src/python/BasicMap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/BasicMap.py -------------------------------------------------------------------------------- /src/python/BasicMapPartitions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/BasicMapPartitions.py -------------------------------------------------------------------------------- /src/python/BasicSum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/BasicSum.py -------------------------------------------------------------------------------- /src/python/ChapterSixExample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/ChapterSixExample.py -------------------------------------------------------------------------------- /src/python/IntersectByKey.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/IntersectByKey.py -------------------------------------------------------------------------------- /src/python/LoadCsv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/LoadCsv.py -------------------------------------------------------------------------------- /src/python/LoadHive.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/LoadHive.py -------------------------------------------------------------------------------- /src/python/LoadJson.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/LoadJson.py -------------------------------------------------------------------------------- /src/python/MLlib.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/MLlib.py -------------------------------------------------------------------------------- /src/python/MakeHiveTable.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/MakeHiveTable.py -------------------------------------------------------------------------------- /src/python/MakeParquetFile.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/MakeParquetFile.py -------------------------------------------------------------------------------- /src/python/PerKeyAvg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/PerKeyAvg.py -------------------------------------------------------------------------------- /src/python/QueryParquetFile.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/QueryParquetFile.py -------------------------------------------------------------------------------- /src/python/QueryParuetFile.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/QueryParuetFile.py -------------------------------------------------------------------------------- /src/python/RemoveOutliers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/RemoveOutliers.py -------------------------------------------------------------------------------- /src/python/SparkSQLTwitter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/SparkSQLTwitter.py -------------------------------------------------------------------------------- /src/python/WordCount.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/holdenk/learning-spark-examples/HEAD/src/python/WordCount.py --------------------------------------------------------------------------------