├── KafkaProducer ├── .gitignore ├── Readme.md ├── build.sbt ├── data │ ├── 26GB │ │ ├── scatter_plot_1.png │ │ ├── scatter_plot_2.png │ │ ├── scatter_plot_4.png │ │ ├── scatter_plot_5.png │ │ ├── t11_jmap-histo │ │ └── t11_jstat │ ├── 5GB │ │ ├── jmap_output.txt │ │ ├── jstat_output.txt │ │ ├── scatter_plot1.png │ │ └── scatter_plot2.png │ ├── jmap_output.txt │ ├── jstat_output.txt │ ├── scatter_plot1.png │ └── scatter_plot2.png ├── project │ ├── build.properties │ └── plugins.sbt ├── sbt └── src │ └── main │ └── scala │ └── com │ └── github │ └── scrapcodes │ └── kafka │ ├── BenchmarkingProducer.scala │ ├── LowLatencyKafkaTest.scala │ └── SparkSQLKafkaConsumer.scala ├── MapReduceJobs ├── .classpath ├── .project ├── LICENSE ├── Readme.md ├── build.xml ├── lib │ ├── commoncrawl-0.1.jar │ ├── hadoop-core.jar │ ├── jets3t-0.8.1.jar │ └── jsoup-1.6.1.jar └── src │ └── com │ └── imaginea │ └── mapreducejobs │ ├── CountURLMapper.java │ ├── InverseWCJob.java │ ├── InverseWordCountMapper.java │ ├── StopWords.java │ └── URLAggregateJob.java ├── README.md ├── deep-dive-with-spark-streamingtathagata-dasspark-meetup2013-06-17-130623151510-phpapp02.pptx └── spark-news-master.zip /KafkaProducer/.gitignore: -------------------------------------------------------------------------------- 1 | target/ 2 | .idea/ 3 | *iml 4 | -------------------------------------------------------------------------------- /KafkaProducer/Readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/Readme.md -------------------------------------------------------------------------------- /KafkaProducer/build.sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/build.sbt -------------------------------------------------------------------------------- /KafkaProducer/data/26GB/scatter_plot_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/26GB/scatter_plot_1.png -------------------------------------------------------------------------------- /KafkaProducer/data/26GB/scatter_plot_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/26GB/scatter_plot_2.png -------------------------------------------------------------------------------- /KafkaProducer/data/26GB/scatter_plot_4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/26GB/scatter_plot_4.png -------------------------------------------------------------------------------- /KafkaProducer/data/26GB/scatter_plot_5.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/26GB/scatter_plot_5.png -------------------------------------------------------------------------------- /KafkaProducer/data/26GB/t11_jmap-histo: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/26GB/t11_jmap-histo -------------------------------------------------------------------------------- /KafkaProducer/data/26GB/t11_jstat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/26GB/t11_jstat -------------------------------------------------------------------------------- /KafkaProducer/data/5GB/jmap_output.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/5GB/jmap_output.txt -------------------------------------------------------------------------------- /KafkaProducer/data/5GB/jstat_output.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/5GB/jstat_output.txt -------------------------------------------------------------------------------- /KafkaProducer/data/5GB/scatter_plot1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/5GB/scatter_plot1.png -------------------------------------------------------------------------------- /KafkaProducer/data/5GB/scatter_plot2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/5GB/scatter_plot2.png -------------------------------------------------------------------------------- /KafkaProducer/data/jmap_output.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/jmap_output.txt -------------------------------------------------------------------------------- /KafkaProducer/data/jstat_output.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/jstat_output.txt -------------------------------------------------------------------------------- /KafkaProducer/data/scatter_plot1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/scatter_plot1.png -------------------------------------------------------------------------------- /KafkaProducer/data/scatter_plot2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/data/scatter_plot2.png -------------------------------------------------------------------------------- /KafkaProducer/project/build.properties: -------------------------------------------------------------------------------- 1 | sbt.version = 0.13.8 -------------------------------------------------------------------------------- /KafkaProducer/project/plugins.sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/project/plugins.sbt -------------------------------------------------------------------------------- /KafkaProducer/sbt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/sbt -------------------------------------------------------------------------------- /KafkaProducer/src/main/scala/com/github/scrapcodes/kafka/BenchmarkingProducer.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/src/main/scala/com/github/scrapcodes/kafka/BenchmarkingProducer.scala -------------------------------------------------------------------------------- /KafkaProducer/src/main/scala/com/github/scrapcodes/kafka/LowLatencyKafkaTest.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/src/main/scala/com/github/scrapcodes/kafka/LowLatencyKafkaTest.scala -------------------------------------------------------------------------------- /KafkaProducer/src/main/scala/com/github/scrapcodes/kafka/SparkSQLKafkaConsumer.scala: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/KafkaProducer/src/main/scala/com/github/scrapcodes/kafka/SparkSQLKafkaConsumer.scala -------------------------------------------------------------------------------- /MapReduceJobs/.classpath: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/.classpath -------------------------------------------------------------------------------- /MapReduceJobs/.project: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/.project -------------------------------------------------------------------------------- /MapReduceJobs/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/LICENSE -------------------------------------------------------------------------------- /MapReduceJobs/Readme.md: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /MapReduceJobs/build.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/build.xml -------------------------------------------------------------------------------- /MapReduceJobs/lib/commoncrawl-0.1.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/lib/commoncrawl-0.1.jar -------------------------------------------------------------------------------- /MapReduceJobs/lib/hadoop-core.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/lib/hadoop-core.jar -------------------------------------------------------------------------------- /MapReduceJobs/lib/jets3t-0.8.1.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/lib/jets3t-0.8.1.jar -------------------------------------------------------------------------------- /MapReduceJobs/lib/jsoup-1.6.1.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/lib/jsoup-1.6.1.jar -------------------------------------------------------------------------------- /MapReduceJobs/src/com/imaginea/mapreducejobs/CountURLMapper.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/src/com/imaginea/mapreducejobs/CountURLMapper.java -------------------------------------------------------------------------------- /MapReduceJobs/src/com/imaginea/mapreducejobs/InverseWCJob.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/src/com/imaginea/mapreducejobs/InverseWCJob.java -------------------------------------------------------------------------------- /MapReduceJobs/src/com/imaginea/mapreducejobs/InverseWordCountMapper.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/src/com/imaginea/mapreducejobs/InverseWordCountMapper.java -------------------------------------------------------------------------------- /MapReduceJobs/src/com/imaginea/mapreducejobs/StopWords.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/src/com/imaginea/mapreducejobs/StopWords.java -------------------------------------------------------------------------------- /MapReduceJobs/src/com/imaginea/mapreducejobs/URLAggregateJob.java: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/MapReduceJobs/src/com/imaginea/mapreducejobs/URLAggregateJob.java -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/README.md -------------------------------------------------------------------------------- /deep-dive-with-spark-streamingtathagata-dasspark-meetup2013-06-17-130623151510-phpapp02.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/deep-dive-with-spark-streamingtathagata-dasspark-meetup2013-06-17-130623151510-phpapp02.pptx -------------------------------------------------------------------------------- /spark-news-master.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/vaquarkhan/Apache-Kafka-poc-and-notes/HEAD/spark-news-master.zip --------------------------------------------------------------------------------