├── .env.spark ├── .gitignore ├── .isort.cfg ├── .pre-commit-config.yaml ├── .pydocstyle ├── .pylintrc ├── .relint.yml ├── Dockerfile ├── Dockerfile-yarn ├── LICENSE ├── Makefile ├── Readme.md ├── book_data ├── 2019-01-01.csv ├── BroadcastLogs_2018_Q3_M8-SAMPLE.csv ├── Periodic_Table_Of_Elements.csv ├── ReferenceTables │ ├── BroadcastProducers.csv │ ├── CD_AirLanguage.csv │ ├── CD_AudienceTargetAge.csv │ ├── CD_AudienceTargetEthnic.csv │ ├── CD_BroadcastOriginPoint.csv │ ├── CD_Category.csv │ ├── CD_ClosedCaption.csv │ ├── CD_Composition.csv │ ├── CD_CountryOfOrigin.csv │ ├── CD_DubDramaCredit.csv │ ├── CD_EthnicProgram.csv │ ├── CD_Exhibition.csv │ ├── CD_FilmClassification.csv │ ├── CD_NetworkAffiliation.csv │ ├── CD_ProductionSource.csv │ ├── CD_ProgramClass.csv │ ├── CD_SpecialAttention.csv │ ├── Call_Signs.csv │ └── LogIdentifier.csv ├── pokedex.dsv ├── pride-and-prejudice.txt ├── sample.csv ├── sample_frame.csv ├── shows-breaking-bad.json ├── shows-silicon-valley.json └── shows-the-golden-girls.json ├── conf └── spark-defaults.conf ├── docker-compose.yarn.yml ├── docker-compose.yml ├── entrypoint-yarn.sh ├── entrypoint.sh ├── requirements ├── requirements.in └── requirements.txt ├── spark_apps └── data_analysis_book │ ├── chapter02 │ ├── ex2.py │ └── word_non_null.py │ ├── chapter03 │ ├── ex3_3.py │ ├── ex3_4.py │ ├── ex3_5.py │ ├── ex3_5_2.py │ ├── word_non_null.py │ ├── word_non_null_short.py │ └── word_non_null_short_multiple_files.py │ ├── chapter04 │ ├── broadcast_logs.py │ ├── broadcast_logs_new_column.py │ ├── broadcast_logs_stats.py │ ├── broadcast_logs_tidy.py │ ├── broadcast_logs_unpacking.py │ ├── ex4_1.py │ ├── ex4_3.py │ ├── ex4_4.py │ └── tabular_data.py │ ├── chapter05 │ ├── broadcast_logs.py │ ├── broadcast_logs_naming.py │ ├── ex5.py │ ├── ex5_5.py │ ├── ex5_6.py │ └── ex5_7.py │ ├── chapter06 │ ├── defining_schema.py │ ├── defining_schema_json.py │ ├── ex6.py │ ├── ex6_6.py │ ├── ex6_7.py │ ├── ex6_8.py │ ├── reading_json.py │ ├── reading_json_explode_collect.py │ └── reading_json_struct.py │ └── chapter07 │ ├── backblaze.py │ ├── blending_sql_python.py │ ├── creating_view.py │ ├── download_backblaze_data.py │ ├── ex7_2.py │ ├── ex7_3.py │ ├── ex7_4.py │ ├── ex7_5.py │ ├── periodic_table.py │ ├── spark_catalog.py │ ├── sql_querying.py │ └── subquery_cte.py ├── ssh_config └── yarn ├── capacity-scheduler.xml ├── core-site.xml ├── hdfs-site.xml ├── mapred-site.xml ├── spark-defaults.conf └── yarn-site.xml /.env.spark: -------------------------------------------------------------------------------- 1 | SPARK_NO_DAEMONIZE=true 2 | -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/.gitignore -------------------------------------------------------------------------------- /.isort.cfg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/.isort.cfg -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /.pydocstyle: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/.pydocstyle -------------------------------------------------------------------------------- /.pylintrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/.pylintrc -------------------------------------------------------------------------------- /.relint.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/.relint.yml -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/Dockerfile -------------------------------------------------------------------------------- /Dockerfile-yarn: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/Dockerfile-yarn -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/Makefile -------------------------------------------------------------------------------- /Readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/Readme.md -------------------------------------------------------------------------------- /book_data/2019-01-01.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/2019-01-01.csv -------------------------------------------------------------------------------- /book_data/BroadcastLogs_2018_Q3_M8-SAMPLE.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/BroadcastLogs_2018_Q3_M8-SAMPLE.csv -------------------------------------------------------------------------------- /book_data/Periodic_Table_Of_Elements.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/Periodic_Table_Of_Elements.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/BroadcastProducers.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/BroadcastProducers.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_AirLanguage.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_AirLanguage.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_AudienceTargetAge.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_AudienceTargetAge.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_AudienceTargetEthnic.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_AudienceTargetEthnic.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_BroadcastOriginPoint.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_BroadcastOriginPoint.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_Category.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_Category.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_ClosedCaption.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_ClosedCaption.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_Composition.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_Composition.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_CountryOfOrigin.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_CountryOfOrigin.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_DubDramaCredit.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_DubDramaCredit.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_EthnicProgram.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_EthnicProgram.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_Exhibition.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_Exhibition.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_FilmClassification.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_FilmClassification.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_NetworkAffiliation.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_NetworkAffiliation.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_ProductionSource.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_ProductionSource.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_ProgramClass.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_ProgramClass.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/CD_SpecialAttention.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/CD_SpecialAttention.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/Call_Signs.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/Call_Signs.csv -------------------------------------------------------------------------------- /book_data/ReferenceTables/LogIdentifier.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/ReferenceTables/LogIdentifier.csv -------------------------------------------------------------------------------- /book_data/pokedex.dsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/pokedex.dsv -------------------------------------------------------------------------------- /book_data/pride-and-prejudice.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/pride-and-prejudice.txt -------------------------------------------------------------------------------- /book_data/sample.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/sample.csv -------------------------------------------------------------------------------- /book_data/sample_frame.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/sample_frame.csv -------------------------------------------------------------------------------- /book_data/shows-breaking-bad.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/shows-breaking-bad.json -------------------------------------------------------------------------------- /book_data/shows-silicon-valley.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/shows-silicon-valley.json -------------------------------------------------------------------------------- /book_data/shows-the-golden-girls.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/book_data/shows-the-golden-girls.json -------------------------------------------------------------------------------- /conf/spark-defaults.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/conf/spark-defaults.conf -------------------------------------------------------------------------------- /docker-compose.yarn.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/docker-compose.yarn.yml -------------------------------------------------------------------------------- /docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/docker-compose.yml -------------------------------------------------------------------------------- /entrypoint-yarn.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/entrypoint-yarn.sh -------------------------------------------------------------------------------- /entrypoint.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/entrypoint.sh -------------------------------------------------------------------------------- /requirements/requirements.in: -------------------------------------------------------------------------------- 1 | ipython 2 | pandas 3 | pyarrow 4 | numpy 5 | pyspark 6 | -------------------------------------------------------------------------------- /requirements/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/requirements/requirements.txt -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter02/ex2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter02/ex2.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter02/word_non_null.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter02/word_non_null.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter03/ex3_3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter03/ex3_3.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter03/ex3_4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter03/ex3_4.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter03/ex3_5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter03/ex3_5.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter03/ex3_5_2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter03/ex3_5_2.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter03/word_non_null.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter03/word_non_null.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter03/word_non_null_short.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter03/word_non_null_short.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter03/word_non_null_short_multiple_files.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter03/word_non_null_short_multiple_files.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/broadcast_logs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/broadcast_logs.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/broadcast_logs_new_column.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/broadcast_logs_new_column.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/broadcast_logs_stats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/broadcast_logs_stats.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/broadcast_logs_tidy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/broadcast_logs_tidy.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/broadcast_logs_unpacking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/broadcast_logs_unpacking.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/ex4_1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/ex4_1.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/ex4_3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/ex4_3.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/ex4_4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/ex4_4.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter04/tabular_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter04/tabular_data.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter05/broadcast_logs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter05/broadcast_logs.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter05/broadcast_logs_naming.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter05/broadcast_logs_naming.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter05/ex5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter05/ex5.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter05/ex5_5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter05/ex5_5.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter05/ex5_6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter05/ex5_6.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter05/ex5_7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter05/ex5_7.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/defining_schema.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/defining_schema.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/defining_schema_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/defining_schema_json.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/ex6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/ex6.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/ex6_6.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/ex6_6.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/ex6_7.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/ex6_7.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/ex6_8.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/ex6_8.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/reading_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/reading_json.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/reading_json_explode_collect.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/reading_json_explode_collect.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter06/reading_json_struct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter06/reading_json_struct.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/backblaze.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/backblaze.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/blending_sql_python.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/blending_sql_python.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/creating_view.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/creating_view.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/download_backblaze_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/download_backblaze_data.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/ex7_2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/ex7_2.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/ex7_3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/ex7_3.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/ex7_4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/ex7_4.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/ex7_5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/ex7_5.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/periodic_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/periodic_table.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/spark_catalog.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/spark_catalog.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/sql_querying.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/sql_querying.py -------------------------------------------------------------------------------- /spark_apps/data_analysis_book/chapter07/subquery_cte.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/spark_apps/data_analysis_book/chapter07/subquery_cte.py -------------------------------------------------------------------------------- /ssh_config: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/ssh_config -------------------------------------------------------------------------------- /yarn/capacity-scheduler.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/yarn/capacity-scheduler.xml -------------------------------------------------------------------------------- /yarn/core-site.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/yarn/core-site.xml -------------------------------------------------------------------------------- /yarn/hdfs-site.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/yarn/hdfs-site.xml -------------------------------------------------------------------------------- /yarn/mapred-site.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/yarn/mapred-site.xml -------------------------------------------------------------------------------- /yarn/spark-defaults.conf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/yarn/spark-defaults.conf -------------------------------------------------------------------------------- /yarn/yarn-site.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/mrn-aglic/pyspark-playground/HEAD/yarn/yarn-site.xml --------------------------------------------------------------------------------