├── .gitattributes ├── .gitignore ├── LICENSE ├── README.md ├── Week1 ├── ClickHouse │ └── docker-compose.yml ├── Postgres │ ├── container-data │ │ └── postgres │ │ │ └── init.sql │ └── docker-compose.yaml ├── employee.png ├── help.txt └── practice.sql ├── Week2 ├── docker-hadoop │ ├── docker-compose.yml │ ├── hadoop.env │ ├── init4win7.bat │ └── tmp │ │ ├── data │ │ ├── checkdata.txt │ │ ├── checkdata2.txt │ │ ├── checkdata3.txt │ │ ├── checkdata4.txt │ │ └── checkdata5.txt │ │ ├── init │ │ └── init.sh │ │ ├── input │ │ ├── input1.txt │ │ └── input2.txt │ │ └── job │ │ └── mr-wordcount.jar └── help.txt ├── Week3 ├── Jupyter │ ├── docker-compose.yaml │ └── notebooks │ │ ├── .ipynb_checkpoints │ │ └── PySparkTasksTemplate-checkpoint.ipynb │ │ ├── PySparkTasksTemplate.ipynb │ │ ├── taxi_cars_data.parquet │ │ └── taxi_data.parquet ├── Project │ ├── PySparkJob.py │ └── clickstream.parquet ├── help.txt ├── spark-practice │ ├── PySpark.ipynb │ ├── PySparkTitanikJob.ipynb │ └── train.csv └── spark-tasks │ ├── PySparkTasksTemplate.ipynb │ ├── taxi_cars_data.parquet │ └── taxi_data.parquet ├── Week4 ├── Airflow │ ├── container-data │ │ └── airflow │ │ │ └── dags │ │ │ ├── calculate_dag.py │ │ │ ├── calculate_parallel_dag.py │ │ │ ├── dummy_dag.py │ │ │ └── hello_dag.py │ └── docker-compose.yaml └── help.txt ├── Week5 ├── SparkML │ ├── Project │ │ ├── PySparkMLFit.py │ │ ├── PySparkMLPredict.py │ │ ├── test.parquet │ │ └── train.parquet │ ├── spark-practice │ │ ├── TitanikSparkML.ipynb │ │ ├── cat_dog │ │ │ ├── PySparkMLDL.ipynb │ │ │ ├── cat_dog.zip │ │ │ ├── scala-logging_2.11-3.9.2.jar │ │ │ └── tensorframes-0.6.0-s_2.11.jar │ │ └── train.csv │ └── spark-tasks │ │ ├── SparkMLTemplate.ipynb │ │ ├── iris.parquet │ │ ├── linear_regression.parquet │ │ └── wine.parquet └── help.txt ├── Week6 ├── Superset │ ├── .env │ ├── config │ │ └── superset_config.py │ └── docker-compose.yaml └── help.txt └── workshops ├── 1. DB_Hadoop ├── CAP-Theorem.png ├── docker-hadoop │ ├── docker-compose.yml │ ├── hadoop.env │ ├── init4win.bat │ └── tmp │ │ ├── data │ │ ├── checkdata.txt │ │ ├── checkdata2.txt │ │ ├── checkdata3.txt │ │ ├── checkdata4.txt │ │ └── checkdata5.txt │ │ ├── init │ │ └── init.sh │ │ └── input │ │ └── input.txt └── hadoop-with-hive │ ├── README.md │ ├── data │ ├── create.sql │ ├── init.sh │ ├── users_20210501.csv │ └── users_20210502.csv │ ├── docker-compose.yml │ └── hadoop.env ├── 2. Spark ├── PySparkShow.ipynb ├── Spark │ ├── PySparkJob.py │ ├── docker-compose.yml │ └── help.txt ├── Streaming │ ├── WordStream │ │ ├── WordStream.py │ │ └── commands.txt │ └── docker-compose.yml └── taxi_data.parquet ├── 3. Airflow ├── container-data │ └── airflow │ │ └── dags │ │ ├── calculate_dag.py │ │ ├── calculate_parallel_dag.py │ │ ├── dummy_dag.py │ │ ├── hello_dag.py │ │ └── test_dag.py └── docker-compose.yaml └── 4. Spark ML ├── TitanikSparkML.ipynb ├── test.csv └── train.csv /.gitattributes: -------------------------------------------------------------------------------- 1 | *.sql linguist-detectable=false -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/README.md -------------------------------------------------------------------------------- /Week1/ClickHouse/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week1/ClickHouse/docker-compose.yml -------------------------------------------------------------------------------- /Week1/Postgres/container-data/postgres/init.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week1/Postgres/container-data/postgres/init.sql -------------------------------------------------------------------------------- /Week1/Postgres/docker-compose.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week1/Postgres/docker-compose.yaml -------------------------------------------------------------------------------- /Week1/employee.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week1/employee.png -------------------------------------------------------------------------------- /Week1/help.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week1/help.txt -------------------------------------------------------------------------------- /Week1/practice.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week1/practice.sql -------------------------------------------------------------------------------- /Week2/docker-hadoop/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/docker-compose.yml -------------------------------------------------------------------------------- /Week2/docker-hadoop/hadoop.env: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/hadoop.env -------------------------------------------------------------------------------- /Week2/docker-hadoop/init4win7.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/init4win7.bat -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/data/checkdata.txt: -------------------------------------------------------------------------------- 1 | Big Data = Big Issues 2 | -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/data/checkdata2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/tmp/data/checkdata2.txt -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/data/checkdata3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/tmp/data/checkdata3.txt -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/data/checkdata4.txt: -------------------------------------------------------------------------------- 1 | Data4 2 | 3 | -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/data/checkdata5.txt: -------------------------------------------------------------------------------- 1 | Data5 2 | 3 | -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/init/init.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/tmp/init/init.sh -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/input/input1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/tmp/input/input1.txt -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/input/input2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/tmp/input/input2.txt -------------------------------------------------------------------------------- /Week2/docker-hadoop/tmp/job/mr-wordcount.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/docker-hadoop/tmp/job/mr-wordcount.jar -------------------------------------------------------------------------------- /Week2/help.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week2/help.txt -------------------------------------------------------------------------------- /Week3/Jupyter/docker-compose.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/Jupyter/docker-compose.yaml -------------------------------------------------------------------------------- /Week3/Jupyter/notebooks/.ipynb_checkpoints/PySparkTasksTemplate-checkpoint.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/Jupyter/notebooks/.ipynb_checkpoints/PySparkTasksTemplate-checkpoint.ipynb -------------------------------------------------------------------------------- /Week3/Jupyter/notebooks/PySparkTasksTemplate.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/Jupyter/notebooks/PySparkTasksTemplate.ipynb -------------------------------------------------------------------------------- /Week3/Jupyter/notebooks/taxi_cars_data.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/Jupyter/notebooks/taxi_cars_data.parquet -------------------------------------------------------------------------------- /Week3/Jupyter/notebooks/taxi_data.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/Jupyter/notebooks/taxi_data.parquet -------------------------------------------------------------------------------- /Week3/Project/PySparkJob.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/Project/PySparkJob.py -------------------------------------------------------------------------------- /Week3/Project/clickstream.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/Project/clickstream.parquet -------------------------------------------------------------------------------- /Week3/help.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/help.txt -------------------------------------------------------------------------------- /Week3/spark-practice/PySpark.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/spark-practice/PySpark.ipynb -------------------------------------------------------------------------------- /Week3/spark-practice/PySparkTitanikJob.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/spark-practice/PySparkTitanikJob.ipynb -------------------------------------------------------------------------------- /Week3/spark-practice/train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/spark-practice/train.csv -------------------------------------------------------------------------------- /Week3/spark-tasks/PySparkTasksTemplate.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/spark-tasks/PySparkTasksTemplate.ipynb -------------------------------------------------------------------------------- /Week3/spark-tasks/taxi_cars_data.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/spark-tasks/taxi_cars_data.parquet -------------------------------------------------------------------------------- /Week3/spark-tasks/taxi_data.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week3/spark-tasks/taxi_data.parquet -------------------------------------------------------------------------------- /Week4/Airflow/container-data/airflow/dags/calculate_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week4/Airflow/container-data/airflow/dags/calculate_dag.py -------------------------------------------------------------------------------- /Week4/Airflow/container-data/airflow/dags/calculate_parallel_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week4/Airflow/container-data/airflow/dags/calculate_parallel_dag.py -------------------------------------------------------------------------------- /Week4/Airflow/container-data/airflow/dags/dummy_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week4/Airflow/container-data/airflow/dags/dummy_dag.py -------------------------------------------------------------------------------- /Week4/Airflow/container-data/airflow/dags/hello_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week4/Airflow/container-data/airflow/dags/hello_dag.py -------------------------------------------------------------------------------- /Week4/Airflow/docker-compose.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week4/Airflow/docker-compose.yaml -------------------------------------------------------------------------------- /Week4/help.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week4/help.txt -------------------------------------------------------------------------------- /Week5/SparkML/Project/PySparkMLFit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/Project/PySparkMLFit.py -------------------------------------------------------------------------------- /Week5/SparkML/Project/PySparkMLPredict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/Project/PySparkMLPredict.py -------------------------------------------------------------------------------- /Week5/SparkML/Project/test.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/Project/test.parquet -------------------------------------------------------------------------------- /Week5/SparkML/Project/train.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/Project/train.parquet -------------------------------------------------------------------------------- /Week5/SparkML/spark-practice/TitanikSparkML.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-practice/TitanikSparkML.ipynb -------------------------------------------------------------------------------- /Week5/SparkML/spark-practice/cat_dog/PySparkMLDL.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-practice/cat_dog/PySparkMLDL.ipynb -------------------------------------------------------------------------------- /Week5/SparkML/spark-practice/cat_dog/cat_dog.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-practice/cat_dog/cat_dog.zip -------------------------------------------------------------------------------- /Week5/SparkML/spark-practice/cat_dog/scala-logging_2.11-3.9.2.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-practice/cat_dog/scala-logging_2.11-3.9.2.jar -------------------------------------------------------------------------------- /Week5/SparkML/spark-practice/cat_dog/tensorframes-0.6.0-s_2.11.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-practice/cat_dog/tensorframes-0.6.0-s_2.11.jar -------------------------------------------------------------------------------- /Week5/SparkML/spark-practice/train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-practice/train.csv -------------------------------------------------------------------------------- /Week5/SparkML/spark-tasks/SparkMLTemplate.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-tasks/SparkMLTemplate.ipynb -------------------------------------------------------------------------------- /Week5/SparkML/spark-tasks/iris.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-tasks/iris.parquet -------------------------------------------------------------------------------- /Week5/SparkML/spark-tasks/linear_regression.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-tasks/linear_regression.parquet -------------------------------------------------------------------------------- /Week5/SparkML/spark-tasks/wine.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week5/SparkML/spark-tasks/wine.parquet -------------------------------------------------------------------------------- /Week5/help.txt: -------------------------------------------------------------------------------- 1 | Для работы необходимы: 2 | 1) Python 3.X+ 3 | 2) Jupyter Notebook 4 | 3) PySpark 5 | pip install pyspark -------------------------------------------------------------------------------- /Week6/Superset/.env: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week6/Superset/.env -------------------------------------------------------------------------------- /Week6/Superset/config/superset_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week6/Superset/config/superset_config.py -------------------------------------------------------------------------------- /Week6/Superset/docker-compose.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week6/Superset/docker-compose.yaml -------------------------------------------------------------------------------- /Week6/help.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/Week6/help.txt -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/CAP-Theorem.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/CAP-Theorem.png -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/docker-hadoop/docker-compose.yml -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/hadoop.env: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/docker-hadoop/hadoop.env -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/init4win.bat: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/docker-hadoop/init4win.bat -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/tmp/data/checkdata.txt: -------------------------------------------------------------------------------- 1 | Some data 2 | -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/tmp/data/checkdata2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/docker-hadoop/tmp/data/checkdata2.txt -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/tmp/data/checkdata3.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/docker-hadoop/tmp/data/checkdata3.txt -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/tmp/data/checkdata4.txt: -------------------------------------------------------------------------------- 1 | Data4 2 | 3 | -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/tmp/data/checkdata5.txt: -------------------------------------------------------------------------------- 1 | Data5 2 | 3 | -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/tmp/init/init.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/docker-hadoop/tmp/init/init.sh -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/docker-hadoop/tmp/input/input.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/docker-hadoop/tmp/input/input.txt -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/hadoop-with-hive/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/hadoop-with-hive/README.md -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/hadoop-with-hive/data/create.sql: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/hadoop-with-hive/data/create.sql -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/hadoop-with-hive/data/init.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/hadoop-with-hive/data/init.sh -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/hadoop-with-hive/data/users_20210501.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/hadoop-with-hive/data/users_20210501.csv -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/hadoop-with-hive/data/users_20210502.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/hadoop-with-hive/data/users_20210502.csv -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/hadoop-with-hive/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/hadoop-with-hive/docker-compose.yml -------------------------------------------------------------------------------- /workshops/1. DB_Hadoop/hadoop-with-hive/hadoop.env: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/1. DB_Hadoop/hadoop-with-hive/hadoop.env -------------------------------------------------------------------------------- /workshops/2. Spark/PySparkShow.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/PySparkShow.ipynb -------------------------------------------------------------------------------- /workshops/2. Spark/Spark/PySparkJob.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/Spark/PySparkJob.py -------------------------------------------------------------------------------- /workshops/2. Spark/Spark/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/Spark/docker-compose.yml -------------------------------------------------------------------------------- /workshops/2. Spark/Spark/help.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/Spark/help.txt -------------------------------------------------------------------------------- /workshops/2. Spark/Streaming/WordStream/WordStream.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/Streaming/WordStream/WordStream.py -------------------------------------------------------------------------------- /workshops/2. Spark/Streaming/WordStream/commands.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/Streaming/WordStream/commands.txt -------------------------------------------------------------------------------- /workshops/2. Spark/Streaming/docker-compose.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/Streaming/docker-compose.yml -------------------------------------------------------------------------------- /workshops/2. Spark/taxi_data.parquet: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/2. Spark/taxi_data.parquet -------------------------------------------------------------------------------- /workshops/3. Airflow/container-data/airflow/dags/calculate_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/3. Airflow/container-data/airflow/dags/calculate_dag.py -------------------------------------------------------------------------------- /workshops/3. Airflow/container-data/airflow/dags/calculate_parallel_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/3. Airflow/container-data/airflow/dags/calculate_parallel_dag.py -------------------------------------------------------------------------------- /workshops/3. Airflow/container-data/airflow/dags/dummy_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/3. Airflow/container-data/airflow/dags/dummy_dag.py -------------------------------------------------------------------------------- /workshops/3. Airflow/container-data/airflow/dags/hello_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/3. Airflow/container-data/airflow/dags/hello_dag.py -------------------------------------------------------------------------------- /workshops/3. Airflow/container-data/airflow/dags/test_dag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/3. Airflow/container-data/airflow/dags/test_dag.py -------------------------------------------------------------------------------- /workshops/3. Airflow/docker-compose.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/3. Airflow/docker-compose.yaml -------------------------------------------------------------------------------- /workshops/4. Spark ML/TitanikSparkML.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/4. Spark ML/TitanikSparkML.ipynb -------------------------------------------------------------------------------- /workshops/4. Spark ML/test.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/4. Spark ML/test.csv -------------------------------------------------------------------------------- /workshops/4. Spark ML/train.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/AlexKbit/stepik-ds-course/HEAD/workshops/4. Spark ML/train.csv --------------------------------------------------------------------------------