├── .gitignore ├── .travis.yml ├── AUTHORS ├── Dockerfile ├── Dockerfile-gpu ├── LICENSE ├── README.md ├── bin ├── flux └── test_example ├── deploy ├── docker │ ├── docker_build.sh │ ├── docker_build_gpu.sh │ ├── docker_build_hdfs.sh │ ├── docker_build_ros.sh │ ├── docker_build_ros_gpu.sh │ ├── flux │ │ ├── Dockerfile │ │ ├── Dockerfile-gpu │ │ ├── README.md │ │ ├── jupyterhub_config.py │ │ ├── lib │ │ │ ├── protobuf-java-3.3.0.jar │ │ │ ├── rosbaginputformat.jar │ │ │ ├── rosbaginputformat_2.11-0.9.8.jar │ │ │ └── scala-library-2.11.8.jar │ │ └── spark-ex-kubernetes.sh │ ├── hdfs4k8s │ │ ├── Dockerfile-datanode │ │ ├── Dockerfile-namenode │ │ ├── run-dn.sh │ │ └── run-nn.sh │ └── ros_base │ │ ├── Dockerfile │ │ ├── Dockerfile-gpu │ │ ├── README.txt │ │ └── ros_entrypoint.sh └── kubernetes │ ├── distributed │ ├── README.md │ ├── flux │ ├── flux-init │ ├── hdfs-flux │ │ ├── .helmignore │ │ ├── Chart.yaml │ │ ├── templates │ │ │ ├── NOTES.txt │ │ │ ├── _helpers.tpl │ │ │ ├── dn-ds.yaml │ │ │ ├── hdfs-cm.yaml │ │ │ ├── nn-pod.yaml │ │ │ └── nn-svc.yaml │ │ └── values.yaml │ ├── hdfs-pv │ │ ├── .helmignore │ │ ├── Chart.yaml │ │ ├── templates │ │ │ ├── NOTES.txt │ │ │ ├── _helpers.tpl │ │ │ ├── dn-pv.yaml │ │ │ └── nn-pv.yaml │ │ └── values.yaml │ └── hdfs-pvc │ │ ├── Chart.yaml │ │ ├── templates │ │ ├── _helpers.tpl │ │ ├── dn-pvc.yaml │ │ └── nn-pvc.yaml │ │ └── values.yaml │ ├── flux-ros-hadoop-deployment.yml │ ├── flux-ros-hadoop-gpu-deployment.yml │ ├── flux-ros-hadoop-gpu-service.yml │ └── flux-ros-hadoop-service.yml ├── examples ├── Tutorial.ipynb ├── concept.png ├── data-exploration.ipynb ├── drive-obj-detect.mp4 ├── drive-stats.mp4 ├── header.png ├── lane_detector.py ├── line.py ├── map.png ├── object_detection_model.py ├── object_detector.py ├── rosbag-larger-than-2-GB.ipynb ├── sample-use-cases.ipynb └── utils.py └── images ├── flux_cloud.png ├── flux_overview.png ├── login_notebook.png └── sample_notebook.png /.gitignore: -------------------------------------------------------------------------------- 1 | .DS_Store 2 | .ipynb_checkpoints/ 3 | metastore_db/ 4 | target/ 5 | derby.log 6 | *bag 7 | dist/ 8 | -------------------------------------------------------------------------------- /.travis.yml: -------------------------------------------------------------------------------- 1 | sudo: required 2 | 3 | language: python 4 | 5 | env: 6 | - CHANGE_MINIKUBE_NONE_USER=true 7 | 8 | services: 9 | - docker 10 | 11 | before_script: 12 | # install minikube 13 | - curl -Lo kubectl https://storage.googleapis.com/kubernetes-release/release/v1.9.0/bin/linux/amd64/kubectl && chmod +x kubectl && sudo mv kubectl /usr/local/bin/ 14 | - curl -Lo minikube https://storage.googleapis.com/minikube/releases/v0.25.2/minikube-linux-amd64 && chmod +x minikube && sudo mv minikube /usr/local/bin/ 15 | - minikube config set WantReportErrorPrompt false 16 | - sudo minikube start --vm-driver=none --kubernetes-version=v1.9.0 17 | - minikube update-context 18 | - JSONPATH='{range .items[*]}{@.metadata.name}:{range @.status.conditions[*]}{@.type}={@.status};{end}{end}'; until kubectl get nodes -o jsonpath="$JSONPATH" 2>&1 | grep -q "Ready=True"; do sleep 1; done 19 | - kubectl cluster-info 20 | - curl https://raw.githubusercontent.com/kubernetes/helm/master/scripts/get > get_helm.sh 21 | - chmod 700 get_helm.sh 22 | - sudo ./get_helm.sh 23 | - helm init 24 | 25 | script: 26 | - ./bin/flux build 27 | # - ./deploy/docker/docker_build_ros_gpu.sh 28 | # - ./deploy/docker/docker_build_gpu.sh 29 | - ./bin/flux start 30 | - sleep 10 # TODO: avoid sleep 31 | - ./bin/flux ps 32 | # TODO: activate once working - (cd examples && find . -name '*.ipynb') | xargs ./bin/test_example 33 | - ./bin/flux stop 34 | - ./bin/flux purge 35 | -------------------------------------------------------------------------------- /AUTHORS: -------------------------------------------------------------------------------- 1 | # This is the official list of Flux authors for copyright purposes. 2 | # This file is distinct from the CONTRIBUTORS files. 3 | # See the latter for an explanation. 4 | 5 | # Names should be added to this file as: 6 | # Name or Organization 7 | # The email address is not required for organizations. 8 | 9 | Jan Wiegelmann git@wiegelmann.net 10 | Adrian Achihăei vasco@consultant.com 11 | Seunghan Han hanseunghan@gmail.com 12 | Karthikeya Sampa Subbarao karthikeya108@gmail.com 13 | -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- 1 | FROM fluxproject/flux 2 | 3 | COPY examples/* /opt/ros_hadoop/latest/doc/ 4 | RUN chmod -R 777 /opt/ros_hadoop/latest/doc 5 | -------------------------------------------------------------------------------- /Dockerfile-gpu: -------------------------------------------------------------------------------- 1 | FROM fluxproject/flux_gpu 2 | 3 | COPY examples/* /opt/ros_hadoop/latest/doc/ 4 | RUN chmod -R 777 /opt/ros_hadoop/latest/doc 5 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | Apache License 2 | Version 2.0, January 2004 3 | http://www.apache.org/licenses/ 4 | 5 | TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION 6 | 7 | 1. Definitions. 8 | 9 | "License" shall mean the terms and conditions for use, reproduction, 10 | and distribution as defined by Sections 1 through 9 of this document. 11 | 12 | "Licensor" shall mean the copyright owner or entity authorized by 13 | the copyright owner that is granting the License. 14 | 15 | "Legal Entity" shall mean the union of the acting entity and all 16 | other entities that control, are controlled by, or are under common 17 | control with that entity. For the purposes of this definition, 18 | "control" means (i) the power, direct or indirect, to cause the 19 | direction or management of such entity, whether by contract or 20 | otherwise, or (ii) ownership of fifty percent (50%) or more of the 21 | outstanding shares, or (iii) beneficial ownership of such entity. 22 | 23 | "You" (or "Your") shall mean an individual or Legal Entity 24 | exercising permissions granted by this License. 25 | 26 | "Source" form shall mean the preferred form for making modifications, 27 | including but not limited to software source code, documentation 28 | source, and configuration files. 29 | 30 | "Object" form shall mean any form resulting from mechanical 31 | transformation or translation of a Source form, including but 32 | not limited to compiled object code, generated documentation, 33 | and conversions to other media types. 34 | 35 | "Work" shall mean the work of authorship, whether in Source or 36 | Object form, made available under the License, as indicated by a 37 | copyright notice that is included in or attached to the work 38 | (an example is provided in the Appendix below). 39 | 40 | "Derivative Works" shall mean any work, whether in Source or Object 41 | form, that is based on (or derived from) the Work and for which the 42 | editorial revisions, annotations, elaborations, or other modifications 43 | represent, as a whole, an original work of authorship. For the purposes 44 | of this License, Derivative Works shall not include works that remain 45 | separable from, or merely link (or bind by name) to the interfaces of, 46 | the Work and Derivative Works thereof. 47 | 48 | "Contribution" shall mean any work of authorship, including 49 | the original version of the Work and any modifications or additions 50 | to that Work or Derivative Works thereof, that is intentionally 51 | submitted to Licensor for inclusion in the Work by the copyright owner 52 | or by an individual or Legal Entity authorized to submit on behalf of 53 | the copyright owner. For the purposes of this definition, "submitted" 54 | means any form of electronic, verbal, or written communication sent 55 | to the Licensor or its representatives, including but not limited to 56 | communication on electronic mailing lists, source code control systems, 57 | and issue tracking systems that are managed by, or on behalf of, the 58 | Licensor for the purpose of discussing and improving the Work, but 59 | excluding communication that is conspicuously marked or otherwise 60 | designated in writing by the copyright owner as "Not a Contribution." 61 | 62 | "Contributor" shall mean Licensor and any individual or Legal Entity 63 | on behalf of whom a Contribution has been received by Licensor and 64 | subsequently incorporated within the Work. 65 | 66 | 2. Grant of Copyright License. Subject to the terms and conditions of 67 | this License, each Contributor hereby grants to You a perpetual, 68 | worldwide, non-exclusive, no-charge, royalty-free, irrevocable 69 | copyright license to reproduce, prepare Derivative Works of, 70 | publicly display, publicly perform, sublicense, and distribute the 71 | Work and such Derivative Works in Source or Object form. 72 | 73 | 3. Grant of Patent License. Subject to the terms and conditions of 74 | this License, each Contributor hereby grants to You a perpetual, 75 | worldwide, non-exclusive, no-charge, royalty-free, irrevocable 76 | (except as stated in this section) patent license to make, have made, 77 | use, offer to sell, sell, import, and otherwise transfer the Work, 78 | where such license applies only to those patent claims licensable 79 | by such Contributor that are necessarily infringed by their 80 | Contribution(s) alone or by combination of their Contribution(s) 81 | with the Work to which such Contribution(s) was submitted. If You 82 | institute patent litigation against any entity (including a 83 | cross-claim or counterclaim in a lawsuit) alleging that the Work 84 | or a Contribution incorporated within the Work constitutes direct 85 | or contributory patent infringement, then any patent licenses 86 | granted to You under this License for that Work shall terminate 87 | as of the date such litigation is filed. 88 | 89 | 4. Redistribution. You may reproduce and distribute copies of the 90 | Work or Derivative Works thereof in any medium, with or without 91 | modifications, and in Source or Object form, provided that You 92 | meet the following conditions: 93 | 94 | (a) You must give any other recipients of the Work or 95 | Derivative Works a copy of this License; and 96 | 97 | (b) You must cause any modified files to carry prominent notices 98 | stating that You changed the files; and 99 | 100 | (c) You must retain, in the Source form of any Derivative Works 101 | that You distribute, all copyright, patent, trademark, and 102 | attribution notices from the Source form of the Work, 103 | excluding those notices that do not pertain to any part of 104 | the Derivative Works; and 105 | 106 | (d) If the Work includes a "NOTICE" text file as part of its 107 | distribution, then any Derivative Works that You distribute must 108 | include a readable copy of the attribution notices contained 109 | within such NOTICE file, excluding those notices that do not 110 | pertain to any part of the Derivative Works, in at least one 111 | of the following places: within a NOTICE text file distributed 112 | as part of the Derivative Works; within the Source form or 113 | documentation, if provided along with the Derivative Works; or, 114 | within a display generated by the Derivative Works, if and 115 | wherever such third-party notices normally appear. The contents 116 | of the NOTICE file are for informational purposes only and 117 | do not modify the License. You may add Your own attribution 118 | notices within Derivative Works that You distribute, alongside 119 | or as an addendum to the NOTICE text from the Work, provided 120 | that such additional attribution notices cannot be construed 121 | as modifying the License. 122 | 123 | You may add Your own copyright statement to Your modifications and 124 | may provide additional or different license terms and conditions 125 | for use, reproduction, or distribution of Your modifications, or 126 | for any such Derivative Works as a whole, provided Your use, 127 | reproduction, and distribution of the Work otherwise complies with 128 | the conditions stated in this License. 129 | 130 | 5. Submission of Contributions. Unless You explicitly state otherwise, 131 | any Contribution intentionally submitted for inclusion in the Work 132 | by You to the Licensor shall be under the terms and conditions of 133 | this License, without any additional terms or conditions. 134 | Notwithstanding the above, nothing herein shall supersede or modify 135 | the terms of any separate license agreement you may have executed 136 | with Licensor regarding such Contributions. 137 | 138 | 6. Trademarks. This License does not grant permission to use the trade 139 | names, trademarks, service marks, or product names of the Licensor, 140 | except as required for reasonable and customary use in describing the 141 | origin of the Work and reproducing the content of the NOTICE file. 142 | 143 | 7. Disclaimer of Warranty. Unless required by applicable law or 144 | agreed to in writing, Licensor provides the Work (and each 145 | Contributor provides its Contributions) on an "AS IS" BASIS, 146 | WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or 147 | implied, including, without limitation, any warranties or conditions 148 | of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A 149 | PARTICULAR PURPOSE. You are solely responsible for determining the 150 | appropriateness of using or redistributing the Work and assume any 151 | risks associated with Your exercise of permissions under this License. 152 | 153 | 8. Limitation of Liability. In no event and under no legal theory, 154 | whether in tort (including negligence), contract, or otherwise, 155 | unless required by applicable law (such as deliberate and grossly 156 | negligent acts) or agreed to in writing, shall any Contributor be 157 | liable to You for damages, including any direct, indirect, special, 158 | incidental, or consequential damages of any character arising as a 159 | result of this License or out of the use or inability to use the 160 | Work (including but not limited to damages for loss of goodwill, 161 | work stoppage, computer failure or malfunction, or any and all 162 | other commercial damages or losses), even if such Contributor 163 | has been advised of the possibility of such damages. 164 | 165 | 9. Accepting Warranty or Additional Liability. While redistributing 166 | the Work or Derivative Works thereof, You may choose to offer, 167 | and charge a fee for, acceptance of support, warranty, indemnity, 168 | or other liability obligations and/or rights consistent with this 169 | License. However, in accepting such obligations, You may act only 170 | on Your own behalf and on Your sole responsibility, not on behalf 171 | of any other Contributor, and only if You agree to indemnify, 172 | defend, and hold each Contributor harmless for any liability 173 | incurred by, or claims asserted against, such Contributor by reason 174 | of your accepting any such warranty or additional liability. 175 | 176 | END OF TERMS AND CONDITIONS 177 | 178 | APPENDIX: How to apply the Apache License to your work. 179 | 180 | To apply the Apache License to your work, attach the following 181 | boilerplate notice, with the fields enclosed by brackets "[]" 182 | replaced with your own identifying information. (Don't include 183 | the brackets!) The text should be enclosed in the appropriate 184 | comment syntax for the file format. We also recommend that a 185 | file or class name and description of purpose be included on the 186 | same "printed page" as the copyright notice for easier 187 | identification within third-party archives. 188 | 189 | Copyright [yyyy] [name of copyright owner] 190 | 191 | Licensed under the Apache License, Version 2.0 (the "License"); 192 | you may not use this file except in compliance with the License. 193 | You may obtain a copy of the License at 194 | 195 | http://www.apache.org/licenses/LICENSE-2.0 196 | 197 | Unless required by applicable law or agreed to in writing, software 198 | distributed under the License is distributed on an "AS IS" BASIS, 199 | WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 200 | See the License for the specific language governing permissions and 201 | limitations under the License. 202 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | [![Build Status](https://travis-ci.org/flux-project/flux.svg?branch=master)](https://travis-ci.org/flux-project/flux) 2 | [![Docker Automation](https://img.shields.io/docker/automated/fluxproject/flux.svg)](https://hub.docker.com/r/fluxproject/flux/) 3 | [![Docker Build Status](https://img.shields.io/docker/build/fluxproject/flux.svg)](https://hub.docker.com/r/fluxproject/flux/) 4 | 5 | # Flux Project 6 | 7 | Autodeploy a complete end-to-end machine/deep learning pipeline on Kubernetes using tools like Spark, TensorFlow, HDFS, etc. - it requires a running Kubernetes (K8s) cluster in the cloud or on-premise. 8 | 9 | Please visit the [website for updates.](http://flux-project.org/ "Flux Project") 10 | 11 | 12 | 13 | ### Prerequisites 14 | Before installing the components make sure you have installed 15 | * [Docker](https://www.docker.com/get-docker) 16 | The edge version of docker community edition is coming with a kubernetes option 17 | * [Kubernetes](https://kubernetes.io/) 18 | * [Helm](https://helm.sh/) 19 | The package manager for Kubernetes. 20 | 21 | ### Deploy on nodes 22 | 23 | `./bin/flux` will check for GPU availability and make use of it if it can find a GPU. 24 | 25 | 1. Build the images 26 | ```bash 27 | ./bin/flux build 28 | ``` 29 | Note that images need to be deployed to your nodes or to your docker registry 30 | 31 | 1. Create the deployment and the service with Kubernetes 32 | ```bash 33 | ./bin/flux start 34 | ``` 35 | 36 | 1. Check that all components are running 37 | ```bash 38 | ./bin/flux ps 39 | ``` 40 | 41 | ### Accessing the sample notebooks: 42 | 43 | ```bash 44 | ./bin/flux notebook 45 | ``` 46 | A browser window opens. You can there login using `flux/flux`. 47 | 48 | 49 | 50 | After Login an ipython notebook playground with examples will open. 51 | 52 | 53 | 54 | ### Cloud deployment 55 | 56 | 57 | -------------------------------------------------------------------------------- /bin/flux: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | # Usage 4 | # ===== 5 | # 6 | # flux build 7 | # flux start - determine cloud vendor / OS and start 8 | # flux stop - stops 9 | # flux purge - delete everything 10 | # flux pull - pulls latest version 11 | # flux notebook - open browser on notebook start page 12 | # flux ps - list all processes 13 | # flux stats - print resource utilization 14 | # 15 | # Later: 16 | # flux scale / add-host / add-node 17 | # flux update 18 | 19 | function require { 20 | which $1 &>/dev/null || { echo "$1 is not installed, but required!"; exit 1; } 21 | } 22 | 23 | function displayUsage { 24 | grep '^#' $0 | grep -v '#!' | sed 's/^# *//' 25 | } 26 | 27 | function checkForGPU { 28 | true # TODO [ -n `docker volume ls -q -f driver=nvidia-docker` ] 29 | } 30 | 31 | hasGPU=$(checkForGPU) 32 | 33 | set -eo pipefail 34 | 35 | require 'docker' 36 | require 'kubectl' 37 | require 'helm' 38 | 39 | 40 | command=$1 41 | 42 | case "$command" in 43 | "build") 44 | GPU=${hasGPU} || echo '-_gpu' 45 | 46 | echo "suffix: ${GPU}" 47 | 48 | ./deploy/docker/docker_build_ros${GPU}.sh 49 | ./deploy/docker/docker_build${GPU}.sh 50 | docker build -t fluxproject/examples${GPU} . 51 | ;; 52 | "start") 53 | kubectl create -f deploy/kubernetes/flux-ros-hadoop-deployment.yml 54 | kubectl create -f deploy/kubernetes/flux-ros-hadoop-service.yml 55 | ;; 56 | # TODO: poll and block until it is really started? 57 | "purge") 58 | kubectl delete -f deploy/kubernetes/flux-ros-hadoop-service.yml 59 | kubectl delete -f deploy/kubernetes/flux-ros-hadoop-deployment.yml 60 | ;; 61 | "stop") 62 | # TODO: wait for helm install helm delete --purge hdfs 63 | ;; 64 | "ps") 65 | kubectl get all --all-namespaces 66 | ;; 67 | "stats") 68 | echo "TODO: implement me" 69 | exit 1 70 | ;; 71 | "notebook") 72 | #PORT= 73 | open "http://localhost:$(kubectl get service flux-ros-hadoop --template='{{(index .spec.ports 0).nodePort}}')" 74 | ;; 75 | "pull") 76 | docker pull fluxproject/flux:latest 77 | docker pull fluxproject/examples:latest 78 | ;; 79 | 80 | # TODO: need flux init? 81 | # TODO: need flux check to check if everything is running 82 | *) 83 | displayUsage 84 | exit 1 85 | ;; 86 | esac 87 | -------------------------------------------------------------------------------- /bin/test_example: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | POD=$(kubectl get pods --output='go-template={{(index .items 0).metadata.name}}') 3 | 4 | kubectl exec -ti ${POD} -- jupyter nbconvert --execute $1 5 | -------------------------------------------------------------------------------- /deploy/docker/docker_build.sh: -------------------------------------------------------------------------------- 1 | docker build -t fluxproject/flux -f deploy/docker/flux/Dockerfile deploy/docker/flux 2 | -------------------------------------------------------------------------------- /deploy/docker/docker_build_gpu.sh: -------------------------------------------------------------------------------- 1 | docker build -t fluxproject/flux_gpu -f deploy/docker/flux/Dockerfile-gpu deploy/docker/flux 2 | -------------------------------------------------------------------------------- /deploy/docker/docker_build_hdfs.sh: -------------------------------------------------------------------------------- 1 | docker build -t fluxproject/hdfs-nn-4k8s:0.1 -f deploy/docker/hdfs4k8s/Dockerfile-namenode . 2 | docker build -t fluxproject/hdfs-dn-4k8s:0.1 -f deploy/docker/hdfs4k8s/Dockerfile-datanode . 3 | -------------------------------------------------------------------------------- /deploy/docker/docker_build_ros.sh: -------------------------------------------------------------------------------- 1 | docker build -t fluxproject/ros_base -f deploy/docker/ros_base/Dockerfile deploy/docker/ros_base 2 | -------------------------------------------------------------------------------- /deploy/docker/docker_build_ros_gpu.sh: -------------------------------------------------------------------------------- 1 | docker build -t fluxproject/ros_base_gpu -f deploy/docker/ros_base/Dockerfile-gpu deploy/docker/ros_base 2 | -------------------------------------------------------------------------------- /deploy/docker/flux/Dockerfile: -------------------------------------------------------------------------------- 1 | FROM fluxproject/ros_base 2 | 3 | RUN apt-get update && apt-get install -y --no-install-recommends \ 4 | locales bzip2 tree unzip xz-utils curl wget iproute2 sudo \ 5 | python-pip python3-pip python-setuptools python3-setuptools \ 6 | openjdk-8-jdk-headless nodejs npm nodejs-legacy \ 7 | iputils-ping net-tools iproute knot-dnsutils vim \ 8 | ffmpeg \ 9 | && rm -rf /var/lib/apt/lists/* 10 | 11 | # Jupyterhub setting 12 | RUN mkdir -p /etc/jupyterhub 13 | COPY jupyterhub_config.py /etc/jupyterhub/ 14 | 15 | # Introduce flux user # TODO: link 16 | RUN npm install -g configurable-http-proxy 17 | RUN useradd -u 11111 -m -s /bin/bash flux 18 | RUN usermod -aG sudo flux 19 | RUN bash -c " echo flux:flux | chpasswd " 20 | 21 | # Flux user setting # TODO: link 22 | COPY spark-ex-kubernetes.sh /home/flux/ 23 | 24 | RUN python2 -m pip install --upgrade --user pip && \ 25 | python3 -m pip install --upgrade --user pip && \ 26 | python3 -m pip install --no-cache-dir --upgrade jupyter jupyterhub jupyterlab && \ 27 | python2 -m pip install --no-cache-dir --upgrade pyspark matplotlib pandas tensorflow keras Pillow && \ 28 | python2 -m pip install --no-cache-dir --upgrade --force-reinstall requests imageio moviepy seaborn gmaps && \ 29 | python2 -m pip install ipykernel && \ 30 | python2 -m ipykernel install && \ 31 | python3 -m pip install ipykernel && \ 32 | python3 -m ipykernel install 33 | 34 | RUN apt-key adv --keyserver keyserver.ubuntu.com --recv-keys 66F84AE1EB71A8AC108087DCAF677210FF6D3CDA && \ 35 | bash -c 'echo "deb [ arch=amd64 ] http://packages.dataspeedinc.com/ros/ubuntu $(lsb_release -sc) main" > /etc/apt/sources.list.d/ros-dataspeed-public.list' && \ 36 | apt-get update 37 | 38 | RUN bash -c 'echo "yaml http://packages.dataspeedinc.com/ros/ros-public-'$ROS_DISTRO'.yaml '$ROS_DISTRO'" > /etc/ros/rosdep/sources.list.d/30-dataspeed-public-'$ROS_DISTRO'.list' && \ 39 | rosdep update 2>/dev/null && apt-get install -y --no-install-recommends \ 40 | ros-$ROS_DISTRO-dbw-mkz ros-$ROS_DISTRO-mobility-base ros-$ROS_DISTRO-baxter-sdk ros-$ROS_DISTRO-velodyne && \ 41 | rm -rf /var/lib/apt/lists/* 42 | 43 | 44 | # Default to UTF-8 45 | RUN locale-gen en_US.UTF-8 46 | ENV LANG en_US.UTF-8 47 | ENV JAVA_HOME /usr/lib/jvm/java-8-openjdk-amd64 48 | ENV PATH $PATH:/opt/apache/hadoop/bin 49 | ENV ROSIF_JAR /opt/ros_hadoop/master/lib/rosbaginputformat.jar 50 | 51 | RUN mkdir -p /opt/ros_hadoop/master/dist/ 52 | RUN mkdir -p /opt/apache/ 53 | RUN mkdir -p /opt/ros_spark/dist/ 54 | COPY . /opt/ros_hadoop/master/ 55 | 56 | # TODO: ENV ROS_HADOOP='0.9.11' 57 | # RUN \ 58 | # curl -s "https://codeload.github.com/valtech/ros_hadoop/tar.gz/v${ROS_HADOOP}" | \ 59 | # tar -C /opt/ros_hadoop -xvzf - && \ 60 | # mv /opt/ros_hadoop/ros_hadoop-${ROS_HADOOP} /opt/ros_hadoop/latest 61 | RUN \ 62 | curl -s "https://codeload.github.com/valtech/ros_hadoop/tar.gz/master" | \ 63 | tar -C /opt/ros_hadoop -xvzf - && \ 64 | mv /opt/ros_hadoop/ros_hadoop-master /opt/ros_hadoop/latest 65 | 66 | RUN bash -c "if [ ! -f /opt/ros_hadoop/master/dist/hadoop-3.0.0.tar.gz ] ; then wget --no-check-certificate -O /opt/ros_hadoop/master/dist/hadoop-3.1.1.tar.gz -q https://www.eu.apache.org/dist/hadoop/common/hadoop-3.1.1/hadoop-3.1.1.tar.gz ; fi" 67 | RUN tar -xzf /opt/ros_hadoop/master/dist/hadoop-3.1.1.tar.gz -C /opt/apache && rm /opt/ros_hadoop/master/dist/hadoop-3.1.1.tar.gz 68 | RUN ln -s /opt/apache/hadoop-3.1.1 /opt/apache/hadoop 69 | RUN bash -c "if [ ! -f /opt/ros_hadoop/latest/lib/rosbaginputformat.jar ] ; then ln -s /opt/ros_hadoop/master/lib/rosbaginputformat.jar /opt/ros_hadoop/latest/lib/rosbaginputformat.jar ; fi" 70 | 71 | ## for spark example tests 72 | RUN bash -c "if [ ! -f /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz ] ; then wget --quiet -O /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz http://apache.lauf-forum.at/spark/spark-2.3.1/spark-2.3.1-bin-hadoop2.7.tgz ; fi" 73 | RUN tar -xzf /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz -C /opt/apache && rm /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz 74 | 75 | RUN printf "\n\n\nfs.defaultFS\nhdfs://localhost:9000\n\n" > /opt/apache/hadoop/etc/hadoop/core-site.xml && \ 76 | printf "\n\ndfs.replication\n1\n\n" > /opt/apache/hadoop/etc/hadoop/hdfs-site.xml && \ 77 | bash -c "/opt/apache/hadoop/bin/hdfs namenode -format 2>/dev/null" && \ 78 | printf "#! /bin/bash\n/opt/apache/hadoop/bin/hdfs --daemon stop datanode\n/opt/apache/hadoop/bin/hdfs --daemon stop namenode\n/opt/apache/hadoop/bin/hdfs --daemon start namenode\n/opt/apache/hadoop/bin/hdfs --daemon start datanode\nexec \"\$@\"\n" > /start_hadoop.sh && \ 79 | chmod a+x /start_hadoop.sh 80 | 81 | RUN printf "#! /bin/bash\nset -e\nsource \"/opt/ros/$ROS_DISTRO/setup.bash\"\n/start_hadoop.sh\nexec \"\$@\"\n" > /ros_hadoop.sh && \ 82 | chmod a+x /ros_hadoop.sh 83 | 84 | RUN bash -c "if [ ! -f /opt/ros_hadoop/master/dist/HMB_4.bag ] ; then wget --quiet -O /opt/ros_hadoop/master/dist/HMB_4.bag https://xfiles.valtech.io/f/c494d168522045e3bcc0/?dl=1 ; fi" && \ 85 | java -jar "$ROSIF_JAR" -f /opt/ros_hadoop/master/dist/HMB_4.bag 86 | 87 | RUN bash -c "/start_hadoop.sh" && \ 88 | until /opt/apache/hadoop/bin/hdfs dfsadmin -safemode wait; do sleep 1s; done && \ 89 | until /opt/apache/hadoop/bin/hdfs dfsadmin -report; do sleep 1s; done && \ 90 | until /opt/apache/hadoop/bin/hdfs dfs -mkdir /user; do sleep 1s; done && \ 91 | /opt/apache/hadoop/bin/hdfs dfs -mkdir /user/root && \ 92 | /opt/apache/hadoop/bin/hdfs dfs -mkdir /user/flux && \ 93 | /opt/apache/hadoop/bin/hdfs dfs -put /opt/ros_hadoop/master/dist/HMB_4.bag && \ 94 | /opt/apache/hadoop/bin/hdfs --daemon stop datanode && \ 95 | /opt/apache/hadoop/bin/hdfs --daemon stop namenode 96 | 97 | RUN \ 98 | mkdir -p /ope/ros_hadoop/latest/doc && \ 99 | chmod -R 777 /opt/ros_hadoop 100 | 101 | WORKDIR /opt/ros_hadoop/latest/doc/ 102 | ENTRYPOINT ["/ros_hadoop.sh"] 103 | 104 | CMD ["jupyterhub", "-f", "/etc/jupyterhub/jupyterhub_config.py"] 105 | -------------------------------------------------------------------------------- /deploy/docker/flux/Dockerfile-gpu: -------------------------------------------------------------------------------- 1 | FROM fluxproject/ros_base_gpu 2 | 3 | RUN apt-get update && apt-get install -y --no-install-recommends \ 4 | locales bzip2 tree unzip xz-utils curl wget iproute2 sudo \ 5 | python-pip python3-pip python-setuptools python3-setuptools \ 6 | openjdk-8-jdk-headless nodejs npm nodejs-legacy \ 7 | iputils-ping net-tools iproute knot-dnsutils vim \ 8 | ffmpeg \ 9 | && rm -rf /var/lib/apt/lists/* 10 | 11 | # Jupyterhub setting 12 | RUN mkdir -p /etc/jupyterhub 13 | COPY jupyterhub_config.py /etc/jupyterhub/ 14 | 15 | # Introduce flux user 16 | RUN npm install -g configurable-http-proxy 17 | RUN useradd -u 11111 -m -s /bin/bash flux 18 | RUN usermod -aG sudo flux 19 | RUN bash -c " echo flux:flux | chpasswd " 20 | 21 | # Flux user setting # TODO: link 22 | COPY spark-ex-kubernetes.sh /home/flux/ 23 | 24 | RUN python2 -m pip install --upgrade --user pip && \ 25 | python3 -m pip install --upgrade --user pip && \ 26 | python3 -m pip install --no-cache-dir --upgrade jupyter jupyterhub jupyterlab && \ 27 | python2 -m pip install --no-cache-dir --upgrade pyspark matplotlib pandas tensorflow-gpu keras Pillow && \ 28 | python2 -m pip install --no-cache-dir --upgrade --force-reinstall requests imageio moviepy seaborn gmaps && \ 29 | python2 -m pip install ipykernel && \ 30 | python2 -m ipykernel install && \ 31 | python3 -m pip install ipykernel && \ 32 | python3 -m ipykernel install 33 | 34 | RUN apt-key adv --keyserver keyserver.ubuntu.com --recv-keys 66F84AE1EB71A8AC108087DCAF677210FF6D3CDA && \ 35 | bash -c 'echo "deb [ arch=amd64 ] http://packages.dataspeedinc.com/ros/ubuntu $(lsb_release -sc) main" > /etc/apt/sources.list.d/ros-dataspeed-public.list' && \ 36 | apt-get update 37 | 38 | RUN bash -c 'echo "yaml http://packages.dataspeedinc.com/ros/ros-public-'$ROS_DISTRO'.yaml '$ROS_DISTRO'" > /etc/ros/rosdep/sources.list.d/30-dataspeed-public-'$ROS_DISTRO'.list' && \ 39 | rosdep update 2>/dev/null && apt-get install -y --no-install-recommends \ 40 | ros-$ROS_DISTRO-dbw-mkz ros-$ROS_DISTRO-mobility-base ros-$ROS_DISTRO-baxter-sdk ros-$ROS_DISTRO-velodyne && \ 41 | rm -rf /var/lib/apt/lists/* 42 | 43 | # Default to UTF-8 44 | RUN locale-gen en_US.UTF-8 45 | ENV LANG en_US.UTF-8 46 | ENV JAVA_HOME /usr/lib/jvm/java-8-openjdk-amd64 47 | ENV PATH $PATH:/opt/apache/hadoop/bin 48 | ENV ROSIF_JAR /opt/ros_hadoop/master/lib/rosbaginputformat.jar 49 | 50 | RUN mkdir -p /opt/ros_hadoop/latest 51 | RUN mkdir -p /opt/ros_hadoop/master/dist/ 52 | RUN mkdir -p /opt/apache/ 53 | RUN mkdir -p /opt/ros_spark/dist/ 54 | COPY . /opt/ros_hadoop/master/ 55 | RUN bash -c "curl -s https://api.github.com/repos/valtech/ros_hadoop/releases/latest | egrep -io 'https://api.github.com/repos/valtech/ros_hadoop/tarball/[^\"]*' | xargs wget --quiet -O /opt/ros_hadoop/latest.tgz" 56 | RUN bash -c "if [ ! -f /opt/ros_hadoop/master/dist/hadoop-3.0.0.tar.gz ] ; then wget --no-check-certificate -O /opt/ros_hadoop/master/dist/hadoop-3.1.1.tar.gz -q https://www.eu.apache.org/dist/hadoop/common/hadoop-3.1.1/hadoop-3.1.1.tar.gz ; fi" 57 | RUN tar -xzf /opt/ros_hadoop/latest.tgz -C /opt/ros_hadoop/latest --strip-components=1 && rm /opt/ros_hadoop/latest.tgz 58 | RUN tar -xzf /opt/ros_hadoop/master/dist/hadoop-3.1.1.tar.gz -C /opt/apache && rm /opt/ros_hadoop/master/dist/hadoop-3.1.1.tar.gz 59 | RUN ln -s /opt/apache/hadoop-3.1.1 /opt/apache/hadoop 60 | RUN bash -c "if [ ! -f /opt/ros_hadoop/latest/lib/rosbaginputformat.jar ] ; then ln -s /opt/ros_hadoop/master/lib/rosbaginputformat.jar /opt/ros_hadoop/latest/lib/rosbaginputformat.jar ; fi" 61 | 62 | ## for spark example tests 63 | RUN bash -c "if [ ! -f /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz ] ; then wget --quiet -O /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz http://apache.lauf-forum.at/spark/spark-2.3.1/spark-2.3.1-bin-hadoop2.7.tgz ; fi" 64 | RUN tar -xzf /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz -C /opt/apache && rm /opt/ros_spark/dist/spark-2.3.1-bin-hadoop2.7.tgz 65 | 66 | RUN printf "\n\n\nfs.defaultFS\nhdfs://localhost:9000\n\n" > /opt/apache/hadoop/etc/hadoop/core-site.xml && \ 67 | printf "\n\ndfs.replication\n1\n\n" > /opt/apache/hadoop/etc/hadoop/hdfs-site.xml && \ 68 | bash -c "/opt/apache/hadoop/bin/hdfs namenode -format 2>/dev/null" && \ 69 | printf "#! /bin/bash\n/opt/apache/hadoop/bin/hdfs --daemon stop datanode\n/opt/apache/hadoop/bin/hdfs --daemon stop namenode\n/opt/apache/hadoop/bin/hdfs --daemon start namenode\n/opt/apache/hadoop/bin/hdfs --daemon start datanode\nexec \"\$@\"\n" > /start_hadoop.sh && \ 70 | chmod a+x /start_hadoop.sh 71 | 72 | RUN printf "#! /bin/bash\nset -e\nsource \"/opt/ros/$ROS_DISTRO/setup.bash\"\n/start_hadoop.sh\nexec \"\$@\"\n" > /ros_hadoop.sh && \ 73 | chmod a+x /ros_hadoop.sh 74 | 75 | RUN bash -c "if [ ! -f /opt/ros_hadoop/master/dist/HMB_4.bag ] ; then wget --quiet -O /opt/ros_hadoop/master/dist/HMB_4.bag https://xfiles.valtech.io/f/c494d168522045e3bcc0/?dl=1 ; fi" && \ 76 | java -jar "$ROSIF_JAR" -f /opt/ros_hadoop/master/dist/HMB_4.bag 77 | 78 | RUN bash -c "/start_hadoop.sh" && \ 79 | /opt/apache/hadoop/bin/hdfs dfsadmin -safemode wait && \ 80 | /opt/apache/hadoop/bin/hdfs dfsadmin -report && \ 81 | /opt/apache/hadoop/bin/hdfs dfs -mkdir /user && \ 82 | /opt/apache/hadoop/bin/hdfs dfs -mkdir /user/root && \ 83 | /opt/apache/hadoop/bin/hdfs dfs -mkdir /user/flux && \ 84 | /opt/apache/hadoop/bin/hdfs dfs -put /opt/ros_hadoop/master/dist/HMB_4.bag && \ 85 | /opt/apache/hadoop/bin/hdfs --daemon stop datanode && \ 86 | /opt/apache/hadoop/bin/hdfs --daemon stop namenode 87 | 88 | RUN \ 89 | mkdir -p /ope/ros_hadoop/latest/doc && \ 90 | chmod -R 777 /opt/ros_hadoop 91 | 92 | WORKDIR /opt/ros_hadoop/latest/doc/ 93 | ENTRYPOINT ["/ros_hadoop.sh"] 94 | 95 | CMD ["jupyterhub", "-f", "/etc/jupyterhub/jupyterhub_config.py"] 96 | -------------------------------------------------------------------------------- /deploy/docker/flux/README.md: -------------------------------------------------------------------------------- 1 | # **RosbagInputFormat** 2 | RosbagInputFormat is an open source **splittable** Hadoop InputFormat for the ROS bag file format. 3 | 4 | The complete source code is available in src/ folder and the jar file is generated using SBT (see build.sbt) 5 | 6 | For an example of rosbag file larger than 2 GB see doc/Rosbag larger than 2 GB.ipynb Solved the issue https://github.com/valtech/ros_hadoop/issues/6 The issue was due to ByteBuffer being limitted by JVM Integer size and has nothing to do with Spark or how the RosbagMapInputFormat works within Spark. It was only problematic to extract the conf index with the jar. 7 | 8 | # Usage 9 | 10 | 1. Download latest release jar file and put it in classpath 11 | 2. Extract the index configuration of your ROS bag file. **The extracted index is a very very small configuration** file containing a protobuf array that will be given in the job configuration. **Note that the operation will not process and it will not parse** the whole bag file, but will simply seek to the required offset. e.g. 12 | ```bash 13 | java -jar lib/rosbaginputformat.jar -f /opt/ros_hadoop/master/dist/HMB_4.bag 14 | # will create an idx.bin config file /opt/ros_hadoop/master/dist/HMB_4.bag.idx.bin 15 | ``` 16 | 3. Put the ROS bag file in HDFS e.g. 17 | ```bash 18 | hdfs dfs -put 19 | ``` 20 | 4. Use it in your Spark jobs e.g. 21 | ```python 22 | sc.newAPIHadoopFile( 23 | path = "hdfs://127.0.0.1:9000/user/spark/HMB_4.bag", 24 | inputFormatClass = "de.valtech.foss.RosbagMapInputFormat", 25 | keyClass = "org.apache.hadoop.io.LongWritable", 26 | valueClass = "org.apache.hadoop.io.MapWritable", 27 | conf = {"RosbagInputFormat.chunkIdx":"/opt/ros_hadoop/master/dist/HMB_4.bag.idx.bin"}) 28 | ``` 29 | 30 | Example data can be found for instance at https://github.com/udacity/self-driving-car/tree/master/datasets published under MIT License. 31 | 32 | # Documentation 33 | The [doc/](doc/) folder contains a jupyter notebook with a few basic usage examples. 34 | 35 |

36 |

37 | 38 | # Tutorial 39 | 40 | ## To test locally use the Dockerfile 41 | 42 | To build an image using the Dockerfile run the following in the shell. 43 | Please note that it will download Hadoop and Spark from the URL source. The generated image is therefore relatively large ~5G. 44 | ```bash 45 | docker build -t ros_hadoop:latest -f Dockerfile . 46 | ``` 47 | 48 | To start a container use the following shell command **in the ros_hadoop folder.** 49 | ```bash 50 | # $(pwd) will point to the ros_hadoop git clone folder 51 | docker run -it -v $(pwd):/root/ros_hadoop -p 8888:8888 ros_hadoop 52 | ``` 53 | The container has a configured HDFS as well as Spark and the RosInputFormat jar. 54 | It leaves the user in a bash shell. 55 | 56 | Point your browser to the local [URL](http://localhost:8888/) and enjoy the tutorial. The access token is printed in the docker container console. 57 | 58 | ### Usage from Spark (pyspark) 59 | 60 | Example data can be found for instance at https://github.com/udacity/self-driving-car/tree/master/datasets published under MIT License. 61 | 62 | Check that the Rosbag file version is V2.0 63 | 64 | ```bash 65 | java -jar lib/rosbaginputformat.jar --version -f /opt/ros_hadoop/master/dist/HMB_4.bag 66 | ``` 67 | 68 | ### Extract the index as configuration 69 | 70 | The index is a very very small configuration file containing a protobuf array that will be given in the job configuration. 71 | Note that the operation will not process and it will not parse the whole bag file, but will simply seek to the required offset. 72 | 73 | ```bash 74 | # assuming you start the notebook in the doc/ folder 75 | java -jar ../lib/rosbaginputformat.jar \ 76 | -f /opt/ros_hadoop/master/dist/HMB_4.bag 77 | 78 | hdfs dfs -ls 79 | ``` 80 | 81 | This will generate a very small file named HMB_4.bag.idx.bin in the same folder. 82 | 83 | ### Copy the bag file in HDFS 84 | 85 | Using your favorite tool put the bag file in your working HDFS folder. 86 | 87 | ***Note***: keep the index file as configuration to your jobs, ***do not*** put small files in HDFS. 88 | For convenience we already provide an example file (/opt/ros_hadoop/master/dist/HMB_4.bag) in the HDFS under /user/root/ 89 | 90 | ```bash 91 | hdfs dfs -put /opt/ros_hadoop/master/dist/HMB_4.bag 92 | hdfs dfs -ls 93 | ``` 94 |

95 |

96 | 97 | + Hadoop InputFormat and Record Reader for Rosbag 98 | + Process Rosbag with Spark, Yarn, MapReduce, Hadoop Streaming API, … 99 | + Spark RDD are cached and optimised for analysis 100 | 101 | ### Process the ROS bag file in Spark using the RosbagInputFormat 102 | 103 | ***Note***: your HDFS address might differ. 104 | ```python 105 | fin = sc.newAPIHadoopFile( 106 | path = "hdfs://127.0.0.1:9000/user/root/HMB_4.bag", 107 | inputFormatClass = "de.valtech.foss.RosbagMapInputFormat", 108 | keyClass = "org.apache.hadoop.io.LongWritable", 109 | valueClass = "org.apache.hadoop.io.MapWritable", 110 | conf = {“RosbagInputFormat.chunkIdx”:”/opt/ros_hadoop/master/dist/HMB_4.bag.idx.bin"}) 111 | ``` 112 | 113 | ### Interpret the Messages 114 | 115 | To interpret the messages we need the connections. 116 | We could get the connections as configuration as well. At the moment we decided to collect the connections into Spark driver in a dictionary and use it in the subsequent RDD actions. 117 | 118 | Collect the connections from all Spark partitions of the bag file into the Spark driver 119 | ```python 120 | conn_a = fin.filter( 121 | lambda r: r[1]['header']['op'] == 7 122 | ).map( 123 | lambda r: r[1] 124 | ).collect() 125 | conn_d = {str(k['header']['topic']):k for k in conn_a} 126 | 127 | # see topic names 128 | conn_d.keys() 129 | ``` 130 | 131 | From all ROS bag splits we collect into Spark driver the connection messages (op=7 in header) where the ROS definitions are stored. This operation happens in parallel of course. 132 | 133 | ### Load the python map functions from src/main/python/functions.py 134 | ```bash 135 | %run -i ../src/main/python/functions.py 136 | ``` 137 | At the moment the file contains a single mapper function named msg_map. 138 | 139 | ### Use of msg_map to apply a function on all messages 140 | 141 | Python rosbag.bag needs to be installed on all Spark workers. The msg_map function (from src/main/python/functions.py) takes three arguments: 142 | 1. r = the message or RDD record Tuple 143 | 2. func = a function (default str) to apply to the ROS message 144 | 3. conn = a connection to specify what topic to process 145 | 146 | ```python 147 | %matplotlib nbagg 148 | # use %matplotlib notebook in python3 149 | from functools import partial 150 | import pandas as pd 151 | import numpy as np 152 | 153 | 154 | # Take messages from '/imu/data' topic using default str func 155 | rdd = fin.flatMap( 156 | partial(msg_map, conn=conn_d['/imu/data']) 157 | ) 158 | ``` 159 | 160 | The connection dictionary is sent over the closure to the workers that uses it in the msg_map. 161 | 162 |

163 | 164 | ```python 165 | print(rdd.take(1)[0]) 166 | ``` 167 | 168 | ``` 169 | header: 170 | seq: 1701626 171 | stamp: 172 | secs: 1479425728 173 | nsecs: 747487068 174 | frame_id: /imu 175 | orientation: 176 | x: -0.0251433756238 177 | y: 0.0284643176884 178 | z: -0.0936542998233 179 | w: 0.994880191333 180 | orientation_covariance: [0.017453292519943295, 0.0, 0.0, 0.0, 0.017453292519943295, 0.0, 0.0, 0.0, 0.15707963267948966] 181 | angular_velocity: 182 | x: 0.0 183 | y: 0.0 184 | z: 0.0 185 | angular_velocity_covariance: [-1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0, -1.0] 186 | linear_acceleration: 187 | x: 1.16041922569 188 | y: 0.595418334007 189 | z: 10.7565326691 190 | linear_acceleration_covariance: [0.0004, 0.0, 0.0, 0.0, 0.0004, 0.0, 0.0, 0.0, 0.0004] 191 | ``` 192 | 193 | 194 | ### Image data from camera messages 195 | 196 | An example of taking messages using a func other than default str. 197 | In our case we apply a lambda to messages from from '/center_camera/image_color/compressed' topic. As usual with Spark the operation will happen in parallel on all workers. 198 | 199 | ```python 200 | from PIL import Image 201 | from io import BytesIO 202 | 203 | res = fin.flatMap( 204 | partial(msg_map, func=lambda r: r.data, conn=conn_d['/center_camera/image_color/compressed']) 205 | ).take(50) 206 | 207 | Image.open(BytesIO(res[48])) 208 | ``` 209 | 210 |

211 | 212 | 213 | ### Plot fuel level 214 | 215 | The topic /vehicle/fuel_level_report contains 2215 ROS messages. Let us plot the header.stamp in seconds vs. fuel_level using a pandas dataframe. 216 | 217 | ```python 218 | def f(msg): 219 | return (msg.header.stamp.secs, msg.fuel_level) 220 | 221 | d = fin.flatMap( 222 | partial(msg_map, func=f, conn=conn_d['/vehicle/fuel_level_report']) 223 | ).toDF().toPandas() 224 | 225 | d.set_index(‘_1').plot() 226 | ``` 227 |

228 | 229 | ### Machine Learning models on Spark workers 230 | 231 | A dot product Keras "model" for each message from a topic. We will compare it with the one computed with numpy. 232 | 233 | ***Note*** that the imports happen in the workers and not in driver. On the other hand the connection dictionary is sent over the closure. 234 | 235 | ```python 236 | def f(msg): 237 | from keras.layers import dot, Dot, Input 238 | from keras.models import Model 239 | 240 | linear_acceleration = { 241 | 'x': msg.linear_acceleration.x, 242 | 'y': msg.linear_acceleration.y, 243 | 'z': msg.linear_acceleration.z, 244 | } 245 | 246 | linear_acceleration_covariance = np.array(msg.linear_acceleration_covariance) 247 | 248 | i1 = Input(shape=(3,)) 249 | i2 = Input(shape=(3,)) 250 | o = dot([i1,i2], axes=1) 251 | 252 | model = Model([i1,i2], o) 253 | 254 | # return a tuple with (numpy dot product, keras dot "predict") 255 | return ( 256 | np.dot(linear_acceleration_covariance.reshape(3,3), 257 | [linear_acceleration['x'], linear_acceleration['y'], linear_acceleration['z']]), 258 | model.predict([ 259 | np.array([[ linear_acceleration['x'], linear_acceleration['y'], linear_acceleration['z'] ]]), 260 | linear_acceleration_covariance.reshape((3,3))]) 261 | ) 262 | 263 | fin.flatMap(partial(msg_map, func=f, conn=conn_d['/vehicle/imu/data_raw'])).take(5) 264 | 265 | # tuple with (numpy dot product, keras dot “predict”) 266 | ``` 267 | One can sample of course and collect the data in the driver to train a model on one single machine. 268 | Note that the msg is the most granular unit but you could replace the flatMap with a mapPartitions to apply such a Keras function to a whole split. 269 | 270 | Another option would be to have a map.reduceByKey before the flatMap so that the function argument would be a whole interval instead of a msg. The idea is to key on time. 271 | 272 | We hope that the RosbagInputFormat would be useful to you. 273 | 274 | ## Please do not forget to send us your [feedback](AUTHORS). 275 | ![doc/images/browse-tutorial.png](doc/images/browse-tutorial.png) 276 | -------------------------------------------------------------------------------- /deploy/docker/flux/jupyterhub_config.py: -------------------------------------------------------------------------------- 1 | # Configuration file for jupyterhub. 2 | 3 | #------------------------------------------------------------------------------ 4 | # Application(SingletonConfigurable) configuration 5 | #------------------------------------------------------------------------------ 6 | 7 | ## This is an application. 8 | 9 | ## The date format used by logging formatters for %(asctime)s 10 | #c.Application.log_datefmt = '%Y-%m-%d %H:%M:%S' 11 | 12 | ## The Logging format template 13 | #c.Application.log_format = '[%(name)s]%(highlevel)s %(message)s' 14 | 15 | ## Set the log level by value or name. 16 | #c.Application.log_level = 30 17 | 18 | #------------------------------------------------------------------------------ 19 | # JupyterHub(Application) configuration 20 | #------------------------------------------------------------------------------ 21 | 22 | ## An Application for starting a Multi-User Jupyter Notebook server. 23 | 24 | ## Maximum number of concurrent servers that can be active at a time. 25 | # 26 | # Setting this can limit the total resources your users can consume. 27 | # 28 | # An active server is any server that's not fully stopped. It is considered 29 | # active from the time it has been requested until the time that it has 30 | # completely stopped. 31 | # 32 | # If this many user servers are active, users will not be able to launch new 33 | # servers until a server is shutdown. Spawn requests will be rejected with a 429 34 | # error asking them to try again. 35 | # 36 | # If set to 0, no limit is enforced. 37 | #c.JupyterHub.active_server_limit = 0 38 | 39 | ## Grant admin users permission to access single-user servers. 40 | # 41 | # Users should be properly informed if this is enabled. 42 | #c.JupyterHub.admin_access = False 43 | 44 | ## DEPRECATED since version 0.7.2, use Authenticator.admin_users instead. 45 | #c.JupyterHub.admin_users = set() 46 | 47 | ## Allow named single-user servers per user 48 | #c.JupyterHub.allow_named_servers = False 49 | 50 | ## Answer yes to any questions (e.g. confirm overwrite) 51 | #c.JupyterHub.answer_yes = False 52 | 53 | ## PENDING DEPRECATION: consider using service_tokens 54 | # 55 | # Dict of token:username to be loaded into the database. 56 | # 57 | # Allows ahead-of-time generation of API tokens for use by externally managed 58 | # services, which authenticate as JupyterHub users. 59 | # 60 | # Consider using service_tokens for general services that talk to the JupyterHub 61 | # API. 62 | #c.JupyterHub.api_tokens = {} 63 | 64 | ## Class for authenticating users. 65 | # 66 | # This should be a class with the following form: 67 | # 68 | # - constructor takes one kwarg: `config`, the IPython config object. 69 | # 70 | # - is a tornado.gen.coroutine 71 | # - returns username on success, None on failure 72 | # - takes two arguments: (handler, data), 73 | # where `handler` is the calling web.RequestHandler, 74 | # and `data` is the POST form data from the login page. 75 | #c.JupyterHub.authenticator_class = 'jupyterhub.auth.PAMAuthenticator' 76 | 77 | ## The base URL of the entire application 78 | #c.JupyterHub.base_url = '/' 79 | 80 | ## Whether to shutdown the proxy when the Hub shuts down. 81 | # 82 | # Disable if you want to be able to teardown the Hub while leaving the proxy 83 | # running. 84 | # 85 | # Only valid if the proxy was starting by the Hub process. 86 | # 87 | # If both this and cleanup_servers are False, sending SIGINT to the Hub will 88 | # only shutdown the Hub, leaving everything else running. 89 | # 90 | # The Hub should be able to resume from database state. 91 | #c.JupyterHub.cleanup_proxy = True 92 | 93 | ## Whether to shutdown single-user servers when the Hub shuts down. 94 | # 95 | # Disable if you want to be able to teardown the Hub while leaving the single- 96 | # user servers running. 97 | # 98 | # If both this and cleanup_proxy are False, sending SIGINT to the Hub will only 99 | # shutdown the Hub, leaving everything else running. 100 | # 101 | # The Hub should be able to resume from database state. 102 | #c.JupyterHub.cleanup_servers = True 103 | 104 | ## Maximum number of concurrent users that can be spawning at a time. 105 | # 106 | # Spawning lots of servers at the same time can cause performance problems for 107 | # the Hub or the underlying spawning system. Set this limit to prevent bursts of 108 | # logins from attempting to spawn too many servers at the same time. 109 | # 110 | # This does not limit the number of total running servers. See 111 | # active_server_limit for that. 112 | # 113 | # If more than this many users attempt to spawn at a time, their requests will 114 | # be rejected with a 429 error asking them to try again. Users will have to wait 115 | # for some of the spawning services to finish starting before they can start 116 | # their own. 117 | # 118 | # If set to 0, no limit is enforced. 119 | #c.JupyterHub.concurrent_spawn_limit = 100 120 | 121 | ## The config file to load 122 | #c.JupyterHub.config_file = 'jupyterhub_config.py' 123 | 124 | ## DEPRECATED: does nothing 125 | #c.JupyterHub.confirm_no_ssl = False 126 | 127 | ## Number of days for a login cookie to be valid. Default is two weeks. 128 | #c.JupyterHub.cookie_max_age_days = 14 129 | 130 | ## The cookie secret to use to encrypt cookies. 131 | # 132 | # Loaded from the JPY_COOKIE_SECRET env variable by default. 133 | # 134 | # Should be exactly 256 bits (32 bytes). 135 | #c.JupyterHub.cookie_secret = b'' 136 | 137 | ## File in which to store the cookie secret. 138 | #c.JupyterHub.cookie_secret_file = 'jupyterhub_cookie_secret' 139 | 140 | ## The location of jupyterhub data files (e.g. /usr/local/share/jupyter/hub) 141 | #c.JupyterHub.data_files_path = '/usr/local/share/jupyter/hub' 142 | 143 | ## Include any kwargs to pass to the database connection. See 144 | # sqlalchemy.create_engine for details. 145 | #c.JupyterHub.db_kwargs = {} 146 | 147 | ## url for the database. e.g. `sqlite:///jupyterhub.sqlite` 148 | #c.JupyterHub.db_url = 'sqlite:///jupyterhub.sqlite' 149 | 150 | ## log all database transactions. This has A LOT of output 151 | #c.JupyterHub.debug_db = False 152 | 153 | ## DEPRECATED since version 0.8: Use ConfigurableHTTPProxy.debug 154 | #c.JupyterHub.debug_proxy = False 155 | 156 | ## Send JupyterHub's logs to this file. 157 | # 158 | # This will *only* include the logs of the Hub itself, not the logs of the proxy 159 | # or any single-user servers. 160 | #c.JupyterHub.extra_log_file = '' 161 | 162 | ## Extra log handlers to set on JupyterHub logger 163 | #c.JupyterHub.extra_log_handlers = [] 164 | 165 | ## Generate default config file 166 | #c.JupyterHub.generate_config = False 167 | 168 | ## The ip or hostname for proxies and spawners to use for connecting to the Hub. 169 | # 170 | # Use when the bind address (`hub_ip`) is 0.0.0.0 or otherwise different from 171 | # the connect address. 172 | # 173 | # Default: when `hub_ip` is 0.0.0.0, use `socket.gethostname()`, otherwise use 174 | # `hub_ip`. 175 | # 176 | # .. versionadded:: 0.8 177 | #c.JupyterHub.hub_connect_ip = '' 178 | 179 | ## The port for proxies & spawners to connect to the hub on. 180 | # 181 | # Used alongside `hub_connect_ip` 182 | # 183 | # .. versionadded:: 0.8 184 | #c.JupyterHub.hub_connect_port = 0 185 | 186 | ## The ip address for the Hub process to *bind* to. 187 | # 188 | # See `hub_connect_ip` for cases where the bind and connect address should 189 | # differ. 190 | #c.JupyterHub.hub_ip = '127.0.0.1' 191 | 192 | ## The port for the Hub process 193 | #c.JupyterHub.hub_port = 8081 194 | 195 | ## The public facing ip of the whole application (the proxy) 196 | #c.JupyterHub.ip = '' 197 | 198 | ## Supply extra arguments that will be passed to Jinja environment. 199 | #c.JupyterHub.jinja_environment_options = {} 200 | 201 | ## Interval (in seconds) at which to update last-activity timestamps. 202 | #c.JupyterHub.last_activity_interval = 300 203 | 204 | ## Dict of 'group': ['usernames'] to load at startup. 205 | # 206 | # This strictly *adds* groups and users to groups. 207 | # 208 | # Loading one set of groups, then starting JupyterHub again with a different set 209 | # will not remove users or groups from previous launches. That must be done 210 | # through the API. 211 | #c.JupyterHub.load_groups = {} 212 | 213 | ## Specify path to a logo image to override the Jupyter logo in the banner. 214 | #c.JupyterHub.logo_file = '' 215 | 216 | ## File to write PID Useful for daemonizing jupyterhub. 217 | #c.JupyterHub.pid_file = '' 218 | 219 | ## The public facing port of the proxy 220 | #c.JupyterHub.port = 8000 221 | 222 | ## DEPRECATED since version 0.8 : Use ConfigurableHTTPProxy.api_url 223 | #c.JupyterHub.proxy_api_ip = '' 224 | 225 | ## DEPRECATED since version 0.8 : Use ConfigurableHTTPProxy.api_url 226 | #c.JupyterHub.proxy_api_port = 0 227 | 228 | ## DEPRECATED since version 0.8: Use ConfigurableHTTPProxy.auth_token 229 | #c.JupyterHub.proxy_auth_token = '' 230 | 231 | ## Interval (in seconds) at which to check if the proxy is running. 232 | #c.JupyterHub.proxy_check_interval = 30 233 | 234 | ## Select the Proxy API implementation. 235 | #c.JupyterHub.proxy_class = 'jupyterhub.proxy.ConfigurableHTTPProxy' 236 | 237 | ## DEPRECATED since version 0.8. Use ConfigurableHTTPProxy.command 238 | #c.JupyterHub.proxy_cmd = [] 239 | 240 | ## Purge and reset the database. 241 | #c.JupyterHub.reset_db = False 242 | 243 | ## Interval (in seconds) at which to check connectivity of services with web 244 | # endpoints. 245 | #c.JupyterHub.service_check_interval = 60 246 | 247 | ## Dict of token:servicename to be loaded into the database. 248 | # 249 | # Allows ahead-of-time generation of API tokens for use by externally managed 250 | # services. 251 | #c.JupyterHub.service_tokens = {} 252 | 253 | ## List of service specification dictionaries. 254 | # 255 | # A service 256 | # 257 | # For instance:: 258 | # 259 | # services = [ 260 | # { 261 | # 'name': 'cull_idle', 262 | # 'command': ['/path/to/cull_idle_servers.py'], 263 | # }, 264 | # { 265 | # 'name': 'formgrader', 266 | # 'url': 'http://127.0.0.1:1234', 267 | # 'api_token': 'super-secret', 268 | # 'environment': 269 | # } 270 | # ] 271 | #c.JupyterHub.services = [] 272 | 273 | ## The class to use for spawning single-user servers. 274 | # 275 | # Should be a subclass of Spawner. 276 | #c.JupyterHub.spawner_class = 'jupyterhub.spawner.LocalProcessSpawner' 277 | 278 | ## Path to SSL certificate file for the public facing interface of the proxy 279 | # 280 | # When setting this, you should also set ssl_key 281 | #c.JupyterHub.ssl_cert = '' 282 | 283 | ## Path to SSL key file for the public facing interface of the proxy 284 | # 285 | # When setting this, you should also set ssl_cert 286 | #c.JupyterHub.ssl_key = '' 287 | 288 | ## Host to send statsd metrics to 289 | #c.JupyterHub.statsd_host = '' 290 | 291 | ## Port on which to send statsd metrics about the hub 292 | #c.JupyterHub.statsd_port = 8125 293 | 294 | ## Prefix to use for all metrics sent by jupyterhub to statsd 295 | #c.JupyterHub.statsd_prefix = 'jupyterhub' 296 | 297 | ## Run single-user servers on subdomains of this host. 298 | # 299 | # This should be the full `https://hub.domain.tld[:port]`. 300 | # 301 | # Provides additional cross-site protections for javascript served by single- 302 | # user servers. 303 | # 304 | # Requires `.hub.domain.tld` to resolve to the same host as 305 | # `hub.domain.tld`. 306 | # 307 | # In general, this is most easily achieved with wildcard DNS. 308 | # 309 | # When using SSL (i.e. always) this also requires a wildcard SSL certificate. 310 | #c.JupyterHub.subdomain_host = '' 311 | 312 | ## Paths to search for jinja templates. 313 | #c.JupyterHub.template_paths = [] 314 | 315 | ## Extra settings overrides to pass to the tornado application. 316 | #c.JupyterHub.tornado_settings = {} 317 | 318 | ## Trust user-provided tokens (via JupyterHub.service_tokens) to have good 319 | # entropy. 320 | # 321 | # If you are not inserting additional tokens via configuration file, this flag 322 | # has no effect. 323 | # 324 | # In JupyterHub 0.8, internally generated tokens do not pass through additional 325 | # hashing because the hashing is costly and does not increase the entropy of 326 | # already-good UUIDs. 327 | # 328 | # User-provided tokens, on the other hand, are not trusted to have good entropy 329 | # by default, and are passed through many rounds of hashing to stretch the 330 | # entropy of the key (i.e. user-provided tokens are treated as passwords instead 331 | # of random keys). These keys are more costly to check. 332 | # 333 | # If your inserted tokens are generated by a good-quality mechanism, e.g. 334 | # `openssl rand -hex 32`, then you can set this flag to True to reduce the cost 335 | # of checking authentication tokens. 336 | #c.JupyterHub.trust_user_provided_tokens = False 337 | 338 | ## Upgrade the database automatically on start. 339 | # 340 | # Only safe if database is regularly backed up. Only SQLite databases will be 341 | # backed up to a local file automatically. 342 | #c.JupyterHub.upgrade_db = False 343 | 344 | #------------------------------------------------------------------------------ 345 | # Spawner(LoggingConfigurable) configuration 346 | #------------------------------------------------------------------------------ 347 | 348 | ## Base class for spawning single-user notebook servers. 349 | # 350 | # Subclass this, and override the following methods: 351 | # 352 | # - load_state - get_state - start - stop - poll 353 | # 354 | # As JupyterHub supports multiple users, an instance of the Spawner subclass is 355 | # created for each user. If there are 20 JupyterHub users, there will be 20 356 | # instances of the subclass. 357 | 358 | ## Extra arguments to be passed to the single-user server. 359 | # 360 | # Some spawners allow shell-style expansion here, allowing you to use 361 | # environment variables here. Most, including the default, do not. Consult the 362 | # documentation for your spawner to verify! 363 | #c.Spawner.args = [] 364 | 365 | ## The command used for starting the single-user server. 366 | # 367 | # Provide either a string or a list containing the path to the startup script 368 | # command. Extra arguments, other than this path, should be provided via `args`. 369 | # 370 | # This is usually set if you want to start the single-user server in a different 371 | # python environment (with virtualenv/conda) than JupyterHub itself. 372 | # 373 | # Some spawners allow shell-style expansion here, allowing you to use 374 | # environment variables. Most, including the default, do not. Consult the 375 | # documentation for your spawner to verify! 376 | #c.Spawner.cmd = ['jupyterhub-singleuser'] 377 | 378 | ## Minimum number of cpu-cores a single-user notebook server is guaranteed to 379 | # have available. 380 | # 381 | # If this value is set to 0.5, allows use of 50% of one CPU. If this value is 382 | # set to 2, allows use of up to 2 CPUs. 383 | # 384 | # Note that this needs to be supported by your spawner for it to work. 385 | #c.Spawner.cpu_guarantee = None 386 | 387 | ## Maximum number of cpu-cores a single-user notebook server is allowed to use. 388 | # 389 | # If this value is set to 0.5, allows use of 50% of one CPU. If this value is 390 | # set to 2, allows use of up to 2 CPUs. 391 | # 392 | # The single-user notebook server will never be scheduled by the kernel to use 393 | # more cpu-cores than this. There is no guarantee that it can access this many 394 | # cpu-cores. 395 | # 396 | # This needs to be supported by your spawner for it to work. 397 | #c.Spawner.cpu_limit = None 398 | 399 | ## Enable debug-logging of the single-user server 400 | #c.Spawner.debug = False 401 | 402 | ## The URL the single-user server should start in. 403 | # 404 | # `{username}` will be expanded to the user's username 405 | # 406 | # Example uses: 407 | # 408 | # - You can set `notebook_dir` to `/` and `default_url` to `/tree/home/{username}` to allow people to 409 | # navigate the whole filesystem from their notebook server, but still start in their home directory. 410 | # - Start with `/notebooks` instead of `/tree` if `default_url` points to a notebook instead of a directory. 411 | # - You can set this to `/lab` to have JupyterLab start by default, rather than Jupyter Notebook. 412 | c.Spawner.default_url = '/lab' 413 | 414 | ## Disable per-user configuration of single-user servers. 415 | # 416 | # When starting the user's single-user server, any config file found in the 417 | # user's $HOME directory will be ignored. 418 | # 419 | # Note: a user could circumvent this if the user modifies their Python 420 | # environment, such as when they have their own conda environments / virtualenvs 421 | # / containers. 422 | #c.Spawner.disable_user_config = False 423 | 424 | ## Whitelist of environment variables for the single-user server to inherit from 425 | # the JupyterHub process. 426 | # 427 | # This whitelist is used to ensure that sensitive information in the JupyterHub 428 | # process's environment (such as `CONFIGPROXY_AUTH_TOKEN`) is not passed to the 429 | # single-user server's process. 430 | #c.Spawner.env_keep = ['PATH', 'PYTHONPATH', 'CONDA_ROOT', 'CONDA_DEFAULT_ENV', 'VIRTUAL_ENV', 'LANG', 'LC_ALL'] 431 | c.Spawner.env_keep = ['PATH', 'PYTHONPATH', 'LANG', 'LC_ALL', 'JAVA_HOME', 'ROSIF_JAR', 'HOSTNAME', 'TERM', 'ROS_DISTRO'] 432 | 433 | ## Extra environment variables to set for the single-user server's process. 434 | # 435 | # Environment variables that end up in the single-user server's process come from 3 sources: 436 | # - This `environment` configurable 437 | # - The JupyterHub process' environment variables that are whitelisted in `env_keep` 438 | # - Variables to establish contact between the single-user notebook and the hub (such as JUPYTERHUB_API_TOKEN) 439 | # 440 | # The `enviornment` configurable should be set by JupyterHub administrators to 441 | # add installation specific environment variables. It is a dict where the key is 442 | # the name of the environment variable, and the value can be a string or a 443 | # callable. If it is a callable, it will be called with one parameter (the 444 | # spawner instance), and should return a string fairly quickly (no blocking 445 | # operations please!). 446 | # 447 | # Note that the spawner class' interface is not guaranteed to be exactly same 448 | # across upgrades, so if you are using the callable take care to verify it 449 | # continues to work after upgrades! 450 | #c.Spawner.environment = {} 451 | 452 | ## Timeout (in seconds) before giving up on a spawned HTTP server 453 | # 454 | # Once a server has successfully been spawned, this is the amount of time we 455 | # wait before assuming that the server is unable to accept connections. 456 | #c.Spawner.http_timeout = 30 457 | 458 | ## The IP address (or hostname) the single-user server should listen on. 459 | # 460 | # The JupyterHub proxy implementation should be able to send packets to this 461 | # interface. 462 | #c.Spawner.ip = '' 463 | 464 | ## Minimum number of bytes a single-user notebook server is guaranteed to have 465 | # available. 466 | # 467 | # Allows the following suffixes: 468 | # - K -> Kilobytes 469 | # - M -> Megabytes 470 | # - G -> Gigabytes 471 | # - T -> Terabytes 472 | # 473 | # This needs to be supported by your spawner for it to work. 474 | #c.Spawner.mem_guarantee = None 475 | 476 | ## Maximum number of bytes a single-user notebook server is allowed to use. 477 | # 478 | # Allows the following suffixes: 479 | # - K -> Kilobytes 480 | # - M -> Megabytes 481 | # - G -> Gigabytes 482 | # - T -> Terabytes 483 | # 484 | # If the single user server tries to allocate more memory than this, it will 485 | # fail. There is no guarantee that the single-user notebook server will be able 486 | # to allocate this much memory - only that it can not allocate more than this. 487 | # 488 | # This needs to be supported by your spawner for it to work. 489 | #c.Spawner.mem_limit = None 490 | 491 | ## Path to the notebook directory for the single-user server. 492 | # 493 | # The user sees a file listing of this directory when the notebook interface is 494 | # started. The current interface does not easily allow browsing beyond the 495 | # subdirectories in this directory's tree. 496 | # 497 | # `~` will be expanded to the home directory of the user, and {username} will be 498 | # replaced with the name of the user. 499 | # 500 | # Note that this does *not* prevent users from accessing files outside of this 501 | # path! They can do so with many other means. 502 | c.Spawner.notebook_dir = '/opt/ros_hadoop/latest/doc/' 503 | 504 | ## An HTML form for options a user can specify on launching their server. 505 | # 506 | # The surrounding `
` element and the submit button are already provided. 507 | # 508 | # For example: 509 | # 510 | # .. code:: html 511 | # 512 | # Set your key: 513 | # 514 | #
515 | # Choose a letter: 516 | # 520 | # 521 | # The data from this form submission will be passed on to your spawner in 522 | # `self.user_options` 523 | #c.Spawner.options_form = '' 524 | 525 | ## Interval (in seconds) on which to poll the spawner for single-user server's 526 | # status. 527 | # 528 | # At every poll interval, each spawner's `.poll` method is called, which checks 529 | # if the single-user server is still running. If it isn't running, then 530 | # JupyterHub modifies its own state accordingly and removes appropriate routes 531 | # from the configurable proxy. 532 | #c.Spawner.poll_interval = 30 533 | 534 | ## The port for single-user servers to listen on. 535 | # 536 | # Defaults to `0`, which uses a randomly allocated port number each time. 537 | # 538 | # If set to a non-zero value, all Spawners will use the same port, which only 539 | # makes sense if each server is on a different address, e.g. in containers. 540 | # 541 | # New in version 0.7. 542 | #c.Spawner.port = 0 543 | 544 | ## An optional hook function that you can implement to do some bootstrapping work 545 | # before the spawner starts. For example, create a directory for your user or 546 | # load initial content. 547 | # 548 | # This can be set independent of any concrete spawner implementation. 549 | # 550 | # Example:: 551 | # 552 | # from subprocess import check_call 553 | # def my_hook(spawner): 554 | # username = spawner.user.name 555 | # check_call(['./examples/bootstrap-script/bootstrap.sh', username]) 556 | # 557 | # c.Spawner.pre_spawn_hook = my_hook 558 | #c.Spawner.pre_spawn_hook = None 559 | 560 | ## Timeout (in seconds) before giving up on starting of single-user server. 561 | # 562 | # This is the timeout for start to return, not the timeout for the server to 563 | # respond. Callers of spawner.start will assume that startup has failed if it 564 | # takes longer than this. start should return when the server process is started 565 | # and its location is known. 566 | #c.Spawner.start_timeout = 60 567 | 568 | #------------------------------------------------------------------------------ 569 | # LocalProcessSpawner(Spawner) configuration 570 | #------------------------------------------------------------------------------ 571 | 572 | ## A Spawner that uses `subprocess.Popen` to start single-user servers as local 573 | # processes. 574 | # 575 | # Requires local UNIX users matching the authenticated users to exist. Does not 576 | # work on Windows. 577 | # 578 | # This is the default spawner for JupyterHub. 579 | 580 | ## Seconds to wait for single-user server process to halt after SIGINT. 581 | # 582 | # If the process has not exited cleanly after this many seconds, a SIGTERM is 583 | # sent. 584 | #c.LocalProcessSpawner.interrupt_timeout = 10 585 | 586 | ## Seconds to wait for process to halt after SIGKILL before giving up. 587 | # 588 | # If the process does not exit cleanly after this many seconds of SIGKILL, it 589 | # becomes a zombie process. The hub process will log a warning and then give up. 590 | #c.LocalProcessSpawner.kill_timeout = 5 591 | 592 | ## Extra keyword arguments to pass to Popen 593 | # 594 | # when spawning single-user servers. 595 | # 596 | # For example:: 597 | # 598 | # popen_kwargs = dict(shell=True) 599 | #c.LocalProcessSpawner.popen_kwargs = {} 600 | 601 | ## Seconds to wait for single-user server process to halt after SIGTERM. 602 | # 603 | # If the process does not exit cleanly after this many seconds of SIGTERM, a 604 | # SIGKILL is sent. 605 | #c.LocalProcessSpawner.term_timeout = 5 606 | 607 | #------------------------------------------------------------------------------ 608 | # Authenticator(LoggingConfigurable) configuration 609 | #------------------------------------------------------------------------------ 610 | 611 | ## Base class for implementing an authentication provider for JupyterHub 612 | 613 | ## Set of users that will have admin rights on this JupyterHub. 614 | # 615 | # Admin users have extra privileges: 616 | # - Use the admin panel to see list of users logged in 617 | # - Add / remove users in some authenticators 618 | # - Restart / halt the hub 619 | # - Start / stop users' single-user servers 620 | # - Can access each individual users' single-user server (if configured) 621 | # 622 | # Admin access should be treated the same way root access is. 623 | # 624 | # Defaults to an empty set, in which case no user has admin access. 625 | #c.Authenticator.admin_users = set() 626 | 627 | ## Automatically begin the login process 628 | # 629 | # rather than starting with a "Login with..." link at `/hub/login` 630 | # 631 | # To work, `.login_url()` must give a URL other than the default `/hub/login`, 632 | # such as an oauth handler or another automatic login handler, registered with 633 | # `.get_handlers()`. 634 | # 635 | # .. versionadded:: 0.8 636 | #c.Authenticator.auto_login = False 637 | 638 | ## Enable persisting auth_state (if available). 639 | # 640 | # auth_state will be encrypted and stored in the Hub's database. This can 641 | # include things like authentication tokens, etc. to be passed to Spawners as 642 | # environment variables. 643 | # 644 | # Encrypting auth_state requires the cryptography package. 645 | # 646 | # Additionally, the JUPYTERHUB_CRYPTO_KEY envirionment variable must contain one 647 | # (or more, separated by ;) 32B encryption keys. These can be either base64 or 648 | # hex-encoded. 649 | # 650 | # If encryption is unavailable, auth_state cannot be persisted. 651 | # 652 | # New in JupyterHub 0.8 653 | #c.Authenticator.enable_auth_state = False 654 | 655 | ## Dictionary mapping authenticator usernames to JupyterHub users. 656 | # 657 | # Primarily used to normalize OAuth user names to local users. 658 | #c.Authenticator.username_map = {} 659 | 660 | ## Regular expression pattern that all valid usernames must match. 661 | # 662 | # If a username does not match the pattern specified here, authentication will 663 | # not be attempted. 664 | # 665 | # If not set, allow any username. 666 | #c.Authenticator.username_pattern = '' 667 | 668 | ## Whitelist of usernames that are allowed to log in. 669 | # 670 | # Use this with supported authenticators to restrict which users can log in. 671 | # This is an additional whitelist that further restricts users, beyond whatever 672 | # restrictions the authenticator has in place. 673 | # 674 | # If empty, does not perform any additional restriction. 675 | #c.Authenticator.whitelist = set() 676 | 677 | #------------------------------------------------------------------------------ 678 | # LocalAuthenticator(Authenticator) configuration 679 | #------------------------------------------------------------------------------ 680 | 681 | ## Base class for Authenticators that work with local Linux/UNIX users 682 | # 683 | # Checks for local users, and can attempt to create them if they exist. 684 | 685 | ## The command to use for creating users as a list of strings 686 | # 687 | # For each element in the list, the string USERNAME will be replaced with the 688 | # user's username. The username will also be appended as the final argument. 689 | # 690 | # For Linux, the default value is: 691 | # 692 | # ['adduser', '-q', '--gecos', '""', '--disabled-password'] 693 | # 694 | # To specify a custom home directory, set this to: 695 | # 696 | # ['adduser', '-q', '--gecos', '""', '--home', '/customhome/USERNAME', '-- 697 | # disabled-password'] 698 | # 699 | # This will run the command: 700 | # 701 | # adduser -q --gecos "" --home /customhome/river --disabled-password river 702 | # 703 | # when the user 'river' is created. 704 | #c.LocalAuthenticator.add_user_cmd = [] 705 | 706 | ## If set to True, will attempt to create local system users if they do not exist 707 | # already. 708 | # 709 | # Supports Linux and BSD variants only. 710 | #c.LocalAuthenticator.create_system_users = False 711 | 712 | ## Whitelist all users from this UNIX group. 713 | # 714 | # This makes the username whitelist ineffective. 715 | #c.LocalAuthenticator.group_whitelist = set() 716 | 717 | #------------------------------------------------------------------------------ 718 | # PAMAuthenticator(LocalAuthenticator) configuration 719 | #------------------------------------------------------------------------------ 720 | 721 | ## Authenticate local UNIX users with PAM 722 | 723 | ## The text encoding to use when communicating with PAM 724 | #c.PAMAuthenticator.encoding = 'utf8' 725 | 726 | ## Whether to open a new PAM session when spawners are started. 727 | # 728 | # This may trigger things like mounting shared filsystems, loading credentials, 729 | # etc. depending on system configuration, but it does not always work. 730 | # 731 | # If any errors are encountered when opening/closing PAM sessions, this is 732 | # automatically set to False. 733 | #c.PAMAuthenticator.open_sessions = True 734 | 735 | ## The name of the PAM service to use for authentication 736 | #c.PAMAuthenticator.service = 'login' 737 | 738 | #------------------------------------------------------------------------------ 739 | # CryptKeeper(SingletonConfigurable) configuration 740 | #------------------------------------------------------------------------------ 741 | 742 | ## Encapsulate encryption configuration 743 | # 744 | # Use via the encryption_config singleton below. 745 | 746 | ## 747 | #c.CryptKeeper.keys = [] 748 | 749 | ## The number of threads to allocate for encryption 750 | #c.CryptKeeper.n_threads = 4 751 | -------------------------------------------------------------------------------- /deploy/docker/flux/lib/protobuf-java-3.3.0.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/deploy/docker/flux/lib/protobuf-java-3.3.0.jar -------------------------------------------------------------------------------- /deploy/docker/flux/lib/rosbaginputformat.jar: -------------------------------------------------------------------------------- 1 | rosbaginputformat_2.11-0.9.8.jar -------------------------------------------------------------------------------- /deploy/docker/flux/lib/rosbaginputformat_2.11-0.9.8.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/deploy/docker/flux/lib/rosbaginputformat_2.11-0.9.8.jar -------------------------------------------------------------------------------- /deploy/docker/flux/lib/scala-library-2.11.8.jar: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/deploy/docker/flux/lib/scala-library-2.11.8.jar -------------------------------------------------------------------------------- /deploy/docker/flux/spark-ex-kubernetes.sh: -------------------------------------------------------------------------------- 1 | ## 2 | ## 3 | 4 | # Here is the working version on MyMac 5 | 6 | bin/spark-submit \ 7 | --master k8s://https://192.168.1.40:6443 \ 8 | --deploy-mode cluster \ 9 | --name spark-pi \ 10 | --class org.apache.spark.examples.SparkPi \ 11 | --conf spark.executor.instances=1 \ 12 | --conf spark.kubernetes.container.image=seunghan/spark_k8s/spark:test_0.1 \ 13 | local:///opt/spark/examples/jars/spark-examples_2.11-2.3.0.jar 14 | 15 | # k8s://https://: 16 | #spark-submit \ 17 | # --master k8s://https://192.168.1.40:6443 \ 18 | # --deploy-mode cluster \ 19 | # --name spark-pi \ 20 | # --class org.apache.spark.examples.SparkPi \ 21 | # --jars https://path/to/dependency1.jar,https://path/to/dependency2.jar 22 | # --files hdfs://host:port/path/to/file1,hdfs://host:port/path/to/file2 23 | # --conf spark.executor.instances=5 \ 24 | # --conf spark.kubernetes.container.image= \ 25 | # https://path/to/examples.jar 26 | 27 | # https://apache-spark-on-k8s.github.io/userdocs/running-on-kubernetes.html 28 | #bin/spark-submit \ 29 | # --deploy-mode cluster \ 30 | # --class org.apache.spark.examples.SparkPi \ 31 | # --master k8s://https://: \ 32 | # --kubernetes-namespace default \ 33 | # --conf spark.executor.instances=5 \ 34 | # --conf spark.app.name=spark-pi \ 35 | # --conf spark.kubernetes.driver.docker.image=kubespark/spark-driver:v2.2.0-kubernetes-0.5.0 \ 36 | # --conf spark.kubernetes.executor.docker.image=kubespark/spark-executor:v2.2.0-kubernetes-0.5.0 \ 37 | # local:///opt/spark/examples/jars/spark-examples_2.11-2.2.0-k8s-0.5.0.jar 38 | 39 | spark-submit \ 40 | --master k8s://https://192.168.1.40:6443 \ 41 | --deploy-mode cluster \ 42 | --name spark-pi \ 43 | --class org.apache.spark.examples.SparkPi \ 44 | --conf spark.executor.instances=5 \ 45 | --conf spark.kubernetes.container.image=anantpukale/spark_app:1.1 \ 46 | local:///home/flux/spark-2.3.0-bin-hadoop2.7/examples/jars/spark-examples_2.11-2.3.0.jar 47 | 48 | 49 | # Directly on mac 50 | # /opt/spark/ 51 | 52 | bin/spark-submit \ 53 | --master k8s://https://192.168.1.40:6443 \ 54 | --deploy-mode cluster \ 55 | --name spark-pi \ 56 | --class org.apache.spark.examples.SparkPi \ 57 | --conf spark.executor.instances=5 \ 58 | --conf spark.kubernetes.container.image=kubespark/spark-driver:v2.2.0-kubernetes-0.5.0 \ 59 | local:///opt/spark/examples/jars/spark-examples_2.11-2.3.0.jar 60 | 61 | 62 | 63 | 64 | 65 | ## following commands ... config params doesn't work.. 66 | 67 | spark-submit \ 68 | --master k8s://https://192.168.1.40:6443 \ 69 | --deploy-mode cluster \ 70 | --name spark-pi \ 71 | --class org.apache.spark.examples.SparkPi \ 72 | --conf spark.executor.instances=5 \ 73 | --conf spark.kubernetes.driver.docker.image=kubespark/spark-driver:v2.2.0-kubernetes-0.5.0 \ 74 | --conf spark.kubernetes.executor.docker.image=kubespark/spark-executor:v2.2.0-kubernetes-0.5.0 \ 75 | local:///home/flux/spark-2.3.0-bin-hadoop2.7/examples/jars/spark-examples_2.11-2.3.0.jar 76 | 77 | 78 | bin/spark-submit \ 79 | --deploy-mode cluster \ 80 | --class org.apache.spark.examples.SparkPi \ 81 | --master k8s://https://192.168.1.40:6443 \ 82 | --kubernetes-namespace default \ 83 | --conf spark.executor.instances=5 \ 84 | --conf spark.app.name=spark-pi \ 85 | --conf spark.kubernetes.driver.docker.image=kubespark/spark-driver:v2.2.0-kubernetes-0.5.0 \ 86 | --conf spark.kubernetes.executor.docker.image=kubespark/spark-executor:v2.2.0-kubernetes-0.5.0 \ 87 | local:///opt/spark/examples/jars/spark-examples_2.11-2.2.0-k8s-0.5.0.jar 88 | 89 | 90 | 91 | 92 | bin/spark-submit 93 | --master k8s://https://192.168.1.40:6443 94 | --deploy-mode cluster 95 | --name spark-pi 96 | --class org.apache.spark.examples.SparkPi 97 | --conf spark.executor.instances=5 98 | --conf spark.kubernetes.driver.docker.image=kubespark/spark-driver:v2.2.0-kubernetes-0.5.0 99 | --conf spark.kubernetes.executor.docker.image=kubespark/spark-executor:v2.2.0-kubernetes-0.5.0 100 | local:///opt/spark/examples/jars/spark-examples_2.11-2.3.0.jar 101 | 102 | 103 | 104 | 105 | spark-submit \ 106 | --master k8s://https://192.168.1.40:6443 \ 107 | --deploy-mode cluster \ 108 | --name spark-pi \ 109 | --class org.apache.spark.examples.SparkPi \ 110 | --conf spark.executor.instances=1 \ 111 | --conf spark.kubernetes.container.image=seunghan/spark_k8s/spark:test_0.1 \ 112 | local:///home/flux/spark-2.3.0-bin-hadoop2.7/examples/jars/spark-examples_2.11-2.3.0.jar 113 | 114 | 115 | spark-submit \ 116 | --master k8s://https://192.168.1.40:6443 \ 117 | --deploy-mode cluster \ 118 | --name spark-pi \ 119 | --class org.apache.spark.examples.SparkPi \ 120 | --conf spark.executor.instances=1 \ 121 | --conf spark.kubernetes.container.image=seunghan/spark_k8s/spark:test_0.1 \ 122 | local:///opt/apache/spark-2.3.0-bin-hadoop2.7/examples/jars/spark-examples_2.11-2.3.0.jar 123 | -------------------------------------------------------------------------------- /deploy/docker/hdfs4k8s/Dockerfile-datanode: -------------------------------------------------------------------------------- 1 | # Note : Original source of the following dockerfile 2 | # https://github.com/big-data-europe/docker-hadoop/blob/master/datanode/Dockerfile 3 | FROM bde2020/hadoop-base:1.1.0-hadoop2.7.1-java8 4 | 5 | HEALTHCHECK CMD curl -f http://localhost:50075/ || exit 1 6 | 7 | ENV HDFS_CONF_dfs_datanode_data_dir=file:///hadoop/dfs/data 8 | RUN mkdir -p /hadoop/dfs/data 9 | #VOLUME /hadoop/dfs/data 10 | 11 | COPY deploy/docker/hdfs4k8s/run-dn.sh /run.sh 12 | RUN chmod a+x /run.sh 13 | 14 | EXPOSE 50075 15 | 16 | CMD ["/run.sh"] -------------------------------------------------------------------------------- /deploy/docker/hdfs4k8s/Dockerfile-namenode: -------------------------------------------------------------------------------- 1 | # Note : Original source of the following dockerfile 2 | # https://github.com/big-data-europe/docker-hadoop/blob/master/namenode/Dockerfile 3 | FROM bde2020/hadoop-base:1.1.0-hadoop2.7.1-java8 4 | #MAINTAINER Ivan Ermilov 5 | 6 | HEALTHCHECK CMD curl -f http://localhost:50070/ || exit 1 7 | 8 | ENV HDFS_CONF_dfs_namenode_name_dir=file:///hadoop/dfs/name 9 | RUN mkdir -p /hadoop/dfs/name 10 | #VOLUME /hadoop/dfs/name 11 | 12 | COPY deploy/docker/hdfs4k8s/run-nn.sh /run.sh 13 | RUN chmod a+x /run.sh 14 | 15 | EXPOSE 50070 16 | 17 | CMD ["/run.sh"] -------------------------------------------------------------------------------- /deploy/docker/hdfs4k8s/run-dn.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | #### 4 | # Original source of the following script 5 | # Source : https://github.com/big-data-europe/docker-hadoop/blob/master/datanode/run.sh 6 | #### 7 | 8 | datadir=`echo $HDFS_CONF_dfs_datanode_data_dir | perl -pe 's#file://##'` 9 | if [ ! -d $datadir ]; then 10 | echo "Datanode data directory not found: $datadir" 11 | exit 2 12 | fi 13 | 14 | $HADOOP_PREFIX/bin/hdfs --config $HADOOP_CONF_DIR datanode 15 | -------------------------------------------------------------------------------- /deploy/docker/hdfs4k8s/run-nn.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | #### 4 | # Original source of the following script 5 | # Source : https://github.com/big-data-europe/docker-hadoop/tree/master/datanode 6 | #### 7 | namedir=`echo $HDFS_CONF_dfs_namenode_name_dir | perl -pe 's#file://##'` 8 | if [ ! -d $namedir ]; then 9 | echo "Namenode name directory not found: $namedir" 10 | exit 2 11 | fi 12 | 13 | if [ -z "$CLUSTER_NAME" ]; then 14 | echo "Cluster name not specified" 15 | exit 2 16 | fi 17 | 18 | if [ "`ls -A $namedir`" == "" ]; then 19 | echo "Formatting namenode name directory: $namedir" 20 | $HADOOP_PREFIX/bin/hdfs --config $HADOOP_CONF_DIR namenode -format $CLUSTER_NAME 21 | fi 22 | 23 | $HADOOP_PREFIX/bin/hdfs --config $HADOOP_CONF_DIR namenode 24 | -------------------------------------------------------------------------------- /deploy/docker/ros_base/Dockerfile: -------------------------------------------------------------------------------- 1 | # This is an auto generated Dockerfile for ros:ros-core 2 | # generated from docker_images/create_ros_core_image.Dockerfile.em 3 | FROM ubuntu:xenial 4 | #FROM nvidia/cuda:9.0-cudnn7-devel-ubuntu16.04 5 | #FROM nvidia/cuda:9.0-cudnn7-runtime-ubuntu16.04 6 | 7 | # install packages 8 | RUN apt-get update && apt-get install -y --no-install-recommends \ 9 | dirmngr \ 10 | gnupg2 \ 11 | && rm -rf /var/lib/apt/lists/* 12 | 13 | # setup keys 14 | RUN apt-key adv --keyserver hkp://keyserver.ubuntu.com:80 --recv-keys 421C365BD9FF1F717815A3895523BAEEB01FA116 15 | 16 | # setup sources.list 17 | RUN echo "deb http://packages.ros.org/ros/ubuntu xenial main" > /etc/apt/sources.list.d/ros-latest.list 18 | 19 | # install bootstrap tools 20 | RUN apt-get update && apt-get install --no-install-recommends -y \ 21 | python-rosdep \ 22 | python-rosinstall \ 23 | python-vcstools \ 24 | && rm -rf /var/lib/apt/lists/* 25 | 26 | # setup environment 27 | ENV LANG C.UTF-8 28 | ENV LC_ALL C.UTF-8 29 | 30 | # bootstrap rosdep 31 | RUN rosdep init \ 32 | && rosdep update 33 | 34 | # install ros packages 35 | ENV ROS_DISTRO kinetic 36 | RUN apt-get update && apt-get install -y \ 37 | ros-kinetic-ros-core=1.3.2-0* \ 38 | && rm -rf /var/lib/apt/lists/* 39 | 40 | # setup entrypoint 41 | COPY ros_entrypoint.sh / 42 | 43 | ENTRYPOINT ["/ros_entrypoint.sh"] 44 | CMD ["bash"] 45 | -------------------------------------------------------------------------------- /deploy/docker/ros_base/Dockerfile-gpu: -------------------------------------------------------------------------------- 1 | # This is an auto generated Dockerfile for ros:ros-core 2 | # generated from docker_images/create_ros_core_image.Dockerfile.em 3 | #FROM ubuntu:xenial 4 | #FROM nvidia/cuda:9.0-cudnn7-devel-ubuntu16.04 5 | FROM nvidia/cuda:9.0-cudnn7-runtime-ubuntu16.04 6 | 7 | # install packages 8 | RUN apt-get update && apt-get install -y --no-install-recommends \ 9 | dirmngr \ 10 | gnupg2 \ 11 | && rm -rf /var/lib/apt/lists/* 12 | 13 | # setup keys 14 | RUN apt-key adv --keyserver hkp://keyserver.ubuntu.com:80 --recv-keys 421C365BD9FF1F717815A3895523BAEEB01FA116 15 | 16 | # setup sources.list 17 | RUN echo "deb http://packages.ros.org/ros/ubuntu xenial main" > /etc/apt/sources.list.d/ros-latest.list 18 | 19 | # install bootstrap tools 20 | RUN apt-get update && apt-get install --no-install-recommends -y \ 21 | python-rosdep \ 22 | python-rosinstall \ 23 | python-vcstools \ 24 | && rm -rf /var/lib/apt/lists/* 25 | 26 | # setup environment 27 | ENV LANG C.UTF-8 28 | ENV LC_ALL C.UTF-8 29 | 30 | # bootstrap rosdep 31 | RUN rosdep init \ 32 | && rosdep update 33 | 34 | # install ros packages 35 | ENV ROS_DISTRO kinetic 36 | RUN apt-get update && apt-get install -y \ 37 | ros-kinetic-ros-core=1.3.2-0* \ 38 | && rm -rf /var/lib/apt/lists/* 39 | 40 | # setup entrypoint 41 | COPY ros_entrypoint.sh / 42 | 43 | ENTRYPOINT ["/ros_entrypoint.sh"] 44 | CMD ["bash"] 45 | -------------------------------------------------------------------------------- /deploy/docker/ros_base/README.txt: -------------------------------------------------------------------------------- 1 | 2 | ## ROS Dockerfile source 3 | 4 | https://github.com/osrf/docker_images/blob/f2b13092747c0f60cf7608369b57ea89bc01e22d/ros/kinetic/ubuntu/xenial/ros-core/Dockerfile 5 | 6 | 7 | -------------------------------------------------------------------------------- /deploy/docker/ros_base/ros_entrypoint.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | set -e 3 | 4 | # setup ros environment 5 | source "/opt/ros/$ROS_DISTRO/setup.bash" 6 | exec "$@" 7 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/README.md: -------------------------------------------------------------------------------- 1 | # Distrbuted multi-node HDFS set up on kubernetes 2 | 3 | ### Helm package 4 | To package the kubernetes components with helm one needs only the helm client. 5 | If you do not have helm already, download it and run once ```helm init -c``` (just ```helm init``` if tiller is not already installed) that will create a .helm folder structure in your $HOME 6 | 7 | Note: On a cluster using Ubuntu OS run the following 8 | ```bash 9 | kubectl patch deploy --namespace kube-system tiller-deploy -p '{"spec":{"template":{"spec":{"serviceAccount":"tiller"}}}}' 10 | ``` 11 | 12 | Lint the helm packages 13 | ```bash 14 | helm lint $(./flux) hdfs-pvc/ 15 | helm lint $(./flux) hdfs-flux/ 16 | ``` 17 | 18 | Package the helm charts as follows 19 | ```bash 20 | helm package hdfs-pvc/ 21 | helm package hdfs-flux/ 22 | ``` 23 | 24 | ### Flux namespace 25 | 26 | All components assume a kubernetes namespace flux. 27 | ```bash 28 | kubectl create namespace flux 29 | ``` 30 | 31 | ### Install HDFS 32 | 33 | Label one kubernetes node as hdfs-namenode 34 | ```bash 35 | kubectl label no hdfs-namenode-selector=hdfs-namenode 36 | ``` 37 | Label a list of kubernetes nodes as hdfs-datanode 38 | ```bash 39 | kubectl label no hdfs-datanode-selector=hdfs-datanode 40 | # ... 41 | ``` 42 | 43 | NOTE: If you need to specify persistence volume manually, install the `hdfs-pv` helm package. (By default namenode and datanode will use `/tmp/name` and `/tmp/data` on host machines. You can customize the path as specified in the below `install` command.) 44 | 45 | ```bash 46 | helm lint $(./flux) hdfs-pv/ 47 | helm package hdfs-pv/ 48 | helm install --name hdfs-pv $(./flux) --set flux.datanode_host_path="/path/to/storage/dn" --set flux.namenode_host_path="/path/to/storage/nn" hdfs-pv-0.2.0.tgz 49 | ``` 50 | 51 | Install the helm packages 52 | ```bash 53 | helm install --name=hdfs-pvc $(./flux) hdfs-pvc-0.2.0.tgz 54 | helm install --name=hdfs $(./flux) ./hdfs-flux-0.2.0.tgz 55 | ``` 56 | 57 | Connect to a datanode and create the HDFS directories 58 | ```bash 59 | kubectl exec -it -n flux datanode-0 -- hdfs dfs -mkdir -p /user/flux 60 | ``` 61 | 62 | Delete the hdfs pods and services 63 | ```bash 64 | helm delete --purge hdfs 65 | ``` 66 | 67 | Delete the hdfs PersistenceVolumeClaim 68 | ```bash 69 | helm delete --purge hdfs-pvc 70 | ``` 71 | 72 | Delete the hdfs PersistenceVolume 73 | ```bash 74 | helm delete --purge hdfs-pv 75 | ``` 76 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/flux: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env bash 2 | 3 | NODES=$(kubectl get nodes -o jsonpath='{.items..metadata.name}') 4 | NODES_CNT=$(echo "${NODES}" | tr ' ' '\n' | wc -l | xargs echo -n) 5 | NAMENODES=$(kubectl get nodes -o jsonpath="{.items[?(@.metadata.labels['hdfs-namenode-selector'])]..metadata.name}" | tr ' ' ',') 6 | NAMENODES_CNT=$(echo "${NAMENODES}" | tr ',' '\n' | wc -l | xargs echo -n) 7 | DATANODES=$(kubectl get nodes -o jsonpath="{.items[?(@.metadata.labels['hdfs-datanode-selector'])]..metadata.name}" | tr ' ' ',') 8 | DATANODES_CNT=$(echo "${DATANODES}" | tr ',' '\n' | wc -l | xargs echo -n) 9 | NAMENODE_HOST_PATH='/tmp' 10 | DATANODE_HOST_PATH='/tmp' 11 | #echo "Nodes: ${NODES}" 12 | #echo "Namenodes: ${NAMENODES}" 13 | #echo "DataNodes: ${DATANODES}" 14 | #echo "Namenodes hostpath: ${NAMENODE_HOST_PATH}" 15 | #echo "Datanodes hostpath: ${DATANODE_HOST_PATH}" 16 | echo -n "--set flux.datanodes_cnt=${DATANODES_CNT} --set flux.datanodes={${DATANODES}} --set flux.namenodes={${NAMENODES}} " 17 | #--set flux.datanode.host_path=${DATANODE_HOST_PATH} --set flux.namenode_host_path=${NAMENODE_HOST_PATH} " 18 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/flux-init: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env bash 2 | kubectl create ns flux 3 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/.helmignore: -------------------------------------------------------------------------------- 1 | # Patterns to ignore when building packages. 2 | # This supports shell glob matching, relative path matching, and 3 | # negation (prefixed with !). Only one pattern per line. 4 | .DS_Store 5 | # Common VCS dirs 6 | .git/ 7 | .gitignore 8 | .bzr/ 9 | .bzrignore 10 | .hg/ 11 | .hgignore 12 | .svn/ 13 | # Common backup files 14 | *.swp 15 | *.bak 16 | *.tmp 17 | *~ 18 | # Various IDEs 19 | .project 20 | .idea/ 21 | *.tmproj 22 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/Chart.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | appVersion: "1.0" 3 | description: HDFS Helm chart for Kubernetes 4 | name: hdfs-flux 5 | version: 0.2.0 6 | home: https://hadoop.apache.org/ 7 | sources: 8 | - https://github.com/apache/hadoop 9 | icon: http://hadoop.apache.org/images/hadoop-logo.jpg 10 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/templates/NOTES.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/deploy/kubernetes/distributed/hdfs-flux/templates/NOTES.txt -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/templates/_helpers.tpl: -------------------------------------------------------------------------------- 1 | {{/* vim: set filetype=mustache: */}} 2 | {{/* 3 | Expand the name of the chart. 4 | */}} 5 | {{- define "hdfs-flux.name" -}} 6 | {{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" -}} 7 | {{- end -}} 8 | 9 | {{/* 10 | Create a default fully qualified app name. 11 | We truncate at 63 chars because some Kubernetes name fields are limited to this (by the DNS naming spec). 12 | If release name contains chart name it will be used as a full name. 13 | */}} 14 | {{- define "hdfs-flux.fullname" -}} 15 | {{- if .Values.fullnameOverride -}} 16 | {{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" -}} 17 | {{- else -}} 18 | {{- $name := default .Chart.Name .Values.nameOverride -}} 19 | {{- if contains $name .Release.Name -}} 20 | {{- .Release.Name | trunc 63 | trimSuffix "-" -}} 21 | {{- else -}} 22 | {{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" -}} 23 | {{- end -}} 24 | {{- end -}} 25 | {{- end -}} 26 | 27 | {{/* 28 | Create chart name and version as used by the chart label. 29 | */}} 30 | {{- define "hdfs-flux.chart" -}} 31 | {{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" -}} 32 | {{- end -}} 33 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/templates/dn-ds.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | kind: Service 3 | metadata: 4 | name: datanode 5 | namespace: flux 6 | spec: 7 | ports: 8 | - name: dfs 9 | port: 50020 10 | protocol: TCP 11 | - name: datatransfer 12 | port: 50010 13 | protocol: TCP 14 | - name: webhdfs 15 | port: 50075 16 | clusterIP: None 17 | selector: 18 | name: datanode 19 | app: flux-dn 20 | 21 | --- 22 | apiVersion: apps/v1 23 | kind: StatefulSet 24 | metadata: 25 | name: datanode 26 | namespace: flux 27 | spec: 28 | selector: 29 | matchLabels: 30 | name: datanode 31 | app: flux-dn 32 | serviceName: datanode 33 | replicas: {{ .Values.flux.datanodes_cnt }} 34 | template: 35 | metadata: 36 | labels: 37 | name: datanode 38 | app: flux-dn 39 | spec: 40 | dnsPolicy: ClusterFirstWithHostNet 41 | containers: 42 | - name: datanode 43 | image: {{ .Values.image.datanode }} 44 | hostname: datanode 45 | ports: 46 | - containerPort: 50075 47 | - containerPort: 50010 48 | - containerPort: 50020 49 | envFrom: 50 | - configMapRef: 51 | name: hadoop-cm 52 | volumeMounts: 53 | - name: datanode-volume 54 | mountPath: /hadoop/dfs 55 | nodeSelector: 56 | hdfs-datanode-selector: hdfs-datanode 57 | volumeClaimTemplates: 58 | - metadata: 59 | name: datanode-volume 60 | spec: 61 | accessModes: 62 | - ReadWriteOnce 63 | selector: 64 | matchLabels: 65 | datanode-pv-label: pvc-hdfs-dn 66 | 67 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/templates/hdfs-cm.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | data: 3 | CORE_CONF_fs_defaultFS: hdfs://namenode:8020 4 | CORE_CONF_hadoop_http_staticuser_user: root 5 | CORE_CONF_hadoop_proxyuser_hue_groups: '*' 6 | CORE_CONF_hadoop_proxyuser_hue_hosts: '*' 7 | HDFS_CONF_dfs_permissions_enabled: "false" 8 | HDFS_CONF_dfs_webhdfs_enabled: "true" 9 | HDFS_CONF_dfs_namenode_datanode_registration_ip___hostname___check: "false" 10 | kind: ConfigMap 11 | metadata: 12 | name: hadoop-cm 13 | namespace: flux 14 | 15 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/templates/nn-pod.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | kind: Pod 3 | metadata: 4 | name: namenode 5 | namespace: flux 6 | labels: 7 | app: flux-nn 8 | chart: {{ .Chart.Name }}-{{ .Chart.Version | replace "+" "_"}} 9 | release: {{ .Release.Name }} 10 | heritage: {{ .Release.Service }} 11 | spec: 12 | hostNetwork: false 13 | hostPID: true 14 | dnsPolicy: ClusterFirstWithHostNet 15 | containers: 16 | - name: namenode 17 | replicas: 1 18 | image: {{ .Values.image.namenode }} 19 | hostname: namenode 20 | ports: 21 | - containerPort: 50070 22 | - containerPort: 8020 23 | env: 24 | - name: CLUSTER_NAME 25 | value: flux-cluster 26 | envFrom: 27 | - configMapRef: 28 | name: hadoop-cm 29 | volumeMounts: 30 | - name: namenode-volume 31 | mountPath: /hadoop/dfs 32 | volumes: 33 | - name: namenode-volume 34 | persistentVolumeClaim: 35 | claimName: namenode-volume-namenode-0 36 | nodeSelector: 37 | hdfs-namenode-selector: hdfs-namenode 38 | 39 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/templates/nn-svc.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | kind: Service 3 | metadata: 4 | name: namenode 5 | namespace: flux 6 | labels: 7 | app: flux-nn 8 | chart: {{ .Chart.Name }}-{{ .Chart.Version | replace "+" "_"}} 9 | release: {{ .Release.Name }} 10 | heritage: {{ .Release.Service }} 11 | spec: 12 | ports: 13 | - protocol: TCP 14 | port: 8020 15 | name: namenode-port 16 | - protocol: TCP 17 | port: 50070 18 | name: namenode-port-ui 19 | clusterIP: None 20 | selector: 21 | app: flux-nn 22 | release: {{ .Release.Name }} 23 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-flux/values.yaml: -------------------------------------------------------------------------------- 1 | # Default values for hdfs-flux. 2 | # This is a YAML-formatted file. 3 | # Declare variables to be passed into your templates. 4 | 5 | replicaCount: 1 6 | 7 | image: 8 | datanode: bde2020/hadoop-datanode:1.1.0-hadoop2.8-java8 9 | namenode: bde2020/hadoop-namenode:1.1.0-hadoop2.8-java8 10 | 11 | persistence: 12 | datanode: 13 | accessMode: ReadWriteOnce 14 | size: 10Gi 15 | namenode: 16 | accessMode: ReadWriteOnce 17 | size: 10Gi 18 | 19 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pv/.helmignore: -------------------------------------------------------------------------------- 1 | # Patterns to ignore when building packages. 2 | # This supports shell glob matching, relative path matching, and 3 | # negation (prefixed with !). Only one pattern per line. 4 | .DS_Store 5 | # Common VCS dirs 6 | .git/ 7 | .gitignore 8 | .bzr/ 9 | .bzrignore 10 | .hg/ 11 | .hgignore 12 | .svn/ 13 | # Common backup files 14 | *.swp 15 | *.bak 16 | *.tmp 17 | *~ 18 | # Various IDEs 19 | .project 20 | .idea/ 21 | *.tmproj 22 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pv/Chart.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | appVersion: "1.0" 3 | description: HDFS PV Helm chart for Kubernetes 4 | name: hdfs-pv 5 | version: 0.2.0 6 | home: https://github.com/flux-project/flux 7 | sources: 8 | - https://github.com/flux-project/flux 9 | icon: http://hadoop.apache.org/images/hadoop-logo.jpg 10 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pv/templates/NOTES.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/deploy/kubernetes/distributed/hdfs-pv/templates/NOTES.txt -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pv/templates/_helpers.tpl: -------------------------------------------------------------------------------- 1 | {{/* vim: set filetype=mustache: */}} 2 | {{/* 3 | Expand the name of the chart. 4 | */}} 5 | {{- define "hdfs-pv.name" -}} 6 | {{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" -}} 7 | {{- end -}} 8 | 9 | {{/* 10 | Create a default fully qualified app name. 11 | We truncate at 63 chars because some Kubernetes name fields are limited to this (by the DNS naming spec). 12 | If release name contains chart name it will be used as a full name. 13 | */}} 14 | {{- define "hdfs-pv.fullname" -}} 15 | {{- if .Values.fullnameOverride -}} 16 | {{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" -}} 17 | {{- else -}} 18 | {{- $name := default .Chart.Name .Values.nameOverride -}} 19 | {{- if contains $name .Release.Name -}} 20 | {{- .Release.Name | trunc 63 | trimSuffix "-" -}} 21 | {{- else -}} 22 | {{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" -}} 23 | {{- end -}} 24 | {{- end -}} 25 | {{- end -}} 26 | 27 | {{/* 28 | Create chart name and version as used by the chart label. 29 | */}} 30 | {{- define "hdfs-pv.chart" -}} 31 | {{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" -}} 32 | {{- end -}} 33 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pv/templates/dn-pv.yaml: -------------------------------------------------------------------------------- 1 | {{- range $i,$dn := .Values.flux.datanodes }} 2 | --- 3 | kind: PersistentVolume 4 | apiVersion: v1 5 | metadata: 6 | name: datanode-volume-datanode-{{ $i }} 7 | labels: 8 | type: local 9 | spec: 10 | capacity: 11 | storage: {{ $.Values.persistence.datanode.size |quote }} 12 | accessModes: 13 | - {{ $.Values.persistence.datanode.accessMode | quote }} 14 | hostPath: 15 | path: {{ $.Values.flux.datanode_host_path | default "/tmp/data" | quote }} 16 | {{- end}} 17 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pv/templates/nn-pv.yaml: -------------------------------------------------------------------------------- 1 | kind: PersistentVolume 2 | apiVersion: v1 3 | metadata: 4 | name: namenode-volume-namenode-0 5 | labels: 6 | type: local 7 | spec: 8 | capacity: 9 | storage: {{ .Values.persistence.namenode.size |quote }} 10 | accessModes: 11 | - {{ .Values.persistence.namenode.accessMode | quote }} 12 | hostPath: 13 | path: {{ .Values.flux.namenode_host_path | default "/tmp/name" | quote }} 14 | 15 | 16 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pv/values.yaml: -------------------------------------------------------------------------------- 1 | # Default values for hdfs-pv flux. 2 | # This is a YAML-formatted file. 3 | # Declare variables to be passed into your templates. 4 | 5 | replicaCount: 1 6 | 7 | persistence: 8 | datanode: 9 | accessMode: ReadWriteOnce 10 | size: 10Gi 11 | namenode: 12 | accessMode: ReadWriteOnce 13 | size: 10Gi 14 | 15 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pvc/Chart.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | appVersion: "1.0" 3 | description: HDFS Helm chart for Kubernetes 4 | name: hdfs-pvc 5 | version: 0.2.0 6 | home: https://github.com/flux-project/ 7 | sources: 8 | - https://github.com/flux-project/ 9 | icon: http://hadoop.apache.org/images/hadoop-logo.jpg 10 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pvc/templates/_helpers.tpl: -------------------------------------------------------------------------------- 1 | {{/* vim: set filetype=mustache: */}} 2 | {{/* 3 | Expand the name of the chart. 4 | */}} 5 | {{- define "hdfs-flux.name" -}} 6 | {{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" -}} 7 | {{- end -}} 8 | 9 | {{/* 10 | Create a default fully qualified app name. 11 | We truncate at 63 chars because some Kubernetes name fields are limited to this (by the DNS naming spec). 12 | If release name contains chart name it will be used as a full name. 13 | */}} 14 | {{- define "hdfs-flux.fullname" -}} 15 | {{- if .Values.fullnameOverride -}} 16 | {{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" -}} 17 | {{- else -}} 18 | {{- $name := default .Chart.Name .Values.nameOverride -}} 19 | {{- if contains $name .Release.Name -}} 20 | {{- .Release.Name | trunc 63 | trimSuffix "-" -}} 21 | {{- else -}} 22 | {{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" -}} 23 | {{- end -}} 24 | {{- end -}} 25 | {{- end -}} 26 | 27 | {{/* 28 | Create chart name and version as used by the chart label. 29 | */}} 30 | {{- define "hdfs-flux.chart" -}} 31 | {{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" -}} 32 | {{- end -}} 33 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pvc/templates/dn-pvc.yaml: -------------------------------------------------------------------------------- 1 | {{- range $i,$dn := .Values.flux.datanodes }} 2 | --- 3 | apiVersion: v1 4 | kind: PersistentVolumeClaim 5 | metadata: 6 | name: datanode-volume-datanode-{{ $i }} 7 | namespace: flux 8 | labels: 9 | datanode-pv-label: pvc-hdfs-dn 10 | app: flux-dn-pvc 11 | chart: {{ $.Chart.Name }}-{{ $.Chart.Version | replace "+" "_"}} 12 | release: {{ $.Release.Name }} 13 | heritage: {{ $.Release.Service }} 14 | spec: 15 | accessModes: 16 | - {{ $.Values.persistence.datanode.accessMode | quote }} 17 | resources: 18 | requests: 19 | storage: {{ $.Values.persistence.datanode.size |quote }} 20 | {{- end }} 21 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pvc/templates/nn-pvc.yaml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | kind: PersistentVolumeClaim 3 | metadata: 4 | name: namenode-volume-namenode-0 5 | namespace: flux 6 | labels: 7 | app: flux-nn 8 | chart: {{ .Chart.Name }}-{{ .Chart.Version | replace "+" "_"}} 9 | release: {{ .Release.Name }} 10 | heritage: {{ .Release.Service }} 11 | spec: 12 | accessModes: 13 | - {{ .Values.persistence.namenode.accessMode | quote }} 14 | resources: 15 | requests: 16 | storage: {{ .Values.persistence.namenode.size |quote }} 17 | 18 | -------------------------------------------------------------------------------- /deploy/kubernetes/distributed/hdfs-pvc/values.yaml: -------------------------------------------------------------------------------- 1 | # Default values for hdfs-flux. 2 | # This is a YAML-formatted file. 3 | # Declare variables to be passed into your templates. 4 | 5 | replicaCount: 1 6 | 7 | image: 8 | datanode: fluxproject/hdfs-dn-4k8s:0.1 9 | namenode: fluxproject/hdfs-nn-4k8s:0.1 10 | 11 | persistence: 12 | datanode: 13 | accessMode: ReadWriteOnce 14 | size: 10Gi 15 | namenode: 16 | accessMode: ReadWriteOnce 17 | size: 10Gi 18 | 19 | -------------------------------------------------------------------------------- /deploy/kubernetes/flux-ros-hadoop-deployment.yml: -------------------------------------------------------------------------------- 1 | apiVersion: extensions/v1beta1 2 | kind: Deployment 3 | metadata: 4 | annotations: 5 | deployment.kubernetes.io/revision: "1" 6 | creationTimestamp: null 7 | generation: 1 8 | labels: 9 | run: flux-ros-hadoop 10 | name: flux-ros-hadoop 11 | selfLink: /apis/extensions/v1beta1/namespaces/default/deployments/flux-ros-hadoop 12 | spec: 13 | replicas: 1 14 | selector: 15 | matchLabels: 16 | run: flux-ros-hadoop 17 | strategy: 18 | rollingUpdate: 19 | maxSurge: 1 20 | maxUnavailable: 1 21 | type: RollingUpdate 22 | template: 23 | metadata: 24 | creationTimestamp: null 25 | labels: 26 | run: flux-ros-hadoop 27 | spec: 28 | containers: 29 | - image: fluxproject/examples 30 | imagePullPolicy: IfNotPresent 31 | name: flux-ros-hadoop 32 | ports: 33 | - containerPort: 8000 34 | protocol: TCP 35 | terminationMessagePath: /dev/termination-log 36 | terminationMessagePolicy: File 37 | dnsPolicy: ClusterFirst 38 | restartPolicy: Always 39 | schedulerName: default-scheduler 40 | securityContext: {} 41 | terminationGracePeriodSeconds: 30 42 | status: {} 43 | -------------------------------------------------------------------------------- /deploy/kubernetes/flux-ros-hadoop-gpu-deployment.yml: -------------------------------------------------------------------------------- 1 | apiVersion: extensions/v1beta1 2 | kind: Deployment 3 | metadata: 4 | annotations: 5 | deployment.kubernetes.io/revision: "1" 6 | creationTimestamp: null 7 | generation: 1 8 | labels: 9 | run: flux-ros-hadoop-gpu 10 | name: flux-ros-hadoop-gpu 11 | selfLink: /apis/extensions/v1beta1/namespaces/default/deployments/flux-ros-hadoop-gpu 12 | spec: 13 | replicas: 1 14 | selector: 15 | matchLabels: 16 | run: flux-ros-hadoop-gpu 17 | strategy: 18 | rollingUpdate: 19 | maxSurge: 1 20 | maxUnavailable: 1 21 | type: RollingUpdate 22 | template: 23 | metadata: 24 | creationTimestamp: null 25 | labels: 26 | run: flux-ros-hadoop-gpu 27 | spec: 28 | containers: 29 | - image: fluxproject/examples_gpu 30 | imagePullPolicy: IfNotPresent 31 | name: flux-ros-hadoop-gpu 32 | ports: 33 | - containerPort: 8000 34 | protocol: TCP 35 | resources: 36 | limits: 37 | nvidia.com/gpu: 1 38 | requests: 39 | nvidia.com/gpu: 1 40 | terminationMessagePath: /dev/termination-log 41 | terminationMessagePolicy: File 42 | dnsPolicy: ClusterFirst 43 | restartPolicy: Always 44 | schedulerName: default-scheduler 45 | securityContext: {} 46 | terminationGracePeriodSeconds: 30 47 | status: {} 48 | -------------------------------------------------------------------------------- /deploy/kubernetes/flux-ros-hadoop-gpu-service.yml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | kind: Service 3 | metadata: 4 | creationTimestamp: null 5 | labels: 6 | run: flux-ros-hadoop-gpu 7 | name: flux-ros-hadoop-gpu 8 | selfLink: /api/v1/namespaces/default/services/flux-ros-hadoop-gpu 9 | spec: 10 | externalTrafficPolicy: Cluster 11 | ports: 12 | - port: 8000 13 | protocol: TCP 14 | targetPort: 8000 15 | selector: 16 | run: flux-ros-hadoop-gpu 17 | sessionAffinity: None 18 | type: NodePort 19 | status: 20 | loadBalancer: {} 21 | -------------------------------------------------------------------------------- /deploy/kubernetes/flux-ros-hadoop-service.yml: -------------------------------------------------------------------------------- 1 | apiVersion: v1 2 | kind: Service 3 | metadata: 4 | creationTimestamp: null 5 | labels: 6 | run: flux-ros-hadoop 7 | name: flux-ros-hadoop 8 | selfLink: /api/v1/namespaces/default/services/flux-ros-hadoop 9 | spec: 10 | externalTrafficPolicy: Cluster 11 | ports: 12 | - port: 8000 13 | protocol: TCP 14 | targetPort: 8000 15 | selector: 16 | run: flux-ros-hadoop 17 | sessionAffinity: None 18 | type: NodePort 19 | status: 20 | loadBalancer: {} 21 | -------------------------------------------------------------------------------- /examples/concept.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/examples/concept.png -------------------------------------------------------------------------------- /examples/drive-obj-detect.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/examples/drive-obj-detect.mp4 -------------------------------------------------------------------------------- /examples/drive-stats.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/examples/drive-stats.mp4 -------------------------------------------------------------------------------- /examples/header.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/examples/header.png -------------------------------------------------------------------------------- /examples/lane_detector.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import cv2 3 | from PIL import Image 4 | import glob 5 | from line import Line 6 | 7 | class LaneDetector: 8 | def __init__(self, sample_img_path): 9 | self.nx, self.ny = 9, 6 10 | self.sample_img = cv2.imread(sample_img_path) 11 | self.img_size = self.sample_img.shape[1::-1] 12 | self.mtx, self.dist = self.calibrate_camera() 13 | self.s_thresh=(170, 255) 14 | self.sx_thresh=(20, 100) 15 | self.img_src_points, self.warped_img, self.perspective_M, self.Minv = self.corners_unwarp(self.sample_img, self.mtx, self.dist) 16 | self.ploty = np.linspace(0, self.sample_img.shape[0]-1, num=self.sample_img.shape[0]) 17 | self.y_eval = np.max(self.ploty) 18 | # window settings 19 | self.window_width = 50 20 | self.window_height = 80 # Break image into 9 vertical layers since image height is 720 21 | self.margin = 100 22 | self.ym_per_pix = 30/720 23 | self.xm_per_pix = 3.7/700 24 | self.left_lane = Line() 25 | self.right_lane = Line() 26 | self.last_n_frames = 1 27 | 28 | def calibrate_camera(self): 29 | objp = np.zeros((self.ny*self.nx,3), np.float32) 30 | objp[:,:2] = np.mgrid[0:self.nx, 0:self.ny].T.reshape(-1,2) 31 | 32 | objpoints = [] 33 | imgpoints = [] 34 | cal_images_path = "./camera_cal/*jpg" 35 | cal_images = glob.glob(cal_images_path) 36 | 37 | for idx, fname in enumerate(cal_images): 38 | img = cv2.imread(fname) 39 | gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY) 40 | 41 | # Find the chessboard corners 42 | ret, corners = cv2.findChessboardCorners(gray, (self.nx, self.ny), None) 43 | 44 | # If found, add object points, image points 45 | if ret == True: 46 | objpoints.append(objp) 47 | imgpoints.append(corners) 48 | 49 | cal_img = cv2.imread('camera_cal/calibration1.jpg') 50 | cal_img_size = (cal_img.shape[1::-1]) 51 | ret, mtx, dist, rvecs, tvecs = cv2.calibrateCamera(objpoints, imgpoints, cal_img_size, None, None) 52 | 53 | return mtx, dist 54 | 55 | def thresholding_pipeline(self, img, s_thresh=(170, 255), sx_thresh=(20, 100)): 56 | img = np.copy(img) 57 | # Convert to HLS color space 58 | hls = cv2.cvtColor(img, cv2.COLOR_BGR2HLS) 59 | h_channel = hls[:,:,0] 60 | l_channel = hls[:,:,1] 61 | s_channel = hls[:,:,2] 62 | 63 | gray = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY) 64 | # Sobel x 65 | sobelx = cv2.Sobel(gray, cv2.CV_64F, 1, 0) # Take the derivative in x 66 | abs_sobelx = np.absolute(sobelx) # Absolute x derivative to accentuate lines away from horizontal 67 | scaled_sobel = np.uint8(255*abs_sobelx/np.max(abs_sobelx)) 68 | 69 | # Threshold x gradient 70 | sxbinary = np.zeros_like(scaled_sobel) 71 | sxbinary[(scaled_sobel >= sx_thresh[0]) & (scaled_sobel <= sx_thresh[1])] = 1 72 | 73 | # Threshold color channel 74 | s_binary = np.zeros_like(s_channel) 75 | s_binary[(s_channel >= s_thresh[0]) & (s_channel <= s_thresh[1])] = 1 76 | # Stack each channel 77 | color_binary = np.dstack(( np.zeros_like(sxbinary), sxbinary, s_binary)) * 255 78 | 79 | combined_binary = np.zeros_like(sxbinary) 80 | combined_binary[(s_binary == 1) | (sxbinary == 1)] = 1 81 | 82 | return color_binary, combined_binary 83 | 84 | def corners_unwarp(self, img, mtx, dist): 85 | undist = cv2.undistort(img, mtx, dist, None, mtx) 86 | img_size = undist.shape[1::-1] 87 | src = np.float32([[600, 450], [685, 450], 88 | [1100, 720], [200, 720]]) 89 | 90 | dst = np.float32([[300, 0], [980, 0], 91 | [980, 720], [300, 720]]) 92 | 93 | M = cv2.getPerspectiveTransform(src, dst) 94 | Minv = cv2.getPerspectiveTransform(dst, src) 95 | warped = cv2.warpPerspective(img, M ,img_size, flags=cv2.INTER_LINEAR) 96 | 97 | cv2.polylines(img,np.int32([src]),True,(255,0,0),thickness=3) 98 | cv2.polylines(warped,np.int32([dst]),True,(255,0,0),thickness=3) 99 | 100 | return img, warped, M, Minv 101 | 102 | 103 | def window_mask(self, width, height, img_ref, center,level): 104 | output = np.zeros_like(img_ref) 105 | output[int(img_ref.shape[0]-(level+1)*height):int(img_ref.shape[0]-level*height),max(0,int(center-width/2)):min(int(center+width/2),img_ref.shape[1])] = 1 106 | return output 107 | 108 | def find_window_centroids(self, image, window_width, window_height, margin): 109 | window_centroids = [] # Store the (left,right) window centroid positions per level 110 | window = np.ones(window_width) # Create our window template that we will use for convolutions 111 | 112 | # First find the two starting positions for the left and right lane by using np.sum to get the vertical image slice 113 | # and then np.convolve the vertical image slice with the window template 114 | 115 | # Sum quarter bottom of image to get slice, could use a different ratio 116 | l_sum = np.sum(image[int(3*image.shape[0]/4):,:int(image.shape[1]/2)], axis=0) 117 | l_center = np.argmax(np.convolve(window,l_sum))-window_width/2 118 | r_sum = np.sum(image[int(3*image.shape[0]/4):,int(image.shape[1]/2):], axis=0) 119 | r_center = np.argmax(np.convolve(window,r_sum))-window_width/2+int(image.shape[1]/2) 120 | 121 | # Add what we found for the first layer 122 | window_centroids.append((l_center,r_center)) 123 | 124 | # Go through each layer looking for max pixel locations 125 | for level in range(1,(int)(image.shape[0]/window_height)): 126 | # convolve the window into the vertical slice of the image 127 | image_layer = np.sum(image[int(image.shape[0]-(level+1)*window_height):int(image.shape[0]-level*window_height),:], axis=0) 128 | conv_signal = np.convolve(window, image_layer) 129 | # Find the best left centroid by using past left center as a reference 130 | # Use window_width/2 as offset because convolution signal reference is at right side of window, not center of window 131 | offset = window_width/2 132 | l_min_index = int(max(l_center+offset-margin,0)) 133 | l_max_index = int(min(l_center+offset+margin,image.shape[1])) 134 | l_center = np.argmax(conv_signal[l_min_index:l_max_index])+l_min_index-offset 135 | # Find the best right centroid by using past right center as a reference 136 | r_min_index = int(max(r_center+offset-margin,0)) 137 | r_max_index = int(min(r_center+offset+margin,image.shape[1])) 138 | r_center = np.argmax(conv_signal[r_min_index:r_max_index])+r_min_index-offset 139 | # Add what we found for that layer 140 | window_centroids.append((l_center,r_center)) 141 | 142 | return window_centroids 143 | 144 | def detect_lane_pixles(self, binary_warped): 145 | window_centroids = self.find_window_centroids(binary_warped, self.window_width, self.window_height, self.margin) 146 | 147 | # If we found any window centers 148 | if len(window_centroids) > 0: 149 | 150 | # Points used to draw all the left and right windows 151 | l_points = np.zeros_like(binary_warped) 152 | r_points = np.zeros_like(binary_warped) 153 | 154 | # Go through each level and draw the windows 155 | for level in range(0,len(window_centroids)): 156 | # Window_mask is a function to draw window areas 157 | l_mask = self.window_mask(self.window_width,self.window_height,binary_warped,window_centroids[level][0],level) 158 | r_mask = self.window_mask(self.window_width,self.window_height,binary_warped,window_centroids[level][1],level) 159 | # Add graphic points from window mask here to total pixels found 160 | l_points[(l_points == 255) | ((l_mask == 1) ) ] = 255 161 | r_points[(r_points == 255) | ((r_mask == 1) ) ] = 255 162 | 163 | # Draw the results 164 | template = np.array(r_points+l_points,np.uint8) # add both left and right window pixels together 165 | zero_channel = np.zeros_like(template) # create a zero color channel 166 | template = np.array(cv2.merge((zero_channel,template,zero_channel)),np.uint8) # make window pixels green 167 | warpage= np.dstack((binary_warped, binary_warped, binary_warped))*255 # making the original road pixels 3 color channels 168 | output = cv2.addWeighted(warpage, 1, template, 0.5, 0.0) # overlay the orignal road image with window results 169 | 170 | # If no window centers found, just display orginal road image 171 | else: 172 | output = np.array(cv2.merge((binary_warped,binary_warped,binary_warped)),np.uint8) 173 | 174 | return output, l_points, r_points 175 | 176 | def get_lane_features(self, binary_warped): 177 | lane_lines, l_points, r_points = self.detect_lane_pixles(binary_warped) 178 | 179 | left_lane_pixels = np.nonzero(l_points) 180 | right_lane_pixels = np.nonzero(r_points) 181 | 182 | self.left_lane.detected = True 183 | self.right_lane.detected = True 184 | 185 | self.left_lane.allx = left_lane_pixels[1] 186 | self.left_lane.ally = left_lane_pixels[0] 187 | self.right_lane.allx = right_lane_pixels[1] 188 | self.right_lane.ally = right_lane_pixels[0] 189 | 190 | left_fit = np.polyfit(self.left_lane.ally, self.left_lane.allx, 2) 191 | right_fit = np.polyfit(self.right_lane.ally, self.right_lane.allx, 2) 192 | 193 | if(len(self.left_lane.current_fit) >= self.last_n_frames): 194 | self.left_lane.current_fit.pop() 195 | self.left_lane.current_fit.append(left_fit) 196 | 197 | if(len(self.right_lane.current_fit) >= self.last_n_frames): 198 | self.right_lane.current_fit.pop() 199 | self.right_lane.current_fit.append(right_fit) 200 | 201 | self.left_lane.best_fit = np.mean( self.left_lane.current_fit, axis=0 ) 202 | self.right_lane.best_fit = np.mean( self.right_lane.current_fit, axis=0 ) 203 | 204 | left_x_fitted = left_fit[0] * self.ploty**2 + left_fit[1] * self.ploty + left_fit[2] 205 | right_x_fitted = right_fit[0] * self.ploty**2 + right_fit[1] * self.ploty + right_fit[2] 206 | 207 | for i in range(len(left_x_fitted)): 208 | if (right_x_fitted[i] - left_x_fitted[i]) > 706: 209 | left_x_fitted[i] = right_x_fitted[i] - 700 210 | 211 | if(len(self.left_lane.recent_xfitted) >= self.last_n_frames): 212 | self.left_lane.recent_xfitted.pop() 213 | self.left_lane.recent_xfitted.append(left_x_fitted) 214 | 215 | if(len(self.right_lane.recent_xfitted) >= self.last_n_frames): 216 | self.right_lane.recent_xfitted.pop() 217 | self.right_lane.recent_xfitted.append(right_x_fitted) 218 | 219 | self.left_lane.bestx = np.mean( self.left_lane.recent_xfitted, axis=0 ) 220 | self.right_lane.bestx = np.mean( self.right_lane.recent_xfitted, axis=0 ) 221 | 222 | left_fit_cr = np.polyfit(self.ploty * self.ym_per_pix, self.left_lane.bestx * self.xm_per_pix, 2) 223 | right_fit_cr = np.polyfit(self.ploty * self.ym_per_pix, self.right_lane.bestx * self.xm_per_pix, 2) 224 | # Calculate the new radii of curvature 225 | self.left_lane.radius_of_curvature = ((1 + (2 * left_fit_cr[0] * self.y_eval * self.ym_per_pix + left_fit_cr[1])**2)**1.5) / np.absolute(2*left_fit_cr[0]) 226 | self.right_lane.radius_of_curvature = ((1 + (2 * right_fit_cr[0] * self.y_eval * self.ym_per_pix + right_fit_cr[1])**2)**1.5) / np.absolute(2*right_fit_cr[0]) 227 | 228 | return 229 | 230 | def draw_lane_path(self, binary, undist): 231 | warp_zero = np.zeros_like(binary).astype(np.uint8) 232 | color_warp = np.dstack((warp_zero, warp_zero, warp_zero)) 233 | 234 | # Recast the x and y points into usable format for cv2.fillPoly() 235 | pts_left = np.array([np.transpose(np.vstack([self.left_lane.bestx, self.ploty]))]) 236 | pts_right = np.array([np.flipud(np.transpose(np.vstack([self.right_lane.bestx, self.ploty])))]) 237 | pts = np.hstack((pts_left, pts_right)) 238 | 239 | # Draw the lane onto the warped blank image 240 | cv2.fillPoly(color_warp, np.int_([pts]), (0,255, 0)) 241 | 242 | # Warp the blank back to original image space using inverse perspective matrix (Minv) 243 | newwarp = cv2.warpPerspective(color_warp, self.Minv, (undist.shape[1], undist.shape[0])) 244 | # Combine the result with the original image 245 | result = cv2.addWeighted(undist, 1, newwarp, 0.3, 0) 246 | 247 | return result 248 | 249 | def detect_lane(self, img): 250 | img = cv2.cvtColor(img, cv2.COLOR_RGB2BGR) 251 | undist = cv2.undistort(img, self.mtx, self.dist, None, self.mtx) 252 | color_binary, combined_binary = self.thresholding_pipeline(undist, self.s_thresh, self.sx_thresh) 253 | binary_warped = cv2.warpPerspective(combined_binary, self.perspective_M ,self.img_size, flags=cv2.INTER_LINEAR) 254 | self.get_lane_features(binary_warped) 255 | out = self.draw_lane_path(binary_warped, undist) 256 | 257 | return out -------------------------------------------------------------------------------- /examples/line.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | 3 | class Line(): 4 | def __init__(self): 5 | # was the line detected in the last iteration? 6 | self.detected = False 7 | # x values of the last n fits of the line 8 | self.recent_xfitted = [] 9 | #average x values of the fitted line over the last n iterations 10 | self.bestx = None 11 | #polynomial coefficients averaged over the last n iterations 12 | self.best_fit = None 13 | #polynomial coefficients for last n fits 14 | self.current_fit = [] 15 | #radius of curvature of the line in some units 16 | self.radius_of_curvature = None 17 | #distance in meters of vehicle center from the line 18 | self.line_base_pos = None 19 | #difference in fit coefficients between last and new fits 20 | self.diffs = np.array([0,0,0], dtype='float') 21 | #x values for detected line pixels 22 | self.allx = None 23 | #y values for detected line pixels 24 | self.ally = None -------------------------------------------------------------------------------- /examples/map.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/examples/map.png -------------------------------------------------------------------------------- /examples/object_detection_model.py: -------------------------------------------------------------------------------- 1 | from keras.models import Sequential, Model 2 | from keras.layers import Reshape, Activation, Conv2D, Input, MaxPooling2D, BatchNormalization, Flatten, Dense, Lambda 3 | from keras.layers.advanced_activations import LeakyReLU 4 | from keras.callbacks import EarlyStopping, ModelCheckpoint, TensorBoard 5 | from keras.optimizers import SGD, Adam, RMSprop 6 | from keras.layers.merge import concatenate 7 | import numpy as np 8 | import tensorflow as tf 9 | 10 | class YOLO2MODEL: 11 | def __init__(self): 12 | self.LABELS = ['person', 'bicycle', 'car', 'motorcycle', 'airplane', 'bus', 'train', 'truck', 'boat', 'traffic light', 'fire hydrant', 'stop sign', 'parking meter', 'bench', 'bird', 'cat', 'dog', 'horse', 'sheep', 'cow', 'elephant', 'bear', 'zebra', 'giraffe', 'backpack', 'umbrella', 'handbag', 'tie', 'suitcase', 'frisbee', 'skis', 'snowboard', 'sports ball', 'kite', 'baseball bat', 'baseball glove', 'skateboard', 'surfboard', 'tennis racket', 'bottle', 'wine glass', 'cup', 'fork', 'knife', 'spoon', 'bowl', 'banana', 'apple', 'sandwich', 'orange', 'broccoli', 'carrot', 'hot dog', 'pizza', 'donut', 'cake', 'chair', 'couch', 'potted plant', 'bed', 'dining table', 'toilet', 'tv', 'laptop', 'mouse', 'remote', 'keyboard', 'cell phone', 'microwave', 'oven', 'toaster', 'sink', 'refrigerator', 'book', 'clock', 'vase', 'scissors', 'teddy bear', 'hair drier', 'toothbrush'] 13 | 14 | self.IMAGE_H, self.IMAGE_W = 416, 416 15 | self.GRID_H, self.GRID_W = 13 , 13 16 | self.BOX = 5 17 | self.CLASSES = len(self.LABELS) 18 | self.CLASS_WEIGHTS = np.ones(self.CLASSES, dtype='float32') 19 | self.OBJ_THRESHOLD = 0.3 20 | self.NMS_THRESHOLD = 0.3 21 | self.ANCHORS = [0.57273, 0.677385, 1.87446, 2.06253, 3.33843, 5.47434, 7.88282, 3.52778, 9.77052, 9.16828] 22 | 23 | self.NO_OBJECT_SCALE = 1.0 24 | self.OBJECT_SCALE = 5.0 25 | self.COORD_SCALE = 1.0 26 | self.CLASS_SCALE = 1.0 27 | 28 | self.BATCH_SIZE = 16 29 | self.WARM_UP_BATCHES = 0 30 | self.TRUE_BOX_BUFFER = 50 31 | 32 | def space_to_depth_x2(self,x): 33 | return tf.space_to_depth(x, block_size=2) 34 | 35 | def build(self): 36 | input_image = Input(shape=(self.IMAGE_H, self.IMAGE_W, 3)) 37 | true_boxes = Input(shape=(1, 1, 1, self.TRUE_BOX_BUFFER , 4)) 38 | # Layer 1 39 | x = Conv2D(32, (3,3), strides=(1,1), padding='same', name='conv_1', use_bias=False)(input_image) 40 | x = BatchNormalization(name='norm_1')(x) 41 | x = LeakyReLU(alpha=0.1)(x) 42 | x = MaxPooling2D(pool_size=(2, 2))(x) 43 | 44 | # Layer 2 45 | x = Conv2D(64, (3,3), strides=(1,1), padding='same', name='conv_2', use_bias=False)(x) 46 | x = BatchNormalization(name='norm_2')(x) 47 | x = LeakyReLU(alpha=0.1)(x) 48 | x = MaxPooling2D(pool_size=(2, 2))(x) 49 | 50 | # Layer 3 51 | x = Conv2D(128, (3,3), strides=(1,1), padding='same', name='conv_3', use_bias=False)(x) 52 | x = BatchNormalization(name='norm_3')(x) 53 | x = LeakyReLU(alpha=0.1)(x) 54 | 55 | # Layer 4 56 | x = Conv2D(64, (1,1), strides=(1,1), padding='same', name='conv_4', use_bias=False)(x) 57 | x = BatchNormalization(name='norm_4')(x) 58 | x = LeakyReLU(alpha=0.1)(x) 59 | 60 | # Layer 5 61 | x = Conv2D(128, (3,3), strides=(1,1), padding='same', name='conv_5', use_bias=False)(x) 62 | x = BatchNormalization(name='norm_5')(x) 63 | x = LeakyReLU(alpha=0.1)(x) 64 | x = MaxPooling2D(pool_size=(2, 2))(x) 65 | 66 | # Layer 6 67 | x = Conv2D(256, (3,3), strides=(1,1), padding='same', name='conv_6', use_bias=False)(x) 68 | x = BatchNormalization(name='norm_6')(x) 69 | x = LeakyReLU(alpha=0.1)(x) 70 | 71 | # Layer 7 72 | x = Conv2D(128, (1,1), strides=(1,1), padding='same', name='conv_7', use_bias=False)(x) 73 | x = BatchNormalization(name='norm_7')(x) 74 | x = LeakyReLU(alpha=0.1)(x) 75 | 76 | # Layer 8 77 | x = Conv2D(256, (3,3), strides=(1,1), padding='same', name='conv_8', use_bias=False)(x) 78 | x = BatchNormalization(name='norm_8')(x) 79 | x = LeakyReLU(alpha=0.1)(x) 80 | x = MaxPooling2D(pool_size=(2, 2))(x) 81 | 82 | # Layer 9 83 | x = Conv2D(512, (3,3), strides=(1,1), padding='same', name='conv_9', use_bias=False)(x) 84 | x = BatchNormalization(name='norm_9')(x) 85 | x = LeakyReLU(alpha=0.1)(x) 86 | 87 | # Layer 10 88 | x = Conv2D(256, (1,1), strides=(1,1), padding='same', name='conv_10', use_bias=False)(x) 89 | x = BatchNormalization(name='norm_10')(x) 90 | x = LeakyReLU(alpha=0.1)(x) 91 | 92 | # Layer 11 93 | x = Conv2D(512, (3,3), strides=(1,1), padding='same', name='conv_11', use_bias=False)(x) 94 | x = BatchNormalization(name='norm_11')(x) 95 | x = LeakyReLU(alpha=0.1)(x) 96 | 97 | # Layer 12 98 | x = Conv2D(256, (1,1), strides=(1,1), padding='same', name='conv_12', use_bias=False)(x) 99 | x = BatchNormalization(name='norm_12')(x) 100 | x = LeakyReLU(alpha=0.1)(x) 101 | 102 | # Layer 13 103 | x = Conv2D(512, (3,3), strides=(1,1), padding='same', name='conv_13', use_bias=False)(x) 104 | x = BatchNormalization(name='norm_13')(x) 105 | x = LeakyReLU(alpha=0.1)(x) 106 | 107 | skip_connection = x 108 | 109 | x = MaxPooling2D(pool_size=(2, 2))(x) 110 | 111 | # Layer 14 112 | x = Conv2D(1024, (3,3), strides=(1,1), padding='same', name='conv_14', use_bias=False)(x) 113 | x = BatchNormalization(name='norm_14')(x) 114 | x = LeakyReLU(alpha=0.1)(x) 115 | 116 | # Layer 15 117 | x = Conv2D(512, (1,1), strides=(1,1), padding='same', name='conv_15', use_bias=False)(x) 118 | x = BatchNormalization(name='norm_15')(x) 119 | x = LeakyReLU(alpha=0.1)(x) 120 | 121 | # Layer 16 122 | x = Conv2D(1024, (3,3), strides=(1,1), padding='same', name='conv_16', use_bias=False)(x) 123 | x = BatchNormalization(name='norm_16')(x) 124 | x = LeakyReLU(alpha=0.1)(x) 125 | 126 | # Layer 17 127 | x = Conv2D(512, (1,1), strides=(1,1), padding='same', name='conv_17', use_bias=False)(x) 128 | x = BatchNormalization(name='norm_17')(x) 129 | x = LeakyReLU(alpha=0.1)(x) 130 | 131 | # Layer 18 132 | x = Conv2D(1024, (3,3), strides=(1,1), padding='same', name='conv_18', use_bias=False)(x) 133 | x = BatchNormalization(name='norm_18')(x) 134 | x = LeakyReLU(alpha=0.1)(x) 135 | 136 | # Layer 19 137 | x = Conv2D(1024, (3,3), strides=(1,1), padding='same', name='conv_19', use_bias=False)(x) 138 | x = BatchNormalization(name='norm_19')(x) 139 | x = LeakyReLU(alpha=0.1)(x) 140 | 141 | # Layer 20 142 | x = Conv2D(1024, (3,3), strides=(1,1), padding='same', name='conv_20', use_bias=False)(x) 143 | x = BatchNormalization(name='norm_20')(x) 144 | x = LeakyReLU(alpha=0.1)(x) 145 | 146 | # Layer 21 147 | skip_connection = Conv2D(64, (1,1), strides=(1,1), padding='same', name='conv_21', use_bias=False)(skip_connection) 148 | skip_connection = BatchNormalization(name='norm_21')(skip_connection) 149 | skip_connection = LeakyReLU(alpha=0.1)(skip_connection) 150 | skip_connection = Lambda(self.space_to_depth_x2)(skip_connection) 151 | 152 | x = concatenate([skip_connection, x]) 153 | 154 | # Layer 22 155 | x = Conv2D(1024, (3,3), strides=(1,1), padding='same', name='conv_22', use_bias=False)(x) 156 | x = BatchNormalization(name='norm_22')(x) 157 | x = LeakyReLU(alpha=0.1)(x) 158 | 159 | # Layer 23 160 | x = Conv2D(self.BOX * (4 + 1 + self.CLASSES), (1,1), strides=(1,1), padding='same', name='conv_23')(x) 161 | output = Reshape((self.GRID_H, self.GRID_W, self.BOX, 4 + 1 + self.CLASSES))(x) 162 | 163 | # small hack to allow true_boxes to be registered when Keras build the model 164 | # for more information: https://github.com/fchollet/keras/issues/2790 165 | output = Lambda(lambda args: args[0])([output, true_boxes]) 166 | 167 | model = Model([input_image, true_boxes], output) 168 | 169 | return model -------------------------------------------------------------------------------- /examples/object_detector.py: -------------------------------------------------------------------------------- 1 | from keras.models import Sequential, Model 2 | from keras.layers import Reshape, Activation, Conv2D, Input, MaxPooling2D, BatchNormalization, Flatten, Dense, Lambda 3 | from keras.layers.advanced_activations import LeakyReLU 4 | from keras.callbacks import EarlyStopping, ModelCheckpoint, TensorBoard 5 | from keras.optimizers import SGD, Adam, RMSprop 6 | from keras.layers.merge import concatenate 7 | import matplotlib.pyplot as plt 8 | import keras.backend as K 9 | import tensorflow as tf 10 | from tqdm import tqdm 11 | import numpy as np 12 | import pickle 13 | import os, cv2 14 | from utils import WeightReader, decode_netout, draw_boxes 15 | from object_detection_model import YOLO2MODEL 16 | 17 | class ObjectDetector: 18 | def __init__(self, weights_path): 19 | self.wt_path = weights_path 20 | self.yoloModelObj = YOLO2MODEL() 21 | self.model = self.yoloModelObj.build() 22 | self.load_model_weights() 23 | 24 | def load_model_weights(self): 25 | weight_reader = WeightReader(self.wt_path) 26 | #weight_reader.reset() 27 | nb_conv = 23 28 | 29 | for i in range(1, nb_conv+1): 30 | conv_layer = self.model.get_layer('conv_' + str(i)) 31 | 32 | if i < nb_conv: 33 | norm_layer = self.model.get_layer('norm_' + str(i)) 34 | 35 | size = np.prod(norm_layer.get_weights()[0].shape) 36 | 37 | beta = weight_reader.read_bytes(size) 38 | gamma = weight_reader.read_bytes(size) 39 | mean = weight_reader.read_bytes(size) 40 | var = weight_reader.read_bytes(size) 41 | 42 | weights = norm_layer.set_weights([gamma, beta, mean, var]) 43 | 44 | if len(conv_layer.get_weights()) > 1: 45 | bias = weight_reader.read_bytes(np.prod(conv_layer.get_weights()[1].shape)) 46 | kernel = weight_reader.read_bytes(np.prod(conv_layer.get_weights()[0].shape)) 47 | kernel = kernel.reshape(list(reversed(conv_layer.get_weights()[0].shape))) 48 | kernel = kernel.transpose([2,3,1,0]) 49 | conv_layer.set_weights([kernel, bias]) 50 | else: 51 | kernel = weight_reader.read_bytes(np.prod(conv_layer.get_weights()[0].shape)) 52 | kernel = kernel.reshape(list(reversed(conv_layer.get_weights()[0].shape))) 53 | kernel = kernel.transpose([2,3,1,0]) 54 | conv_layer.set_weights([kernel]) 55 | 56 | return 57 | 58 | def detect_obj(self, image): 59 | dummy_array = np.zeros((1,1,1,1,self.yoloModelObj.TRUE_BOX_BUFFER,4)) 60 | input_image = cv2.resize(image, (416, 416)) 61 | input_image = input_image / 255. 62 | input_image = input_image[:,:,::-1] 63 | input_image = np.expand_dims(input_image, 0) 64 | 65 | netout = self.model.predict([input_image, dummy_array]) 66 | 67 | boxes = decode_netout(netout[0], 68 | obj_threshold=self.yoloModelObj.OBJ_THRESHOLD, 69 | nms_threshold=self.yoloModelObj.NMS_THRESHOLD, 70 | anchors=self.yoloModelObj.ANCHORS, 71 | nb_class=self.yoloModelObj.CLASSES) 72 | 73 | image = draw_boxes(image, boxes, labels=self.yoloModelObj.LABELS) 74 | 75 | return image 76 | -------------------------------------------------------------------------------- /examples/rosbag-larger-than-2-GB.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "# Let us have a look at a 20 GB Rosbag file\n", 8 | "**Note** data can be found for instance at https://github.com/udacity/self-driving-car/tree/master/datasets published under MIT License.\n", 9 | "\n", 10 | "The file is not distributed over the Dockerfile but you can download it and put it into HDFS." 11 | ] 12 | }, 13 | { 14 | "cell_type": "code", 15 | "execution_count": 1, 16 | "metadata": {}, 17 | "outputs": [ 18 | { 19 | "name": "stdout", 20 | "output_type": "stream", 21 | "text": [ 22 | "-rw-r--r-- 1 root root 20G Mar 7 15:16 /root/project/doc/el_camino_north.bag\n" 23 | ] 24 | } 25 | ], 26 | "source": [ 27 | "%%bash\n", 28 | "\n", 29 | "ls -tralFh /root/project/doc/el_camino_north.bag" 30 | ] 31 | }, 32 | { 33 | "cell_type": "code", 34 | "execution_count": 2, 35 | "metadata": {}, 36 | "outputs": [ 37 | { 38 | "name": "stdout", 39 | "output_type": "stream", 40 | "text": [ 41 | "Found 2 items\n", 42 | "-rw-r--r-- 1 root supergroup 331.6 M 2018-03-06 20:50 HMB_4.bag\n", 43 | "-rw-r--r-- 1 root supergroup 19.7 G 2018-03-07 15:28 el_camino_north.bag\n" 44 | ] 45 | } 46 | ], 47 | "source": [ 48 | "%%bash\n", 49 | "\n", 50 | "# same size, no worries, just the -h (human) formating differs in rounding \n", 51 | "hdfs dfs -ls -h" 52 | ] 53 | }, 54 | { 55 | "cell_type": "markdown", 56 | "metadata": {}, 57 | "source": [ 58 | "# Show that the we can read the index\n", 59 | "\n", 60 | "Solved the issue https://github.com/valtech/ros_hadoop/issues/6 \n", 61 | "\n", 62 | "The issue was due to ByteBuffer being limitted by JVM Integer size and has nothing to do with Spark or how the RosbagMapInputFormat works within Spark. It was only problematic to extract the conf index with the jar.\n", 63 | "\n", 64 | "Integer.MAX_SIZE is 2 GB !!" 65 | ] 66 | }, 67 | { 68 | "cell_type": "code", 69 | "execution_count": 3, 70 | "metadata": {}, 71 | "outputs": [ 72 | { 73 | "name": "stdout", 74 | "output_type": "stream", 75 | "text": [ 76 | "CPU times: user 10 ms, sys: 0 ns, total: 10 ms\n", 77 | "Wall time: 1.18 s\n" 78 | ] 79 | } 80 | ], 81 | "source": [ 82 | "%%time\n", 83 | "\n", 84 | "out = !java -jar ../lib/rosbaginputformat.jar -f /root/project/doc/el_camino_north.bag" 85 | ] 86 | }, 87 | { 88 | "cell_type": "code", 89 | "execution_count": 4, 90 | "metadata": {}, 91 | "outputs": [ 92 | { 93 | "name": "stdout", 94 | "output_type": "stream", 95 | "text": [ 96 | "-rw-r--r-- 1 root root 20G Mar 7 15:16 /root/project/doc/el_camino_north.bag\n", 97 | "-rw-r--r-- 1 root root 62K Mar 7 15:41 /root/project/doc/el_camino_north.bag.idx.bin\n" 98 | ] 99 | } 100 | ], 101 | "source": [ 102 | "%%bash\n", 103 | "ls -tralFh /root/project/doc/el_camino_north.bag*" 104 | ] 105 | }, 106 | { 107 | "cell_type": "markdown", 108 | "metadata": {}, 109 | "source": [ 110 | "# Create the Spark Session or get an existing one" 111 | ] 112 | }, 113 | { 114 | "cell_type": "code", 115 | "execution_count": 5, 116 | "metadata": {}, 117 | "outputs": [], 118 | "source": [ 119 | "from pyspark import SparkContext, SparkConf\n", 120 | "from pyspark.sql import SparkSession\n", 121 | "\n", 122 | "sparkConf = SparkConf()\n", 123 | "sparkConf.setMaster(\"local[*]\")\n", 124 | "sparkConf.setAppName(\"ros_hadoop\")\n", 125 | "sparkConf.set(\"spark.jars\", \"../lib/protobuf-java-3.3.0.jar,../lib/rosbaginputformat.jar,../lib/scala-library-2.11.8.jar\")\n", 126 | "\n", 127 | "spark = SparkSession.builder.config(conf=sparkConf).getOrCreate()\n", 128 | "sc = spark.sparkContext" 129 | ] 130 | }, 131 | { 132 | "cell_type": "markdown", 133 | "metadata": {}, 134 | "source": [ 135 | "## Create an RDD from the Rosbag file\n", 136 | "**Note:** your HDFS address might differ." 137 | ] 138 | }, 139 | { 140 | "cell_type": "code", 141 | "execution_count": 6, 142 | "metadata": {}, 143 | "outputs": [], 144 | "source": [ 145 | "fin = sc.newAPIHadoopFile(\n", 146 | " path = \"hdfs://127.0.0.1:9000/user/root/el_camino_north.bag\",\n", 147 | " inputFormatClass = \"de.valtech.foss.RosbagMapInputFormat\",\n", 148 | " keyClass = \"org.apache.hadoop.io.LongWritable\",\n", 149 | " valueClass = \"org.apache.hadoop.io.MapWritable\",\n", 150 | " conf = {\"RosbagInputFormat.chunkIdx\":\"/root/project/doc/el_camino_north.bag.idx.bin\"})" 151 | ] 152 | }, 153 | { 154 | "cell_type": "code", 155 | "execution_count": 14, 156 | "metadata": {}, 157 | "outputs": [ 158 | { 159 | "data": { 160 | "text/plain": [ 161 | "MapPartitionsRDD[2] at mapPartitions at SerDeUtil.scala:244" 162 | ] 163 | }, 164 | "execution_count": 14, 165 | "metadata": {}, 166 | "output_type": "execute_result" 167 | } 168 | ], 169 | "source": [ 170 | "fin" 171 | ] 172 | }, 173 | { 174 | "attachments": { 175 | "image.png": { 176 | "image/png": "" 177 | } 178 | }, 179 | "cell_type": "markdown", 180 | "metadata": {}, 181 | "source": [ 182 | "### On a laptop it will take some time. So please run it on a real cluster.\n", 183 | "\n", 184 | "![image.png](attachment:image.png)\n", 185 | "\n", 186 | "# Have Fun!" 187 | ] 188 | } 189 | ], 190 | "metadata": { 191 | "kernelspec": { 192 | "display_name": "Python 2", 193 | "language": "python", 194 | "name": "python2" 195 | }, 196 | "language_info": { 197 | "codemirror_mode": { 198 | "name": "ipython", 199 | "version": 2 200 | }, 201 | "file_extension": ".py", 202 | "mimetype": "text/x-python", 203 | "name": "python", 204 | "nbconvert_exporter": "python", 205 | "pygments_lexer": "ipython2", 206 | "version": "2.7.12" 207 | } 208 | }, 209 | "nbformat": 4, 210 | "nbformat_minor": 2 211 | } 212 | -------------------------------------------------------------------------------- /examples/utils.py: -------------------------------------------------------------------------------- 1 | import numpy as np 2 | import os 3 | import xml.etree.ElementTree as ET 4 | import tensorflow as tf 5 | import copy 6 | import cv2 7 | 8 | class BoundBox: 9 | def __init__(self, xmin, ymin, xmax, ymax, c = None, classes = None): 10 | self.xmin = xmin 11 | self.ymin = ymin 12 | self.xmax = xmax 13 | self.ymax = ymax 14 | 15 | self.c = c 16 | self.classes = classes 17 | 18 | self.label = -1 19 | self.score = -1 20 | 21 | def get_label(self): 22 | if self.label == -1: 23 | self.label = np.argmax(self.classes) 24 | 25 | return self.label 26 | 27 | def get_score(self): 28 | if self.score == -1: 29 | self.score = self.classes[self.get_label()] 30 | 31 | return self.score 32 | 33 | class WeightReader: 34 | def __init__(self, weight_file): 35 | self.offset = 4 36 | self.all_weights = np.fromfile(weight_file, dtype='float32') 37 | 38 | def read_bytes(self, size): 39 | self.offset = self.offset + size 40 | return self.all_weights[self.offset-size:self.offset] 41 | 42 | def reset(self): 43 | self.offset = 4 44 | 45 | def bbox_iou(box1, box2): 46 | intersect_w = _interval_overlap([box1.xmin, box1.xmax], [box2.xmin, box2.xmax]) 47 | intersect_h = _interval_overlap([box1.ymin, box1.ymax], [box2.ymin, box2.ymax]) 48 | 49 | intersect = intersect_w * intersect_h 50 | 51 | w1, h1 = box1.xmax-box1.xmin, box1.ymax-box1.ymin 52 | w2, h2 = box2.xmax-box2.xmin, box2.ymax-box2.ymin 53 | 54 | union = w1*h1 + w2*h2 - intersect 55 | 56 | return float(intersect) / union 57 | 58 | def draw_boxes(image, boxes, labels): 59 | image_h, image_w, _ = image.shape 60 | 61 | for box in boxes: 62 | xmin = int(box.xmin*image_w) 63 | ymin = int(box.ymin*image_h) 64 | xmax = int(box.xmax*image_w) 65 | ymax = int(box.ymax*image_h) 66 | 67 | cv2.rectangle(image, (xmin,ymin), (xmax,ymax), (0,255,0), 3) 68 | cv2.putText(image, 69 | labels[box.get_label()] + ' ' + str(box.get_score()), 70 | (xmin, ymin - 13), 71 | cv2.FONT_HERSHEY_SIMPLEX, 72 | 1e-3 * image_h, 73 | (0,255,0), 2) 74 | 75 | return image 76 | 77 | def decode_netout(netout, anchors, nb_class, obj_threshold=0.3, nms_threshold=0.3): 78 | grid_h, grid_w, nb_box = netout.shape[:3] 79 | 80 | boxes = [] 81 | 82 | # decode the output by the network 83 | netout[..., 4] = _sigmoid(netout[..., 4]) 84 | netout[..., 5:] = netout[..., 4][..., np.newaxis] * _softmax(netout[..., 5:]) 85 | netout[..., 5:] *= netout[..., 5:] > obj_threshold 86 | 87 | for row in range(grid_h): 88 | for col in range(grid_w): 89 | for b in range(nb_box): 90 | # from 4th element onwards are confidence and class classes 91 | classes = netout[row,col,b,5:] 92 | 93 | if np.sum(classes) > 0: 94 | # first 4 elements are x, y, w, and h 95 | x, y, w, h = netout[row,col,b,:4] 96 | 97 | x = (col + _sigmoid(x)) / grid_w # center position, unit: image width 98 | y = (row + _sigmoid(y)) / grid_h # center position, unit: image height 99 | w = anchors[2 * b + 0] * np.exp(w) / grid_w # unit: image width 100 | h = anchors[2 * b + 1] * np.exp(h) / grid_h # unit: image height 101 | confidence = netout[row,col,b,4] 102 | 103 | box = BoundBox(x-w/2, y-h/2, x+w/2, y+h/2, confidence, classes) 104 | 105 | boxes.append(box) 106 | 107 | # suppress non-maximal boxes 108 | for c in range(nb_class): 109 | sorted_indices = list(reversed(np.argsort([box.classes[c] for box in boxes]))) 110 | 111 | for i in range(len(sorted_indices)): 112 | index_i = sorted_indices[i] 113 | 114 | if boxes[index_i].classes[c] == 0: 115 | continue 116 | else: 117 | for j in range(i+1, len(sorted_indices)): 118 | index_j = sorted_indices[j] 119 | 120 | if bbox_iou(boxes[index_i], boxes[index_j]) >= nms_threshold: 121 | boxes[index_j].classes[c] = 0 122 | 123 | # remove the boxes which are less likely than a obj_threshold 124 | boxes = [box for box in boxes if box.get_score() > obj_threshold] 125 | 126 | return boxes 127 | 128 | def compute_overlap(a, b): 129 | """ 130 | Code originally from https://github.com/rbgirshick/py-faster-rcnn. 131 | Parameters 132 | ---------- 133 | a: (N, 4) ndarray of float 134 | b: (K, 4) ndarray of float 135 | Returns 136 | ------- 137 | overlaps: (N, K) ndarray of overlap between boxes and query_boxes 138 | """ 139 | area = (b[:, 2] - b[:, 0]) * (b[:, 3] - b[:, 1]) 140 | 141 | iw = np.minimum(np.expand_dims(a[:, 2], axis=1), b[:, 2]) - np.maximum(np.expand_dims(a[:, 0], 1), b[:, 0]) 142 | ih = np.minimum(np.expand_dims(a[:, 3], axis=1), b[:, 3]) - np.maximum(np.expand_dims(a[:, 1], 1), b[:, 1]) 143 | 144 | iw = np.maximum(iw, 0) 145 | ih = np.maximum(ih, 0) 146 | 147 | ua = np.expand_dims((a[:, 2] - a[:, 0]) * (a[:, 3] - a[:, 1]), axis=1) + area - iw * ih 148 | 149 | ua = np.maximum(ua, np.finfo(float).eps) 150 | 151 | intersection = iw * ih 152 | 153 | return intersection / ua 154 | 155 | def compute_ap(recall, precision): 156 | """ Compute the average precision, given the recall and precision curves. 157 | Code originally from https://github.com/rbgirshick/py-faster-rcnn. 158 | 159 | # Arguments 160 | recall: The recall curve (list). 161 | precision: The precision curve (list). 162 | # Returns 163 | The average precision as computed in py-faster-rcnn. 164 | """ 165 | # correct AP calculation 166 | # first append sentinel values at the end 167 | mrec = np.concatenate(([0.], recall, [1.])) 168 | mpre = np.concatenate(([0.], precision, [0.])) 169 | 170 | # compute the precision envelope 171 | for i in range(mpre.size - 1, 0, -1): 172 | mpre[i - 1] = np.maximum(mpre[i - 1], mpre[i]) 173 | 174 | # to calculate area under PR curve, look for points 175 | # where X axis (recall) changes value 176 | i = np.where(mrec[1:] != mrec[:-1])[0] 177 | 178 | # and sum (\Delta recall) * prec 179 | ap = np.sum((mrec[i + 1] - mrec[i]) * mpre[i + 1]) 180 | return ap 181 | 182 | def _interval_overlap(interval_a, interval_b): 183 | x1, x2 = interval_a 184 | x3, x4 = interval_b 185 | 186 | if x3 < x1: 187 | if x4 < x1: 188 | return 0 189 | else: 190 | return min(x2,x4) - x1 191 | else: 192 | if x2 < x3: 193 | return 0 194 | else: 195 | return min(x2,x4) - x3 196 | 197 | def _sigmoid(x): 198 | return 1. / (1. + np.exp(-x)) 199 | 200 | def _softmax(x, axis=-1, t=-100.): 201 | x = x - np.max(x) 202 | 203 | if np.min(x) < t: 204 | x = x/np.min(x)*t 205 | 206 | e_x = np.exp(x) 207 | 208 | return e_x / e_x.sum(axis, keepdims=True) -------------------------------------------------------------------------------- /images/flux_cloud.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/images/flux_cloud.png -------------------------------------------------------------------------------- /images/flux_overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/images/flux_overview.png -------------------------------------------------------------------------------- /images/login_notebook.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/images/login_notebook.png -------------------------------------------------------------------------------- /images/sample_notebook.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/flux-project/flux/0e48aaff31b0ee626e3a2ae507af953658dbcd85/images/sample_notebook.png --------------------------------------------------------------------------------