├── .gitattributes
├── .github
    └── FUNDING.yml
├── .gitignore
├── README.md
├── build.gradle
├── collect-stream-logs
    ├── README.md
    ├── collect-stream-logs-flow.xml
    ├── dashboard
    │   ├── draw.html
    │   ├── log.html
    │   ├── reqscanvas.js
    │   └── testEB.html
    ├── data
    │   ├── in
    │   │   └── example.log
    │   └── out
    │   │   └── .gitkeep
    ├── log-generator
    │   ├── build.gradle
    │   └── src
    │   │   └── main
    │   │       ├── groovy
    │   │           └── com.crossbusiness.loggen
    │   │           │   ├── AccessLogGenerator.groovy
    │   │           │   └── AppLogGenerator.groovy
    │   │       ├── java
    │   │           └── .gitkeep
    │   │       └── resources
    │   │           ├── example.log
    │   │           ├── logback-access.xml
    │   │           └── logback.xml
    ├── logs-demo.png
    └── logs-flow.png
├── csv-to-json
    ├── README.md
    └── csv-to-json-flow.xml
├── decompression
    ├── README.md
    └── decompression-circular-flow.xml
├── gradle.properties
├── gradle
    └── wrapper
    │   ├── gradle-wrapper.jar
    │   └── gradle-wrapper.properties
├── gradlew
├── gradlew.bat
├── http-get-route
    ├── README.md
    └── simple-httpget-route-flow.xml
├── invoke-http-route
    ├── README.md
    └── invokeHttp-and-route-original-on-status-flow.xml
├── iot-activity-tracker
    ├── README.md
    ├── dashboard
    │   └── heartrate.html
    ├── iot-demo.png
    ├── iot-flow.png
    └── iot-flow.xml
├── oltp-cdc-olap
    ├── Dockerfile
    ├── README.md
    ├── cdc-architecture.jpg
    ├── cdc-flow.png
    ├── cdc-flow.xml
    ├── kafka
    │   ├── README.md
    │   ├── kafka
    │   │   └── .gitignore
    │   ├── server.properties
    │   ├── zookeeper.properties
    │   └── zookeeper
    │   │   └── .gitignore
    ├── maxwell
    │   ├── .gitignore
    │   └── config.properties
    └── mysql
    │   ├── README.md
    │   ├── data
    │       └── .gitignore
    │   └── my.cnf
├── retry
    ├── README.md
    └── retry-count-loop.xml
├── settings.gradle
├── split-route
    ├── README.md
    ├── data
    │   ├── in
    │   │   └── sample-input.txt
    │   └── out
    │   │   └── .gitkeep
    └── split-route-merge-flow.xml
├── twitter-garden-hose
    ├── README.md
    └── pull-from-twitter-garden-hose-flow.xml
└── twitter-solr
    ├── README.md
    └── twitter-solr-flow.xml


/.gitattributes:
--------------------------------------------------------------------------------
1 | * text=auto
2 | CONTRIBUTING.md export-ignore


--------------------------------------------------------------------------------
/.github/FUNDING.yml:
--------------------------------------------------------------------------------
1 | # These are supported funding model platforms
2 | 
3 | github: [xmlking]
4 | open_collective: xmlking
5 | 
6 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
  1 | # Created by https://www.gitignore.io/api/gradle,osx,windows
  2 | 
  3 | ## App ##
  4 | logs
  5 | *.log
  6 | NOTES.md
  7 | 
  8 | ### Gradle ###
  9 | .gradle
 10 | build/
 11 | 
 12 | # Ignore Gradle GUI config
 13 | gradle-app.setting
 14 | 
 15 | # Avoid ignoring Gradle wrapper jar file (.jar files are usually ignored)
 16 | !gradle-wrapper.jar
 17 | 
 18 | 
 19 | ### Intellij ###
 20 | # Covers JetBrains IDEs: IntelliJ, RubyMine, PhpStorm, AppCode, PyCharm, CLion, Android Studio
 21 | 
 22 | *.iml
 23 | 
 24 | ## Directory-based project format:
 25 | .idea/
 26 | # if you remove the above rule, at least ignore the following:
 27 | 
 28 | # User-specific stuff:
 29 | # .idea/workspace.xml
 30 | # .idea/tasks.xml
 31 | # .idea/dictionaries
 32 | 
 33 | # Sensitive or high-churn files:
 34 | # .idea/dataSources.ids
 35 | # .idea/dataSources.xml
 36 | # .idea/sqlDataSources.xml
 37 | # .idea/dynamic.xml
 38 | # .idea/uiDesigner.xml
 39 | 
 40 | # Gradle:
 41 | # .idea/gradle.xml
 42 | # .idea/libraries
 43 | 
 44 | # Mongo Explorer plugin:
 45 | # .idea/mongoSettings.xml
 46 | 
 47 | ## File-based project format:
 48 | *.ipr
 49 | *.iws
 50 | 
 51 | ## Plugin-specific files:
 52 | 
 53 | # IntelliJ
 54 | /out/
 55 | 
 56 | # mpeltonen/sbt-idea plugin
 57 | .idea_modules/
 58 | 
 59 | # JIRA plugin
 60 | atlassian-ide-plugin.xml
 61 | 
 62 | # Crashlytics plugin (for Android Studio and IntelliJ)
 63 | com_crashlytics_export_strings.xml
 64 | crashlytics.properties
 65 | crashlytics-build.properties
 66 | 
 67 | 
 68 | ### OSX ###
 69 | .DS_Store
 70 | .AppleDouble
 71 | .LSOverride
 72 | 
 73 | # Icon must end with two \r
 74 | Icon
 75 | 
 76 | 
 77 | # Thumbnails
 78 | ._*
 79 | 
 80 | # Files that might appear in the root of a volume
 81 | .DocumentRevisions-V100
 82 | .fseventsd
 83 | .Spotlight-V100
 84 | .TemporaryItems
 85 | .Trashes
 86 | .VolumeIcon.icns
 87 | 
 88 | # Directories potentially created on remote AFP share
 89 | .AppleDB
 90 | .AppleDesktop
 91 | Network Trash Folder
 92 | Temporary Items
 93 | .apdisk
 94 | 
 95 | 
 96 | ### Windows ###
 97 | # Windows image file caches
 98 | Thumbs.db
 99 | ehthumbs.db
100 | 
101 | # Folder config file
102 | Desktop.ini
103 | 
104 | # Recycle Bin used on file shares
105 | $RECYCLE.BIN/
106 | 
107 | # Windows Installer files
108 | *.cab
109 | *.msi
110 | *.msm
111 | *.msp
112 | 
113 | # Windows shortcuts
114 | *.lnk


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
  1 | NiFi Examples
  2 | =================
  3 | 
  4 | Apache NiFi example flows.
  5 | 
  6 | #### collect-stream-logs
  7 | 
  8 | This [flow](./collect-stream-logs/) shows workflow for log collection, aggregation, store and display. 
  9 | 
 10 | 1. Ingest logs from folders.
 11 | 2. Listen for syslogs on UDP port.
 12 | 3. Merge syslogs and drop-in logs and persist merged logs to Solr for historical search. 
 13 | 4. Dashboard: stream real-time log events to dashboard and enable cross-filter search on historical logs data.
 14 | 
 15 | 
 16 | #### iot-activity-tracker
 17 | 
 18 | This [flow](./iot-activity-tracker/) shows how to bring IoT data into Enterprise.
 19 | 
 20 | 1. Ingest IoT data over WebSocket and HTTP
 21 | 3. Store all data to Hadoop(HDFS) and summary data to NoSQL(MarkLogic) for historical data search. 
 22 | 4. Route data based on pre-set thresholds (vital signs like `pulse rate` and `blood pressure`) to alert users and physicians. 
 23 | 5. Inactivity Reporting
 24 | 
 25 | 
 26 | #### oltp-to-olap
 27 | 
 28 | A low latency *Change Data Capture* [flow](./oltp-cdc-olap/) to continuously replicate data from OLTP(MySQL) to OLAP(NoSQL) systems with no impact to the source. 
 29 | 
 30 | 1. Multi-tenant: can contain data from many different databases, support multiple consumers. 
 31 | 2. Flexible CDC: Capture changes from many data sources and types. 
 32 |     1. Source consistency preservation. No impact to the source.
 33 |     2. Both DML (INSERT/UPDATE/DELETE) and DDL (ALTER/CREATE/DROP) are captured non invasively.
 34 |     3. Produce Logical Change Records (LCR) in JSON format. 
 35 |     4. Commits at the source are grouped by transaction.
 36 | 3. Flexible Consumer Dataflows: consumer dataflows can be implemented in Apache NiFi, Flink, Spark or Apex 
 37 |     1. Parallel processing data filtering, transformation and loading.
 38 | 4. Flexible Databus: store LCRs in **Kafka** streams for durability and pub-sub semantics. 
 39 |     1. Use *only* Kafka as input for all consumer dataflows.
 40 |     1. Feed data to many client types (real-time, slow/catch-up, full bootstrap).
 41 |     2. Consumption from an arbitrary time point in the change stream including full bootstrap capability of the entire data.
 42 |     3. Guaranteed in-commit-order and at-least-once delivery.
 43 |     4. Partitioned consumption (partitioned data to different Kafka topics based on database name, table or any field of LCR)
 44 | 5. Both batch and near real time delivery.
 45 | 
 46 | 
 47 | #### csv-to-json
 48 | 
 49 | This [flow](./csv-to-json/) shows how to convert a CSV entry to a JSON document using ExtractText and ReplaceText.
 50 | 
 51 | #### decompression
 52 | 
 53 | This [flow](./decompression/) demonstrates taking an archive that is created with several levels of compression and then continuously 
 54 | decompressing it using a loop until the archived file is extracted out.
 55 | 
 56 | #### http-get-route
 57 | 
 58 | his [flow](./http-get-route/) pulls from a web service (example is nifi itself), extracts text from a specific section, makes a routing decision 
 59 | on that extracted value, prepares to write to disk using PutFile.
 60 | 
 61 | #### invoke-http-route
 62 | 
 63 | This [flow](./invoke-http-route/) demonstrates how to call an HTTP service based on an incoming FlowFile, and route the original FlowFile 
 64 | based on the status code returned from the invocation. In this example, every 30 seconds a FlowFile is produced, 
 65 | an attribute is added to the FlowFile that sets q=nifi, the google.com is invoked for that FlowFile, and any response 
 66 | with a 200 is routed to a relationship called 200.
 67 | 
 68 | #### retry-count-loop
 69 | 
 70 | This [process group](./retry/) can be used to maintain a count of how many times a flowfile goes through it. If it reaches some 
 71 | configured threshold it will route to a 'Limit Exceeded' relationship otherwise it will route to 'retry'. 
 72 | Great for processes which you only want to run X number of times before you give up.
 73 | 
 74 | #### split-route
 75 | 
 76 | This [flow](./split-route/) demonstrates splitting a file on line boundaries, routing the splits based on a regex in the content, 
 77 | merging the less important files together for storage somewhere, and sending the higher priority files down 
 78 | another path to take immediate action.
 79 | 
 80 | #### twitter-garden-hose
 81 | 
 82 | This [flow](./twitter-garden-hose/) pulls from Twitter using the garden hose setting; it pulls out some basic attributes from the Json and 
 83 | then routes only those items that are actually tweets.
 84 | 
 85 | #### twitter-solr
 86 | 
 87 | This [flow](./twitter-solr/) shows how to index tweets with Solr using NiFi. Pre-requisites for this flow are NiFi 0.3.0 or later, 
 88 | the creation of a Twitter application, and a running instance of Solr 5.1 or later with a tweets collection:
 89 | 
 90 | 
 91 | ### Install NiFi
 92 | 1. Manual: Download [Apache NiFi](https://nifi.apache.org/download.html) binaries and unpack to a folder. 
 93 | 2. On Mac: `brew install nifi`
 94 | 
 95 | ### Run NiFi
 96 | ```bash
 97 | cd /Developer/Applications/nifi
 98 | ./bin/nifi.sh  start
 99 | ./bin/nifi.sh  stop
100 | ```
101 | On Mac 
102 | ```bash
103 | # nifi start|stop|run|restart|status|dump|install
104 | nifi start 
105 | nifi status  
106 | nifi stop 
107 | # Working Directory: /usr/local/Cellar/nifi/0.3.0/libexec
108 | ```


--------------------------------------------------------------------------------
/build.gradle:
--------------------------------------------------------------------------------
 1 | allprojects {
 2 |     repositories {
 3 |         mavenCentral()
 4 |     }
 5 |     version = rootVersion
 6 | }
 7 | 
 8 | subprojects {
 9 | 
10 | }
11 | 
12 | task wrapper(type: Wrapper) {
13 |     description = 'Generates gradlew[.bat] scripts'
14 |     gradleVersion = '2.7'
15 | }
16 | 


--------------------------------------------------------------------------------
/collect-stream-logs/README.md:
--------------------------------------------------------------------------------
 1 | collect-stream-logs
 2 | ===================
 3 | 
 4 | 1. Ingest logs from folders.
 5 | 2. Listen for syslogs on UDP port.
 6 | 3. Merge syslogs and drop-in logs and persist merged logs to Solr for historical search.  
 7 | 4. Dashboard: stream real-time log events to dashboard and enable cross-filter search on historical logs data. 
 8 | 
 9 | Note: this flow depends on **nifi-websocket** module, download [nar](https://github.com/xmlking/nifi-websocket/releases/download/0.1.0/nifi-websocket-0.1.0-SNAPSHOT.nar) and copy to `$NIFI_HOME/lib`
10 | 
11 | ### Run log generator
12 | ```bash
13 | gradle :collect-stream-logs:log-generator:run
14 | ```
15 | 
16 | ### Flow
17 | ![logs dataflow](./logs-flow.png)
18 | 
19 | ### Demo
20 | ![streaming logs](./logs-demo.png)
21 | 
22 | ### Reference 
23 | 1. [Collecting Logs with Apache NiFi](http://bryanbende.com/development/2015/05/17/collecting-logs-with-apache-nifi/)


--------------------------------------------------------------------------------
/collect-stream-logs/dashboard/draw.html:
--------------------------------------------------------------------------------
  1 | <!DOCTYPE html>
  2 | <html>
  3 | <head>
  4 |   <meta charset="utf-8"/>
  5 |   <title>Real time drawing App</title>
  6 |   <!--[if lt IE 9]>
  7 |   <script src="http://html5shiv.googlecode.com/svn/trunk/html5.js"></script>
  8 |   <![endif]-->
  9 | </head>
 10 | 
 11 | <body>
 12 | <canvas id="paper" width="1900" height="1000">
 13 |   Your browser needs to support canvas for this to work!
 14 | </canvas>
 15 | 
 16 | <!-- JavaScript includes. -->
 17 | <script src="//ajax.googleapis.com/ajax/libs/jquery/2.0.3/jquery.min.js" ></script>
 18 | <script src="//cdn.jsdelivr.net/sockjs/1.0.0/sockjs.min.js"></script>
 19 | <script src="//cdn.rawgit.com/vert-x3/vertx-bus-bower/master/vertx-eventbus.js"></script>
 20 | 
 21 | <script>
 22 | 
 23 |   $(function () {
 24 |     // This demo depends on the canvas element
 25 |     if (!('getContext' in document.createElement('canvas'))) {
 26 |       alert('Sorry, it looks like your browser does not support canvas!');
 27 |       return false;
 28 |     }
 29 |     var doc = $(document),
 30 |       canvas = $('#paper'),
 31 |       ctx = canvas[0].getContext('2d');
 32 |     // Generate an unique ID
 33 |     var id = Math.round($.now() * Math.random());
 34 |     // A flag for drawing activity
 35 |     var drawing = false;
 36 |     var clients = {};
 37 |     // create a event bus bridge to the server that served this file
 38 |     //var eb = new EventBus('http://apsrt1451:5555/eventbus');
 39 |     var eb = new EventBus('http://localhost:5555/eventbus');
 40 |     eb.onopen = function () {
 41 |       // listen to draw events
 42 |       eb.registerHandler('draw', function (err, res) {
 43 |         // Is the user drawing?
 44 |         var data = res.body;
 45 |         if (data.drawing && clients[data.id]) {
 46 |           // Draw a line on the canvas. clients[data.id] holds
 47 |           // the previous position of this user's mouse pointer
 48 |           drawLine(clients[data.id].x, clients[data.id].y, data.x, data.y);
 49 |         }
 50 |         // Saving the current client state
 51 |         clients[data.id] = data;
 52 |         clients[data.id].updated = $.now();
 53 |       });
 54 |     };
 55 |     var prev = {};
 56 |     canvas.on('mousedown', function (e) {
 57 |       e.preventDefault();
 58 |       drawing = true;
 59 |       prev.x = e.pageX;
 60 |       prev.y = e.pageY;
 61 |     });
 62 |     doc.bind('mouseup mouseleave', function () {
 63 |       drawing = false;
 64 |     });
 65 |     var lastEmit = $.now();
 66 |     doc.on('mousemove', function (e) {
 67 |       if ($.now() - lastEmit > 30) {
 68 |         eb.publish('draw', {
 69 |           'x': e.pageX,
 70 |           'y': e.pageY,
 71 |           'drawing': drawing,
 72 |           'id': id
 73 |         });
 74 |         lastEmit = $.now();
 75 |       }
 76 |       // Draw a line for the current user's movement, as it is
 77 |       // not received in the eventbus
 78 |       if (drawing) {
 79 |         drawLine(prev.x, prev.y, e.pageX, e.pageY);
 80 |         prev.x = e.pageX;
 81 |         prev.y = e.pageY;
 82 |       }
 83 |     });
 84 |     // Remove inactive clients after 10 seconds of inactivity
 85 |     setInterval(function () {
 86 |       for (var ident in clients) {
 87 |         if (clients.hasOwnProperty(ident)) {
 88 |           if ($.now() - clients[ident].updated > 10000) {
 89 |             // Last update was more than 10 seconds ago.
 90 |             // This user has probably closed the page
 91 |             delete clients[ident];
 92 |           }
 93 |         }
 94 |       }
 95 |     }, 10000);
 96 |     function drawLine(fromx, fromy, tox, toy) {
 97 |       ctx.moveTo(fromx, fromy);
 98 |       ctx.lineTo(tox, toy);
 99 |       ctx.stroke();
100 |     }
101 |   });
102 | </script>
103 | 
104 | </body>
105 | </html>
106 | 


--------------------------------------------------------------------------------
/collect-stream-logs/dashboard/log.html:
--------------------------------------------------------------------------------
 1 | <!doctype html>
 2 | <head>
 3 |   <meta charset="utf-8">
 4 |   <meta http-equiv="X-UA-Compatible" content="IE=edge,chrome=1">
 5 |   <title>Cloud Management Platform: CMP Console</title>
 6 |   <meta name="author" content="">
 7 |   <meta name="description" content="">
 8 |   <meta name="viewport" content="width=device-width, initial-scale=1.0">
 9 |   <!-- Place favicon.ico and apple-touch-icon.png in the root directory -->
10 |   <style>
11 |     html,
12 |     body {
13 |       height: 100%;
14 |       margin: 0;
15 |       padding: 0;
16 |     }
17 |     body {
18 |       width: 100%;
19 |       overflow: hidden;
20 |       background: #000;
21 |       display: -webkit-box;
22 |       display: -moz-box;
23 |       -webkit-box-orient: vertical;
24 |       -moz-box-orient: vertical;
25 |     }
26 |     body header,
27 |     body section,
28 |     body footer {
29 |       display: block;
30 |       -webkit-box-flex: 1;
31 |       -moz-box-flex: 1;
32 |       -moz-box-sizing: border-box;
33 |       -webkit-box-sizing: border-box;
34 |     }
35 |   </style>
36 | </head>
37 | <body>
38 | <section id="canvasContainer">
39 |   <canvas id="mainCanvas" data-speed="15" data-frame-rate="30" data-colorize="true" data-sumarize="true" data-time="true">
40 |   </canvas>
41 | </section>
42 | <script src="//ajax.googleapis.com/ajax/libs/jquery/2.0.3/jquery.min.js" ></script>
43 | <script src="//cdn.jsdelivr.net/sockjs/1.0.0/sockjs.min.js"></script>
44 | <script src="//cdn.rawgit.com/vert-x3/vertx-bus-bower/master/vertx-eventbus.js"></script>
45 | <script src="reqscanvas.js"></script>
46 | </body>
47 | </html>
48 | 


--------------------------------------------------------------------------------
/collect-stream-logs/dashboard/reqscanvas.js:
--------------------------------------------------------------------------------
  1 | /**
  2 |  *   Nodestalgia websocket & canvas experiment
  3 |  *   2012 fcsonline
  4 |  *   Sumo: This file is copied from https://github.com/fcsonline/nodestalgia/tree/develop/public/javascripts and modified to use Vert.X EventBus
  5 |  */
  6 | (function () {
  7 | 
  8 |     var PI_2 = Math.PI * 2;
  9 |     var MAX_MSG_TTL = 50;
 10 |     var MARGIN_LEFT = 150;
 11 |     var MARGIN_RIGHT = 150;
 12 |     var MARGIN_TOP = 50;
 13 |     var MARGIN_BOTTOM = 50;
 14 |     var BULLET_POPUP_DIST = 20;
 15 |     var BULLET_SIZE = 4;
 16 |     var DEFAULT_FONT = "10pt Arial";
 17 |     var PONG_HEIGHT = 50;
 18 | 
 19 |     var canvasW = 1000;
 20 |     var canvasH = 560;
 21 |     var friction = 0.99;
 22 |     var requests = [];
 23 |     var typerequests = {};
 24 |     var messages = [];
 25 |     var srcslots = [];
 26 |     var dstslots = [];
 27 |     var origins = [];
 28 |     var total = 0;
 29 |     var pongy = 0;
 30 |     var bulletpopup = -1;
 31 |     var pauseinfo = {};
 32 | 
 33 |     var canvas;
 34 |     var ctx;
 35 | 
 36 |     var longDays = ['Sunday', 'Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday', 'Saturday'];
 37 |     var longMonths = ['January', 'February', 'March', 'April', 'May', 'June', 'July', 'August', 'September', 'October', 'November', 'December'];
 38 | 
 39 |     var intervalId = null;
 40 |     var intervalLoopTime = 30;
 41 | 
 42 |     var speed = 0;
 43 |     var sumarize = true;
 44 |     var colorize = true;
 45 |     var time = true;
 46 | 
 47 |     function init() {
 48 |         $canvas = $("#mainCanvas");
 49 |         canvas = $canvas[0];
 50 | 
 51 |         // Load dynamic properties
 52 |         intervalLoopTime = $canvas.data("frame-rate");
 53 |         speed = $canvas.data("speed");
 54 |         colorize = $canvas.data("colorize");
 55 |         sumarize = $canvas.data("sumarize");
 56 |         time = $canvas.data("time");
 57 | 
 58 |         if (canvas.getContext) {
 59 |             setup();
 60 |             resetcounters();
 61 |             intervalId = setInterval(run, intervalLoopTime);
 62 |         }
 63 |         else {
 64 |             alert("Sorry, needs a recent version of Chrome, Firefox, Opera, Safari, or Internet Explorer 9.");
 65 |         }
 66 |     }
 67 | 
 68 |     function setup() {
 69 |         var canvasDiv = $("#canvasContainer");
 70 | 
 71 |         canvasW = canvasDiv.outerWidth();
 72 |         canvasH = canvasDiv.outerHeight();
 73 | 
 74 |         canvas.setAttribute("width", canvasW);
 75 |         canvas.setAttribute("height", canvasH);
 76 | 
 77 |         pongy = canvasH / 2 - PONG_HEIGHT / 2;
 78 | 
 79 |         console.log("Initialized canvas with size: " + canvasW + "x" + canvasH);
 80 |         console.log("Initialized " + Math.floor(canvasH / 20) + " request and resource vertical slots");
 81 | 
 82 |         ctx = canvas.getContext("2d");
 83 |     }
 84 | 
 85 |     function resetcounters() {
 86 |         // Init label display responses
 87 |         typerequests['200'] = 0;
 88 |         typerequests['404'] = 0;
 89 |         typerequests['304'] = 0;
 90 |     }
 91 | 
 92 |     function run(readonly) {
 93 | 
 94 |         if (readonly === undefined || readonly === false) {
 95 |             // For paused information
 96 |             pauseinfo ['200'] = typerequests['200'];
 97 |             pauseinfo ['304'] = typerequests['304'];
 98 |             pauseinfo ['404'] = typerequests['404'];
 99 |             pauseinfo.date = new Date();
100 |         }
101 | 
102 |         ctx.globalCompositeOperation = "source-over";
103 |         ctx.fillStyle = "rgb(0,0,0)";
104 |         ctx.fillRect(0, 0, canvasW, canvasH);
105 |         ctx.font = DEFAULT_FONT;
106 |         ctx.globalCompositeOperation = "lighter";
107 | 
108 |         var Mrnd = Math.random;
109 |         var Mabs = Math.abs;
110 | 
111 |         // Obsolete arrays
112 |         var orequests = [];
113 |         var omessages = [];
114 |         var osrcslots = [];
115 |         var odstslots = [];
116 | 
117 |         var i = requests.length;
118 |         while (i--) {
119 |             var m = requests[i];
120 |             var x = m.x;
121 |             var y = m.y;
122 |             var vX = m.vX;
123 |             var vY = m.vY;
124 | 
125 |             var nextX = x + vX;
126 |             var nextY = y + vY;
127 | 
128 |             if (nextX > canvasW - MARGIN_RIGHT) {
129 |                 nextX = canvasW - MARGIN_RIGHT;
130 |                 vX *= -1;
131 | 
132 |                 // Establish the repplied attribute for pong
133 |                 m.repplied = true;
134 | 
135 |                 // Push a new message
136 |                 var msg = new Message();
137 |                 msg.x = nextX - 50;
138 |                 msg.y = nextY;
139 |                 msg.color = m.color;
140 |                 msg.text = m.req.result;
141 |                 msg.ttl = MAX_MSG_TTL; // Aprox: 1.5s
142 |                 messages.push(msg);
143 | 
144 |                 var g = ctx.createRadialGradient(nextX, nextY, BULLET_SIZE, nextX, nextY, BULLET_SIZE * 20);
145 |                 g.addColorStop(0, "rgba(" + m.color.r + "," + m.color.g + "," + m.color.b + "," + 1 + ")");
146 |                 g.addColorStop(0.2, "rgba(" + m.color.r + "," + m.color.g + "," + m.color.b + ", 0.4)");
147 |                 g.addColorStop(1.0, "rgba(255,255,255,0)");
148 | 
149 |                 ctx.save();
150 |                 ctx.fillStyle = g;
151 |                 ctx.beginPath();
152 |                 ctx.arc(nextX, nextY, BULLET_SIZE, 0, PI_2, false);
153 |                 ctx.fill();
154 |                 ctx.restore();
155 | 
156 |                 // Search the source slot, for removing
157 |                 var dstslotpos = findSlotByTarget(m.req.path);
158 | 
159 |                 if (dstslotpos >= 0) {
160 |                     dstslots[dstslotpos].count--;
161 |                     if (dstslots[dstslotpos].count === 0) {
162 |                         console.log('Removed obsoleted resource slot at: ' + dstslotpos);
163 |                         odstslots.push(dstslotpos);
164 |                     }
165 |                 }
166 | 
167 |             } else if (nextX < MARGIN_LEFT) {
168 |                 // Remove the request from the stack
169 |                 orequests.push(i);
170 | 
171 |                 // Search the request slot, for removing
172 |                 var srcslotpos = findSlotByIp(m.req.ip);
173 | 
174 |                 if (srcslotpos >= 0) {
175 |                     srcslots[srcslotpos].count--;
176 |                     if (srcslots[srcslotpos].count === 0) {
177 |                         console.log('Removed obsoleted request slot at: ' + srcslotpos);
178 |                         osrcslots.push(srcslotpos);
179 |                     }
180 |                 }
181 |             }
182 | 
183 |             if (nextY > canvasH) {
184 |                 nextY = canvasH;
185 |                 vY *= -1;
186 |             } else if (nextY < 0) {
187 |                 nextY = 0;
188 |                 vY *= -1;
189 |             }
190 | 
191 |             if (readonly === undefined || readonly === false) {
192 |                 m.vX = vX;
193 |                 m.vY = vY;
194 |                 m.x = nextX;
195 |                 m.y = nextY;
196 |             }
197 | 
198 |             ctx.save();
199 |             ctx.fillStyle = colorDef(m.color);
200 |             ctx.beginPath();
201 |             ctx.arc(nextX, nextY, BULLET_SIZE, 0, PI_2, true);
202 |             ctx.closePath();
203 |             ctx.fill();
204 |             ctx.restore();
205 |         }
206 | 
207 |         // DNS Source ip label
208 |         var j = srcslots.length;
209 |         ctx.save();
210 |         ctx.font = DEFAULT_FONT;
211 |         ctx.shadowColor = "#fff";
212 |         ctx.shadowOffsetX = 0;
213 |         ctx.shadowOffsetY = 0;
214 |         ctx.shadowBlur = 0;
215 |         ctx.fillStyle = "#ffffff";
216 | 
217 |         function fitText(text, maxwidth) {
218 | 
219 |             while (ctx.measureText(text).width > maxwidth) {
220 |                 text = text.substring(0, text.length - 1);
221 |             }
222 | 
223 |             return text;
224 |         }
225 | 
226 |         while (j--) {
227 |             var s = srcslots[j];
228 | 
229 | 
230 |             ctx.fillText(fitText(s.ip, MARGIN_LEFT), 10, s.y);
231 |         }
232 | 
233 |         ctx.restore();
234 | 
235 |         // Target label
236 |         var k = dstslots.length;
237 |         ctx.save();
238 |         ctx.font = DEFAULT_FONT;
239 |         ctx.shadowColor = "#fff";
240 |         ctx.shadowOffsetX = 0;
241 |         ctx.shadowOffsetY = 0;
242 |         ctx.shadowBlur = 0;
243 |         ctx.fillStyle = "#ffffff";
244 | 
245 |         while (k--) {
246 |             var t = dstslots[k];
247 |             ctx.fillText(t.path, canvasW - MARGIN_RIGHT + 10, t.y);
248 |         }
249 | 
250 |         ctx.restore();
251 | 
252 |         // HTTP Result labels
253 |         var n = messages.length;
254 |         ctx.save();
255 |         ctx.font = DEFAULT_FONT;
256 |         ctx.shadowColor = "#fff";
257 |         ctx.shadowOffsetX = 0;
258 |         ctx.shadowOffsetY = 0;
259 | 
260 |         while (n--) {
261 |             var title = messages[n];
262 | 
263 |             if (--title.ttl > 0) {
264 |                 ctx.fillStyle = colorDef(title.color, title.ttl / MAX_MSG_TTL);
265 |                 ctx.shadowBlur = title.ttl / 5;
266 |                 ctx.fillText(title.text, title.x, title.y);
267 |             } else {
268 |                 omessages.push(n);
269 |             }
270 | 
271 |         }
272 | 
273 |         ctx.restore();
274 | 
275 |         // Next Pong position
276 |         var nrpos = findNextNonReppliedRequest();
277 |         if (nrpos >= 0) {
278 |             pongy = Math.max(requests[nrpos].y - PONG_HEIGHT / 2, 0);
279 |         }
280 | 
281 |         // Display pong
282 |         ctx.save();
283 |         ctx.fillStyle = "rgb(150,29,28)";
284 |         ctx.fillRect(canvasW - MARGIN_RIGHT, pongy, 10, PONG_HEIGHT);
285 |         ctx.restore();
286 | 
287 |         // Type requests and total label
288 |         if (sumarize) {
289 |             var st = '';
290 | 
291 |             st += ' HTTP OK: ' + pad(pauseinfo['200'], 7);
292 |             st += ' HTTP NOT FOUND: ' + pad(pauseinfo['404'], 5);
293 |             st += ' HTTP NOT MODIFIED: ' + pad(pauseinfo['304'], 5);
294 |             st += ' TOTAL: ' + pad(total, 8);
295 | 
296 |             var tx = canvasW - 600;
297 |             var ty = canvasH - 5;
298 |             ctx.save();
299 |             ctx.font = DEFAULT_FONT;
300 |             ctx.shadowColor = "#fff";
301 |             ctx.shadowOffsetX = 0;
302 |             ctx.shadowOffsetY = 0;
303 |             ctx.shadowBlur = 0;
304 |             ctx.fillStyle = "#ffffff";
305 |             ctx.fillText(st, tx, ty);
306 |             ctx.restore();
307 |         }
308 | 
309 |         // Date & Time display
310 |         if (time) {
311 |             var date = pauseinfo.date;
312 |             ctx.save();
313 |             ctx.font = DEFAULT_FONT;
314 |             ctx.shadowColor = "#fff";
315 |             ctx.shadowOffsetX = 0;
316 |             ctx.shadowOffsetY = 0;
317 |             ctx.shadowBlur = 0;
318 |             ctx.fillStyle = "#ffffff";
319 |             ctx.fillText(getDateDisplay(date), 5, 15);
320 |             ctx.fillText(getTimeDisplay(date), 5, 35);
321 |             ctx.restore();
322 |         }
323 | 
324 |         // Remove obsolete requests
325 |         requests = $.grep(requests, function (n, i) {
326 |             return $.inArray(i, orequests) < 0;
327 |         });
328 | 
329 |         // Remove obsolete messages
330 |         messages = $.grep(messages, function (n, i) {
331 |             return $.inArray(i, omessages) < 0;
332 |         });
333 | 
334 |         // Remove obsolete resources slots
335 |         dstslots = $.grep(dstslots, function (n, i) {
336 |             return $.inArray(i, odstslots) < 0;
337 |         });
338 | 
339 |         // Remove obsolete requests slots
340 |         srcslots = $.grep(srcslots, function (n, i) {
341 |             return $.inArray(i, osrcslots) < 0;
342 |         });
343 | 
344 |     }
345 | 
346 |     function RemoteRequest() {
347 |         this.color = ''; // Defined by origin color o random for only one origin
348 |         this.x = 0;
349 |         this.y = 0;
350 |         this.vX = 0;
351 |         this.vY = 0;
352 |         this.req = null; // Filled by websocket
353 |         this.repplied = false; // For pong targets
354 |     }
355 | 
356 |     function Slot() {
357 |         this.x = 0;
358 |         this.y = 0;
359 |         this.count = 0;
360 |         this.ip = ''; // For request slots
361 |         this.path = ''; // For resource slots
362 |     }
363 | 
364 |     function Origin() {
365 |         this.color = '';
366 |         this.path = '';
367 |     }
368 | 
369 |     function colorDef(obj, alpha) {
370 |         if (alpha !== undefined) {
371 |             return "rgba(" + obj.r + "," + obj.g + "," + obj.b + "," + alpha + ")";
372 |         } else {
373 |             return "rgb(" + obj.r + "," + obj.g + "," + obj.b + ")";
374 |         }
375 |     }
376 | 
377 |     function Message() {
378 |         this.x = 0;
379 |         this.y = 0;
380 |         this.text = "";
381 |     }
382 | 
383 |     function rect(context, x, y, w, h) {
384 |         context.beginPath();
385 |         context.rect(x, y, w, h);
386 |         context.closePath();
387 |         context.fill();
388 |     }
389 | 
390 |     function pad(num, length) {
391 |         var str = '' + num;
392 |         while (str.length < length) {
393 |             str = '0' + str;
394 |         }
395 | 
396 |         return str;
397 |     }
398 | 
399 |     function getDateDisplay(date) {
400 |         return longDays[date.getDay()] + ', ' + longMonths[date.getMonth()] + ' ' + date.getDate() + ', ' + date.getFullYear() + '\r\n';
401 |     }
402 | 
403 |     function getTimeDisplay(date) {
404 |         return (date.getHours() < 10 ? '0' : '') + date.getHours() + ':' +
405 |             (date.getMinutes() < 10 ? '0' : '') + date.getMinutes() + ':' +
406 |             (date.getSeconds() < 10 ? '0' : '') + date.getSeconds();
407 |     }
408 | 
409 |     function findNextNonReppliedRequest() {
410 |         var j;
411 |         for (j = 0; j < requests.length; j++) {
412 |             if (!requests[j].repplied) {
413 |                 return j;
414 |             }
415 |         }
416 | 
417 |         return -1;
418 |     }
419 | 
420 |     function findSlotByIp(ip) {
421 |         var j;
422 |         for (j = 0; j < srcslots.length; j++) {
423 |             if (ip === srcslots[j].ip) {
424 |                 return j;
425 |             }
426 |         }
427 | 
428 |         return -1;
429 |     }
430 | 
431 |     function findSlotByTarget(target) {
432 |         var j;
433 |         for (j = 0; j < dstslots.length; j++) {
434 |             if (target === dstslots[j].path) {
435 |                 return j;
436 |             }
437 |         }
438 | 
439 |         return -1;
440 |     }
441 | 
442 |     function findOriginByName(filename) {
443 |         var j;
444 |         for (j = 0; j < origins.length; j++) {
445 |             if (filename === origins[j].path) {
446 |                 return j;
447 |             }
448 |         }
449 | 
450 |         return -1;
451 |     }
452 | 
453 |     window.onload = init;
454 | 
455 |     // Establish the websocket connection
456 |     //var eb = new EventBus('http://localhost:5555/eventbus');
457 |     var eb = new EventBus('http://apsrt1451:5555/eventbus');
458 | 
459 |     eb.onopen = function () {
460 | 
461 |         eb.registerHandler('log', function (err, res) {
462 |             console.log(res.body);
463 |             var robj = res.body;
464 | 
465 | 
466 |             if (typerequests[robj.result] === undefined) {
467 |                 typerequests[robj.result] = 0;
468 |             }
469 | 
470 |             typerequests[robj.result]++;
471 | 
472 |             // if not paused, then add it to buffer
473 |             if (intervalId) {
474 |                 var m = new RemoteRequest();
475 |                 m.x = MARGIN_LEFT; // canvasW * 0.5;
476 |                 m.vX = speed;
477 |                 m.req = robj;
478 |                 requests.push(m);
479 | 
480 |                 if (robj.origin !== undefined) {
481 |                     // Find pre generated origin, for inherit color
482 |                     var originpos = findOriginByName(robj.origin);
483 | 
484 |                     if (originpos < 0) {
485 |                         // New origin assignment
486 |                         var origin = new Origin();
487 |                         origin.path = robj.origin;
488 |                         origin.color = {
489 |                             r: Math.floor(Math.random() * 155 + 100),
490 |                             g: Math.floor(Math.random() * 155 + 100),
491 |                             b: Math.floor(Math.random() * 155 + 100)
492 |                         };
493 |                         originpos = origins.push(origin) - 1;
494 |                         console.log('New origin: ' + robj.origin);
495 |                     }
496 | 
497 |                     m.color = origins[originpos].color;
498 |                 } else {
499 |                     // For no origin request, only one origin, then random color
500 |                     m.color = {
501 |                         r: Math.floor(Math.random() * 155 + 100),
502 |                         g: Math.floor(Math.random() * 155 + 100),
503 |                         b: Math.floor(Math.random() * 155 + 100)
504 |                     };
505 |                 }
506 | 
507 |                 // Search a request slot
508 |                 var srcslotpos = findSlotByIp(robj.ip);
509 | 
510 |                 if (srcslotpos < 0) {
511 |                     // New slot assignment
512 |                     var sslot = new Slot();
513 |                     sslot.ip = robj.ip;
514 |                     sslot.count = 1;
515 |                     sslot.y = Math.floor(Math.random() * (canvasH - MARGIN_TOP - MARGIN_BOTTOM) + MARGIN_TOP); // TODO: Find a correct slot vertical position
516 |                     srcslotpos = srcslots.push(sslot) - 1;
517 |                     console.log('New request sslot at: ' + sslot.y);
518 |                 } else {
519 |                     srcslots[srcslotpos].count++;
520 |                     console.log('Recycled request slot at: ' + srcslots[srcslotpos].y);
521 |                 }
522 | 
523 |                 // Search a resource slot
524 |                 var dstslotpos = findSlotByTarget(robj.path);
525 | 
526 |                 if (dstslotpos < 0) {
527 |                     // New slot assignment
528 |                     var dslot = new Slot();
529 |                     dslot.path = robj.path;
530 |                     dslot.count = 1;
531 |                     dslot.y = Math.floor(Math.random() * (canvasH - MARGIN_TOP - MARGIN_BOTTOM) + MARGIN_TOP); // TODO: Find a correct slot vertical position
532 |                     dstslotpos = dstslots.push(dslot) - 1;
533 |                     console.log('New resource dslot at: ' + dslot.y);
534 |                 } else {
535 |                     dstslots[dstslotpos].count++;
536 |                     console.log('Recycled resource slot at: ' + dstslots[dstslotpos].y);
537 |                 }
538 | 
539 |                 m.y = srcslots[srcslotpos].y;
540 | 
541 |                 // When the origin and target slots are set, then the vertical speed can be calculated
542 |                 m.vY = (dstslots[dstslotpos].y - srcslots[srcslotpos].y) / (canvasW - MARGIN_LEFT - MARGIN_RIGHT) * speed;
543 |                 console.log('New request with vertical speed at: ' + m.vY);
544 | 
545 |             }
546 | 
547 |             ++total;
548 |         });
549 | 
550 |     };
551 | 
552 |     function bulletInfoPopup(e) {
553 |         var minpos;
554 |         var mindist;
555 |         var j;
556 | 
557 |         for (j = 0; j < requests.length; j++) {
558 |             var tr = requests[j];
559 |             var dist = Math.sqrt(Math.pow(e.pageX - tr.x, 2) + Math.pow(e.pageY - tr.y, 2));
560 | 
561 |             if (mindist === undefined || dist < mindist) {
562 |                 minpos = j;
563 |                 mindist = dist;
564 |             }
565 |         }
566 | 
567 |         if (mindist < BULLET_POPUP_DIST) {
568 |             if (minpos !== bulletpopup || bulletpopup < 0) {
569 |                 console.log('Showing popup of request: ' + minpos);
570 |                 console.log(requests[minpos]);
571 |                 bulletpopup = minpos;
572 | 
573 |                 // Refresh canvas
574 |                 run(true);
575 | 
576 |                 // Display popup rectangle
577 |                 var r = requests[bulletpopup];
578 |                 var rx = r.x + 20;
579 |                 var ry = r.y + 20;
580 | 
581 |                 ctx.save();
582 |                 ctx.fillStyle = colorDef(r.color);
583 |                 ctx.fillRect(rx, ry, 220, 95);
584 |                 ctx.font = DEFAULT_FONT;
585 |                 ctx.fillStyle = "#ffffff";
586 |                 ctx.fillText(r.req.method + ' ' + r.req.path, rx + 10, ry + 20);
587 |                 ctx.fillText("From: " + r.req.ip, rx + 10, ry + 35);
588 |                 ctx.fillText("Result: " + r.req.result, rx + 10, ry + 50);
589 |                 ctx.fillText("Size: " + r.req.size, rx + 10, ry + 65);
590 |                 ctx.fillText("Time: " + r.req.time, rx + 10, ry + 80);
591 |                 ctx.restore();
592 | 
593 |                 $canvas.css('cursor', 'pointer');
594 |             }
595 |         } else {
596 |             if (bulletpopup >= 0) {
597 |                 console.log('Hidding popup');
598 |                 bulletpopup = -1;
599 | 
600 |                 // Refresh canvas
601 |                 run(true);
602 | 
603 |                 $canvas.css('cursor', 'default');
604 |             }
605 |         }
606 | 
607 |     }
608 | 
609 |     // Pause
610 |     $(document).bind('keypress', function (e) {
611 |         var unicode = e.keyCode ? e.keyCode : e.charCode;
612 | 
613 |         if (unicode == 32) { // Space - Pause
614 |             if (intervalId) {
615 |                 clearInterval(intervalId);
616 |                 intervalId = null;
617 | 
618 |                 // Refresh canvas
619 |                 run(true);
620 | 
621 |                 // Bind the mousemove event
622 |                 $canvas.bind('mousemove', bulletInfoPopup);
623 |             } else {
624 |                 // Unbind the mousemove event
625 |                 $canvas.unbind('mousemove', bulletInfoPopup);
626 |                 intervalId = setInterval(run, intervalLoopTime);
627 |             }
628 |         } else if (unicode == 43) { // + more horizontal speed
629 |             speed = Math.min(speed + 5, 200);
630 |             console.log("Speed set to: " + speed);
631 |         } else if (unicode == 45) { // - less horizontal speed
632 |             speed = Math.max(speed - 5, 10);
633 |             console.log("Speed set to: " + speed);
634 |         }
635 |     });
636 | 
637 |     // Resize window event
638 |     $(window).resize(function () {
639 |         setup();
640 |     });
641 | 
642 | })();
643 | 


--------------------------------------------------------------------------------
/collect-stream-logs/dashboard/testEB.html:
--------------------------------------------------------------------------------
  1 | <html>
  2 | <head>
  3 |   <title></title>
  4 |   <script src="//ajax.googleapis.com/ajax/libs/jquery/2.0.3/jquery.min.js" ></script>
  5 |   <script src="//cdn.jsdelivr.net/sockjs/1.0.0/sockjs.min.js"></script>
  6 |   <script src="//cdn.rawgit.com/vert-x3/vertx-bus-bower/master/vertx-eventbus.js"></script>
  7 | </head>
  8 | <style>
  9 |   .box {
 10 |     background-color: #F0F0F0;
 11 |     border: 5px solid blue;
 12 |     width: 400px;
 13 |     height: 300px;
 14 |   }
 15 | 
 16 |   .innerbox {
 17 |     overflow: auto;
 18 |     border: 5px solid blue;
 19 |     border-left: 0px;
 20 |     border-right: 0px;
 21 |   }
 22 | 
 23 |   body {
 24 |     background-color: #F0F0F0;
 25 |   }
 26 | </style>
 27 | 
 28 | <body>
 29 | 
 30 | <div id="send" class="box" style="position:absolute;left:0px;top:0px">
 31 | 
 32 |   <form onsubmit="return false;">
 33 |     Address:<input type="text" id="sendAddress" value="someaddress"/><br>
 34 |     Message:<input type="text" id="sendMessage" value="Hello, World!"/>
 35 |     <input type="button" id="sendButton" value="Send message"/>
 36 |   </form>
 37 | 
 38 |   <br>
 39 |   Sent messages:<br>
 40 | 
 41 |   <div id="sent" class="innerbox" style="width: 400px; height: 205px;">
 42 |   </div>
 43 | </div>
 44 | 
 45 | <div id="subscribe" class="box" style="position:absolute;left:450px;top:0px">
 46 | 
 47 |   <form onsubmit="return false;">
 48 |     Address:<input type="text" id="subscribeAddress" value="someaddress"/>
 49 |     <input type="button" id="subscribeButton" value="Subscribe"/>
 50 |   </form>
 51 | 
 52 |   <br>
 53 |   Subscriptions:<br>
 54 | 
 55 |   <div id="subscribed" class="innerbox" style="width: 400px; height: 230px;">
 56 |   </div>
 57 | </div>
 58 | 
 59 | <br>
 60 | 
 61 | <div id="receive" class="box" style="position:absolute;left:0px;top:350px">
 62 | 
 63 |   Received messages:<br>
 64 | 
 65 |   <div id="received" class="innerbox" style="width: 400px; height: 275px;">
 66 |   </div>
 67 | 
 68 | </div>
 69 | 
 70 | <div id="status" class="box" style="position:absolute;left:450px;top:350px">
 71 |   <input type="button" id="connectButton" value="Open connection"/><br>
 72 |   <input type="button" id="closeButton" value="Close connection"/><br>
 73 |   Connection Status:&nbsp;
 74 |   <div id="status_info">Not connected</div>
 75 | </div>
 76 | 
 77 | <script>
 78 | 
 79 |   var eb = null;
 80 | 
 81 |   function publish(address,  message) {
 82 |     if (eb) {
 83 |       var json = {text: message};
 84 |       eb.publish(address, json);
 85 |       $('#sent').append($("<code>").text("Address:" + address + " Message:" + JSON.stringify(json)));
 86 |       $('#sent').append($("</code><br>"));
 87 |     }
 88 |   }
 89 | 
 90 |   function subscribe(address) {
 91 |     if (eb) {
 92 |       eb.registerHandler(address, function(err, res) {
 93 |         $('#received').append("Address:" + res.address + " Message:" + JSON.stringify(res.body) + "<br>");
 94 |       });
 95 |       $('#subscribed').append($("<code>").text("Address:" + address));
 96 |       $('#subscribed').append($("</code><br>"));
 97 |     }
 98 |   }
 99 | 
100 |   function isJson(str) {
101 |     try {
102 |       JSON.parse(str);
103 |     } catch (e) {
104 |       return false;
105 |     }
106 |     return true;
107 |   }
108 | 
109 |   function closeConn() {
110 |     if (eb) {
111 |       eb.close();
112 |     }
113 |   }
114 | 
115 |   function openConn() {
116 |     if (!eb) {
117 |       //eb = new EventBus('http://apsrt1451:5555/eventbus');
118 |       eb = new EventBus('http://localhost:5555/eventbus');
119 | 
120 |       eb.onopen = function() {
121 |         $("#status_info").text("Connected");
122 |       };
123 | 
124 |       eb.onclose = function() {
125 |         $("#status_info").text("Not connected");
126 |         eb = null;
127 |       };
128 |     }
129 |   }
130 | 
131 |   $(document).ready(function() {
132 |     $("#sendButton").click(function() {
133 |       publish($("#sendAddress").val(), $("#sendMessage").val());
134 |     });
135 | 
136 |     $("#subscribeButton").click(function() {
137 |       subscribe($("#subscribeAddress").val());
138 |     });
139 | 
140 |     $("#closeButton").click(function() {
141 |       closeConn();
142 |     });
143 | 
144 |     $("#connectButton").click(function() {
145 |       openConn();
146 |     });
147 |   });
148 | 
149 | </script>
150 | 
151 | </body>
152 | </html>
153 | 


--------------------------------------------------------------------------------
/collect-stream-logs/data/out/.gitkeep:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/collect-stream-logs/data/out/.gitkeep


--------------------------------------------------------------------------------
/collect-stream-logs/log-generator/build.gradle:
--------------------------------------------------------------------------------
 1 | group 'com.crossbusiness.loggen'
 2 | 
 3 | apply plugin: 'groovy'
 4 | apply plugin: 'application'
 5 | 
 6 | sourceCompatibility = 1.8
 7 | 
 8 | // mainClassName = "com.crossbusiness.loggen.AppLogGenerator"
 9 | mainClassName = "com.crossbusiness.loggen.AccessLogGenerator"
10 | 
11 | repositories {
12 |     mavenCentral()
13 | }
14 | 
15 | dependencies {
16 |     compile 'org.codehaus.groovy:groovy-all:+'
17 |     compile 'ch.qos.logback:logback-classic:1.1.3'
18 |     compile 'ch.qos.logback:logback-access:1.1.3'
19 |     compile 'net.logstash.logback:logstash-logback-encoder:4.5.1'
20 | }
21 | 


--------------------------------------------------------------------------------
/collect-stream-logs/log-generator/src/main/groovy/com.crossbusiness.loggen/AccessLogGenerator.groovy:
--------------------------------------------------------------------------------
 1 | package com.crossbusiness.loggen
 2 | 
 3 | import groovy.json.JsonBuilder
 4 | import groovy.util.logging.Slf4j
 5 | 
 6 | @Slf4j
 7 | class AccessLogGenerator {
 8 | 
 9 |     public static final String[] ips=["123.221.14.56","16.180.70.237","10.182.189.79","218.193.16.244","198.122.118.164","114.214.178.92","233.192.62.103","244.157.45.12","81.73.150.239","237.43.24.118"]
10 |     public static final String[] referers=["-","http://www.casualcyclist.com","http://bestcyclingreviews.com/top_online_shops","http://bleater.com","http://searchengine.com"]
11 |     public static final String[] resources=["/handle-bars","/stems","/wheelsets","/forks","/seatposts","/saddles","/shifters","/Store/cart.jsp?productID="]
12 |     public static final String[] useragents=["Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.0)","Mozilla/5.0 (Macintosh; Intel Mac OS X 10_9_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/36.0.1944.0 Safari/537.36","Mozilla/5.0 (Linux; U; Android 2.3.5; en-us; HTC Vision Build/GRI40) AppleWebKit/533.1 (KHTML, like Gecko) Version/4.0 Mobile Safari/533.1","Mozilla/5.0 (iPad; CPU OS 6_0 like Mac OS X) AppleWebKit/536.26 (KHTML, like Gecko) Version/6.0 Mobile/10A5355d Safari/8536.25","Mozilla/5.0 (Windows; U; Windows NT 6.1; rv:2.2) Gecko/20110201","Mozilla/5.0 (Windows NT 5.1; rv:31.0) Gecko/20100101 Firefox/31.0","Mozilla/5.0 (Windows; U; MSIE 9.0; WIndows NT 9.0; en-US))"]
13 | 
14 |     AccessLogGenerator() {
15 |         println 'Hello World'
16 |     }
17 | 
18 |     def produce() {
19 |         println "starting log events..........."
20 |         def ranDumb     = new Random();
21 |         //127.0.0.1 - - [07/Mar/2012:23:21:47 +0100] "GET / HTTP/1.0" 200 454 "-" "ApacheBench/2.3"
22 |         //def regex = ~/([0-9]+\.[0-9]+\.[0-9]+\.[0-9]+).+\[(.+)\] "(\w+) ([^ ]+) .*" (\w+) (\w+)/;
23 |         def regex = ~/^([^ ]*).+\[(.+)\] "(\w+) ([^ ]+) .*" (\w+) ([^ ]*)/
24 | 
25 |         while (true) {
26 |             AccessLogGenerator.class.getResource( '/example.log' ).eachLine { line ->
27 |                 def matcher = regex.matcher(line)
28 |                 if (matcher.find()) {
29 |                     def logJson = new JsonBuilder(["ip": matcher.group(1), "time": matcher.group(2), "method": matcher.group(3), "path": matcher.group(4), "result": matcher.group(5), "size": matcher.group(6)])
30 | 
31 |                     log.info logJson.toString()
32 |                 } else {
33 |                     println "no match: " + line
34 |                 }
35 |                 //sleep(ranDumb.nextInt(2000-1000+1)+100)
36 |                 sleep(ranDumb.nextInt(200-100+1)+100)
37 |                 //sleep(ranDumb.nextInt(20-10+1)+50)
38 |             }
39 |             println "re-starting log events..........."
40 |         }
41 |     }
42 | 
43 |     static main(args) {
44 |         def generator = new AccessLogGenerator()
45 |         generator.produce()
46 |     }
47 | }


--------------------------------------------------------------------------------
/collect-stream-logs/log-generator/src/main/groovy/com.crossbusiness.loggen/AppLogGenerator.groovy:
--------------------------------------------------------------------------------
 1 | package com.crossbusiness.loggen
 2 | 
 3 | import groovy.json.JsonBuilder
 4 | import groovy.util.logging.Slf4j
 5 | 
 6 | @Slf4j
 7 | class AppLogGenerator {
 8 | 
 9 |     static final int DEFAULT_NUM_LOGS = 100;
10 |     static final long DEFAULT_DELAY = 100;
11 | 
12 |     public static final String ERROR = "ERROR";
13 |     public static final String WARN = "WARN";
14 |     public static final String INFO = "INFO";
15 |     public static final String DEBUG = "DEBUG";
16 |     public static final String TRACE = "TRACE";
17 | 
18 |     static final String[] LEVELS = [ERROR, WARN, INFO, DEBUG, TRACE];
19 | 
20 |     static final String[] MESSAGES =["Solr is cool", "NiFi rocks!", "Lucene is awesome" ];
21 | 
22 |     static final Exception[] EXCEPTIONS =[
23 |         new IllegalStateException("Uh-oh something went wrong"),
24 |         new IllegalArgumentException("Invalid value"),
25 |         new NullPointerException("Value was null")
26 |     ];
27 | 
28 | 
29 |     AppLogGenerator() {
30 |         println 'Hello World'
31 |     }
32 | 
33 |     def produce(long numLogs, long delay) {
34 |         Random rand = new Random();
35 |         for (int i=0; i < numLogs; i++) {
36 |             switch(LEVELS[rand.nextInt(5)]) {
37 |                 case ERROR:
38 |                     final Exception e = EXCEPTIONS[rand.nextInt(EXCEPTIONS.length)];
39 |                     log.error(e.getMessage(), e);
40 |                     break;
41 |                 case WARN:
42 |                     log.warn(MESSAGES[rand.nextInt(MESSAGES.length)]);
43 |                     break;
44 |                 case INFO:
45 |                     log.info(MESSAGES[rand.nextInt(MESSAGES.length)]);
46 |                     break;
47 |                 case DEBUG:
48 |                     log.debug(MESSAGES[rand.nextInt(MESSAGES.length)]);
49 |                     break;
50 |                 case TRACE:
51 |                     log.trace(MESSAGES[rand.nextInt(MESSAGES.length)]);
52 |                     break;
53 |                 default:
54 |                     log.debug("Default message");
55 |             }
56 | 
57 |             if (delay > 0) {
58 |                 try {
59 |                     Thread.sleep(delay);
60 |                 } catch (InterruptedException e) {
61 |                     log.error(e.getMessage(), e);
62 |                 }
63 |             }
64 |         }
65 |     }
66 | 
67 |     static main(args) {
68 |         def generator = new AppLogGenerator()
69 | 
70 |         int numLogs = DEFAULT_NUM_LOGS;
71 |         long delay = DEFAULT_DELAY;
72 | 
73 |         if (args.length == 2) {
74 |             numLogs = Integer.parseInt(args[0]);
75 |             delay = Long.parseLong(args[1]);
76 |         }
77 | 
78 |         generator.produce(numLogs, delay);
79 |     }
80 | }


--------------------------------------------------------------------------------
/collect-stream-logs/log-generator/src/main/java/.gitkeep:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/collect-stream-logs/log-generator/src/main/java/.gitkeep


--------------------------------------------------------------------------------
/collect-stream-logs/log-generator/src/main/resources/logback-access.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | 
 3 | <configuration>
 4 | 
 5 |     <property name="max.retention.days" value="60" />
 6 | 
 7 |     <statusListener class="ch.qos.logback.core.status.OnConsoleStatusListener" />
 8 | 
 9 |     <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
10 |         <encoder>
11 |             <!--<pattern>common</pattern>-->
12 |             <pattern>%h %l %u %user %date "%r" %s %b</pattern>
13 |         </encoder>
14 |     </appender>
15 | 
16 |     <appender name="ACCESS-LOG" class="ch.qos.logback.core.rolling.RollingFileAppender">
17 |         <file>./logs/access.log</file>
18 |         <append>true</append>
19 |         <rollingPolicy class="ch.qos.logback.core.rolling.TimeBasedRollingPolicy">
20 |             <fileNamePattern>./logs/archive/access-%d{yyyyMMdd}-%i.log.zip</fileNamePattern>
21 |             <maxHistory>${max.retention.days}</maxHistory>
22 |             <timeBasedFileNamingAndTriggeringPolicy class="ch.qos.logback.core.rolling.SizeAndTimeBasedFNATP">
23 |                 <maxFileSize>20MB</maxFileSize>
24 |             </timeBasedFileNamingAndTriggeringPolicy>
25 |         </rollingPolicy>
26 |         <encoder>
27 |             <pattern>%h %l %u [%t] "%r" %s %b "%i{Referer}" "%i{User-Agent}"</pattern>
28 |         </encoder>
29 |     </appender>
30 | 
31 |     <appender-ref ref="STDOUT" />
32 |     <appender-ref ref="ACCESS-LOG" />
33 | 
34 | </configuration>


--------------------------------------------------------------------------------
/collect-stream-logs/log-generator/src/main/resources/logback.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <configuration>
 3 |     <property name="max.retention.days" value="60" />
 4 | 
 5 |     <statusListener class="ch.qos.logback.core.status.OnConsoleStatusListener" />
 6 | 
 7 |     <appender name="STDOUT" class="ch.qos.logback.core.ConsoleAppender">
 8 |         <encoder>
 9 |             <!--<pattern>common</pattern>-->
10 |             <pattern>%-4relative [%thread] %-5level %logger{35} - %msg %n</pattern>
11 |         </encoder>
12 |     </appender>
13 | 
14 |     <appender name="STASH" class="net.logstash.logback.appender.LogstashSocketAppender">
15 |         <host>localhost</host>
16 |         <port>8888</port>
17 |     </appender>
18 | 
19 |     <appender name="ACCESS-LOG" class="ch.qos.logback.core.rolling.RollingFileAppender">
20 |         <file>./logs/access.log</file>
21 |         <append>true</append>
22 |         <rollingPolicy class="ch.qos.logback.core.rolling.TimeBasedRollingPolicy">
23 |             <fileNamePattern>./logs/archive/access-%d{yyyyMMdd}-%i.log.zip</fileNamePattern>
24 |             <maxHistory>${max.retention.days}</maxHistory>
25 |             <timeBasedFileNamingAndTriggeringPolicy class="ch.qos.logback.core.rolling.SizeAndTimeBasedFNATP">
26 |                 <maxFileSize>20MB</maxFileSize>
27 |             </timeBasedFileNamingAndTriggeringPolicy>
28 |         </rollingPolicy>
29 |         <encoder>
30 |             <pattern>%h %l %u [%t] "%r" %s %b "%i{Referer}" "%i{User-Agent}"</pattern>
31 |         </encoder>
32 |     </appender>
33 | 
34 |     <logger name="com.crossbusiness.loggen.AccessLogGenerator" level="DEBUG">
35 |         <appender-ref ref="ACCESS-LOG"/>
36 |     </logger>
37 | 
38 |     <root level="all">
39 |         <appender-ref ref="STDOUT" />
40 |         <appender-ref ref="STASH" />
41 |     </root>
42 | </configuration>


--------------------------------------------------------------------------------
/collect-stream-logs/logs-demo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/collect-stream-logs/logs-demo.png


--------------------------------------------------------------------------------
/collect-stream-logs/logs-flow.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/collect-stream-logs/logs-flow.png


--------------------------------------------------------------------------------
/csv-to-json/README.md:
--------------------------------------------------------------------------------
1 | csv-to-json
2 | ===========
3 | 
4 | This flow shows how to convert a CSV entry to a JSON document using ExtractText and ReplaceText.


--------------------------------------------------------------------------------
/decompression/README.md:
--------------------------------------------------------------------------------
1 | decompression
2 | =============
3 | 
4 | This flow demonstrates taking an archive that is created with several levels of compression and then continuously 
5 | decompressing it using a loop until the archived file is extracted out.


--------------------------------------------------------------------------------
/gradle.properties:
--------------------------------------------------------------------------------
1 | rootVersion=0.1.0-SNAPSHOT
2 | 
3 | #Override by USER_HOME/.gradle/gradle.properties
4 | sonatypeUsername=
5 | sonatypePassword=
6 | gitUsername=
7 | gitPassword=


--------------------------------------------------------------------------------
/gradle/wrapper/gradle-wrapper.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/gradle/wrapper/gradle-wrapper.jar


--------------------------------------------------------------------------------
/gradle/wrapper/gradle-wrapper.properties:
--------------------------------------------------------------------------------
1 | #Sun Oct 04 11:47:38 PDT 2015
2 | distributionBase=GRADLE_USER_HOME
3 | distributionPath=wrapper/dists
4 | zipStoreBase=GRADLE_USER_HOME
5 | zipStorePath=wrapper/dists
6 | distributionUrl=https\://services.gradle.org/distributions/gradle-2.7-bin.zip
7 | 


--------------------------------------------------------------------------------
/gradlew:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env bash
  2 | 
  3 | ##############################################################################
  4 | ##
  5 | ##  Gradle start up script for UN*X
  6 | ##
  7 | ##############################################################################
  8 | 
  9 | # Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
 10 | DEFAULT_JVM_OPTS=""
 11 | 
 12 | APP_NAME="Gradle"
 13 | APP_BASE_NAME=`basename "$0"`
 14 | 
 15 | # Use the maximum available, or set MAX_FD != -1 to use that value.
 16 | MAX_FD="maximum"
 17 | 
 18 | warn ( ) {
 19 |     echo "$*"
 20 | }
 21 | 
 22 | die ( ) {
 23 |     echo
 24 |     echo "$*"
 25 |     echo
 26 |     exit 1
 27 | }
 28 | 
 29 | # OS specific support (must be 'true' or 'false').
 30 | cygwin=false
 31 | msys=false
 32 | darwin=false
 33 | case "`uname`" in
 34 |   CYGWIN* )
 35 |     cygwin=true
 36 |     ;;
 37 |   Darwin* )
 38 |     darwin=true
 39 |     ;;
 40 |   MINGW* )
 41 |     msys=true
 42 |     ;;
 43 | esac
 44 | 
 45 | # Attempt to set APP_HOME
 46 | # Resolve links: $0 may be a link
 47 | PRG="$0"
 48 | # Need this for relative symlinks.
 49 | while [ -h "$PRG" ] ; do
 50 |     ls=`ls -ld "$PRG"`
 51 |     link=`expr "$ls" : '.*-> \(.*\)$'`
 52 |     if expr "$link" : '/.*' > /dev/null; then
 53 |         PRG="$link"
 54 |     else
 55 |         PRG=`dirname "$PRG"`"/$link"
 56 |     fi
 57 | done
 58 | SAVED="`pwd`"
 59 | cd "`dirname \"$PRG\"`/" >&-
 60 | APP_HOME="`pwd -P`"
 61 | cd "$SAVED" >&-
 62 | 
 63 | CLASSPATH=$APP_HOME/gradle/wrapper/gradle-wrapper.jar
 64 | 
 65 | # Determine the Java command to use to start the JVM.
 66 | if [ -n "$JAVA_HOME" ] ; then
 67 |     if [ -x "$JAVA_HOME/jre/sh/java" ] ; then
 68 |         # IBM's JDK on AIX uses strange locations for the executables
 69 |         JAVACMD="$JAVA_HOME/jre/sh/java"
 70 |     else
 71 |         JAVACMD="$JAVA_HOME/bin/java"
 72 |     fi
 73 |     if [ ! -x "$JAVACMD" ] ; then
 74 |         die "ERROR: JAVA_HOME is set to an invalid directory: $JAVA_HOME
 75 | 
 76 | Please set the JAVA_HOME variable in your environment to match the
 77 | location of your Java installation."
 78 |     fi
 79 | else
 80 |     JAVACMD="java"
 81 |     which java >/dev/null 2>&1 || die "ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
 82 | 
 83 | Please set the JAVA_HOME variable in your environment to match the
 84 | location of your Java installation."
 85 | fi
 86 | 
 87 | # Increase the maximum file descriptors if we can.
 88 | if [ "$cygwin" = "false" -a "$darwin" = "false" ] ; then
 89 |     MAX_FD_LIMIT=`ulimit -H -n`
 90 |     if [ $? -eq 0 ] ; then
 91 |         if [ "$MAX_FD" = "maximum" -o "$MAX_FD" = "max" ] ; then
 92 |             MAX_FD="$MAX_FD_LIMIT"
 93 |         fi
 94 |         ulimit -n $MAX_FD
 95 |         if [ $? -ne 0 ] ; then
 96 |             warn "Could not set maximum file descriptor limit: $MAX_FD"
 97 |         fi
 98 |     else
 99 |         warn "Could not query maximum file descriptor limit: $MAX_FD_LIMIT"
100 |     fi
101 | fi
102 | 
103 | # For Darwin, add options to specify how the application appears in the dock
104 | if $darwin; then
105 |     GRADLE_OPTS="$GRADLE_OPTS \"-Xdock:name=$APP_NAME\" \"-Xdock:icon=$APP_HOME/media/gradle.icns\""
106 | fi
107 | 
108 | # For Cygwin, switch paths to Windows format before running java
109 | if $cygwin ; then
110 |     APP_HOME=`cygpath --path --mixed "$APP_HOME"`
111 |     CLASSPATH=`cygpath --path --mixed "$CLASSPATH"`
112 |     JAVACMD=`cygpath --unix "$JAVACMD"`
113 | 
114 |     # We build the pattern for arguments to be converted via cygpath
115 |     ROOTDIRSRAW=`find -L / -maxdepth 1 -mindepth 1 -type d 2>/dev/null`
116 |     SEP=""
117 |     for dir in $ROOTDIRSRAW ; do
118 |         ROOTDIRS="$ROOTDIRS$SEP$dir"
119 |         SEP="|"
120 |     done
121 |     OURCYGPATTERN="(^($ROOTDIRS))"
122 |     # Add a user-defined pattern to the cygpath arguments
123 |     if [ "$GRADLE_CYGPATTERN" != "" ] ; then
124 |         OURCYGPATTERN="$OURCYGPATTERN|($GRADLE_CYGPATTERN)"
125 |     fi
126 |     # Now convert the arguments - kludge to limit ourselves to /bin/sh
127 |     i=0
128 |     for arg in "$@" ; do
129 |         CHECK=`echo "$arg"|egrep -c "$OURCYGPATTERN" -`
130 |         CHECK2=`echo "$arg"|egrep -c "^-"`                                 ### Determine if an option
131 | 
132 |         if [ $CHECK -ne 0 ] && [ $CHECK2 -eq 0 ] ; then                    ### Added a condition
133 |             eval `echo args$i`=`cygpath --path --ignore --mixed "$arg"`
134 |         else
135 |             eval `echo args$i`="\"$arg\""
136 |         fi
137 |         i=$((i+1))
138 |     done
139 |     case $i in
140 |         (0) set -- ;;
141 |         (1) set -- "$args0" ;;
142 |         (2) set -- "$args0" "$args1" ;;
143 |         (3) set -- "$args0" "$args1" "$args2" ;;
144 |         (4) set -- "$args0" "$args1" "$args2" "$args3" ;;
145 |         (5) set -- "$args0" "$args1" "$args2" "$args3" "$args4" ;;
146 |         (6) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" ;;
147 |         (7) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" ;;
148 |         (8) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" ;;
149 |         (9) set -- "$args0" "$args1" "$args2" "$args3" "$args4" "$args5" "$args6" "$args7" "$args8" ;;
150 |     esac
151 | fi
152 | 
153 | # Split up the JVM_OPTS And GRADLE_OPTS values into an array, following the shell quoting and substitution rules
154 | function splitJvmOpts() {
155 |     JVM_OPTS=("$@")
156 | }
157 | eval splitJvmOpts $DEFAULT_JVM_OPTS $JAVA_OPTS $GRADLE_OPTS
158 | JVM_OPTS[${#JVM_OPTS[*]}]="-Dorg.gradle.appname=$APP_BASE_NAME"
159 | 
160 | exec "$JAVACMD" "${JVM_OPTS[@]}" -classpath "$CLASSPATH" org.gradle.wrapper.GradleWrapperMain "$@"
161 | 


--------------------------------------------------------------------------------
/gradlew.bat:
--------------------------------------------------------------------------------
 1 | @if "%DEBUG%" == "" @echo off
 2 | @rem ##########################################################################
 3 | @rem
 4 | @rem  Gradle startup script for Windows
 5 | @rem
 6 | @rem ##########################################################################
 7 | 
 8 | @rem Set local scope for the variables with windows NT shell
 9 | if "%OS%"=="Windows_NT" setlocal
10 | 
11 | @rem Add default JVM options here. You can also use JAVA_OPTS and GRADLE_OPTS to pass JVM options to this script.
12 | set DEFAULT_JVM_OPTS=
13 | 
14 | set DIRNAME=%~dp0
15 | if "%DIRNAME%" == "" set DIRNAME=.
16 | set APP_BASE_NAME=%~n0
17 | set APP_HOME=%DIRNAME%
18 | 
19 | @rem Find java.exe
20 | if defined JAVA_HOME goto findJavaFromJavaHome
21 | 
22 | set JAVA_EXE=java.exe
23 | %JAVA_EXE% -version >NUL 2>&1
24 | if "%ERRORLEVEL%" == "0" goto init
25 | 
26 | echo.
27 | echo ERROR: JAVA_HOME is not set and no 'java' command could be found in your PATH.
28 | echo.
29 | echo Please set the JAVA_HOME variable in your environment to match the
30 | echo location of your Java installation.
31 | 
32 | goto fail
33 | 
34 | :findJavaFromJavaHome
35 | set JAVA_HOME=%JAVA_HOME:"=%
36 | set JAVA_EXE=%JAVA_HOME%/bin/java.exe
37 | 
38 | if exist "%JAVA_EXE%" goto init
39 | 
40 | echo.
41 | echo ERROR: JAVA_HOME is set to an invalid directory: %JAVA_HOME%
42 | echo.
43 | echo Please set the JAVA_HOME variable in your environment to match the
44 | echo location of your Java installation.
45 | 
46 | goto fail
47 | 
48 | :init
49 | @rem Get command-line arguments, handling Windowz variants
50 | 
51 | if not "%OS%" == "Windows_NT" goto win9xME_args
52 | if "%@eval[2+2]" == "4" goto 4NT_args
53 | 
54 | :win9xME_args
55 | @rem Slurp the command line arguments.
56 | set CMD_LINE_ARGS=
57 | set _SKIP=2
58 | 
59 | :win9xME_args_slurp
60 | if "x%~1" == "x" goto execute
61 | 
62 | set CMD_LINE_ARGS=%*
63 | goto execute
64 | 
65 | :4NT_args
66 | @rem Get arguments from the 4NT Shell from JP Software
67 | set CMD_LINE_ARGS=%$
68 | 
69 | :execute
70 | @rem Setup the command line
71 | 
72 | set CLASSPATH=%APP_HOME%\gradle\wrapper\gradle-wrapper.jar
73 | 
74 | @rem Execute Gradle
75 | "%JAVA_EXE%" %DEFAULT_JVM_OPTS% %JAVA_OPTS% %GRADLE_OPTS% "-Dorg.gradle.appname=%APP_BASE_NAME%" -classpath "%CLASSPATH%" org.gradle.wrapper.GradleWrapperMain %CMD_LINE_ARGS%
76 | 
77 | :end
78 | @rem End local scope for the variables with windows NT shell
79 | if "%ERRORLEVEL%"=="0" goto mainEnd
80 | 
81 | :fail
82 | rem Set variable GRADLE_EXIT_CONSOLE if you need the _script_ return code instead of
83 | rem the _cmd.exe /c_ return code!
84 | if  not "" == "%GRADLE_EXIT_CONSOLE%" exit 1
85 | exit /b 1
86 | 
87 | :mainEnd
88 | if "%OS%"=="Windows_NT" endlocal
89 | 
90 | :omega
91 | 


--------------------------------------------------------------------------------
/http-get-route/README.md:
--------------------------------------------------------------------------------
1 | http-get-route
2 | ==============
3 | 
4 | Pulls from a web service (example is nifi itself), extracts text from a specific section, makes a routing decision 
5 | on that extracted value, prepares to write to disk using PutFile.


--------------------------------------------------------------------------------
/invoke-http-route/README.md:
--------------------------------------------------------------------------------
1 | invoke-http-route
2 | =================
3 | 
4 | This flow demonstrates how to call an HTTP service based on an incoming FlowFile, and route the original FlowFile 
5 | based on the status code returned from the invocation. In this example, every 30 seconds a FlowFile is produced, 
6 | an attribute is added to the FlowFile that sets q=nifi, the google.com is invoked for that FlowFile, and any response 
7 | with a 200 is routed to a relationship called 200.


--------------------------------------------------------------------------------
/invoke-http-route/invokeHttp-and-route-original-on-status-flow.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="UTF-8" standalone="yes"?>
  2 | <template>
  3 |     <description></description>
  4 |     <name>InvokeAndRouteOnStatus</name>
  5 |     <snippet>
  6 |         <connections>
  7 |             <id>1e03fc63-e6bb-4ee4-8445-8a0c38ba8b39</id>
  8 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
  9 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 10 |             <backPressureObjectThreshold>0</backPressureObjectThreshold>
 11 |             <destination>
 12 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 13 |                 <id>0ba0b02b-bc72-492d-8e1d-d473fdaca6c5</id>
 14 |                 <type>PROCESSOR</type>
 15 |             </destination>
 16 |             <flowFileExpiration>0 sec</flowFileExpiration>
 17 |             <labelIndex>1</labelIndex>
 18 |             <name></name>
 19 |             <selectedRelationships>success</selectedRelationships>
 20 |             <source>
 21 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 22 |                 <id>978f5abe-b43b-47e2-9f0b-37c665fb6fd8</id>
 23 |                 <type>PROCESSOR</type>
 24 |             </source>
 25 |             <zIndex>0</zIndex>
 26 |         </connections>
 27 |         <connections>
 28 |             <id>87c6a9d6-37ca-4f3b-a774-4dbfa37323a0</id>
 29 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
 30 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 31 |             <backPressureObjectThreshold>0</backPressureObjectThreshold>
 32 |             <bends>
 33 |                 <x>1247.5449829101562</x>
 34 |                 <y>213.377197265625</y>
 35 |             </bends>
 36 |             <bends>
 37 |                 <x>1247.5449829101562</x>
 38 |                 <y>263.377197265625</y>
 39 |             </bends>
 40 |             <destination>
 41 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 42 |                 <id>0ba0b02b-bc72-492d-8e1d-d473fdaca6c5</id>
 43 |                 <type>PROCESSOR</type>
 44 |             </destination>
 45 |             <flowFileExpiration>0 sec</flowFileExpiration>
 46 |             <labelIndex>1</labelIndex>
 47 |             <name></name>
 48 |             <selectedRelationships>Failure</selectedRelationships>
 49 |             <selectedRelationships>Retry</selectedRelationships>
 50 |             <source>
 51 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 52 |                 <id>0ba0b02b-bc72-492d-8e1d-d473fdaca6c5</id>
 53 |                 <type>PROCESSOR</type>
 54 |             </source>
 55 |             <zIndex>0</zIndex>
 56 |         </connections>
 57 |         <connections>
 58 |             <id>c15d92f3-4f31-4453-9361-4a1e05286339</id>
 59 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
 60 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 61 |             <backPressureObjectThreshold>0</backPressureObjectThreshold>
 62 |             <destination>
 63 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 64 |                 <id>978f5abe-b43b-47e2-9f0b-37c665fb6fd8</id>
 65 |                 <type>PROCESSOR</type>
 66 |             </destination>
 67 |             <flowFileExpiration>0 sec</flowFileExpiration>
 68 |             <labelIndex>1</labelIndex>
 69 |             <name></name>
 70 |             <selectedRelationships>success</selectedRelationships>
 71 |             <source>
 72 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 73 |                 <id>0c7ce557-9e17-40d7-be3d-59e40bda3052</id>
 74 |                 <type>PROCESSOR</type>
 75 |             </source>
 76 |             <zIndex>0</zIndex>
 77 |         </connections>
 78 |         <connections>
 79 |             <id>12c0c979-7b9c-41fa-9112-621faba86586</id>
 80 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
 81 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 82 |             <backPressureObjectThreshold>0</backPressureObjectThreshold>
 83 |             <destination>
 84 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 85 |                 <id>d9b44845-0a0a-4ca0-8c99-6257a372f973</id>
 86 |                 <type>PROCESSOR</type>
 87 |             </destination>
 88 |             <flowFileExpiration>0 sec</flowFileExpiration>
 89 |             <labelIndex>1</labelIndex>
 90 |             <name></name>
 91 |             <selectedRelationships>200</selectedRelationships>
 92 |             <source>
 93 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
 94 |                 <id>51f639fd-42fc-4e43-96ac-f88e3586f55d</id>
 95 |                 <type>PROCESSOR</type>
 96 |             </source>
 97 |             <zIndex>0</zIndex>
 98 |         </connections>
 99 |         <connections>
100 |             <id>b4a967a9-5be7-4dcc-8de4-82ef908eebf2</id>
101 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
102 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
103 |             <backPressureObjectThreshold>0</backPressureObjectThreshold>
104 |             <destination>
105 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
106 |                 <id>51f639fd-42fc-4e43-96ac-f88e3586f55d</id>
107 |                 <type>PROCESSOR</type>
108 |             </destination>
109 |             <flowFileExpiration>0 sec</flowFileExpiration>
110 |             <labelIndex>1</labelIndex>
111 |             <name></name>
112 |             <selectedRelationships>Original</selectedRelationships>
113 |             <source>
114 |                 <groupId>f171ca87-d018-4f94-a245-4ae378b9e181</groupId>
115 |                 <id>0ba0b02b-bc72-492d-8e1d-d473fdaca6c5</id>
116 |                 <type>PROCESSOR</type>
117 |             </source>
118 |             <zIndex>0</zIndex>
119 |         </connections>
120 |         <processors>
121 |             <id>d9b44845-0a0a-4ca0-8c99-6257a372f973</id>
122 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
123 |             <position>
124 |                 <x>851.2960157866881</x>
125 |                 <y>550.0135779982523</y>
126 |             </position>
127 |             <config>
128 |                 <bulletinLevel>WARN</bulletinLevel>
129 |                 <comments></comments>
130 |                 <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
131 |                 <defaultConcurrentTasks>
132 |                     <entry>
133 |                         <key>TIMER_DRIVEN</key>
134 |                         <value>1</value>
135 |                     </entry>
136 |                     <entry>
137 |                         <key>EVENT_DRIVEN</key>
138 |                         <value>0</value>
139 |                     </entry>
140 |                     <entry>
141 |                         <key>CRON_DRIVEN</key>
142 |                         <value>1</value>
143 |                     </entry>
144 |                 </defaultConcurrentTasks>
145 |                 <defaultSchedulingPeriod>
146 |                     <entry>
147 |                         <key>TIMER_DRIVEN</key>
148 |                         <value>0 sec</value>
149 |                     </entry>
150 |                     <entry>
151 |                         <key>CRON_DRIVEN</key>
152 |                         <value>* * * * * ?</value>
153 |                     </entry>
154 |                 </defaultSchedulingPeriod>
155 |                 <descriptors>
156 |                     <entry>
157 |                         <key>Hash Attribute Name</key>
158 |                         <value>
159 |                             <defaultValue>hash.value</defaultValue>
160 |                             <description>The name of the FlowFile Attribute into which the Hash Value should be written.
161 |                                 If the value already exists, it will be overwritten
162 |                             </description>
163 |                             <displayName>Hash Attribute Name</displayName>
164 |                             <dynamic>false</dynamic>
165 |                             <name>Hash Attribute Name</name>
166 |                             <required>true</required>
167 |                             <sensitive>false</sensitive>
168 |                             <supportsEl>false</supportsEl>
169 |                         </value>
170 |                     </entry>
171 |                     <entry>
172 |                         <key>Hash Algorithm</key>
173 |                         <value>
174 |                             <allowableValues>
175 |                                 <displayName>RIPEMD320</displayName>
176 |                                 <value>RIPEMD320</value>
177 |                             </allowableValues>
178 |                             <allowableValues>
179 |                                 <displayName>SHA-1</displayName>
180 |                                 <value>SHA-1</value>
181 |                             </allowableValues>
182 |                             <allowableValues>
183 |                                 <displayName>SHA-384</displayName>
184 |                                 <value>SHA-384</value>
185 |                             </allowableValues>
186 |                             <allowableValues>
187 |                                 <displayName>RIPEMD160</displayName>
188 |                                 <value>RIPEMD160</value>
189 |                             </allowableValues>
190 |                             <allowableValues>
191 |                                 <displayName>SHA</displayName>
192 |                                 <value>SHA</value>
193 |                             </allowableValues>
194 |                             <allowableValues>
195 |                                 <displayName>WHIRLPOOL</displayName>
196 |                                 <value>WHIRLPOOL</value>
197 |                             </allowableValues>
198 |                             <allowableValues>
199 |                                 <displayName>GOST3411</displayName>
200 |                                 <value>GOST3411</value>
201 |                             </allowableValues>
202 |                             <allowableValues>
203 |                                 <displayName>SHA-224</displayName>
204 |                                 <value>SHA-224</value>
205 |                             </allowableValues>
206 |                             <allowableValues>
207 |                                 <displayName>SHA-256</displayName>
208 |                                 <value>SHA-256</value>
209 |                             </allowableValues>
210 |                             <allowableValues>
211 |                                 <displayName>MD2</displayName>
212 |                                 <value>MD2</value>
213 |                             </allowableValues>
214 |                             <allowableValues>
215 |                                 <displayName>RIPEMD128</displayName>
216 |                                 <value>RIPEMD128</value>
217 |                             </allowableValues>
218 |                             <allowableValues>
219 |                                 <displayName>MD4</displayName>
220 |                                 <value>MD4</value>
221 |                             </allowableValues>
222 |                             <allowableValues>
223 |                                 <displayName>SHA-512</displayName>
224 |                                 <value>SHA-512</value>
225 |                             </allowableValues>
226 |                             <allowableValues>
227 |                                 <displayName>RIPEMD256</displayName>
228 |                                 <value>RIPEMD256</value>
229 |                             </allowableValues>
230 |                             <allowableValues>
231 |                                 <displayName>TIGER</displayName>
232 |                                 <value>TIGER</value>
233 |                             </allowableValues>
234 |                             <allowableValues>
235 |                                 <displayName>MD5</displayName>
236 |                                 <value>MD5</value>
237 |                             </allowableValues>
238 |                             <defaultValue>MD5</defaultValue>
239 |                             <description>Determines what hashing algorithm should be used to perform the hashing
240 |                                 function
241 |                             </description>
242 |                             <displayName>Hash Algorithm</displayName>
243 |                             <dynamic>false</dynamic>
244 |                             <name>Hash Algorithm</name>
245 |                             <required>true</required>
246 |                             <sensitive>false</sensitive>
247 |                             <supportsEl>false</supportsEl>
248 |                         </value>
249 |                     </entry>
250 |                 </descriptors>
251 |                 <lossTolerant>false</lossTolerant>
252 |                 <penaltyDuration>30 sec</penaltyDuration>
253 |                 <properties>
254 |                     <entry>
255 |                         <key>Hash Attribute Name</key>
256 |                     </entry>
257 |                     <entry>
258 |                         <key>Hash Algorithm</key>
259 |                     </entry>
260 |                 </properties>
261 |                 <runDurationMillis>0</runDurationMillis>
262 |                 <schedulingPeriod>0 sec</schedulingPeriod>
263 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
264 |                 <yieldDuration>1 sec</yieldDuration>
265 |             </config>
266 |             <name>HashContent</name>
267 |             <relationships>
268 |                 <autoTerminate>true</autoTerminate>
269 |                 <description>Any FlowFile that cannot be processed successfully will be sent to this relationship
270 |                     without any attribute being added
271 |                 </description>
272 |                 <name>failure</name>
273 |             </relationships>
274 |             <relationships>
275 |                 <autoTerminate>true</autoTerminate>
276 |                 <description>FlowFiles that are process successfully will be sent to this relationship</description>
277 |                 <name>success</name>
278 |             </relationships>
279 |             <state>STOPPED</state>
280 |             <style/>
281 |             <supportsEventDriven>true</supportsEventDriven>
282 |             <supportsParallelProcessing>true</supportsParallelProcessing>
283 |             <type>org.apache.nifi.processors.standard.HashContent</type>
284 |         </processors>
285 |         <processors>
286 |             <id>51f639fd-42fc-4e43-96ac-f88e3586f55d</id>
287 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
288 |             <position>
289 |                 <x>836.400390625</x>
290 |                 <y>367.4216613769531</y>
291 |             </position>
292 |             <config>
293 |                 <bulletinLevel>WARN</bulletinLevel>
294 |                 <comments></comments>
295 |                 <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
296 |                 <defaultConcurrentTasks>
297 |                     <entry>
298 |                         <key>TIMER_DRIVEN</key>
299 |                         <value>1</value>
300 |                     </entry>
301 |                     <entry>
302 |                         <key>EVENT_DRIVEN</key>
303 |                         <value>0</value>
304 |                     </entry>
305 |                     <entry>
306 |                         <key>CRON_DRIVEN</key>
307 |                         <value>1</value>
308 |                     </entry>
309 |                 </defaultConcurrentTasks>
310 |                 <defaultSchedulingPeriod>
311 |                     <entry>
312 |                         <key>TIMER_DRIVEN</key>
313 |                         <value>0 sec</value>
314 |                     </entry>
315 |                     <entry>
316 |                         <key>CRON_DRIVEN</key>
317 |                         <value>* * * * * ?</value>
318 |                     </entry>
319 |                 </defaultSchedulingPeriod>
320 |                 <descriptors>
321 |                     <entry>
322 |                         <key>Routing Strategy</key>
323 |                         <value>
324 |                             <allowableValues>
325 |                                 <description>A copy of the FlowFile will be routed to each relationship whose
326 |                                     corresponding expression evaluates to 'true'
327 |                                 </description>
328 |                                 <displayName>Route to Property name</displayName>
329 |                                 <value>Route to Property name</value>
330 |                             </allowableValues>
331 |                             <allowableValues>
332 |                                 <description>Requires that all user-defined expressions evaluate to 'true' for the
333 |                                     FlowFile to be considered a match
334 |                                 </description>
335 |                                 <displayName>Route to 'matched' if all match</displayName>
336 |                                 <value>Route to 'match' if all match</value>
337 |                             </allowableValues>
338 |                             <allowableValues>
339 |                                 <description>Requires that at least one user-defined expression evaluate to 'true' for
340 |                                     hte FlowFile to be considered a match
341 |                                 </description>
342 |                                 <displayName>Route to 'matched' if any matches</displayName>
343 |                                 <value>Route to 'match' if any matches</value>
344 |                             </allowableValues>
345 |                             <defaultValue>Route to Property name</defaultValue>
346 |                             <description>Specifies how to determine which relationship to use when evaluating the
347 |                                 Expression Language
348 |                             </description>
349 |                             <displayName>Routing Strategy</displayName>
350 |                             <dynamic>false</dynamic>
351 |                             <name>Routing Strategy</name>
352 |                             <required>true</required>
353 |                             <sensitive>false</sensitive>
354 |                             <supportsEl>false</supportsEl>
355 |                         </value>
356 |                     </entry>
357 |                     <entry>
358 |                         <key>200</key>
359 |                         <value>
360 |                             <description></description>
361 |                             <displayName>200</displayName>
362 |                             <dynamic>true</dynamic>
363 |                             <name>200</name>
364 |                             <required>false</required>
365 |                             <sensitive>false</sensitive>
366 |                             <supportsEl>true</supportsEl>
367 |                         </value>
368 |                     </entry>
369 |                 </descriptors>
370 |                 <lossTolerant>false</lossTolerant>
371 |                 <penaltyDuration>30 sec</penaltyDuration>
372 |                 <properties>
373 |                     <entry>
374 |                         <key>Routing Strategy</key>
375 |                         <value>Route to Property name</value>
376 |                     </entry>
377 |                     <entry>
378 |                         <key>200</key>
379 |                         <value>${invokehttp.status.code:equals(200)}</value>
380 |                     </entry>
381 |                 </properties>
382 |                 <runDurationMillis>0</runDurationMillis>
383 |                 <schedulingPeriod>0 sec</schedulingPeriod>
384 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
385 |                 <yieldDuration>1 sec</yieldDuration>
386 |             </config>
387 |             <name>Route On Status Code</name>
388 |             <relationships>
389 |                 <autoTerminate>false</autoTerminate>
390 |                 <description></description>
391 |                 <name>200</name>
392 |             </relationships>
393 |             <relationships>
394 |                 <autoTerminate>true</autoTerminate>
395 |                 <description>FlowFiles that do not match any user-define expression will be routed here</description>
396 |                 <name>unmatched</name>
397 |             </relationships>
398 |             <state>STOPPED</state>
399 |             <style/>
400 |             <supportsEventDriven>true</supportsEventDriven>
401 |             <supportsParallelProcessing>true</supportsParallelProcessing>
402 |             <type>org.apache.nifi.processors.standard.RouteOnAttribute</type>
403 |         </processors>
404 |         <processors>
405 |             <id>0ba0b02b-bc72-492d-8e1d-d473fdaca6c5</id>
406 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
407 |             <position>
408 |                 <x>838.5449829101562</x>
409 |                 <y>188.377197265625</y>
410 |             </position>
411 |             <config>
412 |                 <bulletinLevel>WARN</bulletinLevel>
413 |                 <comments></comments>
414 |                 <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
415 |                 <defaultConcurrentTasks>
416 |                     <entry>
417 |                         <key>TIMER_DRIVEN</key>
418 |                         <value>1</value>
419 |                     </entry>
420 |                     <entry>
421 |                         <key>EVENT_DRIVEN</key>
422 |                         <value>0</value>
423 |                     </entry>
424 |                     <entry>
425 |                         <key>CRON_DRIVEN</key>
426 |                         <value>1</value>
427 |                     </entry>
428 |                 </defaultConcurrentTasks>
429 |                 <defaultSchedulingPeriod>
430 |                     <entry>
431 |                         <key>TIMER_DRIVEN</key>
432 |                         <value>0 sec</value>
433 |                     </entry>
434 |                     <entry>
435 |                         <key>CRON_DRIVEN</key>
436 |                         <value>* * * * * ?</value>
437 |                     </entry>
438 |                 </defaultSchedulingPeriod>
439 |                 <descriptors>
440 |                     <entry>
441 |                         <key>HTTP Method</key>
442 |                         <value>
443 |                             <defaultValue>GET</defaultValue>
444 |                             <description>HTTP request method (GET, POST, PUT, DELETE, HEAD, OPTIONS).</description>
445 |                             <displayName>HTTP Method</displayName>
446 |                             <dynamic>false</dynamic>
447 |                             <name>HTTP Method</name>
448 |                             <required>true</required>
449 |                             <sensitive>false</sensitive>
450 |                             <supportsEl>true</supportsEl>
451 |                         </value>
452 |                     </entry>
453 |                     <entry>
454 |                         <key>Remote URL</key>
455 |                         <value>
456 |                             <description>Remote URL which will be connected to, including scheme, host, port, path.
457 |                             </description>
458 |                             <displayName>Remote URL</displayName>
459 |                             <dynamic>false</dynamic>
460 |                             <name>Remote URL</name>
461 |                             <required>true</required>
462 |                             <sensitive>false</sensitive>
463 |                             <supportsEl>true</supportsEl>
464 |                         </value>
465 |                     </entry>
466 |                     <entry>
467 |                         <key>SSL Context Service</key>
468 |                         <value>
469 |                             <description>The SSL Context Service used to provide client certificate information for
470 |                                 TLS/SSL (https) connections.
471 |                             </description>
472 |                             <displayName>SSL Context Service</displayName>
473 |                             <dynamic>false</dynamic>
474 |                             <identifiesControllerService>org.apache.nifi.ssl.SSLContextService
475 |                             </identifiesControllerService>
476 |                             <name>SSL Context Service</name>
477 |                             <required>false</required>
478 |                             <sensitive>false</sensitive>
479 |                             <supportsEl>false</supportsEl>
480 |                         </value>
481 |                     </entry>
482 |                     <entry>
483 |                         <key>Connection Timeout</key>
484 |                         <value>
485 |                             <defaultValue>5 secs</defaultValue>
486 |                             <description>Max wait time for connection to remote service.</description>
487 |                             <displayName>Connection Timeout</displayName>
488 |                             <dynamic>false</dynamic>
489 |                             <name>Connection Timeout</name>
490 |                             <required>true</required>
491 |                             <sensitive>false</sensitive>
492 |                             <supportsEl>false</supportsEl>
493 |                         </value>
494 |                     </entry>
495 |                     <entry>
496 |                         <key>Read Timeout</key>
497 |                         <value>
498 |                             <defaultValue>15 secs</defaultValue>
499 |                             <description>Max wait time for response from remote service.</description>
500 |                             <displayName>Read Timeout</displayName>
501 |                             <dynamic>false</dynamic>
502 |                             <name>Read Timeout</name>
503 |                             <required>true</required>
504 |                             <sensitive>false</sensitive>
505 |                             <supportsEl>false</supportsEl>
506 |                         </value>
507 |                     </entry>
508 |                     <entry>
509 |                         <key>Include Date Header</key>
510 |                         <value>
511 |                             <allowableValues>
512 |                                 <displayName>True</displayName>
513 |                                 <value>True</value>
514 |                             </allowableValues>
515 |                             <allowableValues>
516 |                                 <displayName>False</displayName>
517 |                                 <value>False</value>
518 |                             </allowableValues>
519 |                             <defaultValue>True</defaultValue>
520 |                             <description>Include an RFC-2616 Date header in the request.</description>
521 |                             <displayName>Include Date Header</displayName>
522 |                             <dynamic>false</dynamic>
523 |                             <name>Include Date Header</name>
524 |                             <required>true</required>
525 |                             <sensitive>false</sensitive>
526 |                             <supportsEl>false</supportsEl>
527 |                         </value>
528 |                     </entry>
529 |                     <entry>
530 |                         <key>Follow Redirects</key>
531 |                         <value>
532 |                             <allowableValues>
533 |                                 <displayName>True</displayName>
534 |                                 <value>True</value>
535 |                             </allowableValues>
536 |                             <allowableValues>
537 |                                 <displayName>False</displayName>
538 |                                 <value>False</value>
539 |                             </allowableValues>
540 |                             <defaultValue>True</defaultValue>
541 |                             <description>Follow HTTP redirects issued by remote server.</description>
542 |                             <displayName>Follow Redirects</displayName>
543 |                             <dynamic>false</dynamic>
544 |                             <name>Follow Redirects</name>
545 |                             <required>true</required>
546 |                             <sensitive>false</sensitive>
547 |                             <supportsEl>false</supportsEl>
548 |                         </value>
549 |                     </entry>
550 |                     <entry>
551 |                         <key>Attributes to Send</key>
552 |                         <value>
553 |                             <description>Regular expression that defines which attributes to send as HTTP headers in the
554 |                                 request. If not defined, no attributes are sent as headers.
555 |                             </description>
556 |                             <displayName>Attributes to Send</displayName>
557 |                             <dynamic>false</dynamic>
558 |                             <name>Attributes to Send</name>
559 |                             <required>false</required>
560 |                             <sensitive>false</sensitive>
561 |                             <supportsEl>false</supportsEl>
562 |                         </value>
563 |                     </entry>
564 |                     <entry>
565 |                         <key>Basic Authentication Username</key>
566 |                         <value>
567 |                             <description>The username to be used by the client to authenticate against the Remote URL.
568 |                                 Cannot include control characters (0-31), ':', or DEL (127).
569 |                             </description>
570 |                             <displayName>Basic Authentication Username</displayName>
571 |                             <dynamic>false</dynamic>
572 |                             <name>Basic Authentication Username</name>
573 |                             <required>false</required>
574 |                             <sensitive>false</sensitive>
575 |                             <supportsEl>false</supportsEl>
576 |                         </value>
577 |                     </entry>
578 |                     <entry>
579 |                         <key>Basic Authentication Password</key>
580 |                         <value>
581 |                             <description>The password to be used by the client to authenticate against the Remote URL.
582 |                             </description>
583 |                             <displayName>Basic Authentication Password</displayName>
584 |                             <dynamic>false</dynamic>
585 |                             <name>Basic Authentication Password</name>
586 |                             <required>false</required>
587 |                             <sensitive>false</sensitive>
588 |                             <supportsEl>false</supportsEl>
589 |                         </value>
590 |                     </entry>
591 |                 </descriptors>
592 |                 <lossTolerant>false</lossTolerant>
593 |                 <penaltyDuration>30 sec</penaltyDuration>
594 |                 <properties>
595 |                     <entry>
596 |                         <key>HTTP Method</key>
597 |                     </entry>
598 |                     <entry>
599 |                         <key>Remote URL</key>
600 |                         <value>https://www.google.com</value>
601 |                     </entry>
602 |                     <entry>
603 |                         <key>SSL Context Service</key>
604 |                     </entry>
605 |                     <entry>
606 |                         <key>Connection Timeout</key>
607 |                     </entry>
608 |                     <entry>
609 |                         <key>Read Timeout</key>
610 |                     </entry>
611 |                     <entry>
612 |                         <key>Include Date Header</key>
613 |                     </entry>
614 |                     <entry>
615 |                         <key>Follow Redirects</key>
616 |                     </entry>
617 |                     <entry>
618 |                         <key>Attributes to Send</key>
619 |                     </entry>
620 |                     <entry>
621 |                         <key>Basic Authentication Username</key>
622 |                     </entry>
623 |                     <entry>
624 |                         <key>Basic Authentication Password</key>
625 |                     </entry>
626 |                 </properties>
627 |                 <runDurationMillis>0</runDurationMillis>
628 |                 <schedulingPeriod>0 sec</schedulingPeriod>
629 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
630 |                 <yieldDuration>1 sec</yieldDuration>
631 |             </config>
632 |             <name>Search Google</name>
633 |             <relationships>
634 |                 <autoTerminate>false</autoTerminate>
635 |                 <description>FlowFile will be routed on any type of connection failure, timeout or general exception.
636 |                 </description>
637 |                 <name>Failure</name>
638 |             </relationships>
639 |             <relationships>
640 |                 <autoTerminate>true</autoTerminate>
641 |                 <description>FlowFile will be routed on any status code that should NOT be retried (1xx, 3xx, 4xx status
642 |                     codes).
643 |                 </description>
644 |                 <name>No Retry</name>
645 |             </relationships>
646 |             <relationships>
647 |                 <autoTerminate>false</autoTerminate>
648 |                 <description>Original FlowFile will be routed upon success (2xx status codes).</description>
649 |                 <name>Original</name>
650 |             </relationships>
651 |             <relationships>
652 |                 <autoTerminate>true</autoTerminate>
653 |                 <description>Response FlowFile will be routed upon success (2xx status codes).</description>
654 |                 <name>Response</name>
655 |             </relationships>
656 |             <relationships>
657 |                 <autoTerminate>false</autoTerminate>
658 |                 <description>FlowFile will be routed on any status code that can be retried (5xx status codes).
659 |                 </description>
660 |                 <name>Retry</name>
661 |             </relationships>
662 |             <state>STOPPED</state>
663 |             <style/>
664 |             <supportsEventDriven>false</supportsEventDriven>
665 |             <supportsParallelProcessing>true</supportsParallelProcessing>
666 |             <type>org.apache.nifi.processors.standard.InvokeHTTP</type>
667 |         </processors>
668 |         <processors>
669 |             <id>0c7ce557-9e17-40d7-be3d-59e40bda3052</id>
670 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
671 |             <position>
672 |                 <x>291.68109130859375</x>
673 |                 <y>-7.794247627258301</y>
674 |             </position>
675 |             <config>
676 |                 <bulletinLevel>WARN</bulletinLevel>
677 |                 <comments></comments>
678 |                 <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
679 |                 <defaultConcurrentTasks>
680 |                     <entry>
681 |                         <key>TIMER_DRIVEN</key>
682 |                         <value>1</value>
683 |                     </entry>
684 |                     <entry>
685 |                         <key>EVENT_DRIVEN</key>
686 |                         <value>0</value>
687 |                     </entry>
688 |                     <entry>
689 |                         <key>CRON_DRIVEN</key>
690 |                         <value>1</value>
691 |                     </entry>
692 |                 </defaultConcurrentTasks>
693 |                 <defaultSchedulingPeriod>
694 |                     <entry>
695 |                         <key>TIMER_DRIVEN</key>
696 |                         <value>0 sec</value>
697 |                     </entry>
698 |                     <entry>
699 |                         <key>CRON_DRIVEN</key>
700 |                         <value>* * * * * ?</value>
701 |                     </entry>
702 |                 </defaultSchedulingPeriod>
703 |                 <descriptors>
704 |                     <entry>
705 |                         <key>File Size</key>
706 |                         <value>
707 |                             <description>The size of the file that will be used</description>
708 |                             <displayName>File Size</displayName>
709 |                             <dynamic>false</dynamic>
710 |                             <name>File Size</name>
711 |                             <required>true</required>
712 |                             <sensitive>false</sensitive>
713 |                             <supportsEl>false</supportsEl>
714 |                         </value>
715 |                     </entry>
716 |                     <entry>
717 |                         <key>Batch Size</key>
718 |                         <value>
719 |                             <defaultValue>1</defaultValue>
720 |                             <description>The number of FlowFiles to be transferred in each invocation</description>
721 |                             <displayName>Batch Size</displayName>
722 |                             <dynamic>false</dynamic>
723 |                             <name>Batch Size</name>
724 |                             <required>true</required>
725 |                             <sensitive>false</sensitive>
726 |                             <supportsEl>false</supportsEl>
727 |                         </value>
728 |                     </entry>
729 |                     <entry>
730 |                         <key>Data Format</key>
731 |                         <value>
732 |                             <allowableValues>
733 |                                 <displayName>Binary</displayName>
734 |                                 <value>Binary</value>
735 |                             </allowableValues>
736 |                             <allowableValues>
737 |                                 <displayName>Text</displayName>
738 |                                 <value>Text</value>
739 |                             </allowableValues>
740 |                             <defaultValue>Binary</defaultValue>
741 |                             <description>Specifies whether the data should be Text or Binary</description>
742 |                             <displayName>Data Format</displayName>
743 |                             <dynamic>false</dynamic>
744 |                             <name>Data Format</name>
745 |                             <required>true</required>
746 |                             <sensitive>false</sensitive>
747 |                             <supportsEl>false</supportsEl>
748 |                         </value>
749 |                     </entry>
750 |                     <entry>
751 |                         <key>Unique FlowFiles</key>
752 |                         <value>
753 |                             <allowableValues>
754 |                                 <displayName>true</displayName>
755 |                                 <value>true</value>
756 |                             </allowableValues>
757 |                             <allowableValues>
758 |                                 <displayName>false</displayName>
759 |                                 <value>false</value>
760 |                             </allowableValues>
761 |                             <defaultValue>false</defaultValue>
762 |                             <description>If true, each FlowFile that is generated will be unique. If false, a random
763 |                                 value will be generated and all FlowFiles will get the same content but this offers much
764 |                                 higher throughput
765 |                             </description>
766 |                             <displayName>Unique FlowFiles</displayName>
767 |                             <dynamic>false</dynamic>
768 |                             <name>Unique FlowFiles</name>
769 |                             <required>true</required>
770 |                             <sensitive>false</sensitive>
771 |                             <supportsEl>false</supportsEl>
772 |                         </value>
773 |                     </entry>
774 |                 </descriptors>
775 |                 <lossTolerant>false</lossTolerant>
776 |                 <penaltyDuration>30 sec</penaltyDuration>
777 |                 <properties>
778 |                     <entry>
779 |                         <key>File Size</key>
780 |                         <value>10 b</value>
781 |                     </entry>
782 |                     <entry>
783 |                         <key>Batch Size</key>
784 |                     </entry>
785 |                     <entry>
786 |                         <key>Data Format</key>
787 |                     </entry>
788 |                     <entry>
789 |                         <key>Unique FlowFiles</key>
790 |                     </entry>
791 |                 </properties>
792 |                 <runDurationMillis>0</runDurationMillis>
793 |                 <schedulingPeriod>30 sec</schedulingPeriod>
794 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
795 |                 <yieldDuration>1 sec</yieldDuration>
796 |             </config>
797 |             <name>Source</name>
798 |             <relationships>
799 |                 <autoTerminate>false</autoTerminate>
800 |                 <description></description>
801 |                 <name>success</name>
802 |             </relationships>
803 |             <state>STOPPED</state>
804 |             <style/>
805 |             <supportsEventDriven>false</supportsEventDriven>
806 |             <supportsParallelProcessing>true</supportsParallelProcessing>
807 |             <type>org.apache.nifi.processors.standard.GenerateFlowFile</type>
808 |         </processors>
809 |         <processors>
810 |             <id>978f5abe-b43b-47e2-9f0b-37c665fb6fd8</id>
811 |             <parentGroupId>f171ca87-d018-4f94-a245-4ae378b9e181</parentGroupId>
812 |             <position>
813 |                 <x>836.550537109375</x>
814 |                 <y>-2.695110321044922</y>
815 |             </position>
816 |             <config>
817 |                 <bulletinLevel>WARN</bulletinLevel>
818 |                 <comments></comments>
819 |                 <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
820 |                 <defaultConcurrentTasks>
821 |                     <entry>
822 |                         <key>TIMER_DRIVEN</key>
823 |                         <value>1</value>
824 |                     </entry>
825 |                     <entry>
826 |                         <key>EVENT_DRIVEN</key>
827 |                         <value>0</value>
828 |                     </entry>
829 |                     <entry>
830 |                         <key>CRON_DRIVEN</key>
831 |                         <value>1</value>
832 |                     </entry>
833 |                 </defaultConcurrentTasks>
834 |                 <defaultSchedulingPeriod>
835 |                     <entry>
836 |                         <key>TIMER_DRIVEN</key>
837 |                         <value>0 sec</value>
838 |                     </entry>
839 |                     <entry>
840 |                         <key>CRON_DRIVEN</key>
841 |                         <value>* * * * * ?</value>
842 |                     </entry>
843 |                 </defaultSchedulingPeriod>
844 |                 <descriptors>
845 |                     <entry>
846 |                         <key>q</key>
847 |                         <value>
848 |                             <description></description>
849 |                             <displayName>q</displayName>
850 |                             <dynamic>true</dynamic>
851 |                             <name>q</name>
852 |                             <required>false</required>
853 |                             <sensitive>false</sensitive>
854 |                             <supportsEl>true</supportsEl>
855 |                         </value>
856 |                     </entry>
857 |                 </descriptors>
858 |                 <lossTolerant>false</lossTolerant>
859 |                 <penaltyDuration>30 sec</penaltyDuration>
860 |                 <properties>
861 |                     <entry>
862 |                         <key>q</key>
863 |                         <value>nifi</value>
864 |                     </entry>
865 |                 </properties>
866 |                 <runDurationMillis>0</runDurationMillis>
867 |                 <schedulingPeriod>0 sec</schedulingPeriod>
868 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
869 |                 <yieldDuration>1 sec</yieldDuration>
870 |             </config>
871 |             <name>q=nifi</name>
872 |             <relationships>
873 |                 <autoTerminate>false</autoTerminate>
874 |                 <description>All FlowFiles are routed to this relationship</description>
875 |                 <name>success</name>
876 |             </relationships>
877 |             <state>STOPPED</state>
878 |             <style/>
879 |             <supportsEventDriven>true</supportsEventDriven>
880 |             <supportsParallelProcessing>true</supportsParallelProcessing>
881 |             <type>org.apache.nifi.processors.attributes.UpdateAttribute</type>
882 |         </processors>
883 |     </snippet>
884 |     <timestamp>08/03/2015 15:56:12 EDT</timestamp>
885 | </template>


--------------------------------------------------------------------------------
/iot-activity-tracker/README.md:
--------------------------------------------------------------------------------
 1 | iot-activity-tracker
 2 | ====================
 3 | 
 4 | 1. Ingest IoT data over HTTP
 5 |     1. Open HTTP server on port 5001 and listen for HTTP `POST` requests.
 6 |     2. Add HTTP headers (`sensor`) to flowFile attributes. 
 7 |     2. Publish HTTP payload to **EventBus**'s dynamic address `iot.in.${sensor}`.
 8 | 2. Ingest IoT data over WebSocket.
 9 |     1. Open EventBus-WebSocket bridge on port 5555.
10 |     2. Let external (JavaScript), and internal(ListenHTTP) clients to publish IoT events including headers(`sensor`) to dynamic address `iot.in.${sensor}`.
11 |     3. Extract sensor data from JSON payload into flowFile attributes for future use.
12 | 3. Store all data to HDFS(W.I.P) and summary data to NoSQL(MarkLogic) for historical data search.
13 | 4. Stream real-time targeted data to user's app and physicians dashboard. 
14 | 5. Route Heart rate IoT data to `warning` and `danger` routes
15 |     1. `danger` route will send email alert to Physicians.
16 |     2. `warning` route will send dashboard alert (Call Center).
17 | 6. Inactivity Reporting
18 |     1. Send `Inactivity Message` when there is no IoT data in the flow for 5 min.
19 |     2. Send `Activity Restored Message` when new IoT data received after inactivity event. 
20 |     3. Client UI can subscript to `Inactivity` events and show graphical status. 
21 |        
22 | Note: this flow depends on **nifi-websocket** module, download [nar](https://github.com/xmlking/nifi-websocket/releases/download/0.1.0/nifi-websocket-0.1.0-SNAPSHOT.nar) and copy to `$NIFI_HOME/lib`
23 | 
24 | ### Run
25 | 1. Send test IoT data via dashboard 
26 |     > Access [this](./dashboard/heartrate.html) page and submit the form. 
27 | 2. Send test IoT data via CURL
28 | ```bash
29 | curl ....
30 | ```
31 | 
32 | ### Demo
33 | ![streaming logs](./iot-demo.png)
34 | 
35 | ### Flow
36 | ![logs dataflow](./iot-flow.png)
37 | 
38 | ### Reference 
39 | 


--------------------------------------------------------------------------------
/iot-activity-tracker/dashboard/heartrate.html:
--------------------------------------------------------------------------------
  1 | <html>
  2 | <head>
  3 |   <title></title>
  4 |   <script src="//ajax.googleapis.com/ajax/libs/jquery/2.0.3/jquery.min.js" ></script>
  5 |   <script src="//cdnjs.cloudflare.com/ajax/libs/jqueryui/1.11.4/jquery-ui.min.js" ></script>
  6 |   <script src="//cdn.jsdelivr.net/sockjs/1.0.0/sockjs.min.js"></script>
  7 |   <script src="//cdn.rawgit.com/vert-x3/vertx-bus-bower/master/vertx-eventbus.js"></script>
  8 |   <script src="//cdnjs.cloudflare.com/ajax/libs/smoothie/1.27.0/smoothie.min.js"></script>
  9 |   <link rel="stylesheet" href="//maxcdn.bootstrapcdn.com/font-awesome/4.4.0/css/font-awesome.min.css">
 10 |   <link rel="stylesheet" href="//cdnjs.cloudflare.com/ajax/libs/animate.css/3.4.0/animate.min.css">
 11 |   <link rel="stylesheet" href="//code.jquery.com/ui/1.11.4/themes/smoothness/jquery-ui.css">
 12 | </head>
 13 | <style>
 14 |     /** send box **/
 15 |     #sendBox{
 16 |         display:inline-block;
 17 |         position:relative;
 18 |     }
 19 | 
 20 |     #sendButton{
 21 |         position:absolute;
 22 |         bottom:10px;
 23 |         right:10px;
 24 |     }
 25 | 
 26 |     @keyframes pulse-slow {
 27 |         0%{transform:scale(1)}
 28 |         50%{transform:scale(1.4)}
 29 |         100%{transform:scale(1)}
 30 |     }
 31 | 
 32 |     /** animate-heartbeat **/
 33 |     @keyframes pulse {
 34 |         0% {
 35 |             transform: scaleX(1) scaleY(1);
 36 |         }
 37 |         10% {
 38 |             transform: scaleX(0.85) scaleY(0.85);
 39 |         }
 40 |         20% {
 41 |             transform: scaleX(1) scaleY(1);
 42 |         }
 43 |         30% {
 44 |             transform: scaleX(0.85) scaleY(0.85);
 45 |         }
 46 |         40% {
 47 |             transform: scaleX(1) scaleY(1);
 48 |         }
 49 |         50% {
 50 |             transform: scaleX(0.85) scaleY(0.85);
 51 |         }
 52 |         60% {
 53 |             transform: scaleX(1) scaleY(1);
 54 |         }
 55 |         70% {
 56 |             transform: scaleX(0.85) scaleY(0.85);
 57 |         }
 58 |         80% {
 59 |             transform: scaleX(1) scaleY(1);
 60 |         }
 61 |         90% {
 62 |             transform: scaleX(0.85) scaleY(0.85);
 63 |         }
 64 |         100% {
 65 |             transform: scaleX(1) scaleY(1);
 66 |         }
 67 |     }
 68 |     .animate-heartbeat {
 69 |         animation: pulse-slow 2s infinite;
 70 |     }
 71 | 
 72 |     .fa-stack-text {
 73 |         font-size: 2rem ;
 74 |     }
 75 | 
 76 | </style>
 77 | 
 78 | <body>
 79 | <div>
 80 | <div id="sendBox">
 81 |     <textarea id="sendMessage" cols="25" rows="12">
 82 | {
 83 |     "id": "sumo",
 84 |     "hr": 90
 85 | }
 86 |     </textarea>
 87 |     <button id="sendButton">Submit</button>
 88 | </div>
 89 | <canvas id="mycanvas" width="800" height="180"></canvas>
 90 | 
 91 | 
 92 | <span style="margin-left: 2cm; vertical-align:baseline;" class="fa-stack fa-4x">
 93 |   <i id="heart" class="fa fa-heart fa-stack-2x"></i>
 94 |   <i id="hr" class="fa-stack-1x fa-stack-text fa-inverse"></i>
 95 | </span>
 96 | </div>
 97 | 
 98 | <script>
 99 | 
100 |   var eb = null;
101 |   var timer = null;
102 |   var hrElement;
103 |   var heartElement;
104 |   var timeSeries;
105 | 
106 |   function setupSmootie() {
107 |       timeSeries = new TimeSeries();
108 |       var smoothieChart = new SmoothieChart({
109 |           minValue: 50.0,
110 |           maxValue: 150.0,
111 |           grid: {
112 |               strokeStyle: 'rgb(125, 0, 0)',
113 |               fillStyle: 'rgb(60, 0, 0)',
114 |               lineWidth: 1,
115 |               millisPerLine: 1000,
116 |               verticalSections: 4
117 |           }
118 |       });
119 |       smoothieChart.addTimeSeries(timeSeries, {
120 |           strokeStyle:'rgb(0, 255, 0)',
121 |           fillStyle:'rgba(0, 255, 0, 0.4)',
122 |           lineWidth:3
123 |       });
124 |       smoothieChart.streamTo(document.getElementById("mycanvas"), 250);
125 |   }
126 | 
127 |   function publish(address,  message) {
128 |       var headers = {sensor: "hr"};
129 |       eb.publish(address, message, headers);
130 |   }
131 | 
132 |   function subscribe(address) {
133 |       eb.registerHandler(address, function(msg, replyTo) {
134 |           console.log(msg.text);
135 |       });
136 |   }
137 | 
138 |   function subscribeToHeartrate() {
139 |       eb.registerHandler('iot.out.sumo.hr', function(err, res) {
140 |           var hr = parseInt(res.body.hr);
141 |           hrElement.html(hr);
142 | 
143 |           if(!heartElement.hasClass("animate-heartbeat")) {
144 |               console.info('adding animate...');
145 |               heartElement.addClass("animate-heartbeat");
146 |           }
147 | 
148 |           //reset timer.
149 |           clearTimeout(timer);
150 |           timer = setTimeout(function() {
151 |               console.log('removing animate...');
152 |               heartElement.removeClass("animate-heartbeat");
153 |           }, 3000);
154 | 
155 | 
156 | 
157 |           if (hr > 120) {
158 |               heartElement.css({
159 |                   color: "#d63230"
160 |               });
161 |           } else if (hr > 100) {
162 |               heartElement.css({
163 |                   color: "#ff4136"
164 |               });
165 |           } else if(hr > 80){
166 |               heartElement.css({
167 |                   color: "#ff6f69"
168 |               });
169 |           } else {
170 |               heartElement.css({
171 |                   color: "#008000"
172 |               } );
173 |           }
174 | 
175 |           timeSeries.append(new Date().getTime(), hr);
176 |       });
177 |   }
178 | 
179 | 
180 |   function subscribeToActivity() {
181 |       eb.registerHandler('iot.out.sumo.activity.inactive', function(err, res) {
182 |           console.log("iot.out.sumo.activity.inactive: ", res.body)
183 |       });
184 |       eb.registerHandler('iot.out.sumo.activity.restored', function(err, res) {
185 |           console.log("iot.out.sumo.activity.restored: ", res.body)
186 |       });
187 |   }
188 | 
189 |   $(document).ready(function() {
190 |       hrElement = $("#hr"); //document.getElementById("hr");
191 |       heartElement = $("#heart");
192 | 
193 |       setupSmootie();
194 |       //eb = new EventBus('http://apsrt1451:5555/eventbus');
195 |       eb = new EventBus('http://localhost:5555/eventbus');
196 | 
197 |       eb.onopen = function () {
198 |           subscribeToHeartrate();
199 |           subscribeToActivity();
200 |       };
201 | 
202 |       $("#sendButton").click(function() {
203 |           var msg = $("textarea#sendMessage").val();
204 |           publish("iot.in.hr", JSON.parse(msg));
205 |       });
206 |   });
207 | 
208 | </script>
209 | 
210 | </body>
211 | </html>
212 | 


--------------------------------------------------------------------------------
/iot-activity-tracker/iot-demo.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/iot-activity-tracker/iot-demo.png


--------------------------------------------------------------------------------
/iot-activity-tracker/iot-flow.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/iot-activity-tracker/iot-flow.png


--------------------------------------------------------------------------------
/oltp-cdc-olap/Dockerfile:
--------------------------------------------------------------------------------
 1 | FROM docker-registry.zende.sk/zendesk/ruby:2.1.6
 2 | 
 3 | RUN apt-get update && apt-get install -y openjdk-7-jre curl
 4 | 
 5 | RUN mkdir /app
 6 | WORKDIR /app
 7 | 
 8 | RUN curl -sLo - https://github.com/zendesk/maxwell/releases/download/v0.13.1/maxwell-0.13.1.tar.gz | tar zxvf -
 9 | RUN mv maxwell-*/* .
10 | 
11 | ADD REVISION /
12 | 
13 | CMD bin/maxwell --user=$MYSQL_USERNAME --password=$MYSQL_PASSWORD --host=$MYSQL_HOST --producer=kafka --kafka.bootstrap.servers=$KAFKA_HOST:$KAFKA_PORT
14 | 


--------------------------------------------------------------------------------
/oltp-cdc-olap/README.md:
--------------------------------------------------------------------------------
  1 | oltp-cdc-olap
  2 | =============
  3 | 
  4 | A low latency, multi-tenant *Change Data Capture(CDC)* pipeline to continuously replicate data from **OLTP(**MySQL**)** to **OLAP(**NoSQL**)** systems with no impact to the source. 
  5 | 
  6 | 
  7 | 1. Capture changes from many Data Sources and types.
  8 | 2. Feed data to many client types (real-time, slow/catch-up, full bootstrap).
  9 | 3. Multi-tenant: can contain data from many different databases, support multiple consumers. 
 10 | 4. Non-intrusive architecture for change capture.
 11 | 5. Both batch and near real time delivery.
 12 | 6. Isolate fast consumers from slow consumers.
 13 | 7. Isolate sources from consumers
 14 |     1. Schema changes
 15 |     2. Physical layout changes
 16 |     3. Speed mismatch
 17 | 8. Change filtering
 18 |     1. Filtering of database changes at the database level, schema level, table level, and row/column level.
 19 | 9. Buffer change records in **Kafka** for flexible consumption from an arbitrary time point in the change stream including full bootstrap capability of the entire data.
 20 | 9. Guaranteed in-commit-order and at-least-once delivery with high availability (`at least once` vs. `exactly once`)
 21 | 10. Resilience and Recoverability
 22 | 12. Schema-awareness 
 23 |   
 24 | ### Setup
 25 | 
 26 | #### Install and Run MySQL
 27 | Install source MySQL database and configure it with row based replication as per [instructions](./mysql/). 
 28 | 
 29 | #### Install and Run Kafka
 30 | Follow the [instructions](./kafka/)
 31 | 
 32 | #### Install Maxwell 
 33 | ```bash
 34 | cd oltp-cdc-olap/maxwell
 35 | curl -L -0 https://github.com/zendesk/maxwell/releases/download/v0.13.1/maxwell-0.13.1.tar.gz | tar --strip-components=1 -zx -C .
 36 | ```
 37 | 
 38 | ### Run
 39 | 
 40 |    `cd maxwell`
 41 | 
 42 | 1. Run with stdout producer 
 43 | 
 44 |    `bin/maxwell --user='maxwell' --password='XXXXXX' --host='127.0.0.1' --producer=stdout`
 45 | 2. Run with kafka producer
 46 | 
 47 |    `bin/maxwell`
 48 |     
 49 | ### Test
 50 | If all goes well you'll see maxwell replaying your inserts:
 51 | 
 52 | ```sql
 53 | mysql> CREATE TABLE test.guests (
 54 |          id INT(6) UNSIGNED AUTO_INCREMENT PRIMARY KEY,
 55 |          firstname VARCHAR(30) NOT NULL,
 56 |          lastname VARCHAR(30) NOT NULL,
 57 |          email VARCHAR(50),
 58 |          reg_date TIMESTAMP
 59 |        )
 60 | mysql> INSERT INTO test.guests SET firstname='sumo', lastname='demo';
 61 | Query OK, 1 row affected (0.04 sec)
 62 | 
 63 | (maxwell)
 64 | {"database":"test","table":"guests","type":"insert","ts":1446422524,"xid":1800,"commit":true,"data":{"reg_date":"2015-11-02 00:02:04","firstname":"sumo","id":1,"lastname":"demo"}}
 65 | ```
 66 | 
 67 | ### Architecture
 68 | ![cdc architecture](./cdc-architecture.jpg)
 69 | 
 70 | ### Dataflow
 71 | 
 72 | This [flow](./cdc-flow.xml) depends on **nifi-scripting** module, download [nar](https://github.com/xmlking/nifi-scripting/releases) and copy to `$NIFI_HOME/lib`
 73 | 
 74 | ExecuteJavaScript's JSON transformation logic:
 75 | 
 76 | ```js
 77 | // logical change record (LCR)
 78 | var lcr = util.flowFileToString(flowFile, session);
 79 | lcr = JSON.parse(lcr);
 80 | 
 81 | var attMap = new java.util.HashMap();
 82 | attMap.put('commit', lcr.commit.toString());
 83 | attMap.put('database', lcr.database);
 84 | attMap.put('table', lcr.table);
 85 | attMap.put('ts', lcr.ts.toString());
 86 | attMap.put('id', lcr.data.id.toString());
 87 | attMap.put('type', lcr.type);
 88 | attMap.put('xid', lcr.xid.toString());
 89 | 
 90 | session.remove(flowFile);
 91 | flowFile = util.stringToFlowFile(JSON.stringify(lcr.data) , session, flowFile);
 92 | flowFile = session.putAllAttributes(flowFile, attMap);
 93 | ```
 94 | 
 95 | ![cdc dataflow](./cdc-flow.png)
 96 | 
 97 | ### Reference 
 98 | 1. [Maxwell's Daemon](http://maxwells-daemon.io/quickstart/)
 99 | 2. [LinkedIn: Creating A Low Latency Change Data Capture System With Databus](http://highscalability.com/blog/2012/3/19/linkedin-creating-a-low-latency-change-data-capture-system-w.html)
100 | 3. [Introducing Maxwell, a mysql-to-kafka binlog processor](https://developer.zendesk.com/blog/introducing-maxwell-a-mysql-to-kafka-binlog-processor)
101 | 4. [Martin Kleppman's blog: Using logs to build a solid data infrastructure](https://martin.kleppmann.com/2015/05/27/logs-for-data-infrastructure.html)
102 | 
103 | 


--------------------------------------------------------------------------------
/oltp-cdc-olap/cdc-architecture.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/oltp-cdc-olap/cdc-architecture.jpg


--------------------------------------------------------------------------------
/oltp-cdc-olap/cdc-flow.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/oltp-cdc-olap/cdc-flow.png


--------------------------------------------------------------------------------
/oltp-cdc-olap/kafka/README.md:
--------------------------------------------------------------------------------
 1 | ### Install Kafka (one time)
 2 | ```bash
 3 | brew install kafka
 4 | ```
 5 | #### To Start Zookeeper
 6 | ```bash
 7 | zookeeper-server-start.sh ./kafka/zookeeper.properties
 8 | ```
 9 | 
10 | #### To Start Kafka
11 | ```bash
12 | kafka-server-start.sh ./kafka/server.properties
13 | ```
14 | 
15 | #### Create Kafka Topic and partitioning (one time)
16 | ```bash
17 | kafka-topics.sh --zookeeper localhost:2181 --create --topic maxwell --partitions 1 --replication-factor 1
18 | ```
19 | 
20 | #### List Kafka Topics
21 | ```bash
22 | kafka-topics.sh --list --zookeeper localhost:2181
23 | ```
24 | 
25 | #### Display messages on a topic
26 | ```bash  
27 | kafka-console-consumer.sh --zookeeper localhost:2181 --topic maxwell --from-beginning
28 | ```
29 |     
30 | *NOTE: stop Kafka first and then Zookeeper*


--------------------------------------------------------------------------------
/oltp-cdc-olap/kafka/kafka/.gitignore:
--------------------------------------------------------------------------------
1 | *
2 | !.gitignore


--------------------------------------------------------------------------------
/oltp-cdc-olap/kafka/server.properties:
--------------------------------------------------------------------------------
  1 | # Licensed to the Apache Software Foundation (ASF) under one or more
  2 | # contributor license agreements.  See the NOTICE file distributed with
  3 | # this work for additional information regarding copyright ownership.
  4 | # The ASF licenses this file to You under the Apache License, Version 2.0
  5 | # (the "License"); you may not use this file except in compliance with
  6 | # the License.  You may obtain a copy of the License at
  7 | # 
  8 | #    http://www.apache.org/licenses/LICENSE-2.0
  9 | # 
 10 | # Unless required by applicable law or agreed to in writing, software
 11 | # distributed under the License is distributed on an "AS IS" BASIS,
 12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 13 | # See the License for the specific language governing permissions and
 14 | # limitations under the License.
 15 | # see kafka.server.KafkaConfig for additional details and defaults
 16 | 
 17 | ############################# Server Basics #############################
 18 | 
 19 | # The id of the broker. This must be set to a unique integer for each broker.
 20 | broker.id=0
 21 | 
 22 | ############################# Socket Server Settings #############################
 23 | 
 24 | # The port the socket server listens on
 25 | port=9092
 26 | 
 27 | # Hostname the broker will bind to. If not set, the server will bind to all interfaces
 28 | #host.name=localhost
 29 | 
 30 | # Hostname the broker will advertise to producers and consumers. If not set, it uses the
 31 | # value for "host.name" if configured.  Otherwise, it will use the value returned from
 32 | # java.net.InetAddress.getCanonicalHostName().
 33 | #advertised.host.name=<hostname routable by clients>
 34 | 
 35 | # The port to publish to ZooKeeper for clients to use. If this is not set,
 36 | # it will publish the same port that the broker binds to.
 37 | #advertised.port=<port accessible by clients>
 38 | 
 39 | # The number of threads handling network requests
 40 | num.network.threads=3
 41 |  
 42 | # The number of threads doing disk I/O
 43 | num.io.threads=8
 44 | 
 45 | # The send buffer (SO_SNDBUF) used by the socket server
 46 | socket.send.buffer.bytes=102400
 47 | 
 48 | # The receive buffer (SO_RCVBUF) used by the socket server
 49 | socket.receive.buffer.bytes=102400
 50 | 
 51 | # The maximum size of a request that the socket server will accept (protection against OOM)
 52 | socket.request.max.bytes=104857600
 53 | 
 54 | 
 55 | ############################# Log Basics #############################
 56 | 
 57 | # A comma seperated list of directories under which to store log files
 58 | # log.dirs=/usr/local/var/lib/kafka-logs
 59 | log.dirs=./kafka/kafka
 60 | 
 61 | # The default number of log partitions per topic. More partitions allow greater
 62 | # parallelism for consumption, but this will also result in more files across
 63 | # the brokers.
 64 | num.partitions=1
 65 | 
 66 | # The number of threads per data directory to be used for log recovery at startup and flushing at shutdown.
 67 | # This value is recommended to be increased for installations with data dirs located in RAID array.
 68 | num.recovery.threads.per.data.dir=1
 69 | 
 70 | ############################# Log Flush Policy #############################
 71 | 
 72 | # Messages are immediately written to the filesystem but by default we only fsync() to sync
 73 | # the OS cache lazily. The following configurations control the flush of data to disk. 
 74 | # There are a few important trade-offs here:
 75 | #    1. Durability: Unflushed data may be lost if you are not using replication.
 76 | #    2. Latency: Very large flush intervals may lead to latency spikes when the flush does occur as there will be a lot of data to flush.
 77 | #    3. Throughput: The flush is generally the most expensive operation, and a small flush interval may lead to exceessive seeks. 
 78 | # The settings below allow one to configure the flush policy to flush data after a period of time or
 79 | # every N messages (or both). This can be done globally and overridden on a per-topic basis.
 80 | 
 81 | # The number of messages to accept before forcing a flush of data to disk
 82 | #log.flush.interval.messages=10000
 83 | 
 84 | # The maximum amount of time a message can sit in a log before we force a flush
 85 | #log.flush.interval.ms=1000
 86 | 
 87 | ############################# Log Retention Policy #############################
 88 | 
 89 | # The following configurations control the disposal of log segments. The policy can
 90 | # be set to delete segments after a period of time, or after a given size has accumulated.
 91 | # A segment will be deleted whenever *either* of these criteria are met. Deletion always happens
 92 | # from the end of the log.
 93 | 
 94 | # The minimum age of a log file to be eligible for deletion
 95 | log.retention.hours=168
 96 | 
 97 | # A size-based retention policy for logs. Segments are pruned from the log as long as the remaining
 98 | # segments don't drop below log.retention.bytes.
 99 | #log.retention.bytes=1073741824
100 | 
101 | # The maximum size of a log segment file. When this size is reached a new log segment will be created.
102 | log.segment.bytes=1073741824
103 | 
104 | # The interval at which log segments are checked to see if they can be deleted according 
105 | # to the retention policies
106 | log.retention.check.interval.ms=300000
107 | 
108 | # By default the log cleaner is disabled and the log retention policy will default to just delete segments after their retention expires.
109 | # If log.cleaner.enable=true is set the cleaner will be enabled and individual logs can then be marked for log compaction.
110 | log.cleaner.enable=false
111 | 
112 | ############################# Zookeeper #############################
113 | 
114 | # Zookeeper connection string (see zookeeper docs for details).
115 | # This is a comma separated host:port pairs, each corresponding to a zk
116 | # server. e.g. "127.0.0.1:3000,127.0.0.1:3001,127.0.0.1:3002".
117 | # You can also append an optional chroot string to the urls to specify the
118 | # root directory for all kafka znodes.
119 | zookeeper.connect=localhost:2181
120 | 
121 | # Timeout in ms for connecting to zookeeper
122 | zookeeper.connection.timeout.ms=6000
123 | 


--------------------------------------------------------------------------------
/oltp-cdc-olap/kafka/zookeeper.properties:
--------------------------------------------------------------------------------
 1 | # Licensed to the Apache Software Foundation (ASF) under one or more
 2 | # contributor license agreements.  See the NOTICE file distributed with
 3 | # this work for additional information regarding copyright ownership.
 4 | # The ASF licenses this file to You under the Apache License, Version 2.0
 5 | # (the "License"); you may not use this file except in compliance with
 6 | # the License.  You may obtain a copy of the License at
 7 | # 
 8 | #    http://www.apache.org/licenses/LICENSE-2.0
 9 | # 
10 | # Unless required by applicable law or agreed to in writing, software
11 | # distributed under the License is distributed on an "AS IS" BASIS,
12 | # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 | # See the License for the specific language governing permissions and
14 | # limitations under the License.
15 | # the directory where the snapshot is stored.
16 | # dataDir=/usr/local/var/lib/zookeeper
17 | dataDir=./kafka/zookeeper
18 | # the port at which the clients will connect
19 | clientPort=2181
20 | # disable the per-ip limit on the number of connections since this is a non-production config
21 | maxClientCnxns=0
22 | 


--------------------------------------------------------------------------------
/oltp-cdc-olap/kafka/zookeeper/.gitignore:
--------------------------------------------------------------------------------
1 | *
2 | !.gitignore


--------------------------------------------------------------------------------
/oltp-cdc-olap/maxwell/.gitignore:
--------------------------------------------------------------------------------
1 | *
2 | !.gitignore
3 | !config.properties


--------------------------------------------------------------------------------
/oltp-cdc-olap/maxwell/config.properties:
--------------------------------------------------------------------------------
 1 | # mysql username
 2 | user=maxwell
 3 | # mysql password
 4 | password=XXXXXX
 5 | # mysql host
 6 | host=127.0.0.1
 7 | # mysql port
 8 | port=3306
 9 | # where shall we send these rows, sir?
10 | producer=kafka
11 | # any options prefixed with 'kafka.' will be passed into the kafka producer library
12 | kafka.acks=1
13 | kafka.compression.type=gzip
14 | kafka.bootstrap.servers=127.0.0.1:9092
15 | # provide a topic for maxwell to write to. Default will be "maxwell".
16 | kafka_topic=maxwell
17 | 


--------------------------------------------------------------------------------
/oltp-cdc-olap/mysql/README.md:
--------------------------------------------------------------------------------
 1 | Database setup and configuration for CDC dataflow demo
 2 | 
 3 | ### Install MySQL (one time)
 4 | ```bash
 5 | brew install mysql
 6 | mysql -V  # Verify the MySQL installation
 7 | ```
 8 | 
 9 | ### Initializing Database (one time)
10 | ```bash
11 | unset TMPDIR
12 | # mysql_install_db --defaults-file=./mysql/my.cnf --verbose --user=`whoami`
13 | mysql_install_db --verbose --user=`whoami` --basedir="$(brew --prefix mysql)"  --datadir=./mysql/data
14 | ```
15 | 
16 | ### Run MySQL
17 | ```bash
18 | mysqld --defaults-file=./mysql/my.cnf # start
19 | mysqladmin -u root -p shutdown  # stop
20 | ```
21 | 
22 | #### Setup Security (for Production) (one time)
23 | ```bash
24 | mysql_secure_installation
25 | ```
26 | 
27 | #### Grant permissions for maxwell (one time)
28 | ```sql
29 | mysql -u root -p 
30 | mysql> GRANT ALL on maxwell.* to 'maxwell'@'%' identified by 'XXXXXX';
31 | mysql> GRANT SELECT, REPLICATION CLIENT, REPLICATION SLAVE on *.* to 'maxwell'@'%';
32 | # or for running maxwell locally:
33 | mysql> GRANT SELECT, REPLICATION CLIENT, REPLICATION SLAVE on *.* to 'maxwell'@'localhost' identified by 'XXXXXX';
34 | mysql> GRANT ALL on maxwell.* to 'maxwell'@'localhost';
35 | ```
36 | 
37 | #### MySQL Command Line Tool
38 | ```sql
39 | mysql -u root -p 
40 | SHOW DATABASES; # List all existing databases.
41 | SELECT DISTINCT User FROM mysql.user;  #List all MySQL / MariaDB users.
42 | SHOW VARIABLES WHERE Variable_Name LIKE "%dir"; #  see Env
43 | DROP DATABASE maxwell;
44 | DROP TABLE test.guests;
45 | ```


--------------------------------------------------------------------------------
/oltp-cdc-olap/mysql/data/.gitignore:
--------------------------------------------------------------------------------
1 | *
2 | !.gitignore


--------------------------------------------------------------------------------
/oltp-cdc-olap/mysql/my.cnf:
--------------------------------------------------------------------------------
 1 | # For advice on how to change settings please see
 2 | # http://dev.mysql.com/doc/refman/5.6/en/server-configuration-defaults.html
 3 | 
 4 | [mysqld]
 5 | 
 6 | # Remove leading # and set to the amount of RAM for the most important data
 7 | # cache in MySQL. Start at 70% of total RAM for dedicated server, else 10%.
 8 | # innodb_buffer_pool_size = 128M
 9 | 
10 | # Remove leading # to turn on a very important data integrity option: logging
11 | # changes to the binary log between backups.
12 | # log_bin
13 | 
14 | # These are commonly set, remove the # and set as required.
15 | # basedir = .....
16 | # datadir = .....
17 | # port = .....
18 | # server_id = .....
19 | # socket = .....
20 | 
21 | # Remove leading # to set options mainly useful for reporting servers.
22 | # The server defaults are faster for transactions and fast SELECTs.
23 | # Adjust sizes as needed, experiment to find the optimal values.
24 | # join_buffer_size = 128M
25 | # sort_buffer_size = 2M
26 | # read_rnd_buffer_size = 2M 
27 | 
28 | sql_mode=NO_ENGINE_SUBSTITUTION,STRICT_TRANS_TABLES
29 | 
30 | basedir=/usr/local/opt/mysql
31 | datadir=./mysql/data
32 | server-id=1
33 | log-bin=master
34 | binlog_format=row


--------------------------------------------------------------------------------
/retry/README.md:
--------------------------------------------------------------------------------
1 | retry-count-loop
2 | ================
3 | 
4 | This process group can be used to maintain a count of how many times a flowfile goes through it. If it reaches some 
5 | configured threshold it will route to a 'Limit Exceeded' relationship otherwise it will route to 'retry'. 
6 | Great for processes which you only want to run X number of times before you give up.


--------------------------------------------------------------------------------
/retry/retry-count-loop.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="UTF-8" standalone="yes"?>
  2 | <template>
  3 |     <description>Provides a function to count how many times a given flowfile has gone through it and if it exceeds some
  4 |         threshold it will kick it out.
  5 |     </description>
  6 |     <name>Retry Count Loop</name>
  7 |     <snippet>
  8 |         <processGroups>
  9 |             <id>d80fe614-b7e0-46bc-8b98-da89e3223712</id>
 10 |             <parentGroupId>622ae166-2d67-4066-8fd1-4f96f72570c3</parentGroupId>
 11 |             <position>
 12 |                 <x>767.5239007271769</x>
 13 |                 <y>-528.3105172159726</y>
 14 |             </position>
 15 |             <activeRemotePortCount>0</activeRemotePortCount>
 16 |             <comments>This flow will track how many times a given flow file routes through it. If the number of times
 17 |                 exceeds a specific maximum then it will route to the 'limit exceeded' port. Otherwise it will route to
 18 |                 'retry'.
 19 | 
 20 |                 The attributes it uses are 'retry.counter' and 'retry.maxcount'. If the 'retry.maxcount' is specified on
 21 |                 a given flowfile then it will be honored. Otherwise a default of '3' is set as the maximum retry count.
 22 | 
 23 |                 As the flowfile goes through this flow it increments the 'retry.maxcount' attribute by 1. It then checks
 24 |                 if this value exceeds 'retry.maxcount' and if so then it routes the flowfile to 'limit exceeded'
 25 |                 otherwise it routes to 'retry'.
 26 | 
 27 |                 So you can configure the 'retry' relationship to loop back to the process you want and you can send the
 28 |                 'limit exceeded' to move on from that process to something else.
 29 |             </comments>
 30 |             <contents>
 31 |                 <connections>
 32 |                     <id>155cdc9a-b9ff-4f6d-bade-78e2b7922ead</id>
 33 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
 34 |                     <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 35 |                     <backPressureObjectThreshold>10</backPressureObjectThreshold>
 36 |                     <destination>
 37 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
 38 |                         <id>de67351f-6e63-4557-91ed-4362e27de6a5</id>
 39 |                         <type>OUTPUT_PORT</type>
 40 |                     </destination>
 41 |                     <flowFileExpiration>0 sec</flowFileExpiration>
 42 |                     <labelIndex>1</labelIndex>
 43 |                     <name></name>
 44 |                     <selectedRelationships>Try again</selectedRelationships>
 45 |                     <source>
 46 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
 47 |                         <id>10f53281-4064-4725-8119-25a5e77b0cf3</id>
 48 |                         <type>PROCESSOR</type>
 49 |                     </source>
 50 |                     <zIndex>0</zIndex>
 51 |                 </connections>
 52 |                 <connections>
 53 |                     <id>9f1ccea3-7f03-4026-b3d4-d05b37ca5596</id>
 54 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
 55 |                     <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 56 |                     <backPressureObjectThreshold>10</backPressureObjectThreshold>
 57 |                     <destination>
 58 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
 59 |                         <id>62021278-2608-4b09-9095-8143dbcdc772</id>
 60 |                         <type>OUTPUT_PORT</type>
 61 |                     </destination>
 62 |                     <flowFileExpiration>0 sec</flowFileExpiration>
 63 |                     <labelIndex>1</labelIndex>
 64 |                     <name></name>
 65 |                     <selectedRelationships>success</selectedRelationships>
 66 |                     <source>
 67 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
 68 |                         <id>34b75d26-46b8-3d67-923f-fb6e7f93d0cd</id>
 69 |                         <type>PROCESSOR</type>
 70 |                     </source>
 71 |                     <zIndex>0</zIndex>
 72 |                 </connections>
 73 |                 <connections>
 74 |                     <id>d3170ec7-c212-466f-b1c9-d0fc3570503e</id>
 75 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
 76 |                     <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 77 |                     <backPressureObjectThreshold>10</backPressureObjectThreshold>
 78 |                     <destination>
 79 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
 80 |                         <id>10f53281-4064-4725-8119-25a5e77b0cf3</id>
 81 |                         <type>PROCESSOR</type>
 82 |                     </destination>
 83 |                     <flowFileExpiration>0 sec</flowFileExpiration>
 84 |                     <labelIndex>1</labelIndex>
 85 |                     <name></name>
 86 |                     <selectedRelationships>success</selectedRelationships>
 87 |                     <source>
 88 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
 89 |                         <id>8692729d-e3f2-472d-9435-f1bbf207e41c</id>
 90 |                         <type>PROCESSOR</type>
 91 |                     </source>
 92 |                     <zIndex>0</zIndex>
 93 |                 </connections>
 94 |                 <connections>
 95 |                     <id>fb4298e6-37b3-47ae-9124-d255368d673f</id>
 96 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
 97 |                     <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 98 |                     <backPressureObjectThreshold>10</backPressureObjectThreshold>
 99 |                     <destination>
100 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
101 |                         <id>8692729d-e3f2-472d-9435-f1bbf207e41c</id>
102 |                         <type>PROCESSOR</type>
103 |                     </destination>
104 |                     <flowFileExpiration>0 sec</flowFileExpiration>
105 |                     <labelIndex>1</labelIndex>
106 |                     <name></name>
107 |                     <source>
108 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
109 |                         <id>535627d4-d4fb-4963-84bd-22115060c9cc</id>
110 |                         <type>INPUT_PORT</type>
111 |                     </source>
112 |                     <zIndex>0</zIndex>
113 |                 </connections>
114 |                 <connections>
115 |                     <id>ec2fe73b-c7c0-489c-82be-ddd2fa8ce8cb</id>
116 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
117 |                     <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
118 |                     <backPressureObjectThreshold>10</backPressureObjectThreshold>
119 |                     <destination>
120 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
121 |                         <id>34b75d26-46b8-3d67-923f-fb6e7f93d0cd</id>
122 |                         <type>PROCESSOR</type>
123 |                     </destination>
124 |                     <flowFileExpiration>0 sec</flowFileExpiration>
125 |                     <labelIndex>1</labelIndex>
126 |                     <name></name>
127 |                     <selectedRelationships>unmatched</selectedRelationships>
128 |                     <source>
129 |                         <groupId>d80fe614-b7e0-46bc-8b98-da89e3223712</groupId>
130 |                         <id>10f53281-4064-4725-8119-25a5e77b0cf3</id>
131 |                         <type>PROCESSOR</type>
132 |                     </source>
133 |                     <zIndex>0</zIndex>
134 |                 </connections>
135 |                 <inputPorts>
136 |                     <id>535627d4-d4fb-4963-84bd-22115060c9cc</id>
137 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
138 |                     <position>
139 |                         <x>442.99999073586037</x>
140 |                         <y>107.99999712137014</y>
141 |                     </position>
142 |                     <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
143 |                     <name>data</name>
144 |                     <state>RUNNING</state>
145 |                     <type>INPUT_PORT</type>
146 |                 </inputPorts>
147 |                 <outputPorts>
148 |                     <id>de67351f-6e63-4557-91ed-4362e27de6a5</id>
149 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
150 |                     <position>
151 |                         <x>266.00002125343855</x>
152 |                         <y>620.0000047507647</y>
153 |                     </position>
154 |                     <comments>Items sent to this port have not yet exceeded the maximum retry count.</comments>
155 |                     <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
156 |                     <name>retry</name>
157 |                     <state>STOPPED</state>
158 |                     <type>OUTPUT_PORT</type>
159 |                     <validationErrors>'Port 'retry'' is invalid because Output connection for port 'retry' is not
160 |                         defined.
161 |                     </validationErrors>
162 |                 </outputPorts>
163 |                 <outputPorts>
164 |                     <id>62021278-2608-4b09-9095-8143dbcdc772</id>
165 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
166 |                     <position>
167 |                         <x>710.4906828745322</x>
168 |                         <y>816.4274339499834</y>
169 |                     </position>
170 |                     <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
171 |                     <name>limit exceeded</name>
172 |                     <state>STOPPED</state>
173 |                     <type>OUTPUT_PORT</type>
174 |                     <validationErrors>'Port 'limit exceeded'' is invalid because Output connection for port 'limit
175 |                         exceeded' is not defined.
176 |                     </validationErrors>
177 |                 </outputPorts>
178 |                 <processors>
179 |                     <id>10f53281-4064-4725-8119-25a5e77b0cf3</id>
180 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
181 |                     <position>
182 |                         <x>370.0000517710166</x>
183 |                         <y>394.0000047507647</y>
184 |                     </position>
185 |                     <config>
186 |                         <bulletinLevel>WARN</bulletinLevel>
187 |                         <comments></comments>
188 |                         <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
189 |                         <defaultConcurrentTasks>
190 |                             <entry>
191 |                                 <key>TIMER_DRIVEN</key>
192 |                                 <value>1</value>
193 |                             </entry>
194 |                             <entry>
195 |                                 <key>EVENT_DRIVEN</key>
196 |                                 <value>0</value>
197 |                             </entry>
198 |                             <entry>
199 |                                 <key>CRON_DRIVEN</key>
200 |                                 <value>1</value>
201 |                             </entry>
202 |                         </defaultConcurrentTasks>
203 |                         <defaultSchedulingPeriod>
204 |                             <entry>
205 |                                 <key>TIMER_DRIVEN</key>
206 |                                 <value>0 sec</value>
207 |                             </entry>
208 |                             <entry>
209 |                                 <key>CRON_DRIVEN</key>
210 |                                 <value>* * * * * ?</value>
211 |                             </entry>
212 |                         </defaultSchedulingPeriod>
213 |                         <descriptors>
214 |                             <entry>
215 |                                 <key>Routing Strategy</key>
216 |                                 <value>
217 |                                     <allowableValues>
218 |                                         <description>A copy of the FlowFile will be routed to each relationship whose
219 |                                             corresponding expression evaluates to 'true'
220 |                                         </description>
221 |                                         <displayName>Route to Property name</displayName>
222 |                                         <value>Route to Property name</value>
223 |                                     </allowableValues>
224 |                                     <allowableValues>
225 |                                         <description>Requires that all user-defined expressions evaluate to 'true' for
226 |                                             the FlowFile to be considered a match
227 |                                         </description>
228 |                                         <displayName>Route to 'matched' if all match</displayName>
229 |                                         <value>Route to 'match' if all match</value>
230 |                                     </allowableValues>
231 |                                     <allowableValues>
232 |                                         <description>Requires that at least one user-defined expression evaluate to
233 |                                             'true' for hte FlowFile to be considered a match
234 |                                         </description>
235 |                                         <displayName>Route to 'matched' if any matches</displayName>
236 |                                         <value>Route to 'match' if any matches</value>
237 |                                     </allowableValues>
238 |                                     <defaultValue>Route to Property name</defaultValue>
239 |                                     <description>Specifies how to determine which relationship to use when evaluating
240 |                                         the Expression Language
241 |                                     </description>
242 |                                     <displayName>Routing Strategy</displayName>
243 |                                     <dynamic>false</dynamic>
244 |                                     <name>Routing Strategy</name>
245 |                                     <required>true</required>
246 |                                     <sensitive>false</sensitive>
247 |                                     <supportsEl>false</supportsEl>
248 |                                 </value>
249 |                             </entry>
250 |                             <entry>
251 |                                 <key>Try again</key>
252 |                                 <value>
253 |                                     <description></description>
254 |                                     <displayName>Try again</displayName>
255 |                                     <dynamic>true</dynamic>
256 |                                     <name>Try again</name>
257 |                                     <required>false</required>
258 |                                     <sensitive>false</sensitive>
259 |                                     <supportsEl>true</supportsEl>
260 |                                 </value>
261 |                             </entry>
262 |                         </descriptors>
263 |                         <lossTolerant>false</lossTolerant>
264 |                         <penaltyDuration>30 sec</penaltyDuration>
265 |                         <properties>
266 |                             <entry>
267 |                                 <key>Routing Strategy</key>
268 |                             </entry>
269 |                             <entry>
270 |                                 <key>Try again</key>
271 |                                 <value>${retry.counter:le('${retry.maxcount}')}</value>
272 |                             </entry>
273 |                         </properties>
274 |                         <runDurationMillis>0</runDurationMillis>
275 |                         <schedulingPeriod>0 sec</schedulingPeriod>
276 |                         <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
277 |                         <yieldDuration>1 sec</yieldDuration>
278 |                     </config>
279 |                     <name>Check Retry Count</name>
280 |                     <relationships>
281 |                         <autoTerminate>false</autoTerminate>
282 |                         <description></description>
283 |                         <name>Try again</name>
284 |                     </relationships>
285 |                     <relationships>
286 |                         <autoTerminate>false</autoTerminate>
287 |                         <description>FlowFiles that do not match any user-define expression will be routed here
288 |                         </description>
289 |                         <name>unmatched</name>
290 |                     </relationships>
291 |                     <state>RUNNING</state>
292 |                     <style/>
293 |                     <supportsEventDriven>true</supportsEventDriven>
294 |                     <supportsParallelProcessing>true</supportsParallelProcessing>
295 |                     <type>org.apache.nifi.processors.standard.RouteOnAttribute</type>
296 |                 </processors>
297 |                 <processors>
298 |                     <id>8692729d-e3f2-472d-9435-f1bbf207e41c</id>
299 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
300 |                     <position>
301 |                         <x>369.00002125343855</x>
302 |                         <y>218.00000475076467</y>
303 |                     </position>
304 |                     <config>
305 |                         <bulletinLevel>WARN</bulletinLevel>
306 |                         <comments></comments>
307 |                         <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
308 |                         <defaultConcurrentTasks>
309 |                             <entry>
310 |                                 <key>TIMER_DRIVEN</key>
311 |                                 <value>1</value>
312 |                             </entry>
313 |                             <entry>
314 |                                 <key>EVENT_DRIVEN</key>
315 |                                 <value>0</value>
316 |                             </entry>
317 |                             <entry>
318 |                                 <key>CRON_DRIVEN</key>
319 |                                 <value>1</value>
320 |                             </entry>
321 |                         </defaultConcurrentTasks>
322 |                         <defaultSchedulingPeriod>
323 |                             <entry>
324 |                                 <key>TIMER_DRIVEN</key>
325 |                                 <value>0 sec</value>
326 |                             </entry>
327 |                             <entry>
328 |                                 <key>CRON_DRIVEN</key>
329 |                                 <value>* * * * * ?</value>
330 |                             </entry>
331 |                         </defaultSchedulingPeriod>
332 |                         <descriptors>
333 |                             <entry>
334 |                                 <key>retry.counter</key>
335 |                                 <value>
336 |                                     <description></description>
337 |                                     <displayName>retry.counter</displayName>
338 |                                     <dynamic>true</dynamic>
339 |                                     <name>retry.counter</name>
340 |                                     <required>false</required>
341 |                                     <sensitive>false</sensitive>
342 |                                     <supportsEl>true</supportsEl>
343 |                                 </value>
344 |                             </entry>
345 |                             <entry>
346 |                                 <key>retry.maxcount</key>
347 |                                 <value>
348 |                                     <description></description>
349 |                                     <displayName>retry.maxcount</displayName>
350 |                                     <dynamic>true</dynamic>
351 |                                     <name>retry.maxcount</name>
352 |                                     <required>false</required>
353 |                                     <sensitive>false</sensitive>
354 |                                     <supportsEl>true</supportsEl>
355 |                                 </value>
356 |                             </entry>
357 |                         </descriptors>
358 |                         <lossTolerant>false</lossTolerant>
359 |                         <penaltyDuration>30 sec</penaltyDuration>
360 |                         <properties>
361 |                             <entry>
362 |                                 <key>retry.counter</key>
363 |                                 <value>${retry.counter:replaceNull('0'):plus(1)}</value>
364 |                             </entry>
365 |                             <entry>
366 |                                 <key>retry.maxcount</key>
367 |                                 <value>${retry.maxcount:replaceNull('3')}</value>
368 |                             </entry>
369 |                         </properties>
370 |                         <runDurationMillis>0</runDurationMillis>
371 |                         <schedulingPeriod>0 sec</schedulingPeriod>
372 |                         <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
373 |                         <yieldDuration>1 sec</yieldDuration>
374 |                     </config>
375 |                     <name>Set retry counter</name>
376 |                     <relationships>
377 |                         <autoTerminate>false</autoTerminate>
378 |                         <description>All FlowFiles are routed to this relationship</description>
379 |                         <name>success</name>
380 |                     </relationships>
381 |                     <state>RUNNING</state>
382 |                     <style/>
383 |                     <supportsEventDriven>true</supportsEventDriven>
384 |                     <supportsParallelProcessing>true</supportsParallelProcessing>
385 |                     <type>org.apache.nifi.processors.attributes.UpdateAttribute</type>
386 |                 </processors>
387 |                 <processors>
388 |                     <id>34b75d26-46b8-3d67-923f-fb6e7f93d0cd</id>
389 |                     <parentGroupId>d80fe614-b7e0-46bc-8b98-da89e3223712</parentGroupId>
390 |                     <position>
391 |                         <x>629.3641311351234</x>
392 |                         <y>617.2079695910758</y>
393 |                     </position>
394 |                     <config>
395 |                         <bulletinLevel>WARN</bulletinLevel>
396 |                         <comments></comments>
397 |                         <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
398 |                         <defaultConcurrentTasks>
399 |                             <entry>
400 |                                 <key>TIMER_DRIVEN</key>
401 |                                 <value>1</value>
402 |                             </entry>
403 |                             <entry>
404 |                                 <key>EVENT_DRIVEN</key>
405 |                                 <value>0</value>
406 |                             </entry>
407 |                             <entry>
408 |                                 <key>CRON_DRIVEN</key>
409 |                                 <value>1</value>
410 |                             </entry>
411 |                         </defaultConcurrentTasks>
412 |                         <defaultSchedulingPeriod>
413 |                             <entry>
414 |                                 <key>TIMER_DRIVEN</key>
415 |                                 <value>0 sec</value>
416 |                             </entry>
417 |                             <entry>
418 |                                 <key>CRON_DRIVEN</key>
419 |                                 <value>* * * * * ?</value>
420 |                             </entry>
421 |                         </defaultSchedulingPeriod>
422 |                         <descriptors>
423 |                             <entry>
424 |                                 <key>retry.counter</key>
425 |                                 <value>
426 |                                     <description></description>
427 |                                     <displayName>retry.counter</displayName>
428 |                                     <dynamic>true</dynamic>
429 |                                     <name>retry.counter</name>
430 |                                     <required>false</required>
431 |                                     <sensitive>false</sensitive>
432 |                                     <supportsEl>true</supportsEl>
433 |                                 </value>
434 |                             </entry>
435 |                         </descriptors>
436 |                         <lossTolerant>false</lossTolerant>
437 |                         <penaltyDuration>30 sec</penaltyDuration>
438 |                         <properties>
439 |                             <entry>
440 |                                 <key>retry.counter</key>
441 |                                 <value>0</value>
442 |                             </entry>
443 |                         </properties>
444 |                         <runDurationMillis>0</runDurationMillis>
445 |                         <schedulingPeriod>0 sec</schedulingPeriod>
446 |                         <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
447 |                         <yieldDuration>1 sec</yieldDuration>
448 |                     </config>
449 |                     <name>Reset retry counter</name>
450 |                     <relationships>
451 |                         <autoTerminate>false</autoTerminate>
452 |                         <description>All FlowFiles are routed to this relationship</description>
453 |                         <name>success</name>
454 |                     </relationships>
455 |                     <state>RUNNING</state>
456 |                     <style/>
457 |                     <supportsEventDriven>true</supportsEventDriven>
458 |                     <supportsParallelProcessing>true</supportsParallelProcessing>
459 |                     <type>org.apache.nifi.processors.attributes.UpdateAttribute</type>
460 |                 </processors>
461 |             </contents>
462 |             <disabledCount>0</disabledCount>
463 |             <inactiveRemotePortCount>0</inactiveRemotePortCount>
464 |             <inputPortCount>1</inputPortCount>
465 |             <invalidCount>2</invalidCount>
466 |             <name>Retry Check Loop</name>
467 |             <outputPortCount>2</outputPortCount>
468 |             <parent>
469 |                 <id>622ae166-2d67-4066-8fd1-4f96f72570c3</id>
470 |                 <name>Onyara Processing Hub</name>
471 |             </parent>
472 |             <runningCount>4</runningCount>
473 |             <stoppedCount>0</stoppedCount>
474 |         </processGroups>
475 |     </snippet>
476 |     <timestamp>06/02/2015 17:52:51 UTC</timestamp>
477 | </template>


--------------------------------------------------------------------------------
/settings.gradle:
--------------------------------------------------------------------------------
1 | rootProject.name = 'nifi-examples'
2 | include 'collect-stream-logs:log-generator'


--------------------------------------------------------------------------------
/split-route/README.md:
--------------------------------------------------------------------------------
1 | split-route
2 | ===========
3 | 
4 | This flow demonstrates splitting a file on line boundaries, routing the splits based on a regex in the content, 
5 | merging the less important files together for storage somewhere, and sending the higher priority files down 
6 | another path to take immediate action.


--------------------------------------------------------------------------------
/split-route/data/in/sample-input.txt:
--------------------------------------------------------------------------------
 1 | "H","USA","BP","20140502","9","D","BP"
 2 | "R","1","TB","CLM"," "," ","3U"," ","47000","0","47000","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","25000","25000"," ","650","F","D","D","6"," "," "," ","1:20PM ","1:51PM ","0122"," ","Clm 25000","Fast","","16","87"," ","","","64","117.39","2266","4648","11129","0","0"," ","","112089","Good","Cloudy","","","Y"
 3 | "R","2","TB","CLM"," ","B","3U"," ","34000","0","34000","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","25000","25000"," ","600","F","D","D","7"," "," "," ","1:51PM ","2:22PM ","0151"," ","Clm 25000N2L","Fast","","16","79"," ","","","64","112.36","2444","4803","10003","0","0"," ","","261868","Poor","Cloudy","","","Y"
 4 | "R","3","TB","STK","S"," ","3U"," ","100000","0","100000","0","A","100000"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","0","0"," ","600","F","D","D","6"," ","Affirmed Success S.","AfrmdScsB","2:22PM ","2:53PM ","0222"," ","AfrmdScsB100k","Fast","","16","88"," ","","","64","110.54","2323","4618","5810","0","0"," ","","259015","5","Clear","","","Y"
 5 | "R","4","TB","MCL"," "," ","3U"," ","49200","0","49200","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","40000","40000"," ","850","F","D","D","8"," "," "," ","2:53PM ","3:24PM ","0253"," ","Md 40000","Fast","Y","30","72"," ","","","64","145.58","2425","4829","11358","13909","0"," ","","260343","9","Clear","0","","Y"
 6 | "R","5","TB","ALW"," "," ","3U"," ","77000","0","77000","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","0","0"," ","900","F","D","D","7"," "," "," ","3:24PM ","3:55PM ","0325"," ","Alw 77000N1X","Fast","Y","30","74"," ","","","64","151.69","2330","4643","11156","13832","0"," ","","302065","Good","Clear","","","Y"
 7 | "R","6","TB","MSW","S","B","3U"," ","60000","1200","60000","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","0","0"," ","800","F","D","D","5"," "," "," ","3:55PM ","4:26PM ","0355"," ","Md Sp Wt 58k","Fast","","30","61"," ","","","64","140.64","2481","4931","11477","0","0"," ","","161404","Good","Clear","","","Y"
 8 | "R","7","TB","CLM"," ","B","3U"," ","40000","0","40000","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","20000","20000"," ","800","F","D","D","6"," "," "," ","4:26PM ","4:57PM ","0427"," ","Clm 20000","Fast","","30","68"," ","","","64","139.31","2337","4770","11402","0","0"," ","","344306","Good","Clear","","","Y"
 9 | "R","8","TB","ALW"," ","B","3U"," ","77000","0","77000","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","0","0"," ","850","F","D","D","7"," "," "," ","4:57PM ","5:28PM ","0457"," ","Alw 77000N1X","Fast","","30","76"," ","","","64","144.76","2416","4847","11365","13836","0"," ","","213021","Good","Clear","","","Y"
10 | "R","9","TB","STR"," "," ","3U"," ","60000","0","60000","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0"," ","0","0","40000"," ","700","F","D","D","8"," "," "," ","5:28PM ","       ","0528"," ","Alw 40000s","Fast","Y","16","81"," ","","","64","124.66","2339","4740","11211","0","0"," ","","332649","6,8","Clear","0","","Y"
11 | "S","1","000008813341TB","Coolusive","20100124","KY","TB","Colt","Bay","Ice Cool Kitty","2003","TB","Elusive Quality","1993","TB","Tomorrows Cat","1995","TB","Gone West","1984","TB","122","0","L","","28200","Velasquez","Cornelio","H."," ","Jacobson","David"," ","Drawing Away Stable and Jacobson, David"," "," ","265","N"," ","0","N","5","5","3","3","4","0","0","1","1","1","10","200","0","0","100","75","510","320","0","0","0","0","N","25000","4w into lane, held","chase 2o turn, bid 4w turning for home,took over, held sway","7.30","3.80","2.70","Y","000000002103TE","TE","Barbara","Robert"," ","000001976480O6","O6","Averill","Bradley","E."," ","N","0","N","","0","","87","Lansdon B. Robbins & Kevin Callahan","000000257611TE","000000002695JE"
12 | 


--------------------------------------------------------------------------------
/split-route/data/out/.gitkeep:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xmlking/nifi-examples/3a12b86d7a288285af39142cb3f56c0cba0ee312/split-route/data/out/.gitkeep


--------------------------------------------------------------------------------
/twitter-garden-hose/README.md:
--------------------------------------------------------------------------------
1 | twitter-garden-hose
2 | ===================
3 | 
4 | This flow pulls from Twitter using the garden hose setting; it pulls out some basic attributes from the Json and 
5 | then routes only those items that are actually tweets.


--------------------------------------------------------------------------------
/twitter-garden-hose/pull-from-twitter-garden-hose-flow.xml:
--------------------------------------------------------------------------------
  1 | <?xml version="1.0" encoding="UTF-8" standalone="yes"?>
  2 | <template>
  3 |     <description></description>
  4 |     <name>Pull from Twitter Garden Hose</name>
  5 |     <snippet>
  6 |         <connections>
  7 |             <id>d3791469-2ed8-4973-8a43-bd96531ddaa3</id>
  8 |             <parentGroupId>9f346475-a6eb-4251-bce6-474d324f4f9b</parentGroupId>
  9 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 10 |             <backPressureObjectThreshold>1000</backPressureObjectThreshold>
 11 |             <destination>
 12 |                 <groupId>9f346475-a6eb-4251-bce6-474d324f4f9b</groupId>
 13 |                 <id>34f8b0e2-4772-4448-b811-1bc623434c8f</id>
 14 |                 <type>PROCESSOR</type>
 15 |             </destination>
 16 |             <flowFileExpiration>0 sec</flowFileExpiration>
 17 |             <labelIndex>1</labelIndex>
 18 |             <name></name>
 19 |             <prioritizers>org.apache.nifi.prioritizer.PriorityAttributePrioritizer</prioritizers>
 20 |             <prioritizers>org.apache.nifi.prioritizer.OldestFlowFileFirstPrioritizer</prioritizers>
 21 |             <selectedRelationships>matched</selectedRelationships>
 22 |             <source>
 23 |                 <groupId>9f346475-a6eb-4251-bce6-474d324f4f9b</groupId>
 24 |                 <id>3f260837-4af2-44b3-aeea-5b8e7c6cefb5</id>
 25 |                 <type>PROCESSOR</type>
 26 |             </source>
 27 |             <zIndex>0</zIndex>
 28 |         </connections>
 29 |         <connections>
 30 |             <id>487b273e-69d9-4900-8ae0-eb1bd2067b47</id>
 31 |             <parentGroupId>9f346475-a6eb-4251-bce6-474d324f4f9b</parentGroupId>
 32 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 33 |             <backPressureObjectThreshold>1000</backPressureObjectThreshold>
 34 |             <destination>
 35 |                 <groupId>9f346475-a6eb-4251-bce6-474d324f4f9b</groupId>
 36 |                 <id>3f260837-4af2-44b3-aeea-5b8e7c6cefb5</id>
 37 |                 <type>PROCESSOR</type>
 38 |             </destination>
 39 |             <flowFileExpiration>0 sec</flowFileExpiration>
 40 |             <labelIndex>1</labelIndex>
 41 |             <name></name>
 42 |             <selectedRelationships>success</selectedRelationships>
 43 |             <source>
 44 |                 <groupId>9f346475-a6eb-4251-bce6-474d324f4f9b</groupId>
 45 |                 <id>4c0c698b-1de5-48ce-895e-c9120911919e</id>
 46 |                 <type>PROCESSOR</type>
 47 |             </source>
 48 |             <zIndex>0</zIndex>
 49 |         </connections>
 50 |         <connections>
 51 |             <id>5ec1601d-3e1a-49ff-bb91-4a636e24fe60</id>
 52 |             <parentGroupId>9f346475-a6eb-4251-bce6-474d324f4f9b</parentGroupId>
 53 |             <backPressureDataSizeThreshold>0 MB</backPressureDataSizeThreshold>
 54 |             <backPressureObjectThreshold>1000</backPressureObjectThreshold>
 55 |             <destination>
 56 |                 <groupId>9f346475-a6eb-4251-bce6-474d324f4f9b</groupId>
 57 |                 <id>b63ac926-c892-49c1-8dbc-caed1b0abc5b</id>
 58 |                 <type>OUTPUT_PORT</type>
 59 |             </destination>
 60 |             <flowFileExpiration>0 sec</flowFileExpiration>
 61 |             <labelIndex>1</labelIndex>
 62 |             <name></name>
 63 |             <selectedRelationships>tweet</selectedRelationships>
 64 |             <source>
 65 |                 <groupId>9f346475-a6eb-4251-bce6-474d324f4f9b</groupId>
 66 |                 <id>34f8b0e2-4772-4448-b811-1bc623434c8f</id>
 67 |                 <type>PROCESSOR</type>
 68 |             </source>
 69 |             <zIndex>0</zIndex>
 70 |         </connections>
 71 |         <outputPorts>
 72 |             <id>b63ac926-c892-49c1-8dbc-caed1b0abc5b</id>
 73 |             <parentGroupId>9f346475-a6eb-4251-bce6-474d324f4f9b</parentGroupId>
 74 |             <position>
 75 |                 <x>1301.516569433455</x>
 76 |                 <y>605.362905810152</y>
 77 |             </position>
 78 |             <comments></comments>
 79 |             <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
 80 |             <name>Copy of Tweets</name>
 81 |             <state>STOPPED</state>
 82 |             <type>OUTPUT_PORT</type>
 83 |             <validationErrors>'Port 'Copy of Tweets'' is invalid because Output connection for port 'Copy of Tweets' is
 84 |                 not defined.
 85 |             </validationErrors>
 86 |         </outputPorts>
 87 |         <processors>
 88 |             <id>4c0c698b-1de5-48ce-895e-c9120911919e</id>
 89 |             <parentGroupId>9f346475-a6eb-4251-bce6-474d324f4f9b</parentGroupId>
 90 |             <position>
 91 |                 <x>1214.024507589506</x>
 92 |                 <y>50.8230229742004</y>
 93 |             </position>
 94 |             <config>
 95 |                 <bulletinLevel>WARN</bulletinLevel>
 96 |                 <comments></comments>
 97 |                 <concurrentlySchedulableTaskCount>1</concurrentlySchedulableTaskCount>
 98 |                 <defaultConcurrentTasks>
 99 |                     <entry>
100 |                         <key>TIMER_DRIVEN</key>
101 |                         <value>1</value>
102 |                     </entry>
103 |                     <entry>
104 |                         <key>EVENT_DRIVEN</key>
105 |                         <value>0</value>
106 |                     </entry>
107 |                     <entry>
108 |                         <key>CRON_DRIVEN</key>
109 |                         <value>1</value>
110 |                     </entry>
111 |                 </defaultConcurrentTasks>
112 |                 <defaultSchedulingPeriod>
113 |                     <entry>
114 |                         <key>TIMER_DRIVEN</key>
115 |                         <value>0 sec</value>
116 |                     </entry>
117 |                     <entry>
118 |                         <key>CRON_DRIVEN</key>
119 |                         <value>* * * * * ?</value>
120 |                     </entry>
121 |                 </defaultSchedulingPeriod>
122 |                 <descriptors>
123 |                     <entry>
124 |                         <key>Twitter Endpoint</key>
125 |                         <value>
126 |                             <allowableValues>
127 |                                 <description>The endpoint that provides public data, aka a 'garden hose'</description>
128 |                                 <displayName>Sample Endpoint</displayName>
129 |                                 <value>Sample Endpoint</value>
130 |                             </allowableValues>
131 |                             <allowableValues>
132 |                                 <description>The endpoint that provides access to all tweets</description>
133 |                                 <displayName>Firehose Endpoint</displayName>
134 |                                 <value>Firehose Endpoint</value>
135 |                             </allowableValues>
136 |                             <allowableValues>
137 |                                 <description>Endpoint that allows the stream to be filtered by specific terms or User
138 |                                     IDs
139 |                                 </description>
140 |                                 <displayName>Filter Endpoint</displayName>
141 |                                 <value>Filter Endpoint</value>
142 |                             </allowableValues>
143 |                             <defaultValue>Sample Endpoint</defaultValue>
144 |                             <description>Specifies which endpoint data should be pulled from</description>
145 |                             <displayName>Twitter Endpoint</displayName>
146 |                             <dynamic>false</dynamic>
147 |                             <name>Twitter Endpoint</name>
148 |                             <required>true</required>
149 |                             <sensitive>false</sensitive>
150 |                             <supportsEl>false</supportsEl>
151 |                         </value>
152 |                     </entry>
153 |                     <entry>
154 |                         <key>Consumer Key</key>
155 |                         <value>
156 |                             <description>The Consumer Key provided by Twitter</description>
157 |                             <displayName>Consumer Key</displayName>
158 |                             <dynamic>false</dynamic>
159 |                             <name>Consumer Key</name>
160 |                             <required>true</required>
161 |                             <sensitive>false</sensitive>
162 |                             <supportsEl>false</supportsEl>
163 |                         </value>
164 |                     </entry>
165 |                     <entry>
166 |                         <key>Consumer Secret</key>
167 |                         <value>
168 |                             <description>The Consumer Secret provided by Twitter</description>
169 |                             <displayName>Consumer Secret</displayName>
170 |                             <dynamic>false</dynamic>
171 |                             <name>Consumer Secret</name>
172 |                             <required>true</required>
173 |                             <sensitive>true</sensitive>
174 |                             <supportsEl>false</supportsEl>
175 |                         </value>
176 |                     </entry>
177 |                     <entry>
178 |                         <key>Access Token</key>
179 |                         <value>
180 |                             <description>The Acces Token provided by Twitter</description>
181 |                             <displayName>Access Token</displayName>
182 |                             <dynamic>false</dynamic>
183 |                             <name>Access Token</name>
184 |                             <required>true</required>
185 |                             <sensitive>false</sensitive>
186 |                             <supportsEl>false</supportsEl>
187 |                         </value>
188 |                     </entry>
189 |                     <entry>
190 |                         <key>Access Token Secret</key>
191 |                         <value>
192 |                             <description>The Access Token Secret provided by Twitter</description>
193 |                             <displayName>Access Token Secret</displayName>
194 |                             <dynamic>false</dynamic>
195 |                             <name>Access Token Secret</name>
196 |                             <required>true</required>
197 |                             <sensitive>true</sensitive>
198 |                             <supportsEl>false</supportsEl>
199 |                         </value>
200 |                     </entry>
201 |                     <entry>
202 |                         <key>Languages</key>
203 |                         <value>
204 |                             <description>A comma-separated list of languages for which tweets should be fetched
205 |                             </description>
206 |                             <displayName>Languages</displayName>
207 |                             <dynamic>false</dynamic>
208 |                             <name>Languages</name>
209 |                             <required>false</required>
210 |                             <sensitive>false</sensitive>
211 |                             <supportsEl>false</supportsEl>
212 |                         </value>
213 |                     </entry>
214 |                     <entry>
215 |                         <key>Terms to Filter On</key>
216 |                         <value>
217 |                             <description>A comma-separated list of terms to filter on. Ignored unless Endpoint is set to
218 |                                 'Filter Endpoint'. The filter works such that if any term matches, the status update
219 |                                 will be retrieved; multiple terms separated by a space function as an 'AND'. I.e., 'it
220 |                                 was, hello' will retrieve status updates that have either 'hello' or both 'it' AND 'was'
221 |                             </description>
222 |                             <displayName>Terms to Filter On</displayName>
223 |                             <dynamic>false</dynamic>
224 |                             <name>Terms to Filter On</name>
225 |                             <required>false</required>
226 |                             <sensitive>false</sensitive>
227 |                             <supportsEl>false</supportsEl>
228 |                         </value>
229 |                     </entry>
230 |                     <entry>
231 |                         <key>IDs to Follow</key>
232 |                         <value>
233 |                             <description>A comma-separated list of Twitter User ID's to follow. Ignored unless Endpoint
234 |                                 is set to 'Filter Endpoint'.
235 |                             </description>
236 |                             <displayName>IDs to Follow</displayName>
237 |                             <dynamic>false</dynamic>
238 |                             <name>IDs to Follow</name>
239 |                             <required>false</required>
240 |                             <sensitive>false</sensitive>
241 |                             <supportsEl>false</supportsEl>
242 |                         </value>
243 |                     </entry>
244 |                 </descriptors>
245 |                 <lossTolerant>false</lossTolerant>
246 |                 <penaltyDuration>30 sec</penaltyDuration>
247 |                 <properties>
248 |                     <entry>
249 |                         <key>Twitter Endpoint</key>
250 |                         <value>Sample Endpoint</value>
251 |                     </entry>
252 |                     <entry>
253 |                         <key>Consumer Key</key>
254 |                         <value>Rbeh7IMVo3RZf0hz2gdN3tYpQ</value>
255 |                     </entry>
256 |                     <entry>
257 |                         <key>Consumer Secret</key>
258 |                     </entry>
259 |                     <entry>
260 |                         <key>Access Token</key>
261 |                         <value>2954844987-3QltSFwayKVP2pqGSp59D7cAAIrF7l9UkQoTCJ4</value>
262 |                     </entry>
263 |                     <entry>
264 |                         <key>Access Token Secret</key>
265 |                     </entry>
266 |                     <entry>
267 |                         <key>Languages</key>
268 |                     </entry>
269 |                     <entry>
270 |                         <key>Terms to Filter On</key>
271 |                     </entry>
272 |                     <entry>
273 |                         <key>IDs to Follow</key>
274 |                     </entry>
275 |                 </properties>
276 |                 <runDurationMillis>0</runDurationMillis>
277 |                 <schedulingPeriod>0 sec</schedulingPeriod>
278 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
279 |                 <yieldDuration>1 sec</yieldDuration>
280 |             </config>
281 |             <name>Grab Garden Hose</name>
282 |             <relationships>
283 |                 <autoTerminate>false</autoTerminate>
284 |                 <description>All status updates will be routed to this relationship</description>
285 |                 <name>success</name>
286 |             </relationships>
287 |             <state>DISABLED</state>
288 |             <style/>
289 |             <supportsEventDriven>false</supportsEventDriven>
290 |             <supportsParallelProcessing>true</supportsParallelProcessing>
291 |             <type>org.apache.nifi.processors.twitter.GetTwitter</type>
292 |         </processors>
293 |         <processors>
294 |             <id>34f8b0e2-4772-4448-b811-1bc623434c8f</id>
295 |             <parentGroupId>9f346475-a6eb-4251-bce6-474d324f4f9b</parentGroupId>
296 |             <position>
297 |                 <x>1225.4497242643106</x>
298 |                 <y>420.16894353694454</y>
299 |             </position>
300 |             <config>
301 |                 <bulletinLevel>WARN</bulletinLevel>
302 |                 <comments></comments>
303 |                 <concurrentlySchedulableTaskCount>2</concurrentlySchedulableTaskCount>
304 |                 <defaultConcurrentTasks>
305 |                     <entry>
306 |                         <key>TIMER_DRIVEN</key>
307 |                         <value>1</value>
308 |                     </entry>
309 |                     <entry>
310 |                         <key>EVENT_DRIVEN</key>
311 |                         <value>0</value>
312 |                     </entry>
313 |                     <entry>
314 |                         <key>CRON_DRIVEN</key>
315 |                         <value>1</value>
316 |                     </entry>
317 |                 </defaultConcurrentTasks>
318 |                 <defaultSchedulingPeriod>
319 |                     <entry>
320 |                         <key>TIMER_DRIVEN</key>
321 |                         <value>0 sec</value>
322 |                     </entry>
323 |                     <entry>
324 |                         <key>CRON_DRIVEN</key>
325 |                         <value>* * * * * ?</value>
326 |                     </entry>
327 |                 </defaultSchedulingPeriod>
328 |                 <descriptors>
329 |                     <entry>
330 |                         <key>Routing Strategy</key>
331 |                         <value>
332 |                             <allowableValues>
333 |                                 <description>A copy of the FlowFile will be routed to each relationship whose
334 |                                     corresponding expression evaluates to 'true'
335 |                                 </description>
336 |                                 <displayName>Route to Property name</displayName>
337 |                                 <value>Route to Property name</value>
338 |                             </allowableValues>
339 |                             <allowableValues>
340 |                                 <description>Requires that all user-defined expressions evaluate to 'true' for the
341 |                                     FlowFile to be considered a match
342 |                                 </description>
343 |                                 <displayName>Route to 'matched' if all match</displayName>
344 |                                 <value>Route to 'match' if all match</value>
345 |                             </allowableValues>
346 |                             <allowableValues>
347 |                                 <description>Requires that at least one user-defined expression evaluate to 'true' for
348 |                                     hte FlowFile to be considered a match
349 |                                 </description>
350 |                                 <displayName>Route to 'matched' if any matches</displayName>
351 |                                 <value>Route to 'match' if any matches</value>
352 |                             </allowableValues>
353 |                             <defaultValue>Route to Property name</defaultValue>
354 |                             <description>Specifies how to determine which relationship to use when evaluating the
355 |                                 Expression Language
356 |                             </description>
357 |                             <displayName>Routing Strategy</displayName>
358 |                             <dynamic>false</dynamic>
359 |                             <name>Routing Strategy</name>
360 |                             <required>true</required>
361 |                             <sensitive>false</sensitive>
362 |                             <supportsEl>false</supportsEl>
363 |                         </value>
364 |                     </entry>
365 |                     <entry>
366 |                         <key>tweet</key>
367 |                         <value>
368 |                             <description></description>
369 |                             <displayName>tweet</displayName>
370 |                             <dynamic>true</dynamic>
371 |                             <name>tweet</name>
372 |                             <required>false</required>
373 |                             <sensitive>false</sensitive>
374 |                             <supportsEl>true</supportsEl>
375 |                         </value>
376 |                     </entry>
377 |                 </descriptors>
378 |                 <lossTolerant>false</lossTolerant>
379 |                 <penaltyDuration>30 sec</penaltyDuration>
380 |                 <properties>
381 |                     <entry>
382 |                         <key>Routing Strategy</key>
383 |                         <value>Route to Property name</value>
384 |                     </entry>
385 |                     <entry>
386 |                         <key>tweet</key>
387 |                         <value>${twitter.msg:isEmpty():not()}</value>
388 |                     </entry>
389 |                 </properties>
390 |                 <runDurationMillis>25</runDurationMillis>
391 |                 <schedulingPeriod>0 sec</schedulingPeriod>
392 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
393 |                 <yieldDuration>1 sec</yieldDuration>
394 |             </config>
395 |             <name>Find only Tweets</name>
396 |             <relationships>
397 |                 <autoTerminate>false</autoTerminate>
398 |                 <description></description>
399 |                 <name>tweet</name>
400 |             </relationships>
401 |             <relationships>
402 |                 <autoTerminate>true</autoTerminate>
403 |                 <description>FlowFiles that do not match any user-define expression will be routed here</description>
404 |                 <name>unmatched</name>
405 |             </relationships>
406 |             <state>STOPPED</state>
407 |             <style/>
408 |             <supportsEventDriven>true</supportsEventDriven>
409 |             <supportsParallelProcessing>true</supportsParallelProcessing>
410 |             <type>org.apache.nifi.processors.standard.RouteOnAttribute</type>
411 |         </processors>
412 |         <processors>
413 |             <id>3f260837-4af2-44b3-aeea-5b8e7c6cefb5</id>
414 |             <parentGroupId>9f346475-a6eb-4251-bce6-474d324f4f9b</parentGroupId>
415 |             <position>
416 |                 <x>1220.5984364225137</x>
417 |                 <y>234.16894353694454</y>
418 |             </position>
419 |             <config>
420 |                 <bulletinLevel>ERROR</bulletinLevel>
421 |                 <comments></comments>
422 |                 <concurrentlySchedulableTaskCount>4</concurrentlySchedulableTaskCount>
423 |                 <defaultConcurrentTasks>
424 |                     <entry>
425 |                         <key>TIMER_DRIVEN</key>
426 |                         <value>1</value>
427 |                     </entry>
428 |                     <entry>
429 |                         <key>EVENT_DRIVEN</key>
430 |                         <value>0</value>
431 |                     </entry>
432 |                     <entry>
433 |                         <key>CRON_DRIVEN</key>
434 |                         <value>1</value>
435 |                     </entry>
436 |                 </defaultConcurrentTasks>
437 |                 <defaultSchedulingPeriod>
438 |                     <entry>
439 |                         <key>TIMER_DRIVEN</key>
440 |                         <value>0 sec</value>
441 |                     </entry>
442 |                     <entry>
443 |                         <key>CRON_DRIVEN</key>
444 |                         <value>* * * * * ?</value>
445 |                     </entry>
446 |                 </defaultSchedulingPeriod>
447 |                 <descriptors>
448 |                     <entry>
449 |                         <key>Destination</key>
450 |                         <value>
451 |                             <allowableValues>
452 |                                 <displayName>flowfile-content</displayName>
453 |                                 <value>flowfile-content</value>
454 |                             </allowableValues>
455 |                             <allowableValues>
456 |                                 <displayName>flowfile-attribute</displayName>
457 |                                 <value>flowfile-attribute</value>
458 |                             </allowableValues>
459 |                             <defaultValue>flowfile-content</defaultValue>
460 |                             <description>Indicates whether the results of the JsonPath evaluation are written to the
461 |                                 FlowFile content or a FlowFile attribute; if using attribute, must specify the Attribute
462 |                                 Name property. If set to flowfile-content, only one JsonPath may be specified, and the
463 |                                 property name is ignored.
464 |                             </description>
465 |                             <displayName>Destination</displayName>
466 |                             <dynamic>false</dynamic>
467 |                             <name>Destination</name>
468 |                             <required>true</required>
469 |                             <sensitive>false</sensitive>
470 |                             <supportsEl>false</supportsEl>
471 |                         </value>
472 |                     </entry>
473 |                     <entry>
474 |                         <key>Return Type</key>
475 |                         <value>
476 |                             <allowableValues>
477 |                                 <displayName>auto-detect</displayName>
478 |                                 <value>auto-detect</value>
479 |                             </allowableValues>
480 |                             <allowableValues>
481 |                                 <displayName>json</displayName>
482 |                                 <value>json</value>
483 |                             </allowableValues>
484 |                             <allowableValues>
485 |                                 <displayName>scalar</displayName>
486 |                                 <value>scalar</value>
487 |                             </allowableValues>
488 |                             <defaultValue>auto-detect</defaultValue>
489 |                             <description>Indicates the desired return type of the JSON Path expressions. Selecting
490 |                                 'auto-detect' will set the return type to 'json' for a Destination of
491 |                                 'flowfile-content', and 'string' for a Destination of 'flowfile-attribute'.
492 |                             </description>
493 |                             <displayName>Return Type</displayName>
494 |                             <dynamic>false</dynamic>
495 |                             <name>Return Type</name>
496 |                             <required>true</required>
497 |                             <sensitive>false</sensitive>
498 |                             <supportsEl>false</supportsEl>
499 |                         </value>
500 |                     </entry>
501 |                     <entry>
502 |                         <key>Path Not Found Behavior</key>
503 |                         <value>
504 |                             <allowableValues>
505 |                                 <displayName>warn</displayName>
506 |                                 <value>warn</value>
507 |                             </allowableValues>
508 |                             <allowableValues>
509 |                                 <displayName>ignore</displayName>
510 |                                 <value>ignore</value>
511 |                             </allowableValues>
512 |                             <defaultValue>ignore</defaultValue>
513 |                             <description>Indicates how to handle missing JSON path expressions when destination is set
514 |                                 to 'flowfile-attribute'. Selecting 'warn' will generate a warning when a JSON path
515 |                                 expression is not found.
516 |                             </description>
517 |                             <displayName>Path Not Found Behavior</displayName>
518 |                             <dynamic>false</dynamic>
519 |                             <name>Path Not Found Behavior</name>
520 |                             <required>true</required>
521 |                             <sensitive>false</sensitive>
522 |                             <supportsEl>false</supportsEl>
523 |                         </value>
524 |                     </entry>
525 |                     <entry>
526 |                         <key>Null Value Representation</key>
527 |                         <value>
528 |                             <allowableValues>
529 |                                 <displayName>the string 'null'</displayName>
530 |                                 <value>the string 'null'</value>
531 |                             </allowableValues>
532 |                             <allowableValues>
533 |                                 <displayName>empty string</displayName>
534 |                                 <value>empty string</value>
535 |                             </allowableValues>
536 |                             <defaultValue>empty string</defaultValue>
537 |                             <description>Indicates the desired representation of JSON Path expressions resulting in a
538 |                                 null value.
539 |                             </description>
540 |                             <displayName>Null Value Representation</displayName>
541 |                             <dynamic>false</dynamic>
542 |                             <name>Null Value Representation</name>
543 |                             <required>true</required>
544 |                             <sensitive>false</sensitive>
545 |                             <supportsEl>false</supportsEl>
546 |                         </value>
547 |                     </entry>
548 |                     <entry>
549 |                         <key>language</key>
550 |                         <value>
551 |                             <description></description>
552 |                             <displayName>language</displayName>
553 |                             <dynamic>true</dynamic>
554 |                             <name>language</name>
555 |                             <required>false</required>
556 |                             <sensitive>false</sensitive>
557 |                             <supportsEl>false</supportsEl>
558 |                         </value>
559 |                     </entry>
560 |                     <entry>
561 |                         <key>twitter.handle</key>
562 |                         <value>
563 |                             <description></description>
564 |                             <displayName>twitter.handle</displayName>
565 |                             <dynamic>true</dynamic>
566 |                             <name>twitter.handle</name>
567 |                             <required>false</required>
568 |                             <sensitive>false</sensitive>
569 |                             <supportsEl>false</supportsEl>
570 |                         </value>
571 |                     </entry>
572 |                     <entry>
573 |                         <key>twitter.msg</key>
574 |                         <value>
575 |                             <description></description>
576 |                             <displayName>twitter.msg</displayName>
577 |                             <dynamic>true</dynamic>
578 |                             <name>twitter.msg</name>
579 |                             <required>false</required>
580 |                             <sensitive>false</sensitive>
581 |                             <supportsEl>false</supportsEl>
582 |                         </value>
583 |                     </entry>
584 |                     <entry>
585 |                         <key>twitter.user</key>
586 |                         <value>
587 |                             <description></description>
588 |                             <displayName>twitter.user</displayName>
589 |                             <dynamic>true</dynamic>
590 |                             <name>twitter.user</name>
591 |                             <required>false</required>
592 |                             <sensitive>false</sensitive>
593 |                             <supportsEl>false</supportsEl>
594 |                         </value>
595 |                     </entry>
596 |                 </descriptors>
597 |                 <lossTolerant>false</lossTolerant>
598 |                 <penaltyDuration>30 sec</penaltyDuration>
599 |                 <properties>
600 |                     <entry>
601 |                         <key>Destination</key>
602 |                         <value>flowfile-attribute</value>
603 |                     </entry>
604 |                     <entry>
605 |                         <key>Return Type</key>
606 |                         <value>auto-detect</value>
607 |                     </entry>
608 |                     <entry>
609 |                         <key>Path Not Found Behavior</key>
610 |                         <value>ignore</value>
611 |                     </entry>
612 |                     <entry>
613 |                         <key>Null Value Representation</key>
614 |                         <value>empty string</value>
615 |                     </entry>
616 |                     <entry>
617 |                         <key>language</key>
618 |                         <value>$.lang</value>
619 |                     </entry>
620 |                     <entry>
621 |                         <key>twitter.handle</key>
622 |                         <value>$.user.screen_name</value>
623 |                     </entry>
624 |                     <entry>
625 |                         <key>twitter.msg</key>
626 |                         <value>$.text</value>
627 |                     </entry>
628 |                     <entry>
629 |                         <key>twitter.user</key>
630 |                         <value>$.user.name</value>
631 |                     </entry>
632 |                 </properties>
633 |                 <runDurationMillis>25</runDurationMillis>
634 |                 <schedulingPeriod>0 sec</schedulingPeriod>
635 |                 <schedulingStrategy>TIMER_DRIVEN</schedulingStrategy>
636 |                 <yieldDuration>1 sec</yieldDuration>
637 |             </config>
638 |             <name>Pull Key Attributes</name>
639 |             <relationships>
640 |                 <autoTerminate>true</autoTerminate>
641 |                 <description>FlowFiles are routed to this relationship when the JsonPath cannot be evaluated against the
642 |                     content of the FlowFile; for instance, if the FlowFile is not valid JSON
643 |                 </description>
644 |                 <name>failure</name>
645 |             </relationships>
646 |             <relationships>
647 |                 <autoTerminate>false</autoTerminate>
648 |                 <description>FlowFiles are routed to this relationship when the JsonPath is successfully evaluated and
649 |                     the FlowFile is modified as a result
650 |                 </description>
651 |                 <name>matched</name>
652 |             </relationships>
653 |             <relationships>
654 |                 <autoTerminate>true</autoTerminate>
655 |                 <description>FlowFiles are routed to this relationship when the JsonPath does not match the content of
656 |                     the FlowFile and the Destination is set to flowfile-content
657 |                 </description>
658 |                 <name>unmatched</name>
659 |             </relationships>
660 |             <state>STOPPED</state>
661 |             <style/>
662 |             <supportsEventDriven>true</supportsEventDriven>
663 |             <supportsParallelProcessing>true</supportsParallelProcessing>
664 |             <type>org.apache.nifi.processors.standard.EvaluateJsonPath</type>
665 |         </processors>
666 |     </snippet>
667 |     <timestamp>05/14/2015 12:02:30 UTC</timestamp>
668 | </template>


--------------------------------------------------------------------------------
/twitter-solr/README.md:
--------------------------------------------------------------------------------
 1 | twitter-solr
 2 | ============
 3 | 
 4 | This flow shows how to index tweets with Solr using NiFi. Pre-requisites for this flow are NiFi 0.3.0 or later, 
 5 | the creation of a Twitter application, and a running instance of Solr 5.1 or later with a tweets collection:
 6 | 
 7 | 
 8 | ```bash
 9 | ./bin/solr start -c
10 | ./bin/solr create_collection -c tweets -d data_driven_schema_configs -shards 1 -replicationFactor 1
11 | ```


--------------------------------------------------------------------------------