├── .gitignore ├── LICENSE ├── README.md ├── ch01-missing-data-imputation ├── Recipe-01-Removing-observations-with-missing-data.ipynb ├── Recipe-02-Performing-mean-or-median-imputation.ipynb ├── Recipe-03-Imputing-categorical-variables.ipynb ├── Recipe-04-Replacing-missing-values-with-an-arbitrary-number.ipynb ├── Recipe-05-Finding-extreme-values-for-imputation.ipynb ├── Recipe-06-Marking-imputed-values.ipynb ├── Recipe-07-Performing-multivariate-imputation-by-chained-equations.ipynb ├── Recipe-08-Estimating-missing-data-with-K-nearest-neighbours.ipynb └── donwload-prepare-store-credit-approval-dataset.ipynb ├── ch02-categorical-encoding ├── Recipe-01-One-hot-encoding.ipynb ├── Recipe-02-One-hot-encoding-frequent-categories.ipynb ├── Recipe-03-Replacing-categories-by-counts-frequency.ipynb ├── Recipe-04-Ordinal-encoding.ipynb ├── Recipe-05-Ordered-ordinal-encoding.ipynb ├── Recipe-06-Target-mean-encoding.ipynb ├── Recipe-07-Weight-of-evidence.ipynb ├── Recipe-08-Grouping-rare-categories.ipynb ├── Recipe-09-Binary-Encoding.ipynb └── donwload-prepare-store-credit-approval-dataset.ipynb ├── ch03-variable-transformation ├── Recipe-1-logarithmic-transformation.ipynb ├── Recipe-2-reciprocal-transformation.ipynb ├── Recipe-3-square-root-transformation.ipynb ├── Recipe-4-power-transformation.ipynb ├── Recipe-5-Box-Cox-transformation.ipynb └── Recipe-6-Yeo-Johnson-transformation.ipynb ├── ch04-discretization ├── Recipe-1-Equal-width-discretization.ipynb ├── Recipe-2-Equal-frequency-discretisation.ipynb ├── Recipe-3-User-defined-interval-discretization.ipynb ├── Recipe-4-Discretization-k-means.ipynb ├── Recipe-5-Binarization.ipynb ├── Recipe-6-Discretization-with-decision-trees.ipynb └── donwload-prepare-store-enron-data.ipynb ├── ch05-outliers ├── Recipe-1-Visualizing-outliers-with-boxplots.ipynb ├── Recipe-2-Finding-outliers-with-mean-and-std.ipynb ├── Recipe-3-Finding-outliers-with-the-IQR.ipynb ├── Recipe-4-Removing-outliers.ipynb ├── Recipe-5-Capping-outliers.ipynb └── Recipe-6-Capping-outliers-with-quantiles.ipynb ├── ch06-datetime ├── Recipe-1-Extracting-features-from-dates-with-pandas.ipynb ├── Recipe-2-Extracting-features-from-time-with-pandas.ipynb ├── Recipe-3-Capturing-elapsed-time-between-2-variables.ipynb ├── Recipe-4-Working-with-different-time-zones.ipynb └── Recipe-5-Automating-datetime-features-with-Feature-engine.ipynb ├── ch07-scaling ├── Recipe-1-standardization.ipynb ├── Recipe-2-min-max-scaling.ipynb ├── Recipe-3-robust-scaling.ipynb ├── Recipe-4-mean-normalization.ipynb ├── Recipe-5-maximum-absolute-scaling.ipynb └── Recipe-6-scaling-to-unit-length.ipynb ├── ch08-creation ├── Cyclical-features-figures.ipynb ├── Recipe1-Combine-features-with-functions.ipynb ├── Recipe2-Comparing-features-to-reference-variable.ipynb ├── Recipe3-PolynomialExpansion.ipynb ├── Recipe4-Combining-features-with-trees.ipynb ├── Recipe5-Periodic-features.ipynb ├── Recipe6-Spline-features.ipynb ├── Spline-features-figures.ipynb └── polynomial_features_figures.ipynb ├── ch09-featuretools ├── Recipe1-Setting-up-an-entitity-set.ipynb ├── Recipe2-Creating-features-with-cumulative-primitives.ipynb ├── Recipe3-Combining-numerical-features.ipynb ├── Recipe4-Creating-features-from-datetime.ipynb ├── Recipe5-Extracting-features-from-text.ipynb ├── Recipe6-Creating-features-with-aggregation-primitives.ipynb └── prepare-retail-dataset.ipynb ├── ch10-tsfresh ├── Recipe1-extract-features-automatically-with-tsfresh.ipynb ├── Recipe2-extract-relevant-features-with-tsfresh.ipynb ├── Recipe3-extract-specific-features-with-tsfresh.ipynb ├── Recipe4-extract-features-after-feature-selection.ipynb ├── Recipe5-extract-features-automatically-within-pipeline.ipynb └── prepare-occupancy-dataset.ipynb ├── ch11-text ├── Recipe1-Capturing-text-complexity-in-features.ipynb ├── Recipe2-Sentence-tokenization.ipynb ├── Recipe3-bag-of-words.ipynb ├── Recipe4-TFIDF.ipynb └── Recipe5-cleaning-text.ipynb └── requirements.txt /.gitignore: -------------------------------------------------------------------------------- 1 | .ipynb_checkpoints 2 | *.csv 3 | *.data 4 | *.txt 5 | *.gz -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- 1 | MIT License 2 | 3 | Copyright (c) 2022 Packt 4 | 5 | Permission is hereby granted, free of charge, to any person obtaining a copy 6 | of this software and associated documentation files (the "Software"), to deal 7 | in the Software without restriction, including without limitation the rights 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 9 | copies of the Software, and to permit persons to whom the Software is 10 | furnished to do so, subject to the following conditions: 11 | 12 | The above copyright notice and this permission notice shall be included in all 13 | copies or substantial portions of the Software. 14 | 15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 21 | SOFTWARE. 22 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | 2 | ### [Packt Conference : Put Generative AI to work on Oct 11-13 (Virtual)](https://packt.link/JGIEY) 3 | 4 |
[](https://packt.link/JGIEY)
5 | 3 Days, 20+ AI Experts, 25+ Workshops and Power Talks 6 | 7 | Code: USD75OFF 8 | 9 | 10 | 11 | 12 | # Python Feature Engineering Cookbook-Second Edition 13 | 14 |\n", 60 | " | A1 | \n", 61 | "A2 | \n", 62 | "A3 | \n", 63 | "A4 | \n", 64 | "A5 | \n", 65 | "A6 | \n", 66 | "A7 | \n", 67 | "A8 | \n", 68 | "A9 | \n", 69 | "A10 | \n", 70 | "A11 | \n", 71 | "A12 | \n", 72 | "A13 | \n", 73 | "A14 | \n", 74 | "A15 | \n", 75 | "target | \n", 76 | "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", 81 | "b | \n", 82 | "30.83 | \n", 83 | "0.000 | \n", 84 | "u | \n", 85 | "g | \n", 86 | "w | \n", 87 | "v | \n", 88 | "1.25 | \n", 89 | "t | \n", 90 | "t | \n", 91 | "1 | \n", 92 | "f | \n", 93 | "g | \n", 94 | "202.0 | \n", 95 | "0 | \n", 96 | "1 | \n", 97 | "
1 | \n", 100 | "a | \n", 101 | "58.67 | \n", 102 | "4.460 | \n", 103 | "u | \n", 104 | "g | \n", 105 | "q | \n", 106 | "h | \n", 107 | "3.04 | \n", 108 | "t | \n", 109 | "t | \n", 110 | "6 | \n", 111 | "f | \n", 112 | "g | \n", 113 | "43.0 | \n", 114 | "560 | \n", 115 | "1 | \n", 116 | "
2 | \n", 119 | "a | \n", 120 | "24.50 | \n", 121 | "NaN | \n", 122 | "u | \n", 123 | "g | \n", 124 | "q | \n", 125 | "h | \n", 126 | "NaN | \n", 127 | "NaN | \n", 128 | "NaN | \n", 129 | "0 | \n", 130 | "f | \n", 131 | "g | \n", 132 | "280.0 | \n", 133 | "824 | \n", 134 | "1 | \n", 135 | "
3 | \n", 138 | "b | \n", 139 | "27.83 | \n", 140 | "1.540 | \n", 141 | "u | \n", 142 | "g | \n", 143 | "w | \n", 144 | "v | \n", 145 | "3.75 | \n", 146 | "t | \n", 147 | "t | \n", 148 | "5 | \n", 149 | "t | \n", 150 | "g | \n", 151 | "100.0 | \n", 152 | "3 | \n", 153 | "1 | \n", 154 | "
4 | \n", 157 | "b | \n", 158 | "20.17 | \n", 159 | "5.625 | \n", 160 | "u | \n", 161 | "g | \n", 162 | "w | \n", 163 | "v | \n", 164 | "1.71 | \n", 165 | "t | \n", 166 | "f | \n", 167 | "0 | \n", 168 | "f | \n", 169 | "s | \n", 170 | "120.0 | \n", 171 | "0 | \n", 172 | "1 | \n", 173 | "
\n", 58 | " | A2 | \n", 59 | "A3 | \n", 60 | "A8 | \n", 61 | "A11 | \n", 62 | "A14 | \n", 63 | "A15 | \n", 64 | "target | \n", 65 | "
---|---|---|---|---|---|---|---|
0 | \n", 70 | "30.83 | \n", 71 | "0.000 | \n", 72 | "1.25 | \n", 73 | "1 | \n", 74 | "202.0 | \n", 75 | "0 | \n", 76 | "1 | \n", 77 | "
1 | \n", 80 | "58.67 | \n", 81 | "4.460 | \n", 82 | "3.04 | \n", 83 | "6 | \n", 84 | "43.0 | \n", 85 | "560 | \n", 86 | "1 | \n", 87 | "
2 | \n", 90 | "24.50 | \n", 91 | "NaN | \n", 92 | "NaN | \n", 93 | "0 | \n", 94 | "280.0 | \n", 95 | "824 | \n", 96 | "1 | \n", 97 | "
3 | \n", 100 | "27.83 | \n", 101 | "1.540 | \n", 102 | "3.75 | \n", 103 | "5 | \n", 104 | "100.0 | \n", 105 | "3 | \n", 106 | "1 | \n", 107 | "
4 | \n", 110 | "20.17 | \n", 111 | "5.625 | \n", 112 | "1.71 | \n", 113 | "0 | \n", 114 | "120.0 | \n", 115 | "0 | \n", 116 | "1 | \n", 117 | "
\n", 63 | " | A1 | \n", 64 | "A2 | \n", 65 | "A3 | \n", 66 | "A4 | \n", 67 | "A5 | \n", 68 | "A6 | \n", 69 | "A7 | \n", 70 | "A8 | \n", 71 | "A9 | \n", 72 | "A10 | \n", 73 | "A11 | \n", 74 | "A12 | \n", 75 | "A13 | \n", 76 | "A14 | \n", 77 | "A15 | \n", 78 | "target | \n", 79 | "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", 84 | "b | \n", 85 | "30.83 | \n", 86 | "0.000 | \n", 87 | "u | \n", 88 | "g | \n", 89 | "w | \n", 90 | "v | \n", 91 | "1.25 | \n", 92 | "t | \n", 93 | "t | \n", 94 | "1 | \n", 95 | "f | \n", 96 | "g | \n", 97 | "202.0 | \n", 98 | "0 | \n", 99 | "1 | \n", 100 | "
1 | \n", 103 | "a | \n", 104 | "58.67 | \n", 105 | "4.460 | \n", 106 | "u | \n", 107 | "g | \n", 108 | "q | \n", 109 | "h | \n", 110 | "3.04 | \n", 111 | "t | \n", 112 | "t | \n", 113 | "6 | \n", 114 | "f | \n", 115 | "g | \n", 116 | "43.0 | \n", 117 | "560 | \n", 118 | "1 | \n", 119 | "
2 | \n", 122 | "a | \n", 123 | "24.50 | \n", 124 | "0.500 | \n", 125 | "u | \n", 126 | "g | \n", 127 | "q | \n", 128 | "h | \n", 129 | "1.50 | \n", 130 | "t | \n", 131 | "f | \n", 132 | "0 | \n", 133 | "f | \n", 134 | "g | \n", 135 | "280.0 | \n", 136 | "824 | \n", 137 | "1 | \n", 138 | "
3 | \n", 141 | "b | \n", 142 | "27.83 | \n", 143 | "1.540 | \n", 144 | "u | \n", 145 | "g | \n", 146 | "w | \n", 147 | "v | \n", 148 | "3.75 | \n", 149 | "t | \n", 150 | "t | \n", 151 | "5 | \n", 152 | "t | \n", 153 | "g | \n", 154 | "100.0 | \n", 155 | "3 | \n", 156 | "1 | \n", 157 | "
4 | \n", 160 | "b | \n", 161 | "20.17 | \n", 162 | "5.625 | \n", 163 | "u | \n", 164 | "g | \n", 165 | "w | \n", 166 | "v | \n", 167 | "1.71 | \n", 168 | "t | \n", 169 | "f | \n", 170 | "0 | \n", 171 | "f | \n", 172 | "s | \n", 173 | "120.0 | \n", 174 | "0 | \n", 175 | "1 | \n", 176 | "
\n", 62 | " | A1 | \n", 63 | "A2 | \n", 64 | "A3 | \n", 65 | "A4 | \n", 66 | "A5 | \n", 67 | "A6 | \n", 68 | "A7 | \n", 69 | "A8 | \n", 70 | "A9 | \n", 71 | "A10 | \n", 72 | "A11 | \n", 73 | "A12 | \n", 74 | "A13 | \n", 75 | "A14 | \n", 76 | "A15 | \n", 77 | "target | \n", 78 | "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", 83 | "b | \n", 84 | "30.83 | \n", 85 | "0.000 | \n", 86 | "u | \n", 87 | "g | \n", 88 | "w | \n", 89 | "v | \n", 90 | "1.25 | \n", 91 | "t | \n", 92 | "t | \n", 93 | "1 | \n", 94 | "f | \n", 95 | "g | \n", 96 | "202.0 | \n", 97 | "0 | \n", 98 | "1 | \n", 99 | "
1 | \n", 102 | "a | \n", 103 | "58.67 | \n", 104 | "4.460 | \n", 105 | "u | \n", 106 | "g | \n", 107 | "q | \n", 108 | "h | \n", 109 | "3.04 | \n", 110 | "t | \n", 111 | "t | \n", 112 | "6 | \n", 113 | "f | \n", 114 | "g | \n", 115 | "43.0 | \n", 116 | "560 | \n", 117 | "1 | \n", 118 | "
2 | \n", 121 | "a | \n", 122 | "24.50 | \n", 123 | "0.500 | \n", 124 | "u | \n", 125 | "g | \n", 126 | "q | \n", 127 | "h | \n", 128 | "1.50 | \n", 129 | "t | \n", 130 | "f | \n", 131 | "0 | \n", 132 | "f | \n", 133 | "g | \n", 134 | "280.0 | \n", 135 | "824 | \n", 136 | "1 | \n", 137 | "
3 | \n", 140 | "b | \n", 141 | "27.83 | \n", 142 | "1.540 | \n", 143 | "u | \n", 144 | "g | \n", 145 | "w | \n", 146 | "v | \n", 147 | "3.75 | \n", 148 | "t | \n", 149 | "t | \n", 150 | "5 | \n", 151 | "t | \n", 152 | "g | \n", 153 | "100.0 | \n", 154 | "3 | \n", 155 | "1 | \n", 156 | "
4 | \n", 159 | "b | \n", 160 | "20.17 | \n", 161 | "5.625 | \n", 162 | "u | \n", 163 | "g | \n", 164 | "w | \n", 165 | "v | \n", 166 | "1.71 | \n", 167 | "t | \n", 168 | "f | \n", 169 | "0 | \n", 170 | "f | \n", 171 | "s | \n", 172 | "120.0 | \n", 173 | "0 | \n", 174 | "1 | \n", 175 | "
\n", 60 | " | docID | \n", 61 | "wordID | \n", 62 | "count | \n", 63 | "
---|---|---|---|
0 | \n", 68 | "1 | \n", 69 | "118 | \n", 70 | "1 | \n", 71 | "
1 | \n", 74 | "1 | \n", 75 | "285 | \n", 76 | "1 | \n", 77 | "
2 | \n", 80 | "1 | \n", 81 | "1229 | \n", 82 | "1 | \n", 83 | "
3 | \n", 86 | "1 | \n", 87 | "1688 | \n", 88 | "1 | \n", 89 | "
4 | \n", 92 | "1 | \n", 93 | "2068 | \n", 94 | "1 | \n", 95 | "
\n", 149 | " | words | \n", 150 | "
---|---|
0 | \n", 155 | "aaa | \n", 156 | "
1 | \n", 159 | "aaas | \n", 160 | "
2 | \n", 163 | "aactive | \n", 164 | "
3 | \n", 167 | "aadvantage | \n", 168 | "
4 | \n", 171 | "aaker | \n", 172 | "
\n", 226 | " | words | \n", 227 | "
---|---|
8704 | \n", 232 | "eurobond | \n", 233 | "
13618 | \n", 236 | "keen | \n", 237 | "
11114 | \n", 240 | "halligan | \n", 241 | "
19968 | \n", 244 | "pvr | \n", 245 | "
23327 | \n", 248 | "soda | \n", 249 | "
20714 | \n", 252 | "refundable | \n", 253 | "
390 | \n", 256 | "advice | \n", 257 | "
6257 | \n", 260 | "decker | \n", 261 | "
8680 | \n", 264 | "etis | \n", 265 | "
3370 | \n", 268 | "cab | \n", 269 | "
\n", 327 | " | words | \n", 328 | "docID | \n", 329 | "wordID | \n", 330 | "count | \n", 331 | "
---|---|---|---|---|
137715 | \n", 336 | "eurobond | \n", 337 | "2021 | \n", 338 | "8704 | \n", 339 | "2 | \n", 340 | "
140167 | \n", 343 | "eurobond | \n", 344 | "2050 | \n", 345 | "8704 | \n", 346 | "11 | \n", 347 | "
151530 | \n", 350 | "eurobond | \n", 351 | "2269 | \n", 352 | "8704 | \n", 353 | "2 | \n", 354 | "
155066 | \n", 357 | "eurobond | \n", 358 | "2352 | \n", 359 | "8704 | \n", 360 | "2 | \n", 361 | "
156247 | \n", 364 | "eurobond | \n", 365 | "2375 | \n", 366 | "8704 | \n", 367 | "2 | \n", 368 | "
words | \n", 444 | "advice | \n", 445 | "cab | \n", 446 | "decker | \n", 447 | "etis | \n", 448 | "eurobond | \n", 449 | "halligan | \n", 450 | "keen | \n", 451 | "pvr | \n", 452 | "refundable | \n", 453 | "soda | \n", 454 | "
---|---|---|---|---|---|---|---|---|---|---|
0 | \n", 459 | "0.0 | \n", 460 | "0.0 | \n", 461 | "2.0 | \n", 462 | "0.0 | \n", 463 | "0.0 | \n", 464 | "0.0 | \n", 465 | "0.0 | \n", 466 | "0.0 | \n", 467 | "0.0 | \n", 468 | "0.0 | \n", 469 | "
1 | \n", 472 | "0.0 | \n", 473 | "0.0 | \n", 474 | "2.0 | \n", 475 | "0.0 | \n", 476 | "0.0 | \n", 477 | "0.0 | \n", 478 | "0.0 | \n", 479 | "0.0 | \n", 480 | "0.0 | \n", 481 | "0.0 | \n", 482 | "
2 | \n", 485 | "1.0 | \n", 486 | "0.0 | \n", 487 | "0.0 | \n", 488 | "0.0 | \n", 489 | "0.0 | \n", 490 | "0.0 | \n", 491 | "0.0 | \n", 492 | "0.0 | \n", 493 | "0.0 | \n", 494 | "0.0 | \n", 495 | "
3 | \n", 498 | "0.0 | \n", 499 | "0.0 | \n", 500 | "0.0 | \n", 501 | "0.0 | \n", 502 | "0.0 | \n", 503 | "0.0 | \n", 504 | "0.0 | \n", 505 | "0.0 | \n", 506 | "1.0 | \n", 507 | "0.0 | \n", 508 | "
4 | \n", 511 | "0.0 | \n", 512 | "0.0 | \n", 513 | "2.0 | \n", 514 | "0.0 | \n", 515 | "0.0 | \n", 516 | "0.0 | \n", 517 | "0.0 | \n", 518 | "0.0 | \n", 519 | "0.0 | \n", 520 | "0.0 | \n", 521 | "
\n", 49 | " | mean radius | \n", 50 | "mean texture | \n", 51 | "mean perimeter | \n", 52 | "mean area | \n", 53 | "mean smoothness | \n", 54 | "mean compactness | \n", 55 | "mean concavity | \n", 56 | "mean concave points | \n", 57 | "mean symmetry | \n", 58 | "mean fractal dimension | \n", 59 | "... | \n", 60 | "worst radius | \n", 61 | "worst texture | \n", 62 | "worst perimeter | \n", 63 | "worst area | \n", 64 | "worst smoothness | \n", 65 | "worst compactness | \n", 66 | "worst concavity | \n", 67 | "worst concave points | \n", 68 | "worst symmetry | \n", 69 | "worst fractal dimension | \n", 70 | "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", 75 | "17.99 | \n", 76 | "10.38 | \n", 77 | "122.80 | \n", 78 | "1001.0 | \n", 79 | "0.11840 | \n", 80 | "0.27760 | \n", 81 | "0.3001 | \n", 82 | "0.14710 | \n", 83 | "0.2419 | \n", 84 | "0.07871 | \n", 85 | "... | \n", 86 | "25.38 | \n", 87 | "17.33 | \n", 88 | "184.60 | \n", 89 | "2019.0 | \n", 90 | "0.1622 | \n", 91 | "0.6656 | \n", 92 | "0.7119 | \n", 93 | "0.2654 | \n", 94 | "0.4601 | \n", 95 | "0.11890 | \n", 96 | "
1 | \n", 99 | "20.57 | \n", 100 | "17.77 | \n", 101 | "132.90 | \n", 102 | "1326.0 | \n", 103 | "0.08474 | \n", 104 | "0.07864 | \n", 105 | "0.0869 | \n", 106 | "0.07017 | \n", 107 | "0.1812 | \n", 108 | "0.05667 | \n", 109 | "... | \n", 110 | "24.99 | \n", 111 | "23.41 | \n", 112 | "158.80 | \n", 113 | "1956.0 | \n", 114 | "0.1238 | \n", 115 | "0.1866 | \n", 116 | "0.2416 | \n", 117 | "0.1860 | \n", 118 | "0.2750 | \n", 119 | "0.08902 | \n", 120 | "
2 | \n", 123 | "19.69 | \n", 124 | "21.25 | \n", 125 | "130.00 | \n", 126 | "1203.0 | \n", 127 | "0.10960 | \n", 128 | "0.15990 | \n", 129 | "0.1974 | \n", 130 | "0.12790 | \n", 131 | "0.2069 | \n", 132 | "0.05999 | \n", 133 | "... | \n", 134 | "23.57 | \n", 135 | "25.53 | \n", 136 | "152.50 | \n", 137 | "1709.0 | \n", 138 | "0.1444 | \n", 139 | "0.4245 | \n", 140 | "0.4504 | \n", 141 | "0.2430 | \n", 142 | "0.3613 | \n", 143 | "0.08758 | \n", 144 | "
3 | \n", 147 | "11.42 | \n", 148 | "20.38 | \n", 149 | "77.58 | \n", 150 | "386.1 | \n", 151 | "0.14250 | \n", 152 | "0.28390 | \n", 153 | "0.2414 | \n", 154 | "0.10520 | \n", 155 | "0.2597 | \n", 156 | "0.09744 | \n", 157 | "... | \n", 158 | "14.91 | \n", 159 | "26.50 | \n", 160 | "98.87 | \n", 161 | "567.7 | \n", 162 | "0.2098 | \n", 163 | "0.8663 | \n", 164 | "0.6869 | \n", 165 | "0.2575 | \n", 166 | "0.6638 | \n", 167 | "0.17300 | \n", 168 | "
4 | \n", 171 | "20.29 | \n", 172 | "14.34 | \n", 173 | "135.10 | \n", 174 | "1297.0 | \n", 175 | "0.10030 | \n", 176 | "0.13280 | \n", 177 | "0.1980 | \n", 178 | "0.10430 | \n", 179 | "0.1809 | \n", 180 | "0.05883 | \n", 181 | "... | \n", 182 | "22.54 | \n", 183 | "16.67 | \n", 184 | "152.20 | \n", 185 | "1575.0 | \n", 186 | "0.1374 | \n", 187 | "0.2050 | \n", 188 | "0.4000 | \n", 189 | "0.1625 | \n", 190 | "0.2364 | \n", 191 | "0.07678 | \n", 192 | "
5 rows × 30 columns
\n", 196 | "\n", 49 | " | MedInc | \n", 50 | "HouseAge | \n", 51 | "AveRooms | \n", 52 | "AveBedrms | \n", 53 | "Population | \n", 54 | "AveOccup | \n", 55 | "Latitude | \n", 56 | "Longitude | \n", 57 | "
---|---|---|---|---|---|---|---|---|
0 | \n", 62 | "8.3252 | \n", 63 | "41.0 | \n", 64 | "6.984127 | \n", 65 | "1.023810 | \n", 66 | "322.0 | \n", 67 | "2.555556 | \n", 68 | "37.88 | \n", 69 | "-122.23 | \n", 70 | "
1 | \n", 73 | "8.3014 | \n", 74 | "21.0 | \n", 75 | "6.238137 | \n", 76 | "0.971880 | \n", 77 | "2401.0 | \n", 78 | "2.109842 | \n", 79 | "37.86 | \n", 80 | "-122.22 | \n", 81 | "
2 | \n", 84 | "7.2574 | \n", 85 | "52.0 | \n", 86 | "8.288136 | \n", 87 | "1.073446 | \n", 88 | "496.0 | \n", 89 | "2.802260 | \n", 90 | "37.85 | \n", 91 | "-122.24 | \n", 92 | "
3 | \n", 95 | "5.6431 | \n", 96 | "52.0 | \n", 97 | "5.817352 | \n", 98 | "1.073059 | \n", 99 | "558.0 | \n", 100 | "2.547945 | \n", 101 | "37.85 | \n", 102 | "-122.25 | \n", 103 | "
4 | \n", 106 | "3.8462 | \n", 107 | "52.0 | \n", 108 | "6.281853 | \n", 109 | "1.081081 | \n", 110 | "565.0 | \n", 111 | "2.181467 | \n", 112 | "37.85 | \n", 113 | "-122.25 | \n", 114 | "
\n", 81 | " | MedInc | \n", 82 | "HouseAge | \n", 83 | "AveRooms | \n", 84 | "AveBedrms | \n", 85 | "Population | \n", 86 | "AveOccup | \n", 87 | "Latitude | \n", 88 | "Longitude | \n", 89 | "
---|---|---|---|---|---|---|---|---|
1989 | \n", 94 | "1.9750 | \n", 95 | "52.0 | \n", 96 | "2.800000 | \n", 97 | "0.700000 | \n", 98 | "193.0 | \n", 99 | "4.825000 | \n", 100 | "36.73 | \n", 101 | "-119.79 | \n", 102 | "
256 | \n", 105 | "2.2604 | \n", 106 | "43.0 | \n", 107 | "3.671480 | \n", 108 | "1.184116 | \n", 109 | "836.0 | \n", 110 | "3.018051 | \n", 111 | "37.77 | \n", 112 | "-122.21 | \n", 113 | "
7887 | \n", 116 | "6.2990 | \n", 117 | "17.0 | \n", 118 | "6.478022 | \n", 119 | "1.087912 | \n", 120 | "1387.0 | \n", 121 | "3.810440 | \n", 122 | "33.87 | \n", 123 | "-118.04 | \n", 124 | "
4581 | \n", 127 | "1.7199 | \n", 128 | "17.0 | \n", 129 | "2.518000 | \n", 130 | "1.196000 | \n", 131 | "3051.0 | \n", 132 | "3.051000 | \n", 133 | "34.06 | \n", 134 | "-118.28 | \n", 135 | "
1993 | \n", 138 | "2.2206 | \n", 139 | "50.0 | \n", 140 | "4.622754 | \n", 141 | "1.161677 | \n", 142 | "606.0 | \n", 143 | "3.628743 | \n", 144 | "36.73 | \n", 145 | "-119.81 | \n", 146 | "
OutlierTrimmer(capping_method='iqr', fold=1.5, tail='both',\n", 290 | " variables=['MedInc', 'HouseAge', 'Population'])In a Jupyter environment, please rerun this cell to show the HTML representation or trust the notebook.
OutlierTrimmer(capping_method='iqr', fold=1.5, tail='both',\n", 291 | " variables=['MedInc', 'HouseAge', 'Population'])
\n", 46 | " | date | \n", 47 | "
---|---|
0 | \n", 52 | "2019-03-05 00:00:00 | \n", 53 | "
1 | \n", 56 | "2019-03-05 01:15:10 | \n", 57 | "
2 | \n", 60 | "2019-03-05 02:30:20 | \n", 61 | "
3 | \n", 64 | "2019-03-05 03:45:30 | \n", 65 | "
4 | \n", 68 | "2019-03-05 05:00:40 | \n", 69 | "
\n", 122 | " | date | \n", 123 | "hour | \n", 124 | "min | \n", 125 | "sec | \n", 126 | "
---|---|---|---|---|
0 | \n", 131 | "2019-03-05 00:00:00 | \n", 132 | "0 | \n", 133 | "0 | \n", 134 | "0 | \n", 135 | "
1 | \n", 138 | "2019-03-05 01:15:10 | \n", 139 | "1 | \n", 140 | "15 | \n", 141 | "10 | \n", 142 | "
2 | \n", 145 | "2019-03-05 02:30:20 | \n", 146 | "2 | \n", 147 | "30 | \n", 148 | "20 | \n", 149 | "
3 | \n", 152 | "2019-03-05 03:45:30 | \n", 153 | "3 | \n", 154 | "45 | \n", 155 | "30 | \n", 156 | "
4 | \n", 159 | "2019-03-05 05:00:40 | \n", 160 | "5 | \n", 161 | "0 | \n", 162 | "40 | \n", 163 | "
\n", 218 | " | date | \n", 219 | "hour | \n", 220 | "min | \n", 221 | "sec | \n", 222 | "h | \n", 223 | "m | \n", 224 | "s | \n", 225 | "
---|---|---|---|---|---|---|---|
0 | \n", 230 | "2019-03-05 00:00:00 | \n", 231 | "0 | \n", 232 | "0 | \n", 233 | "0 | \n", 234 | "0 | \n", 235 | "0 | \n", 236 | "0 | \n", 237 | "
1 | \n", 240 | "2019-03-05 01:15:10 | \n", 241 | "1 | \n", 242 | "15 | \n", 243 | "10 | \n", 244 | "1 | \n", 245 | "15 | \n", 246 | "10 | \n", 247 | "
2 | \n", 250 | "2019-03-05 02:30:20 | \n", 251 | "2 | \n", 252 | "30 | \n", 253 | "20 | \n", 254 | "2 | \n", 255 | "30 | \n", 256 | "20 | \n", 257 | "
3 | \n", 260 | "2019-03-05 03:45:30 | \n", 261 | "3 | \n", 262 | "45 | \n", 263 | "30 | \n", 264 | "3 | \n", 265 | "45 | \n", 266 | "30 | \n", 267 | "
4 | \n", 270 | "2019-03-05 05:00:40 | \n", 271 | "5 | \n", 272 | "0 | \n", 273 | "40 | \n", 274 | "5 | \n", 275 | "0 | \n", 276 | "40 | \n", 277 | "
\n", 351 | " | date | \n", 352 | "hour | \n", 353 | "min | \n", 354 | "sec | \n", 355 | "h | \n", 356 | "m | \n", 357 | "s | \n", 358 | "is_morning | \n", 359 | "
---|---|---|---|---|---|---|---|---|
0 | \n", 364 | "2019-03-05 00:00:00 | \n", 365 | "0 | \n", 366 | "0 | \n", 367 | "0 | \n", 368 | "0 | \n", 369 | "0 | \n", 370 | "0 | \n", 371 | "0 | \n", 372 | "
1 | \n", 375 | "2019-03-05 01:15:10 | \n", 376 | "1 | \n", 377 | "15 | \n", 378 | "10 | \n", 379 | "1 | \n", 380 | "15 | \n", 381 | "10 | \n", 382 | "0 | \n", 383 | "
2 | \n", 386 | "2019-03-05 02:30:20 | \n", 387 | "2 | \n", 388 | "30 | \n", 389 | "20 | \n", 390 | "2 | \n", 391 | "30 | \n", 392 | "20 | \n", 393 | "0 | \n", 394 | "
3 | \n", 397 | "2019-03-05 03:45:30 | \n", 398 | "3 | \n", 399 | "45 | \n", 400 | "30 | \n", 401 | "3 | \n", 402 | "45 | \n", 403 | "30 | \n", 404 | "0 | \n", 405 | "
4 | \n", 408 | "2019-03-05 05:00:40 | \n", 409 | "5 | \n", 410 | "0 | \n", 411 | "40 | \n", 412 | "5 | \n", 413 | "0 | \n", 414 | "40 | \n", 415 | "0 | \n", 416 | "
\n", 47 | " | date1 | \n", 48 | "date2 | \n", 49 | "
---|---|---|
0 | \n", 54 | "2019-03-05 00:00:00 | \n", 55 | "2019-03-31 | \n", 56 | "
1 | \n", 59 | "2019-03-05 01:00:00 | \n", 60 | "2019-04-30 | \n", 61 | "
2 | \n", 64 | "2019-03-05 02:00:00 | \n", 65 | "2019-05-31 | \n", 66 | "
3 | \n", 69 | "2019-03-05 03:00:00 | \n", 70 | "2019-06-30 | \n", 71 | "
4 | \n", 74 | "2019-03-05 04:00:00 | \n", 75 | "2019-07-31 | \n", 76 | "
\n", 131 | " | date1 | \n", 132 | "date2 | \n", 133 | "elapsed_days | \n", 134 | "
---|---|---|---|
0 | \n", 139 | "2019-03-05 00:00:00 | \n", 140 | "2019-03-31 | \n", 141 | "26 | \n", 142 | "
1 | \n", 145 | "2019-03-05 01:00:00 | \n", 146 | "2019-04-30 | \n", 147 | "55 | \n", 148 | "
2 | \n", 151 | "2019-03-05 02:00:00 | \n", 152 | "2019-05-31 | \n", 153 | "86 | \n", 154 | "
3 | \n", 157 | "2019-03-05 03:00:00 | \n", 158 | "2019-06-30 | \n", 159 | "116 | \n", 160 | "
4 | \n", 163 | "2019-03-05 04:00:00 | \n", 164 | "2019-07-31 | \n", 165 | "147 | \n", 166 | "
\n", 219 | " | date1 | \n", 220 | "date2 | \n", 221 | "elapsed_days | \n", 222 | "months_passed | \n", 223 | "
---|---|---|---|---|
0 | \n", 228 | "2019-03-05 00:00:00 | \n", 229 | "2019-03-31 | \n", 230 | "26 | \n", 231 | "1.0 | \n", 232 | "
1 | \n", 235 | "2019-03-05 01:00:00 | \n", 236 | "2019-04-30 | \n", 237 | "55 | \n", 238 | "2.0 | \n", 239 | "
2 | \n", 242 | "2019-03-05 02:00:00 | \n", 243 | "2019-05-31 | \n", 244 | "86 | \n", 245 | "3.0 | \n", 246 | "
3 | \n", 249 | "2019-03-05 03:00:00 | \n", 250 | "2019-06-30 | \n", 251 | "116 | \n", 252 | "4.0 | \n", 253 | "
4 | \n", 256 | "2019-03-05 04:00:00 | \n", 257 | "2019-07-31 | \n", 258 | "147 | \n", 259 | "5.0 | \n", 260 | "
\n", 314 | " | date1 | \n", 315 | "date2 | \n", 316 | "elapsed_days | \n", 317 | "months_passed | \n", 318 | "diff_seconds | \n", 319 | "diff_minutes | \n", 320 | "
---|---|---|---|---|---|---|
0 | \n", 325 | "2019-03-05 00:00:00 | \n", 326 | "2019-03-31 | \n", 327 | "26 | \n", 328 | "1.0 | \n", 329 | "2246400.0 | \n", 330 | "37440.0 | \n", 331 | "
1 | \n", 334 | "2019-03-05 01:00:00 | \n", 335 | "2019-04-30 | \n", 336 | "55 | \n", 337 | "2.0 | \n", 338 | "4834800.0 | \n", 339 | "80580.0 | \n", 340 | "
2 | \n", 343 | "2019-03-05 02:00:00 | \n", 344 | "2019-05-31 | \n", 345 | "86 | \n", 346 | "3.0 | \n", 347 | "7509600.0 | \n", 348 | "125160.0 | \n", 349 | "
3 | \n", 352 | "2019-03-05 03:00:00 | \n", 353 | "2019-06-30 | \n", 354 | "116 | \n", 355 | "4.0 | \n", 356 | "10098000.0 | \n", 357 | "168300.0 | \n", 358 | "
4 | \n", 361 | "2019-03-05 04:00:00 | \n", 362 | "2019-07-31 | \n", 363 | "147 | \n", 364 | "5.0 | \n", 365 | "12772800.0 | \n", 366 | "212880.0 | \n", 367 | "
\n", 428 | " | date1 | \n", 429 | "date2 | \n", 430 | "elapsed_days | \n", 431 | "months_passed | \n", 432 | "diff_seconds | \n", 433 | "diff_minutes | \n", 434 | "to_today | \n", 435 | "
---|---|---|---|---|---|---|---|
0 | \n", 440 | "2019-03-05 00:00:00 | \n", 441 | "2019-03-31 | \n", 442 | "26 | \n", 443 | "1.0 | \n", 444 | "2246400.0 | \n", 445 | "37440.0 | \n", 446 | "1265 days 11:41:24.651022 | \n", 447 | "
1 | \n", 450 | "2019-03-05 01:00:00 | \n", 451 | "2019-04-30 | \n", 452 | "55 | \n", 453 | "2.0 | \n", 454 | "4834800.0 | \n", 455 | "80580.0 | \n", 456 | "1265 days 10:41:24.651022 | \n", 457 | "
2 | \n", 460 | "2019-03-05 02:00:00 | \n", 461 | "2019-05-31 | \n", 462 | "86 | \n", 463 | "3.0 | \n", 464 | "7509600.0 | \n", 465 | "125160.0 | \n", 466 | "1265 days 09:41:24.651022 | \n", 467 | "
3 | \n", 470 | "2019-03-05 03:00:00 | \n", 471 | "2019-06-30 | \n", 472 | "116 | \n", 473 | "4.0 | \n", 474 | "10098000.0 | \n", 475 | "168300.0 | \n", 476 | "1265 days 08:41:24.651022 | \n", 477 | "
4 | \n", 480 | "2019-03-05 04:00:00 | \n", 481 | "2019-07-31 | \n", 482 | "147 | \n", 483 | "5.0 | \n", 484 | "12772800.0 | \n", 485 | "212880.0 | \n", 486 | "1265 days 07:41:24.651022 | \n", 487 | "
\n", 45 | " | time1 | \n", 46 | "
---|---|
0 | \n", 51 | "2015-06-10 09:00:00+02:00 | \n", 52 | "
1 | \n", 55 | "2015-06-10 10:00:00+02:00 | \n", 56 | "
2 | \n", 59 | "2015-06-10 11:00:00+02:00 | \n", 60 | "
0 | \n", 63 | "2015-09-10 09:00:00-05:00 | \n", 64 | "
1 | \n", 67 | "2015-09-10 10:00:00-05:00 | \n", 68 | "
2 | \n", 71 | "2015-09-10 11:00:00-05:00 | \n", 72 | "
\n", 143 | " | time1 | \n", 144 | "time2 | \n", 145 | "
---|---|---|
0 | \n", 150 | "2015-06-10 09:00:00+02:00 | \n", 151 | "2015-07-01 09:00:00+02:00 | \n", 152 | "
1 | \n", 155 | "2015-06-10 10:00:00+02:00 | \n", 156 | "2015-07-01 10:00:00+02:00 | \n", 157 | "
2 | \n", 160 | "2015-06-10 11:00:00+02:00 | \n", 161 | "2015-07-01 11:00:00+02:00 | \n", 162 | "
0 | \n", 165 | "2015-09-10 09:00:00-05:00 | \n", 166 | "2015-08-01 09:00:00-05:00 | \n", 167 | "
1 | \n", 170 | "2015-09-10 10:00:00-05:00 | \n", 171 | "2015-08-01 10:00:00-05:00 | \n", 172 | "
2 | \n", 175 | "2015-09-10 11:00:00-05:00 | \n", 176 | "2015-08-01 11:00:00-05:00 | \n", 177 | "
\n", 246 | " | time1 | \n", 247 | "time2 | \n", 248 | "time1_utc | \n", 249 | "time2_utc | \n", 250 | "
---|---|---|---|---|
0 | \n", 255 | "2015-06-10 09:00:00+02:00 | \n", 256 | "2015-07-01 09:00:00+02:00 | \n", 257 | "2015-06-10 07:00:00+00:00 | \n", 258 | "2015-07-01 07:00:00+00:00 | \n", 259 | "
1 | \n", 262 | "2015-06-10 10:00:00+02:00 | \n", 263 | "2015-07-01 10:00:00+02:00 | \n", 264 | "2015-06-10 08:00:00+00:00 | \n", 265 | "2015-07-01 08:00:00+00:00 | \n", 266 | "
2 | \n", 269 | "2015-06-10 11:00:00+02:00 | \n", 270 | "2015-07-01 11:00:00+02:00 | \n", 271 | "2015-06-10 09:00:00+00:00 | \n", 272 | "2015-07-01 09:00:00+00:00 | \n", 273 | "
0 | \n", 276 | "2015-09-10 09:00:00-05:00 | \n", 277 | "2015-08-01 09:00:00-05:00 | \n", 278 | "2015-09-10 14:00:00+00:00 | \n", 279 | "2015-08-01 14:00:00+00:00 | \n", 280 | "
1 | \n", 283 | "2015-09-10 10:00:00-05:00 | \n", 284 | "2015-08-01 10:00:00-05:00 | \n", 285 | "2015-09-10 15:00:00+00:00 | \n", 286 | "2015-08-01 15:00:00+00:00 | \n", 287 | "
2 | \n", 290 | "2015-09-10 11:00:00-05:00 | \n", 291 | "2015-08-01 11:00:00-05:00 | \n", 292 | "2015-09-10 16:00:00+00:00 | \n", 293 | "2015-08-01 16:00:00+00:00 | \n", 294 | "
\n", 387 | " | time1_london | \n", 388 | "time2_berlin | \n", 389 | "
---|---|---|
0 | \n", 394 | "2015-06-10 08:00:00+01:00 | \n", 395 | "2015-06-10 09:00:00+02:00 | \n", 396 | "
1 | \n", 399 | "2015-06-10 09:00:00+01:00 | \n", 400 | "2015-06-10 10:00:00+02:00 | \n", 401 | "
2 | \n", 404 | "2015-06-10 10:00:00+01:00 | \n", 405 | "2015-06-10 11:00:00+02:00 | \n", 406 | "
0 | \n", 409 | "2015-09-10 15:00:00+01:00 | \n", 410 | "2015-09-10 16:00:00+02:00 | \n", 411 | "
1 | \n", 414 | "2015-09-10 16:00:00+01:00 | \n", 415 | "2015-09-10 17:00:00+02:00 | \n", 416 | "
2 | \n", 419 | "2015-09-10 17:00:00+01:00 | \n", 420 | "2015-09-10 18:00:00+02:00 | \n", 421 | "
\n", 95 | " | MedInc | \n", 96 | "HouseAge | \n", 97 | "AveRooms | \n", 98 | "AveBedrms | \n", 99 | "Population | \n", 100 | "AveOccup | \n", 101 | "
---|---|---|---|---|---|---|
0 | \n", 106 | "8.3252 | \n", 107 | "41.0 | \n", 108 | "6.984127 | \n", 109 | "1.023810 | \n", 110 | "322.0 | \n", 111 | "2.555556 | \n", 112 | "
1 | \n", 115 | "8.3014 | \n", 116 | "21.0 | \n", 117 | "6.238137 | \n", 118 | "0.971880 | \n", 119 | "2401.0 | \n", 120 | "2.109842 | \n", 121 | "
2 | \n", 124 | "7.2574 | \n", 125 | "52.0 | \n", 126 | "8.288136 | \n", 127 | "1.073446 | \n", 128 | "496.0 | \n", 129 | "2.802260 | \n", 130 | "
3 | \n", 133 | "5.6431 | \n", 134 | "52.0 | \n", 135 | "5.817352 | \n", 136 | "1.073059 | \n", 137 | "558.0 | \n", 138 | "2.547945 | \n", 139 | "
4 | \n", 142 | "3.8462 | \n", 143 | "52.0 | \n", 144 | "6.281853 | \n", 145 | "1.081081 | \n", 146 | "565.0 | \n", 147 | "2.181467 | \n", 148 | "
\n", 160 | " | customer_id | \n", 161 | "invoice | \n", 162 | "stock_code | \n", 163 | "description | \n", 164 | "quantity | \n", 165 | "price | \n", 166 | "price * quantity | \n", 167 | "
---|---|---|---|---|---|---|---|
rows | \n", 170 | "\n", 171 | " | \n", 172 | " | \n", 173 | " | \n", 174 | " | \n", 175 | " | \n", 176 | " | \n", 177 | " |
0 | \n", 182 | "13085.0 | \n", 183 | "489434 | \n", 184 | "85048 | \n", 185 | "15CM CHRISTMAS GLASS BALL 20 LIGHTS | \n", 186 | "12 | \n", 187 | "6.95 | \n", 188 | "83.4 | \n", 189 | "
1 | \n", 192 | "13085.0 | \n", 193 | "489434 | \n", 194 | "79323P | \n", 195 | "PINK CHERRY LIGHTS | \n", 196 | "12 | \n", 197 | "6.75 | \n", 198 | "81.0 | \n", 199 | "
2 | \n", 202 | "13085.0 | \n", 203 | "489434 | \n", 204 | "79323W | \n", 205 | "WHITE CHERRY LIGHTS | \n", 206 | "12 | \n", 207 | "6.75 | \n", 208 | "81.0 | \n", 209 | "
3 | \n", 212 | "13085.0 | \n", 213 | "489434 | \n", 214 | "22041 | \n", 215 | "RECORD FRAME 7\" SINGLE SIZE | \n", 216 | "48 | \n", 217 | "2.10 | \n", 218 | "100.8 | \n", 219 | "
4 | \n", 222 | "13085.0 | \n", 223 | "489434 | \n", 224 | "21232 | \n", 225 | "STRAWBERRY CERAMIC TRINKET BOX | \n", 226 | "24 | \n", 227 | "1.25 | \n", 228 | "30.0 | \n", 229 | "
\n", 294 | " | customer_id | \n", 295 | "invoice | \n", 296 | "invoice_date | \n", 297 | "stock_code | \n", 298 | "description | \n", 299 | "quantity | \n", 300 | "price | \n", 301 | "
---|---|---|---|---|---|---|---|
0 | \n", 306 | "13085.0 | \n", 307 | "489434 | \n", 308 | "2009-12-01 07:45:00 | \n", 309 | "85048 | \n", 310 | "15CM CHRISTMAS GLASS BALL 20 LIGHTS | \n", 311 | "12 | \n", 312 | "6.95 | \n", 313 | "
1 | \n", 316 | "13085.0 | \n", 317 | "489434 | \n", 318 | "2009-12-01 07:45:00 | \n", 319 | "79323P | \n", 320 | "PINK CHERRY LIGHTS | \n", 321 | "12 | \n", 322 | "6.75 | \n", 323 | "
2 | \n", 326 | "13085.0 | \n", 327 | "489434 | \n", 328 | "2009-12-01 07:45:00 | \n", 329 | "79323W | \n", 330 | "WHITE CHERRY LIGHTS | \n", 331 | "12 | \n", 332 | "6.75 | \n", 333 | "
3 | \n", 336 | "13085.0 | \n", 337 | "489434 | \n", 338 | "2009-12-01 07:45:00 | \n", 339 | "22041 | \n", 340 | "RECORD FRAME 7\" SINGLE SIZE | \n", 341 | "48 | \n", 342 | "2.10 | \n", 343 | "
4 | \n", 346 | "13085.0 | \n", 347 | "489434 | \n", 348 | "2009-12-01 07:45:00 | \n", 349 | "21232 | \n", 350 | "STRAWBERRY CERAMIC TRINKET BOX | \n", 351 | "24 | \n", 352 | "1.25 | \n", 353 | "
\n", 413 | " | customer_id | \n", 414 | "invoice | \n", 415 | "invoice_date | \n", 416 | "stock_code | \n", 417 | "description | \n", 418 | "quantity | \n", 419 | "price | \n", 420 | "amount | \n", 421 | "
---|---|---|---|---|---|---|---|---|
0 | \n", 426 | "13085.0 | \n", 427 | "489434 | \n", 428 | "2009-12-01 07:45:00 | \n", 429 | "85048 | \n", 430 | "15CM CHRISTMAS GLASS BALL 20 LIGHTS | \n", 431 | "12 | \n", 432 | "6.95 | \n", 433 | "83.4 | \n", 434 | "
1 | \n", 437 | "13085.0 | \n", 438 | "489434 | \n", 439 | "2009-12-01 07:45:00 | \n", 440 | "79323P | \n", 441 | "PINK CHERRY LIGHTS | \n", 442 | "12 | \n", 443 | "6.75 | \n", 444 | "81.0 | \n", 445 | "
2 | \n", 448 | "13085.0 | \n", 449 | "489434 | \n", 450 | "2009-12-01 07:45:00 | \n", 451 | "79323W | \n", 452 | "WHITE CHERRY LIGHTS | \n", 453 | "12 | \n", 454 | "6.75 | \n", 455 | "81.0 | \n", 456 | "
3 | \n", 459 | "13085.0 | \n", 460 | "489434 | \n", 461 | "2009-12-01 07:45:00 | \n", 462 | "22041 | \n", 463 | "RECORD FRAME 7\" SINGLE SIZE | \n", 464 | "48 | \n", 465 | "2.10 | \n", 466 | "100.8 | \n", 467 | "
4 | \n", 470 | "13085.0 | \n", 471 | "489434 | \n", 472 | "2009-12-01 07:45:00 | \n", 473 | "21232 | \n", 474 | "STRAWBERRY CERAMIC TRINKET BOX | \n", 475 | "24 | \n", 476 | "1.25 | \n", 477 | "30.0 | \n", 478 | "
\n", 92 | " | Invoice | \n", 93 | "StockCode | \n", 94 | "Description | \n", 95 | "Quantity | \n", 96 | "InvoiceDate | \n", 97 | "Price | \n", 98 | "Customer ID | \n", 99 | "Country | \n", 100 | "
---|---|---|---|---|---|---|---|---|
0 | \n", 105 | "489434 | \n", 106 | "85048 | \n", 107 | "15CM CHRISTMAS GLASS BALL 20 LIGHTS | \n", 108 | "12 | \n", 109 | "2009-12-01 07:45:00 | \n", 110 | "6.95 | \n", 111 | "13085.0 | \n", 112 | "United Kingdom | \n", 113 | "
1 | \n", 116 | "489434 | \n", 117 | "79323P | \n", 118 | "PINK CHERRY LIGHTS | \n", 119 | "12 | \n", 120 | "2009-12-01 07:45:00 | \n", 121 | "6.75 | \n", 122 | "13085.0 | \n", 123 | "United Kingdom | \n", 124 | "
2 | \n", 127 | "489434 | \n", 128 | "79323W | \n", 129 | "WHITE CHERRY LIGHTS | \n", 130 | "12 | \n", 131 | "2009-12-01 07:45:00 | \n", 132 | "6.75 | \n", 133 | "13085.0 | \n", 134 | "United Kingdom | \n", 135 | "
3 | \n", 138 | "489434 | \n", 139 | "22041 | \n", 140 | "RECORD FRAME 7\" SINGLE SIZE | \n", 141 | "48 | \n", 142 | "2009-12-01 07:45:00 | \n", 143 | "2.10 | \n", 144 | "13085.0 | \n", 145 | "United Kingdom | \n", 146 | "
4 | \n", 149 | "489434 | \n", 150 | "21232 | \n", 151 | "STRAWBERRY CERAMIC TRINKET BOX | \n", 152 | "24 | \n", 153 | "2009-12-01 07:45:00 | \n", 154 | "1.25 | \n", 155 | "13085.0 | \n", 156 | "United Kingdom | \n", 157 | "
\n", 213 | " | temperature__c3__lag_1 | \n", 214 | "temperature__c3__lag_2 | \n", 215 | "temperature__c3__lag_3 | \n", 216 | "temperature__abs_energy | \n", 217 | "light__sum_of_reoccurring_data_points | \n", 218 | "light__spkt_welch_density__coeff_8 | \n", 219 | "light__variance | \n", 220 | "light__agg_linear_trend__attr_\"slope\"__chunk_len_50__f_agg_\"var\" | \n", 221 | "light__agg_linear_trend__attr_\"intercept\"__chunk_len_10__f_agg_\"var\" | \n", 222 | "co2__spkt_welch_density__coeff_2 | \n", 223 | "co2__variance | \n", 224 | "co2__sum_of_reoccurring_data_points | \n", 225 | "
---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | \n", 230 | "11585.127934 | \n", 231 | "11581.203590 | \n", 232 | "11578.178807 | \n", 233 | "30721.568703 | \n", 234 | "2514.0 | \n", 235 | "332.221295 | \n", 236 | "18086.371875 | \n", 237 | "-21130.3425 | \n", 238 | "19305.1375 | \n", 239 | "1523.529443 | \n", 240 | "756.700664 | \n", 241 | "14124.000000 | \n", 242 | "
2 | \n", 245 | "10751.999610 | \n", 246 | "10752.682508 | \n", 247 | "10753.119812 | \n", 248 | "29225.254374 | \n", 249 | "0.0 | \n", 250 | "0.000000 | \n", 251 | "0.000000 | \n", 252 | "0.0000 | \n", 253 | "0.0000 | \n", 254 | "350.067478 | \n", 255 | "377.280895 | \n", 256 | "13202.000000 | \n", 257 | "
3 | \n", 260 | "10187.865226 | \n", 261 | "10187.206963 | \n", 262 | "10186.284040 | \n", 263 | "28198.139950 | \n", 264 | "0.0 | \n", 265 | "0.000000 | \n", 266 | "0.000000 | \n", 267 | "0.0000 | \n", 268 | "0.0000 | \n", 269 | "91.896894 | \n", 270 | "115.269298 | \n", 271 | "20885.666667 | \n", 272 | "
4 | \n", 275 | "9908.900224 | \n", 276 | "9909.731388 | \n", 277 | "9910.163947 | \n", 278 | "27680.800184 | \n", 279 | "0.0 | \n", 280 | "0.000000 | \n", 281 | "0.000000 | \n", 282 | "0.0000 | \n", 283 | "0.0000 | \n", 284 | "42.394905 | \n", 285 | "35.473216 | \n", 286 | "18285.500000 | \n", 287 | "
5 | \n", 290 | "9705.989789 | \n", 291 | "9706.404551 | \n", 292 | "9706.707963 | \n", 293 | "27299.097469 | \n", 294 | "0.0 | \n", 295 | "0.000000 | \n", 296 | "0.000000 | \n", 297 | "0.0000 | \n", 298 | "0.0000 | \n", 299 | "4.811303 | \n", 300 | "27.539080 | \n", 301 | "17670.500000 | \n", 302 | "