├── README.md
├── 03-datastructures-code.ipynb
├── 01-intro-code.ipynb
├── 02-install-code.ipynb
├── 04-series-code.ipynb
├── 16-dataframe-code.ipynb
└── 33-exporting-code.ipynb


/README.md:
--------------------------------------------------------------------------------
1 | # effective_pandas_book
2 | Errata and code for Effective Pandas book
3 | 
4 | If you are interested in this book, [considering purchasing a copy](https://store.metasnake.com/effective-pandas-book).
5 | 
6 | Physical version [available on Amazon](https://www.amazon.com/Effective-Pandas-Patterns-Manipulation-Treading/dp/B09MYXXSFM/ref=sr_1_1?keywords=effective+panda&qid=1639521930&sr=8-1).
7 | 


--------------------------------------------------------------------------------
/03-datastructures-code.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "markdown",
 5 |    "metadata": {},
 6 |    "source": [
 7 |     "#. If you had a spreadsheet with data, which pandas data structure would you use"
 8 |    ]
 9 |   },
10 |   {
11 |    "cell_type": "markdown",
12 |    "metadata": {
13 |     "lines_to_next_cell": 2
14 |    },
15 |    "source": [
16 |     "#. If you had a database with data, which pandas data structure would you use"
17 |    ]
18 |   }
19 |  ],
20 |  "metadata": {
21 |   "jupytext": {
22 |    "cell_metadata_filter": "-all",
23 |    "main_language": "python",
24 |    "notebook_metadata_filter": "-all"
25 |   },
26 |   "kernelspec": {
27 |    "display_name": "Python 3",
28 |    "language": "python",
29 |    "name": "python3"
30 |   },
31 |   "language_info": {
32 |    "codemirror_mode": {
33 |     "name": "ipython",
34 |     "version": 3
35 |    },
36 |    "file_extension": ".py",
37 |    "mimetype": "text/x-python",
38 |    "name": "python",
39 |    "nbconvert_exporter": "python",
40 |    "pygments_lexer": "ipython3",
41 |    "version": "3.8.5"
42 |   }
43 |  },
44 |  "nbformat": 4,
45 |  "nbformat_minor": 4
46 | }
47 | 


--------------------------------------------------------------------------------
/01-intro-code.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "code",
 5 |    "execution_count": null,
 6 |    "metadata": {},
 7 |    "outputs": [],
 8 |    "source": [
 9 |     "import seaborn as sns  # REMOVELINE\n",
10 |     "sns.set_context('paper')  # REMOVELINE\n",
11 |     "sns.set_style('white') # REMOVELINE"
12 |    ]
13 |   },
14 |   {
15 |    "cell_type": "code",
16 |    "execution_count": null,
17 |    "metadata": {},
18 |    "outputs": [],
19 |    "source": []
20 |   }
21 |  ],
22 |  "metadata": {
23 |   "jupytext": {
24 |    "cell_metadata_filter": "-all",
25 |    "main_language": "python",
26 |    "notebook_metadata_filter": "-all"
27 |   },
28 |   "kernelspec": {
29 |    "display_name": "Python 3",
30 |    "language": "python",
31 |    "name": "python3"
32 |   },
33 |   "language_info": {
34 |    "codemirror_mode": {
35 |     "name": "ipython",
36 |     "version": 3
37 |    },
38 |    "file_extension": ".py",
39 |    "mimetype": "text/x-python",
40 |    "name": "python",
41 |    "nbconvert_exporter": "python",
42 |    "pygments_lexer": "ipython3",
43 |    "version": "3.8.5"
44 |   }
45 |  },
46 |  "nbformat": 4,
47 |  "nbformat_minor": 4
48 | }
49 | 


--------------------------------------------------------------------------------
/02-install-code.ipynb:
--------------------------------------------------------------------------------
 1 | {
 2 |  "cells": [
 3 |   {
 4 |    "cell_type": "code",
 5 |    "execution_count": null,
 6 |    "metadata": {
 7 |     "lines_to_next_cell": 2
 8 |    },
 9 |    "outputs": [],
10 |    "source": [
11 |     "import pandas\n",
12 |     "pandas.__version__"
13 |    ]
14 |   },
15 |   {
16 |    "cell_type": "code",
17 |    "execution_count": null,
18 |    "metadata": {
19 |     "lines_to_next_cell": 2
20 |    },
21 |    "outputs": [],
22 |    "source": [
23 |     "import pandas\n",
24 |     "pandas.__version__"
25 |    ]
26 |   },
27 |   {
28 |    "cell_type": "code",
29 |    "execution_count": null,
30 |    "metadata": {
31 |     "lines_to_next_cell": 2
32 |    },
33 |    "outputs": [],
34 |    "source": [
35 |     "import pandas\n",
36 |     "pandas.__version__"
37 |    ]
38 |   },
39 |   {
40 |    "cell_type": "markdown",
41 |    "metadata": {},
42 |    "source": [
43 |     "#. Install pandas on your machine (using Anaconda or pip)."
44 |    ]
45 |   },
46 |   {
47 |    "cell_type": "markdown",
48 |    "metadata": {},
49 |    "source": [
50 |     "#. Install Jupyter on your machine."
51 |    ]
52 |   },
53 |   {
54 |    "cell_type": "markdown",
55 |    "metadata": {
56 |     "lines_to_next_cell": 2
57 |    },
58 |    "source": [
59 |     "#. Launch Jupyter and run the following in a cell::"
60 |    ]
61 |   }
62 |  ],
63 |  "metadata": {
64 |   "jupytext": {
65 |    "cell_metadata_filter": "-all",
66 |    "main_language": "python",
67 |    "notebook_metadata_filter": "-all"
68 |   },
69 |   "kernelspec": {
70 |    "display_name": "Python 3",
71 |    "language": "python",
72 |    "name": "python3"
73 |   },
74 |   "language_info": {
75 |    "codemirror_mode": {
76 |     "name": "ipython",
77 |     "version": 3
78 |    },
79 |    "file_extension": ".py",
80 |    "mimetype": "text/x-python",
81 |    "name": "python",
82 |    "nbconvert_exporter": "python",
83 |    "pygments_lexer": "ipython3",
84 |    "version": "3.8.5"
85 |   }
86 |  },
87 |  "nbformat": 4,
88 |  "nbformat_minor": 4
89 | }
90 | 


--------------------------------------------------------------------------------
/04-series-code.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 1,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     "series = {\n",
 10 |     "  'index':[0, 1, 2, 3],\n",
 11 |     "  'data':[145, 142, 38, 13],\n",
 12 |     "  'name':'songs'\n",
 13 |     "  }"
 14 |    ]
 15 |   },
 16 |   {
 17 |    "cell_type": "code",
 18 |    "execution_count": 2,
 19 |    "metadata": {},
 20 |    "outputs": [],
 21 |    "source": [
 22 |     "def get(series, idx):\n",
 23 |     "    value_idx = series['index'].index(idx)\n",
 24 |     "    return series['data'][value_idx]"
 25 |    ]
 26 |   },
 27 |   {
 28 |    "cell_type": "code",
 29 |    "execution_count": 3,
 30 |    "metadata": {
 31 |     "lines_to_next_cell": 2
 32 |    },
 33 |    "outputs": [
 34 |     {
 35 |      "data": {
 36 |       "text/plain": [
 37 |        "142"
 38 |       ]
 39 |      },
 40 |      "execution_count": 3,
 41 |      "metadata": {},
 42 |      "output_type": "execute_result"
 43 |     }
 44 |    ],
 45 |    "source": [
 46 |     "get(series, 1)"
 47 |    ]
 48 |   },
 49 |   {
 50 |    "cell_type": "code",
 51 |    "execution_count": 4,
 52 |    "metadata": {
 53 |     "lines_to_next_cell": 2
 54 |    },
 55 |    "outputs": [],
 56 |    "source": [
 57 |     "songs = {\n",
 58 |     "  'index':['Paul', 'John', 'George', 'Ringo'],\n",
 59 |     "  'data':[145, 142, 38, 13],\n",
 60 |     "  'name':'counts'\n",
 61 |     "  }"
 62 |    ]
 63 |   },
 64 |   {
 65 |    "cell_type": "code",
 66 |    "execution_count": 5,
 67 |    "metadata": {
 68 |     "lines_to_next_cell": 2
 69 |    },
 70 |    "outputs": [
 71 |     {
 72 |      "data": {
 73 |       "text/plain": [
 74 |        "142"
 75 |       ]
 76 |      },
 77 |      "execution_count": 5,
 78 |      "metadata": {},
 79 |      "output_type": "execute_result"
 80 |     }
 81 |    ],
 82 |    "source": [
 83 |     "get(songs, 'John')"
 84 |    ]
 85 |   },
 86 |   {
 87 |    "cell_type": "code",
 88 |    "execution_count": 6,
 89 |    "metadata": {
 90 |     "lines_to_next_cell": 2
 91 |    },
 92 |    "outputs": [],
 93 |    "source": [
 94 |     "import pandas as pd\n",
 95 |     "songs2 = pd.Series([145, 142, 38, 13],\n",
 96 |     "     name='counts')"
 97 |    ]
 98 |   },
 99 |   {
100 |    "cell_type": "code",
101 |    "execution_count": 7,
102 |    "metadata": {
103 |     "lines_to_next_cell": 2
104 |    },
105 |    "outputs": [
106 |     {
107 |      "data": {
108 |       "text/plain": [
109 |        "0    145\n",
110 |        "1    142\n",
111 |        "2     38\n",
112 |        "3     13\n",
113 |        "Name: counts, dtype: int64"
114 |       ]
115 |      },
116 |      "execution_count": 7,
117 |      "metadata": {},
118 |      "output_type": "execute_result"
119 |     }
120 |    ],
121 |    "source": [
122 |     "songs2"
123 |    ]
124 |   },
125 |   {
126 |    "cell_type": "code",
127 |    "execution_count": 8,
128 |    "metadata": {
129 |     "lines_to_next_cell": 2
130 |    },
131 |    "outputs": [
132 |     {
133 |      "data": {
134 |       "text/plain": [
135 |        "RangeIndex(start=0, stop=4, step=1)"
136 |       ]
137 |      },
138 |      "execution_count": 8,
139 |      "metadata": {},
140 |      "output_type": "execute_result"
141 |     }
142 |    ],
143 |    "source": [
144 |     "songs2.index"
145 |    ]
146 |   },
147 |   {
148 |    "cell_type": "code",
149 |    "execution_count": 9,
150 |    "metadata": {
151 |     "lines_to_next_cell": 2
152 |    },
153 |    "outputs": [],
154 |    "source": [
155 |     "songs3 = pd.Series([145, 142, 38, 13],\n",
156 |     "     name='counts',\n",
157 |     "     index=['Paul', 'John', 'George', 'Ringo'])"
158 |    ]
159 |   },
160 |   {
161 |    "cell_type": "code",
162 |    "execution_count": 10,
163 |    "metadata": {
164 |     "lines_to_next_cell": 2
165 |    },
166 |    "outputs": [
167 |     {
168 |      "data": {
169 |       "text/plain": [
170 |        "Paul      145\n",
171 |        "John      142\n",
172 |        "George     38\n",
173 |        "Ringo      13\n",
174 |        "Name: counts, dtype: int64"
175 |       ]
176 |      },
177 |      "execution_count": 10,
178 |      "metadata": {},
179 |      "output_type": "execute_result"
180 |     }
181 |    ],
182 |    "source": [
183 |     "songs3"
184 |    ]
185 |   },
186 |   {
187 |    "cell_type": "code",
188 |    "execution_count": 11,
189 |    "metadata": {},
190 |    "outputs": [
191 |     {
192 |      "data": {
193 |       "text/plain": [
194 |        "Index(['Paul', 'John', 'George', 'Ringo'], dtype='object')"
195 |       ]
196 |      },
197 |      "execution_count": 11,
198 |      "metadata": {},
199 |      "output_type": "execute_result"
200 |     }
201 |    ],
202 |    "source": [
203 |     "songs3.index   # doctest: +NORMALIZE_WHITESPACE"
204 |    ]
205 |   },
206 |   {
207 |    "cell_type": "code",
208 |    "execution_count": 12,
209 |    "metadata": {},
210 |    "outputs": [],
211 |    "source": [
212 |     "class Foo:\n",
213 |     "    pass"
214 |    ]
215 |   },
216 |   {
217 |    "cell_type": "code",
218 |    "execution_count": 13,
219 |    "metadata": {
220 |     "lines_to_next_cell": 2
221 |    },
222 |    "outputs": [],
223 |    "source": [
224 |     "ringo = pd.Series(\n",
225 |     "     ['Richard', 'Starkey', 13, Foo()],\n",
226 |     "     name='ringo')"
227 |    ]
228 |   },
229 |   {
230 |    "cell_type": "code",
231 |    "execution_count": 14,
232 |    "metadata": {
233 |     "lines_to_next_cell": 2
234 |    },
235 |    "outputs": [
236 |     {
237 |      "data": {
238 |       "text/plain": [
239 |        "0                                    Richard\n",
240 |        "1                                    Starkey\n",
241 |        "2                                         13\n",
242 |        "3    <__main__.Foo object at 0x7f125dd9b190>\n",
243 |        "Name: ringo, dtype: object"
244 |       ]
245 |      },
246 |      "execution_count": 14,
247 |      "metadata": {},
248 |      "output_type": "execute_result"
249 |     }
250 |    ],
251 |    "source": [
252 |     "ringo  # doctest: +SKIP +NORMALIZE_WHITESPACE"
253 |    ]
254 |   },
255 |   {
256 |    "cell_type": "code",
257 |    "execution_count": 15,
258 |    "metadata": {
259 |     "lines_to_next_cell": 2
260 |    },
261 |    "outputs": [
262 |     {
263 |      "data": {
264 |       "text/plain": [
265 |        "Ono        2.0\n",
266 |        "Clapton    NaN\n",
267 |        "dtype: float64"
268 |       ]
269 |      },
270 |      "execution_count": 15,
271 |      "metadata": {},
272 |      "output_type": "execute_result"
273 |     }
274 |    ],
275 |    "source": [
276 |     "import numpy as np\n",
277 |     "nan_series = pd.Series([2, np.nan],\n",
278 |     "   index=['Ono', 'Clapton'])\n",
279 |     "nan_series"
280 |    ]
281 |   },
282 |   {
283 |    "cell_type": "code",
284 |    "execution_count": 16,
285 |    "metadata": {
286 |     "lines_to_next_cell": 2
287 |    },
288 |    "outputs": [
289 |     {
290 |      "data": {
291 |       "text/plain": [
292 |        "1"
293 |       ]
294 |      },
295 |      "execution_count": 16,
296 |      "metadata": {},
297 |      "output_type": "execute_result"
298 |     }
299 |    ],
300 |    "source": [
301 |     "nan_series.count()"
302 |    ]
303 |   },
304 |   {
305 |    "cell_type": "code",
306 |    "execution_count": 17,
307 |    "metadata": {
308 |     "lines_to_next_cell": 2
309 |    },
310 |    "outputs": [
311 |     {
312 |      "data": {
313 |       "text/plain": [
314 |        "2"
315 |       ]
316 |      },
317 |      "execution_count": 17,
318 |      "metadata": {},
319 |      "output_type": "execute_result"
320 |     }
321 |    ],
322 |    "source": [
323 |     "nan_series.size"
324 |    ]
325 |   },
326 |   {
327 |    "cell_type": "code",
328 |    "execution_count": 18,
329 |    "metadata": {
330 |     "lines_to_next_cell": 2
331 |    },
332 |    "outputs": [
333 |     {
334 |      "data": {
335 |       "text/plain": [
336 |        "Ono           2\n",
337 |        "Clapton    <NA>\n",
338 |        "dtype: Int64"
339 |       ]
340 |      },
341 |      "execution_count": 18,
342 |      "metadata": {},
343 |      "output_type": "execute_result"
344 |     }
345 |    ],
346 |    "source": [
347 |     "nan_series2 = pd.Series([2, None],\n",
348 |     "   index=['Ono', 'Clapton'],\n",
349 |     "   dtype='Int64')\n",
350 |     "nan_series2"
351 |    ]
352 |   },
353 |   {
354 |    "cell_type": "code",
355 |    "execution_count": 19,
356 |    "metadata": {
357 |     "lines_to_next_cell": 2
358 |    },
359 |    "outputs": [
360 |     {
361 |      "data": {
362 |       "text/plain": [
363 |        "1"
364 |       ]
365 |      },
366 |      "execution_count": 19,
367 |      "metadata": {},
368 |      "output_type": "execute_result"
369 |     }
370 |    ],
371 |    "source": [
372 |     "nan_series2.count()"
373 |    ]
374 |   },
375 |   {
376 |    "cell_type": "code",
377 |    "execution_count": 20,
378 |    "metadata": {
379 |     "lines_to_next_cell": 2
380 |    },
381 |    "outputs": [
382 |     {
383 |      "data": {
384 |       "text/plain": [
385 |        "Ono           2\n",
386 |        "Clapton    <NA>\n",
387 |        "dtype: Int64"
388 |       ]
389 |      },
390 |      "execution_count": 20,
391 |      "metadata": {},
392 |      "output_type": "execute_result"
393 |     }
394 |    ],
395 |    "source": [
396 |     "nan_series.astype('Int64')"
397 |    ]
398 |   },
399 |   {
400 |    "cell_type": "code",
401 |    "execution_count": 21,
402 |    "metadata": {
403 |     "lines_to_next_cell": 2
404 |    },
405 |    "outputs": [
406 |     {
407 |      "data": {
408 |       "text/plain": [
409 |        "142"
410 |       ]
411 |      },
412 |      "execution_count": 21,
413 |      "metadata": {},
414 |      "output_type": "execute_result"
415 |     }
416 |    ],
417 |    "source": [
418 |     "import numpy as np\n",
419 |     "numpy_ser = np.array([145, 142, 38, 13])\n",
420 |     "songs3[1]"
421 |    ]
422 |   },
423 |   {
424 |    "cell_type": "code",
425 |    "execution_count": 22,
426 |    "metadata": {
427 |     "lines_to_next_cell": 2
428 |    },
429 |    "outputs": [
430 |     {
431 |      "data": {
432 |       "text/plain": [
433 |        "142"
434 |       ]
435 |      },
436 |      "execution_count": 22,
437 |      "metadata": {},
438 |      "output_type": "execute_result"
439 |     }
440 |    ],
441 |    "source": [
442 |     "numpy_ser[1]"
443 |    ]
444 |   },
445 |   {
446 |    "cell_type": "code",
447 |    "execution_count": 23,
448 |    "metadata": {
449 |     "lines_to_next_cell": 2
450 |    },
451 |    "outputs": [
452 |     {
453 |      "data": {
454 |       "text/plain": [
455 |        "84.5"
456 |       ]
457 |      },
458 |      "execution_count": 23,
459 |      "metadata": {},
460 |      "output_type": "execute_result"
461 |     }
462 |    ],
463 |    "source": [
464 |     "songs3.mean()"
465 |    ]
466 |   },
467 |   {
468 |    "cell_type": "code",
469 |    "execution_count": 24,
470 |    "metadata": {
471 |     "lines_to_next_cell": 2
472 |    },
473 |    "outputs": [
474 |     {
475 |      "data": {
476 |       "text/plain": [
477 |        "84.5"
478 |       ]
479 |      },
480 |      "execution_count": 24,
481 |      "metadata": {},
482 |      "output_type": "execute_result"
483 |     }
484 |    ],
485 |    "source": [
486 |     "numpy_ser.mean()"
487 |    ]
488 |   },
489 |   {
490 |    "cell_type": "code",
491 |    "execution_count": 25,
492 |    "metadata": {
493 |     "lines_to_next_cell": 2
494 |    },
495 |    "outputs": [],
496 |    "source": [
497 |     "mask = songs3 > songs3.median()  # boolean array"
498 |    ]
499 |   },
500 |   {
501 |    "cell_type": "code",
502 |    "execution_count": 26,
503 |    "metadata": {
504 |     "lines_to_next_cell": 2
505 |    },
506 |    "outputs": [
507 |     {
508 |      "data": {
509 |       "text/plain": [
510 |        "Paul       True\n",
511 |        "John       True\n",
512 |        "George    False\n",
513 |        "Ringo     False\n",
514 |        "Name: counts, dtype: bool"
515 |       ]
516 |      },
517 |      "execution_count": 26,
518 |      "metadata": {},
519 |      "output_type": "execute_result"
520 |     }
521 |    ],
522 |    "source": [
523 |     "mask"
524 |    ]
525 |   },
526 |   {
527 |    "cell_type": "code",
528 |    "execution_count": 27,
529 |    "metadata": {
530 |     "lines_to_next_cell": 2
531 |    },
532 |    "outputs": [
533 |     {
534 |      "data": {
535 |       "text/plain": [
536 |        "Paul    145\n",
537 |        "John    142\n",
538 |        "Name: counts, dtype: int64"
539 |       ]
540 |      },
541 |      "execution_count": 27,
542 |      "metadata": {},
543 |      "output_type": "execute_result"
544 |     }
545 |    ],
546 |    "source": [
547 |     "songs3[mask]"
548 |    ]
549 |   },
550 |   {
551 |    "cell_type": "code",
552 |    "execution_count": 28,
553 |    "metadata": {
554 |     "lines_to_next_cell": 2
555 |    },
556 |    "outputs": [
557 |     {
558 |      "data": {
559 |       "text/plain": [
560 |        "array([145, 142])"
561 |       ]
562 |      },
563 |      "execution_count": 28,
564 |      "metadata": {},
565 |      "output_type": "execute_result"
566 |     }
567 |    ],
568 |    "source": [
569 |     "numpy_ser[numpy_ser > np.median(numpy_ser)]"
570 |    ]
571 |   },
572 |   {
573 |    "cell_type": "code",
574 |    "execution_count": 29,
575 |    "metadata": {
576 |     "lines_to_next_cell": 2
577 |    },
578 |    "outputs": [],
579 |    "source": [
580 |     "import pandas as pd\n",
581 |     "import numpy as np"
582 |    ]
583 |   },
584 |   {
585 |    "cell_type": "code",
586 |    "execution_count": 30,
587 |    "metadata": {
588 |     "lines_to_next_cell": 2
589 |    },
590 |    "outputs": [],
591 |    "source": [
592 |     "from pandas import *"
593 |    ]
594 |   },
595 |   {
596 |    "cell_type": "code",
597 |    "execution_count": 31,
598 |    "metadata": {
599 |     "lines_to_next_cell": 2
600 |    },
601 |    "outputs": [
602 |     {
603 |      "data": {
604 |       "text/plain": [
605 |        "0     m\n",
606 |        "1     l\n",
607 |        "2    xs\n",
608 |        "3     s\n",
609 |        "4    xl\n",
610 |        "dtype: category\n",
611 |        "Categories (5, object): ['l', 'm', 's', 'xl', 'xs']"
612 |       ]
613 |      },
614 |      "execution_count": 31,
615 |      "metadata": {},
616 |      "output_type": "execute_result"
617 |     }
618 |    ],
619 |    "source": [
620 |     "s = pd.Series(['m', 'l', 'xs', 's', 'xl'], dtype='category')\n",
621 |     "s"
622 |    ]
623 |   },
624 |   {
625 |    "cell_type": "code",
626 |    "execution_count": 32,
627 |    "metadata": {
628 |     "lines_to_next_cell": 2
629 |    },
630 |    "outputs": [
631 |     {
632 |      "data": {
633 |       "text/plain": [
634 |        "False"
635 |       ]
636 |      },
637 |      "execution_count": 32,
638 |      "metadata": {},
639 |      "output_type": "execute_result"
640 |     }
641 |    ],
642 |    "source": [
643 |     "s.cat.ordered"
644 |    ]
645 |   },
646 |   {
647 |    "cell_type": "code",
648 |    "execution_count": 33,
649 |    "metadata": {
650 |     "lines_to_next_cell": 2
651 |    },
652 |    "outputs": [],
653 |    "source": [
654 |     "s2 = pd.Series(['m', 'l', 'xs', 's', 'xl'])\n",
655 |     "size_type = pd.api.types.CategoricalDtype(\n",
656 |     "    categories=['s','m','l'], ordered=True)\n",
657 |     "s3 = s2.astype(size_type)"
658 |    ]
659 |   },
660 |   {
661 |    "cell_type": "code",
662 |    "execution_count": 34,
663 |    "metadata": {
664 |     "lines_to_next_cell": 2
665 |    },
666 |    "outputs": [
667 |     {
668 |      "data": {
669 |       "text/plain": [
670 |        "0      m\n",
671 |        "1      l\n",
672 |        "2    NaN\n",
673 |        "3      s\n",
674 |        "4    NaN\n",
675 |        "dtype: category\n",
676 |        "Categories (3, object): ['s' < 'm' < 'l']"
677 |       ]
678 |      },
679 |      "execution_count": 34,
680 |      "metadata": {},
681 |      "output_type": "execute_result"
682 |     }
683 |    ],
684 |    "source": [
685 |     "s3"
686 |    ]
687 |   },
688 |   {
689 |    "cell_type": "code",
690 |    "execution_count": 35,
691 |    "metadata": {
692 |     "lines_to_next_cell": 2
693 |    },
694 |    "outputs": [
695 |     {
696 |      "data": {
697 |       "text/plain": [
698 |        "0     True\n",
699 |        "1     True\n",
700 |        "2    False\n",
701 |        "3    False\n",
702 |        "4    False\n",
703 |        "dtype: bool"
704 |       ]
705 |      },
706 |      "execution_count": 35,
707 |      "metadata": {},
708 |      "output_type": "execute_result"
709 |     }
710 |    ],
711 |    "source": [
712 |     "s3 > 's'"
713 |    ]
714 |   },
715 |   {
716 |    "cell_type": "code",
717 |    "execution_count": 36,
718 |    "metadata": {
719 |     "lines_to_next_cell": 2
720 |    },
721 |    "outputs": [
722 |     {
723 |      "data": {
724 |       "text/plain": [
725 |        "0     m\n",
726 |        "1     l\n",
727 |        "2    xs\n",
728 |        "3     s\n",
729 |        "4    xl\n",
730 |        "dtype: category\n",
731 |        "Categories (5, object): ['xs' < 's' < 'm' < 'l' < 'xl']"
732 |       ]
733 |      },
734 |      "execution_count": 36,
735 |      "metadata": {},
736 |      "output_type": "execute_result"
737 |     }
738 |    ],
739 |    "source": [
740 |     "s.cat.reorder_categories(['xs','s','m','l', 'xl'],\n",
741 |     "                         ordered=True)"
742 |    ]
743 |   },
744 |   {
745 |    "cell_type": "code",
746 |    "execution_count": 37,
747 |    "metadata": {
748 |     "lines_to_next_cell": 2,
749 |     "scrolled": true
750 |    },
751 |    "outputs": [
752 |     {
753 |      "data": {
754 |       "text/plain": [
755 |        "0      M\n",
756 |        "1      L\n",
757 |        "2    NaN\n",
758 |        "3      S\n",
759 |        "4    NaN\n",
760 |        "dtype: object"
761 |       ]
762 |      },
763 |      "execution_count": 37,
764 |      "metadata": {},
765 |      "output_type": "execute_result"
766 |     }
767 |    ],
768 |    "source": [
769 |     "s3.str.upper()"
770 |    ]
771 |   }
772 |  ],
773 |  "metadata": {
774 |   "jupytext": {
775 |    "cell_metadata_filter": "-all",
776 |    "main_language": "python",
777 |    "notebook_metadata_filter": "-all"
778 |   },
779 |   "kernelspec": {
780 |    "display_name": "Python 3",
781 |    "language": "python",
782 |    "name": "python3"
783 |   },
784 |   "language_info": {
785 |    "codemirror_mode": {
786 |     "name": "ipython",
787 |     "version": 3
788 |    },
789 |    "file_extension": ".py",
790 |    "mimetype": "text/x-python",
791 |    "name": "python",
792 |    "nbconvert_exporter": "python",
793 |    "pygments_lexer": "ipython3",
794 |    "version": "3.8.5"
795 |   }
796 |  },
797 |  "nbformat": 4,
798 |  "nbformat_minor": 4
799 | }
800 | 


--------------------------------------------------------------------------------
/16-dataframe-code.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "code",
  5 |    "execution_count": 1,
  6 |    "metadata": {},
  7 |    "outputs": [],
  8 |    "source": [
  9 |     "df = {\n",
 10 |     "  'index':[0,1,2],\n",
 11 |     "  'cols': [\n",
 12 |     "    { 'name':'growth',\n",
 13 |     "      'data':[.5, .7, 1.2] },\n",
 14 |     "    { 'name':'Name',\n",
 15 |     "      'data':['Paul', 'George', 'Ringo'] },\n",
 16 |     "  ]\n",
 17 |     "}"
 18 |    ]
 19 |   },
 20 |   {
 21 |    "cell_type": "code",
 22 |    "execution_count": 2,
 23 |    "metadata": {},
 24 |    "outputs": [],
 25 |    "source": [
 26 |     "def get_row(df, idx):\n",
 27 |     "    results = []\n",
 28 |     "    value_idx = df['index'].index(idx)\n",
 29 |     "    for col in df['cols']:\n",
 30 |     "        results.append(col['data'][value_idx])\n",
 31 |     "    return results"
 32 |    ]
 33 |   },
 34 |   {
 35 |    "cell_type": "code",
 36 |    "execution_count": 3,
 37 |    "metadata": {},
 38 |    "outputs": [
 39 |     {
 40 |      "data": {
 41 |       "text/plain": [
 42 |        "[0.7, 'George']"
 43 |       ]
 44 |      },
 45 |      "execution_count": 3,
 46 |      "metadata": {},
 47 |      "output_type": "execute_result"
 48 |     }
 49 |    ],
 50 |    "source": [
 51 |     "get_row(df, 1)"
 52 |    ]
 53 |   },
 54 |   {
 55 |    "cell_type": "code",
 56 |    "execution_count": 4,
 57 |    "metadata": {},
 58 |    "outputs": [],
 59 |    "source": [
 60 |     "def get_col(df, name):\n",
 61 |     "    for col in df['cols']:\n",
 62 |     "        if col['name'] == name:\n",
 63 |     "            return col['data']"
 64 |    ]
 65 |   },
 66 |   {
 67 |    "cell_type": "code",
 68 |    "execution_count": 5,
 69 |    "metadata": {
 70 |     "lines_to_next_cell": 2
 71 |    },
 72 |    "outputs": [
 73 |     {
 74 |      "data": {
 75 |       "text/plain": [
 76 |        "['Paul', 'George', 'Ringo']"
 77 |       ]
 78 |      },
 79 |      "execution_count": 5,
 80 |      "metadata": {},
 81 |      "output_type": "execute_result"
 82 |     }
 83 |    ],
 84 |    "source": [
 85 |     "get_col(df, 'Name')"
 86 |    ]
 87 |   },
 88 |   {
 89 |    "cell_type": "code",
 90 |    "execution_count": 6,
 91 |    "metadata": {
 92 |     "lines_to_next_cell": 2
 93 |    },
 94 |    "outputs": [],
 95 |    "source": [
 96 |     "import pandas as pd\n",
 97 |     "df = pd.DataFrame({\n",
 98 |     "  'growth':[.5, .7, 1.2],\n",
 99 |     "  'Name':['Paul', 'George', 'Ringo'] })"
100 |    ]
101 |   },
102 |   {
103 |    "cell_type": "code",
104 |    "execution_count": 7,
105 |    "metadata": {
106 |     "lines_to_next_cell": 2
107 |    },
108 |    "outputs": [
109 |     {
110 |      "data": {
111 |       "text/html": [
112 |        "<div>\n",
113 |        "<style scoped>\n",
114 |        "    .dataframe tbody tr th:only-of-type {\n",
115 |        "        vertical-align: middle;\n",
116 |        "    }\n",
117 |        "\n",
118 |        "    .dataframe tbody tr th {\n",
119 |        "        vertical-align: top;\n",
120 |        "    }\n",
121 |        "\n",
122 |        "    .dataframe thead th {\n",
123 |        "        text-align: right;\n",
124 |        "    }\n",
125 |        "</style>\n",
126 |        "<table border=\"1\" class=\"dataframe\">\n",
127 |        "  <thead>\n",
128 |        "    <tr style=\"text-align: right;\">\n",
129 |        "      <th></th>\n",
130 |        "      <th>growth</th>\n",
131 |        "      <th>Name</th>\n",
132 |        "    </tr>\n",
133 |        "  </thead>\n",
134 |        "  <tbody>\n",
135 |        "    <tr>\n",
136 |        "      <th>0</th>\n",
137 |        "      <td>0.5</td>\n",
138 |        "      <td>Paul</td>\n",
139 |        "    </tr>\n",
140 |        "    <tr>\n",
141 |        "      <th>1</th>\n",
142 |        "      <td>0.7</td>\n",
143 |        "      <td>George</td>\n",
144 |        "    </tr>\n",
145 |        "    <tr>\n",
146 |        "      <th>2</th>\n",
147 |        "      <td>1.2</td>\n",
148 |        "      <td>Ringo</td>\n",
149 |        "    </tr>\n",
150 |        "  </tbody>\n",
151 |        "</table>\n",
152 |        "</div>"
153 |       ],
154 |       "text/plain": [
155 |        "   growth    Name\n",
156 |        "0     0.5    Paul\n",
157 |        "1     0.7  George\n",
158 |        "2     1.2   Ringo"
159 |       ]
160 |      },
161 |      "execution_count": 7,
162 |      "metadata": {},
163 |      "output_type": "execute_result"
164 |     }
165 |    ],
166 |    "source": [
167 |     "df"
168 |    ]
169 |   },
170 |   {
171 |    "cell_type": "code",
172 |    "execution_count": 8,
173 |    "metadata": {
174 |     "lines_to_next_cell": 2
175 |    },
176 |    "outputs": [
177 |     {
178 |      "data": {
179 |       "text/plain": [
180 |        "growth      1.2\n",
181 |        "Name      Ringo\n",
182 |        "Name: 2, dtype: object"
183 |       ]
184 |      },
185 |      "execution_count": 8,
186 |      "metadata": {},
187 |      "output_type": "execute_result"
188 |     }
189 |    ],
190 |    "source": [
191 |     "df.iloc[2]"
192 |    ]
193 |   },
194 |   {
195 |    "cell_type": "code",
196 |    "execution_count": 9,
197 |    "metadata": {
198 |     "lines_to_next_cell": 2
199 |    },
200 |    "outputs": [
201 |     {
202 |      "data": {
203 |       "text/plain": [
204 |        "0      Paul\n",
205 |        "1    George\n",
206 |        "2     Ringo\n",
207 |        "Name: Name, dtype: object"
208 |       ]
209 |      },
210 |      "execution_count": 9,
211 |      "metadata": {},
212 |      "output_type": "execute_result"
213 |     }
214 |    ],
215 |    "source": [
216 |     "df['Name']"
217 |    ]
218 |   },
219 |   {
220 |    "cell_type": "code",
221 |    "execution_count": 10,
222 |    "metadata": {
223 |     "lines_to_next_cell": 2
224 |    },
225 |    "outputs": [
226 |     {
227 |      "data": {
228 |       "text/plain": [
229 |        "pandas.core.series.Series"
230 |       ]
231 |      },
232 |      "execution_count": 10,
233 |      "metadata": {},
234 |      "output_type": "execute_result"
235 |     }
236 |    ],
237 |    "source": [
238 |     "type(df['Name'])"
239 |    ]
240 |   },
241 |   {
242 |    "cell_type": "code",
243 |    "execution_count": 11,
244 |    "metadata": {
245 |     "lines_to_next_cell": 2
246 |    },
247 |    "outputs": [
248 |     {
249 |      "data": {
250 |       "text/plain": [
251 |        "0      paul\n",
252 |        "1    george\n",
253 |        "2     ringo\n",
254 |        "Name: Name, dtype: object"
255 |       ]
256 |      },
257 |      "execution_count": 11,
258 |      "metadata": {},
259 |      "output_type": "execute_result"
260 |     }
261 |    ],
262 |    "source": [
263 |     "df['Name'].str.lower()"
264 |    ]
265 |   },
266 |   {
267 |    "cell_type": "code",
268 |    "execution_count": 12,
269 |    "metadata": {
270 |     "lines_to_next_cell": 2
271 |    },
272 |    "outputs": [
273 |     {
274 |      "data": {
275 |       "text/plain": [
276 |        "0      Paul\n",
277 |        "1    George\n",
278 |        "2     Ringo\n",
279 |        "Name: Name, dtype: object"
280 |       ]
281 |      },
282 |      "execution_count": 12,
283 |      "metadata": {},
284 |      "output_type": "execute_result"
285 |     }
286 |    ],
287 |    "source": [
288 |     "df.Name"
289 |    ]
290 |   },
291 |   {
292 |    "cell_type": "code",
293 |    "execution_count": 13,
294 |    "metadata": {
295 |     "lines_to_next_cell": 2
296 |    },
297 |    "outputs": [
298 |     {
299 |      "data": {
300 |       "text/html": [
301 |        "<div>\n",
302 |        "<style scoped>\n",
303 |        "    .dataframe tbody tr th:only-of-type {\n",
304 |        "        vertical-align: middle;\n",
305 |        "    }\n",
306 |        "\n",
307 |        "    .dataframe tbody tr th {\n",
308 |        "        vertical-align: top;\n",
309 |        "    }\n",
310 |        "\n",
311 |        "    .dataframe thead th {\n",
312 |        "        text-align: right;\n",
313 |        "    }\n",
314 |        "</style>\n",
315 |        "<table border=\"1\" class=\"dataframe\">\n",
316 |        "  <thead>\n",
317 |        "    <tr style=\"text-align: right;\">\n",
318 |        "      <th></th>\n",
319 |        "      <th>growth</th>\n",
320 |        "      <th>Name</th>\n",
321 |        "    </tr>\n",
322 |        "  </thead>\n",
323 |        "  <tbody>\n",
324 |        "    <tr>\n",
325 |        "      <th>0</th>\n",
326 |        "      <td>0.5</td>\n",
327 |        "      <td>Paul</td>\n",
328 |        "    </tr>\n",
329 |        "    <tr>\n",
330 |        "      <th>1</th>\n",
331 |        "      <td>0.7</td>\n",
332 |        "      <td>George</td>\n",
333 |        "    </tr>\n",
334 |        "    <tr>\n",
335 |        "      <th>2</th>\n",
336 |        "      <td>1.2</td>\n",
337 |        "      <td>Ringo</td>\n",
338 |        "    </tr>\n",
339 |        "  </tbody>\n",
340 |        "</table>\n",
341 |        "</div>"
342 |       ],
343 |       "text/plain": [
344 |        "   growth    Name\n",
345 |        "0     0.5    Paul\n",
346 |        "1     0.7  George\n",
347 |        "2     1.2   Ringo"
348 |       ]
349 |      },
350 |      "execution_count": 13,
351 |      "metadata": {},
352 |      "output_type": "execute_result"
353 |     }
354 |    ],
355 |    "source": [
356 |     "pd.DataFrame([\n",
357 |     "  {'growth':.5, 'Name':'Paul'},\n",
358 |     "  {'growth':.7, 'Name':'George'},\n",
359 |     "  {'growth':1.2, 'Name':'Ringo'}])"
360 |    ]
361 |   },
362 |   {
363 |    "cell_type": "code",
364 |    "execution_count": 14,
365 |    "metadata": {
366 |     "lines_to_next_cell": 2
367 |    },
368 |    "outputs": [],
369 |    "source": [
370 |     "from io import StringIO\n",
371 |     "csv_file = StringIO(\"\"\"growth,Name\n",
372 |     ".5,Paul\n",
373 |     ".7,George\n",
374 |     "1.2,Ringo\"\"\")"
375 |    ]
376 |   },
377 |   {
378 |    "cell_type": "code",
379 |    "execution_count": 15,
380 |    "metadata": {
381 |     "lines_to_next_cell": 2
382 |    },
383 |    "outputs": [
384 |     {
385 |      "data": {
386 |       "text/html": [
387 |        "<div>\n",
388 |        "<style scoped>\n",
389 |        "    .dataframe tbody tr th:only-of-type {\n",
390 |        "        vertical-align: middle;\n",
391 |        "    }\n",
392 |        "\n",
393 |        "    .dataframe tbody tr th {\n",
394 |        "        vertical-align: top;\n",
395 |        "    }\n",
396 |        "\n",
397 |        "    .dataframe thead th {\n",
398 |        "        text-align: right;\n",
399 |        "    }\n",
400 |        "</style>\n",
401 |        "<table border=\"1\" class=\"dataframe\">\n",
402 |        "  <thead>\n",
403 |        "    <tr style=\"text-align: right;\">\n",
404 |        "      <th></th>\n",
405 |        "      <th>growth</th>\n",
406 |        "      <th>Name</th>\n",
407 |        "    </tr>\n",
408 |        "  </thead>\n",
409 |        "  <tbody>\n",
410 |        "    <tr>\n",
411 |        "      <th>0</th>\n",
412 |        "      <td>0.5</td>\n",
413 |        "      <td>Paul</td>\n",
414 |        "    </tr>\n",
415 |        "    <tr>\n",
416 |        "      <th>1</th>\n",
417 |        "      <td>0.7</td>\n",
418 |        "      <td>George</td>\n",
419 |        "    </tr>\n",
420 |        "    <tr>\n",
421 |        "      <th>2</th>\n",
422 |        "      <td>1.2</td>\n",
423 |        "      <td>Ringo</td>\n",
424 |        "    </tr>\n",
425 |        "  </tbody>\n",
426 |        "</table>\n",
427 |        "</div>"
428 |       ],
429 |       "text/plain": [
430 |        "   growth    Name\n",
431 |        "0     0.5    Paul\n",
432 |        "1     0.7  George\n",
433 |        "2     1.2   Ringo"
434 |       ]
435 |      },
436 |      "execution_count": 15,
437 |      "metadata": {},
438 |      "output_type": "execute_result"
439 |     }
440 |    ],
441 |    "source": [
442 |     "pd.read_csv(csv_file)"
443 |    ]
444 |   },
445 |   {
446 |    "cell_type": "code",
447 |    "execution_count": 16,
448 |    "metadata": {
449 |     "lines_to_next_cell": 2
450 |    },
451 |    "outputs": [
452 |     {
453 |      "data": {
454 |       "text/html": [
455 |        "<div>\n",
456 |        "<style scoped>\n",
457 |        "    .dataframe tbody tr th:only-of-type {\n",
458 |        "        vertical-align: middle;\n",
459 |        "    }\n",
460 |        "\n",
461 |        "    .dataframe tbody tr th {\n",
462 |        "        vertical-align: top;\n",
463 |        "    }\n",
464 |        "\n",
465 |        "    .dataframe thead th {\n",
466 |        "        text-align: right;\n",
467 |        "    }\n",
468 |        "</style>\n",
469 |        "<table border=\"1\" class=\"dataframe\">\n",
470 |        "  <thead>\n",
471 |        "    <tr style=\"text-align: right;\">\n",
472 |        "      <th></th>\n",
473 |        "      <th>a</th>\n",
474 |        "      <th>b</th>\n",
475 |        "      <th>c</th>\n",
476 |        "    </tr>\n",
477 |        "  </thead>\n",
478 |        "  <tbody>\n",
479 |        "    <tr>\n",
480 |        "      <th>0</th>\n",
481 |        "      <td>0.496714</td>\n",
482 |        "      <td>-0.138264</td>\n",
483 |        "      <td>0.647689</td>\n",
484 |        "    </tr>\n",
485 |        "    <tr>\n",
486 |        "      <th>1</th>\n",
487 |        "      <td>1.523030</td>\n",
488 |        "      <td>-0.234153</td>\n",
489 |        "      <td>-0.234137</td>\n",
490 |        "    </tr>\n",
491 |        "    <tr>\n",
492 |        "      <th>2</th>\n",
493 |        "      <td>1.579213</td>\n",
494 |        "      <td>0.767435</td>\n",
495 |        "      <td>-0.469474</td>\n",
496 |        "    </tr>\n",
497 |        "    <tr>\n",
498 |        "      <th>3</th>\n",
499 |        "      <td>0.542560</td>\n",
500 |        "      <td>-0.463418</td>\n",
501 |        "      <td>-0.465730</td>\n",
502 |        "    </tr>\n",
503 |        "    <tr>\n",
504 |        "      <th>4</th>\n",
505 |        "      <td>0.241962</td>\n",
506 |        "      <td>-1.913280</td>\n",
507 |        "      <td>-1.724918</td>\n",
508 |        "    </tr>\n",
509 |        "    <tr>\n",
510 |        "      <th>5</th>\n",
511 |        "      <td>-0.562288</td>\n",
512 |        "      <td>-1.012831</td>\n",
513 |        "      <td>0.314247</td>\n",
514 |        "    </tr>\n",
515 |        "    <tr>\n",
516 |        "      <th>6</th>\n",
517 |        "      <td>-0.908024</td>\n",
518 |        "      <td>-1.412304</td>\n",
519 |        "      <td>1.465649</td>\n",
520 |        "    </tr>\n",
521 |        "    <tr>\n",
522 |        "      <th>7</th>\n",
523 |        "      <td>-0.225776</td>\n",
524 |        "      <td>0.067528</td>\n",
525 |        "      <td>-1.424748</td>\n",
526 |        "    </tr>\n",
527 |        "    <tr>\n",
528 |        "      <th>8</th>\n",
529 |        "      <td>-0.544383</td>\n",
530 |        "      <td>0.110923</td>\n",
531 |        "      <td>-1.150994</td>\n",
532 |        "    </tr>\n",
533 |        "    <tr>\n",
534 |        "      <th>9</th>\n",
535 |        "      <td>0.375698</td>\n",
536 |        "      <td>-0.600639</td>\n",
537 |        "      <td>-0.291694</td>\n",
538 |        "    </tr>\n",
539 |        "  </tbody>\n",
540 |        "</table>\n",
541 |        "</div>"
542 |       ],
543 |       "text/plain": [
544 |        "          a         b         c\n",
545 |        "0  0.496714 -0.138264  0.647689\n",
546 |        "1  1.523030 -0.234153 -0.234137\n",
547 |        "2  1.579213  0.767435 -0.469474\n",
548 |        "3  0.542560 -0.463418 -0.465730\n",
549 |        "4  0.241962 -1.913280 -1.724918\n",
550 |        "5 -0.562288 -1.012831  0.314247\n",
551 |        "6 -0.908024 -1.412304  1.465649\n",
552 |        "7 -0.225776  0.067528 -1.424748\n",
553 |        "8 -0.544383  0.110923 -1.150994\n",
554 |        "9  0.375698 -0.600639 -0.291694"
555 |       ]
556 |      },
557 |      "execution_count": 16,
558 |      "metadata": {},
559 |      "output_type": "execute_result"
560 |     }
561 |    ],
562 |    "source": [
563 |     "import numpy as np\n",
564 |     "np.random.seed(42)\n",
565 |     "pd.DataFrame(np.random.randn(10,3),\n",
566 |     "    columns=['a', 'b', 'c'])"
567 |    ]
568 |   },
569 |   {
570 |    "cell_type": "code",
571 |    "execution_count": 17,
572 |    "metadata": {
573 |     "lines_to_next_cell": 2
574 |    },
575 |    "outputs": [
576 |     {
577 |      "data": {
578 |       "text/plain": [
579 |        "[RangeIndex(start=0, stop=3, step=1),\n",
580 |        " Index(['growth', 'Name'], dtype='object')]"
581 |       ]
582 |      },
583 |      "execution_count": 17,
584 |      "metadata": {},
585 |      "output_type": "execute_result"
586 |     }
587 |    ],
588 |    "source": [
589 |     "df.axes  # doctest: +NORMALIZE_WHITESPACE"
590 |    ]
591 |   },
592 |   {
593 |    "cell_type": "code",
594 |    "execution_count": 18,
595 |    "metadata": {
596 |     "lines_to_next_cell": 2
597 |    },
598 |    "outputs": [
599 |     {
600 |      "data": {
601 |       "text/plain": [
602 |        "growth                2.4\n",
603 |        "Name      PaulGeorgeRingo\n",
604 |        "dtype: object"
605 |       ]
606 |      },
607 |      "execution_count": 18,
608 |      "metadata": {},
609 |      "output_type": "execute_result"
610 |     }
611 |    ],
612 |    "source": [
613 |     "df.sum(axis=0)"
614 |    ]
615 |   },
616 |   {
617 |    "cell_type": "code",
618 |    "execution_count": 19,
619 |    "metadata": {
620 |     "lines_to_next_cell": 2
621 |    },
622 |    "outputs": [
623 |     {
624 |      "name": "stderr",
625 |      "output_type": "stream",
626 |      "text": [
627 |       "<ipython-input-19-f6cc363c055e>:1: FutureWarning: Dropping of nuisance columns in DataFrame reductions (with 'numeric_only=None') is deprecated; in a future version this will raise TypeError.  Select only valid columns before calling the reduction.\n",
628 |       "  df.sum(axis=1)\n"
629 |      ]
630 |     },
631 |     {
632 |      "data": {
633 |       "text/plain": [
634 |        "0    0.5\n",
635 |        "1    0.7\n",
636 |        "2    1.2\n",
637 |        "dtype: float64"
638 |       ]
639 |      },
640 |      "execution_count": 19,
641 |      "metadata": {},
642 |      "output_type": "execute_result"
643 |     }
644 |    ],
645 |    "source": [
646 |     "df.sum(axis=1)"
647 |    ]
648 |   },
649 |   {
650 |    "cell_type": "code",
651 |    "execution_count": 20,
652 |    "metadata": {
653 |     "lines_to_next_cell": 2
654 |    },
655 |    "outputs": [
656 |     {
657 |      "data": {
658 |       "text/plain": [
659 |        "growth                2.4\n",
660 |        "Name      PaulGeorgeRingo\n",
661 |        "dtype: object"
662 |       ]
663 |      },
664 |      "execution_count": 20,
665 |      "metadata": {},
666 |      "output_type": "execute_result"
667 |     }
668 |    ],
669 |    "source": [
670 |     "df.sum(axis='index')"
671 |    ]
672 |   },
673 |   {
674 |    "cell_type": "code",
675 |    "execution_count": 21,
676 |    "metadata": {
677 |     "lines_to_next_cell": 2
678 |    },
679 |    "outputs": [
680 |     {
681 |      "name": "stderr",
682 |      "output_type": "stream",
683 |      "text": [
684 |       "<ipython-input-21-43bb752878cf>:1: FutureWarning: Dropping of nuisance columns in DataFrame reductions (with 'numeric_only=None') is deprecated; in a future version this will raise TypeError.  Select only valid columns before calling the reduction.\n",
685 |       "  df.sum(axis='columns')\n"
686 |      ]
687 |     },
688 |     {
689 |      "data": {
690 |       "text/plain": [
691 |        "0    0.5\n",
692 |        "1    0.7\n",
693 |        "2    1.2\n",
694 |        "dtype: float64"
695 |       ]
696 |      },
697 |      "execution_count": 21,
698 |      "metadata": {},
699 |      "output_type": "execute_result"
700 |     }
701 |    ],
702 |    "source": [
703 |     "df.sum(axis='columns')"
704 |    ]
705 |   },
706 |   {
707 |    "cell_type": "code",
708 |    "execution_count": 22,
709 |    "metadata": {
710 |     "lines_to_next_cell": 2
711 |    },
712 |    "outputs": [
713 |     {
714 |      "data": {
715 |       "text/plain": [
716 |        "RangeIndex(start=0, stop=3, step=1)"
717 |       ]
718 |      },
719 |      "execution_count": 22,
720 |      "metadata": {},
721 |      "output_type": "execute_result"
722 |     }
723 |    ],
724 |    "source": [
725 |     "df.axes[0]"
726 |    ]
727 |   },
728 |   {
729 |    "cell_type": "code",
730 |    "execution_count": 23,
731 |    "metadata": {
732 |     "lines_to_next_cell": 2
733 |    },
734 |    "outputs": [
735 |     {
736 |      "data": {
737 |       "text/plain": [
738 |        "Index(['growth', 'Name'], dtype='object')"
739 |       ]
740 |      },
741 |      "execution_count": 23,
742 |      "metadata": {},
743 |      "output_type": "execute_result"
744 |     }
745 |    ],
746 |    "source": [
747 |     "df.axes[1]"
748 |    ]
749 |   },
750 |   {
751 |    "cell_type": "code",
752 |    "execution_count": 24,
753 |    "metadata": {
754 |     "lines_to_next_cell": 2
755 |    },
756 |    "outputs": [
757 |     {
758 |      "data": {
759 |       "text/html": [
760 |        "<div>\n",
761 |        "<style scoped>\n",
762 |        "    .dataframe tbody tr th:only-of-type {\n",
763 |        "        vertical-align: middle;\n",
764 |        "    }\n",
765 |        "\n",
766 |        "    .dataframe tbody tr th {\n",
767 |        "        vertical-align: top;\n",
768 |        "    }\n",
769 |        "\n",
770 |        "    .dataframe thead th {\n",
771 |        "        text-align: right;\n",
772 |        "    }\n",
773 |        "</style>\n",
774 |        "<table border=\"1\" class=\"dataframe\">\n",
775 |        "  <thead>\n",
776 |        "    <tr style=\"text-align: right;\">\n",
777 |        "      <th></th>\n",
778 |        "      <th>Score1</th>\n",
779 |        "      <th>Score2</th>\n",
780 |        "    </tr>\n",
781 |        "  </thead>\n",
782 |        "  <tbody>\n",
783 |        "    <tr>\n",
784 |        "      <th>0</th>\n",
785 |        "      <td>None</td>\n",
786 |        "      <td>85</td>\n",
787 |        "    </tr>\n",
788 |        "    <tr>\n",
789 |        "      <th>1</th>\n",
790 |        "      <td>None</td>\n",
791 |        "      <td>90</td>\n",
792 |        "    </tr>\n",
793 |        "  </tbody>\n",
794 |        "</table>\n",
795 |        "</div>"
796 |       ],
797 |       "text/plain": [
798 |        "  Score1  Score2\n",
799 |        "0   None      85\n",
800 |        "1   None      90"
801 |       ]
802 |      },
803 |      "execution_count": 24,
804 |      "metadata": {},
805 |      "output_type": "execute_result"
806 |     }
807 |    ],
808 |    "source": [
809 |     "df = pd.DataFrame({'Score1': [None, None],\n",
810 |     "                   'Score2': [85, 90]})\n",
811 |     "df"
812 |    ]
813 |   },
814 |   {
815 |    "cell_type": "code",
816 |    "execution_count": 25,
817 |    "metadata": {
818 |     "lines_to_next_cell": 2
819 |    },
820 |    "outputs": [
821 |     {
822 |      "data": {
823 |       "text/plain": [
824 |        "Score1      0\n",
825 |        "Score2    175\n",
826 |        "dtype: int64"
827 |       ]
828 |      },
829 |      "execution_count": 25,
830 |      "metadata": {},
831 |      "output_type": "execute_result"
832 |     }
833 |    ],
834 |    "source": [
835 |     "df.apply(np.sum, axis=0)"
836 |    ]
837 |   },
838 |   {
839 |    "cell_type": "code",
840 |    "execution_count": 26,
841 |    "metadata": {
842 |     "lines_to_next_cell": 2
843 |    },
844 |    "outputs": [
845 |     {
846 |      "data": {
847 |       "text/plain": [
848 |        "0    85\n",
849 |        "1    90\n",
850 |        "dtype: int64"
851 |       ]
852 |      },
853 |      "execution_count": 26,
854 |      "metadata": {},
855 |      "output_type": "execute_result"
856 |     }
857 |    ],
858 |    "source": [
859 |     "df.apply(np.sum, axis=1)"
860 |    ]
861 |   }
862 |  ],
863 |  "metadata": {
864 |   "jupytext": {
865 |    "cell_metadata_filter": "-all",
866 |    "main_language": "python",
867 |    "notebook_metadata_filter": "-all"
868 |   },
869 |   "kernelspec": {
870 |    "display_name": "Python 3",
871 |    "language": "python",
872 |    "name": "python3"
873 |   },
874 |   "language_info": {
875 |    "codemirror_mode": {
876 |     "name": "ipython",
877 |     "version": 3
878 |    },
879 |    "file_extension": ".py",
880 |    "mimetype": "text/x-python",
881 |    "name": "python",
882 |    "nbconvert_exporter": "python",
883 |    "pygments_lexer": "ipython3",
884 |    "version": "3.8.5"
885 |   }
886 |  },
887 |  "nbformat": 4,
888 |  "nbformat_minor": 4
889 | }
890 | 


--------------------------------------------------------------------------------
/33-exporting-code.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |  "cells": [
   3 |   {
   4 |    "cell_type": "code",
   5 |    "execution_count": 1,
   6 |    "metadata": {},
   7 |    "outputs": [
   8 |     {
   9 |      "name": "stderr",
  10 |      "output_type": "stream",
  11 |      "text": [
  12 |       "/home/matt/envs/menv/lib/python3.8/site-packages/IPython/core/interactiveshell.py:3418: DtypeWarning: Columns (7) have mixed types.Specify dtype option on import or set low_memory=False.\n",
  13 |       "  exec(code_obj, self.user_global_ns, self.user_ns)\n"
  14 |      ]
  15 |     }
  16 |    ],
  17 |    "source": [
  18 |     "import pandas as pd\n",
  19 |     "url = 'https://github.com/mattharrison/datasets/raw/master'\\\n",
  20 |     "      '/data/dirtydevil.txt'\n",
  21 |     "df = pd.read_csv(url, skiprows=lambda num: num <34 or num == 35,\n",
  22 |     "                 sep='\\t')\n",
  23 |     "def to_denver_time(df_, time_col, tz_col):\n",
  24 |     "    return (df_\n",
  25 |     "       .assign(**{tz_col: df_[tz_col].replace('MDT', 'MST7MDT')})\n",
  26 |     "       .groupby(tz_col)\n",
  27 |     "       [time_col]\n",
  28 |     "       .transform(lambda s: pd.to_datetime(s)\n",
  29 |     "           .dt.tz_localize(s.name, ambiguous=True)\n",
  30 |     "           .dt.tz_convert('America/Denver'))\n",
  31 |     "    )"
  32 |    ]
  33 |   },
  34 |   {
  35 |    "cell_type": "code",
  36 |    "execution_count": 2,
  37 |    "metadata": {},
  38 |    "outputs": [],
  39 |    "source": [
  40 |     "def tweak_river(df_):\n",
  41 |     "    return (df_\n",
  42 |     "     .assign(datetime=to_denver_time(df_, 'datetime', 'tz_cd'))\n",
  43 |     "     .rename(columns={'144166_00060': 'cfs',\n",
  44 |     "                      '144167_00065': 'gage_height'})\n",
  45 |     "     .set_index('datetime')\n",
  46 |     "    )"
  47 |    ]
  48 |   },
  49 |   {
  50 |    "cell_type": "code",
  51 |    "execution_count": 3,
  52 |    "metadata": {
  53 |     "lines_to_next_cell": 2
  54 |    },
  55 |    "outputs": [
  56 |     {
  57 |      "data": {
  58 |       "text/html": [
  59 |        "<div>\n",
  60 |        "<style scoped>\n",
  61 |        "    .dataframe tbody tr th:only-of-type {\n",
  62 |        "        vertical-align: middle;\n",
  63 |        "    }\n",
  64 |        "\n",
  65 |        "    .dataframe tbody tr th {\n",
  66 |        "        vertical-align: top;\n",
  67 |        "    }\n",
  68 |        "\n",
  69 |        "    .dataframe thead th {\n",
  70 |        "        text-align: right;\n",
  71 |        "    }\n",
  72 |        "</style>\n",
  73 |        "<table border=\"1\" class=\"dataframe\">\n",
  74 |        "  <thead>\n",
  75 |        "    <tr style=\"text-align: right;\">\n",
  76 |        "      <th></th>\n",
  77 |        "      <th>agency_cd</th>\n",
  78 |        "      <th>site_no</th>\n",
  79 |        "      <th>tz_cd</th>\n",
  80 |        "      <th>cfs</th>\n",
  81 |        "      <th>144166_00060_cd</th>\n",
  82 |        "      <th>gage_height</th>\n",
  83 |        "      <th>144167_00065_cd</th>\n",
  84 |        "    </tr>\n",
  85 |        "    <tr>\n",
  86 |        "      <th>datetime</th>\n",
  87 |        "      <th></th>\n",
  88 |        "      <th></th>\n",
  89 |        "      <th></th>\n",
  90 |        "      <th></th>\n",
  91 |        "      <th></th>\n",
  92 |        "      <th></th>\n",
  93 |        "      <th></th>\n",
  94 |        "    </tr>\n",
  95 |        "  </thead>\n",
  96 |        "  <tbody>\n",
  97 |        "    <tr>\n",
  98 |        "      <th>2001-05-07 01:00:00-06:00</th>\n",
  99 |        "      <td>USGS</td>\n",
 100 |        "      <td>9333500</td>\n",
 101 |        "      <td>MDT</td>\n",
 102 |        "      <td>71.00</td>\n",
 103 |        "      <td>A:[91]</td>\n",
 104 |        "      <td>NaN</td>\n",
 105 |        "      <td>NaN</td>\n",
 106 |        "    </tr>\n",
 107 |        "    <tr>\n",
 108 |        "      <th>2001-05-07 01:15:00-06:00</th>\n",
 109 |        "      <td>USGS</td>\n",
 110 |        "      <td>9333500</td>\n",
 111 |        "      <td>MDT</td>\n",
 112 |        "      <td>71.00</td>\n",
 113 |        "      <td>A:[91]</td>\n",
 114 |        "      <td>NaN</td>\n",
 115 |        "      <td>NaN</td>\n",
 116 |        "    </tr>\n",
 117 |        "    <tr>\n",
 118 |        "      <th>2001-05-07 01:30:00-06:00</th>\n",
 119 |        "      <td>USGS</td>\n",
 120 |        "      <td>9333500</td>\n",
 121 |        "      <td>MDT</td>\n",
 122 |        "      <td>71.00</td>\n",
 123 |        "      <td>A:[91]</td>\n",
 124 |        "      <td>NaN</td>\n",
 125 |        "      <td>NaN</td>\n",
 126 |        "    </tr>\n",
 127 |        "    <tr>\n",
 128 |        "      <th>2001-05-07 01:45:00-06:00</th>\n",
 129 |        "      <td>USGS</td>\n",
 130 |        "      <td>9333500</td>\n",
 131 |        "      <td>MDT</td>\n",
 132 |        "      <td>70.00</td>\n",
 133 |        "      <td>A:[91]</td>\n",
 134 |        "      <td>NaN</td>\n",
 135 |        "      <td>NaN</td>\n",
 136 |        "    </tr>\n",
 137 |        "    <tr>\n",
 138 |        "      <th>2001-05-07 02:00:00-06:00</th>\n",
 139 |        "      <td>USGS</td>\n",
 140 |        "      <td>9333500</td>\n",
 141 |        "      <td>MDT</td>\n",
 142 |        "      <td>70.00</td>\n",
 143 |        "      <td>A:[91]</td>\n",
 144 |        "      <td>NaN</td>\n",
 145 |        "      <td>NaN</td>\n",
 146 |        "    </tr>\n",
 147 |        "    <tr>\n",
 148 |        "      <th>...</th>\n",
 149 |        "      <td>...</td>\n",
 150 |        "      <td>...</td>\n",
 151 |        "      <td>...</td>\n",
 152 |        "      <td>...</td>\n",
 153 |        "      <td>...</td>\n",
 154 |        "      <td>...</td>\n",
 155 |        "      <td>...</td>\n",
 156 |        "    </tr>\n",
 157 |        "    <tr>\n",
 158 |        "      <th>2020-09-28 08:30:00-06:00</th>\n",
 159 |        "      <td>USGS</td>\n",
 160 |        "      <td>9333500</td>\n",
 161 |        "      <td>MDT</td>\n",
 162 |        "      <td>9.53</td>\n",
 163 |        "      <td>P</td>\n",
 164 |        "      <td>6.16</td>\n",
 165 |        "      <td>P</td>\n",
 166 |        "    </tr>\n",
 167 |        "    <tr>\n",
 168 |        "      <th>2020-09-28 08:45:00-06:00</th>\n",
 169 |        "      <td>USGS</td>\n",
 170 |        "      <td>9333500</td>\n",
 171 |        "      <td>MDT</td>\n",
 172 |        "      <td>9.20</td>\n",
 173 |        "      <td>P</td>\n",
 174 |        "      <td>6.15</td>\n",
 175 |        "      <td>P</td>\n",
 176 |        "    </tr>\n",
 177 |        "    <tr>\n",
 178 |        "      <th>2020-09-28 09:00:00-06:00</th>\n",
 179 |        "      <td>USGS</td>\n",
 180 |        "      <td>9333500</td>\n",
 181 |        "      <td>MDT</td>\n",
 182 |        "      <td>9.20</td>\n",
 183 |        "      <td>P</td>\n",
 184 |        "      <td>6.15</td>\n",
 185 |        "      <td>P</td>\n",
 186 |        "    </tr>\n",
 187 |        "    <tr>\n",
 188 |        "      <th>2020-09-28 09:15:00-06:00</th>\n",
 189 |        "      <td>USGS</td>\n",
 190 |        "      <td>9333500</td>\n",
 191 |        "      <td>MDT</td>\n",
 192 |        "      <td>9.20</td>\n",
 193 |        "      <td>P</td>\n",
 194 |        "      <td>6.15</td>\n",
 195 |        "      <td>P</td>\n",
 196 |        "    </tr>\n",
 197 |        "    <tr>\n",
 198 |        "      <th>2020-09-28 09:30:00-06:00</th>\n",
 199 |        "      <td>USGS</td>\n",
 200 |        "      <td>9333500</td>\n",
 201 |        "      <td>MDT</td>\n",
 202 |        "      <td>9.20</td>\n",
 203 |        "      <td>P</td>\n",
 204 |        "      <td>6.15</td>\n",
 205 |        "      <td>P</td>\n",
 206 |        "    </tr>\n",
 207 |        "  </tbody>\n",
 208 |        "</table>\n",
 209 |        "<p>539305 rows × 7 columns</p>\n",
 210 |        "</div>"
 211 |       ],
 212 |       "text/plain": [
 213 |        "                          agency_cd  site_no tz_cd    cfs 144166_00060_cd  \\\n",
 214 |        "datetime                                                                    \n",
 215 |        "2001-05-07 01:00:00-06:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 216 |        "2001-05-07 01:15:00-06:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 217 |        "2001-05-07 01:30:00-06:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 218 |        "2001-05-07 01:45:00-06:00      USGS  9333500   MDT  70.00          A:[91]   \n",
 219 |        "2001-05-07 02:00:00-06:00      USGS  9333500   MDT  70.00          A:[91]   \n",
 220 |        "...                             ...      ...   ...    ...             ...   \n",
 221 |        "2020-09-28 08:30:00-06:00      USGS  9333500   MDT   9.53               P   \n",
 222 |        "2020-09-28 08:45:00-06:00      USGS  9333500   MDT   9.20               P   \n",
 223 |        "2020-09-28 09:00:00-06:00      USGS  9333500   MDT   9.20               P   \n",
 224 |        "2020-09-28 09:15:00-06:00      USGS  9333500   MDT   9.20               P   \n",
 225 |        "2020-09-28 09:30:00-06:00      USGS  9333500   MDT   9.20               P   \n",
 226 |        "\n",
 227 |        "                           gage_height 144167_00065_cd  \n",
 228 |        "datetime                                                \n",
 229 |        "2001-05-07 01:00:00-06:00          NaN             NaN  \n",
 230 |        "2001-05-07 01:15:00-06:00          NaN             NaN  \n",
 231 |        "2001-05-07 01:30:00-06:00          NaN             NaN  \n",
 232 |        "2001-05-07 01:45:00-06:00          NaN             NaN  \n",
 233 |        "2001-05-07 02:00:00-06:00          NaN             NaN  \n",
 234 |        "...                                ...             ...  \n",
 235 |        "2020-09-28 08:30:00-06:00         6.16               P  \n",
 236 |        "2020-09-28 08:45:00-06:00         6.15               P  \n",
 237 |        "2020-09-28 09:00:00-06:00         6.15               P  \n",
 238 |        "2020-09-28 09:15:00-06:00         6.15               P  \n",
 239 |        "2020-09-28 09:30:00-06:00         6.15               P  \n",
 240 |        "\n",
 241 |        "[539305 rows x 7 columns]"
 242 |       ]
 243 |      },
 244 |      "execution_count": 3,
 245 |      "metadata": {},
 246 |      "output_type": "execute_result"
 247 |     }
 248 |    ],
 249 |    "source": [
 250 |     "dd = tweak_river(df)\n",
 251 |     "dd"
 252 |    ]
 253 |   },
 254 |   {
 255 |    "cell_type": "code",
 256 |    "execution_count": 4,
 257 |    "metadata": {
 258 |     "lines_to_next_cell": 2
 259 |    },
 260 |    "outputs": [],
 261 |    "source": [
 262 |     "dd.to_csv('/tmp/dd.csv')  # doctest: +SKIP"
 263 |    ]
 264 |   },
 265 |   {
 266 |    "cell_type": "code",
 267 |    "execution_count": 5,
 268 |    "metadata": {
 269 |     "lines_to_next_cell": 2
 270 |    },
 271 |    "outputs": [
 272 |     {
 273 |      "name": "stdout",
 274 |      "output_type": "stream",
 275 |      "text": [
 276 |       "datetime,agency_cd,site_no,tz_cd,cfs,144166_00060_cd,gage_height,144167_00065_cd\n",
 277 |       "2001-05-07 01:00:00-06:00,USGS,9333500,MDT,71.0,A:[91],,\n",
 278 |       "2001-05-07 01:15:00-06:00,USGS,9333500,MDT,71.0,A:[91],,\n",
 279 |       "2001-05-07 01:30:00-06:00,USGS,9333500,MDT,71.0,A:[91],,\n",
 280 |       "2001-05-07 01:45:00-06:00,USGS,9333500,MDT,70.0,A:[91],,\n",
 281 |       "2001-05-07 02:00:00-06:00,USGS,9333500,MDT,70.0,A:[91],,\n",
 282 |       "\n"
 283 |      ]
 284 |     }
 285 |    ],
 286 |    "source": [
 287 |     "print(dd.head(5).to_csv())"
 288 |    ]
 289 |   },
 290 |   {
 291 |    "cell_type": "code",
 292 |    "execution_count": 6,
 293 |    "metadata": {
 294 |     "lines_to_next_cell": 2
 295 |    },
 296 |    "outputs": [
 297 |     {
 298 |      "name": "stderr",
 299 |      "output_type": "stream",
 300 |      "text": [
 301 |       "/home/matt/envs/menv/lib/python3.8/site-packages/IPython/core/interactiveshell.py:3418: DtypeWarning: Columns (7) have mixed types.Specify dtype option on import or set low_memory=False.\n",
 302 |       "  exec(code_obj, self.user_global_ns, self.user_ns)\n"
 303 |      ]
 304 |     }
 305 |    ],
 306 |    "source": [
 307 |     "dd2 = pd.read_csv('/tmp/dd.csv', index_col='datetime')"
 308 |    ]
 309 |   },
 310 |   {
 311 |    "cell_type": "code",
 312 |    "execution_count": 7,
 313 |    "metadata": {
 314 |     "lines_to_next_cell": 2
 315 |    },
 316 |    "outputs": [
 317 |     {
 318 |      "ename": "ValueError",
 319 |      "evalue": "Excel does not support datetimes with timezones. Please ensure that datetimes are timezone unaware before writing to Excel.",
 320 |      "output_type": "error",
 321 |      "traceback": [
 322 |       "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
 323 |       "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
 324 |       "\u001b[0;32m<ipython-input-7-0ac6c2e2e196>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_excel\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'/tmp/dd.xlsx'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
 325 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/core/generic.py\u001b[0m in \u001b[0;36mto_excel\u001b[0;34m(self, excel_writer, sheet_name, na_rep, float_format, columns, header, index, index_label, startrow, startcol, engine, merge_cells, encoding, inf_rep, verbose, freeze_panes, storage_options)\u001b[0m\n\u001b[1;32m   2282\u001b[0m             \u001b[0minf_rep\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0minf_rep\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   2283\u001b[0m         )\n\u001b[0;32m-> 2284\u001b[0;31m         formatter.write(\n\u001b[0m\u001b[1;32m   2285\u001b[0m             \u001b[0mexcel_writer\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   2286\u001b[0m             \u001b[0msheet_name\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0msheet_name\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
 326 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/io/formats/excel.py\u001b[0m in \u001b[0;36mwrite\u001b[0;34m(self, writer, sheet_name, startrow, startcol, freeze_panes, engine, storage_options)\u001b[0m\n\u001b[1;32m    838\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    839\u001b[0m         \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 840\u001b[0;31m             writer.write_cells(\n\u001b[0m\u001b[1;32m    841\u001b[0m                 \u001b[0mformatted_cells\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    842\u001b[0m                 \u001b[0msheet_name\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
 327 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/io/excel/_xlsxwriter.py\u001b[0m in \u001b[0;36mwrite_cells\u001b[0;34m(self, cells, sheet_name, startrow, startcol, freeze_panes)\u001b[0m\n\u001b[1;32m    225\u001b[0m             \u001b[0mwks\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfreeze_panes\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mfreeze_panes\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    226\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 227\u001b[0;31m         \u001b[0;32mfor\u001b[0m \u001b[0mcell\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mcells\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    228\u001b[0m             \u001b[0mval\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mfmt\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_value_with_fmt\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcell\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mval\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    229\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
 328 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/io/formats/excel.py\u001b[0m in \u001b[0;36mget_formatted_cells\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m    776\u001b[0m     \u001b[0;32mdef\u001b[0m \u001b[0mget_formatted_cells\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m->\u001b[0m \u001b[0mIterable\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mExcelCell\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    777\u001b[0m         \u001b[0;32mfor\u001b[0m \u001b[0mcell\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mitertools\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mchain\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_format_header\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_format_body\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 778\u001b[0;31m             \u001b[0mcell\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mval\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_format_value\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcell\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mval\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    779\u001b[0m             \u001b[0;32myield\u001b[0m \u001b[0mcell\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    780\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
 329 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/io/formats/excel.py\u001b[0m in \u001b[0;36m_format_value\u001b[0;34m(self, val)\u001b[0m\n\u001b[1;32m    524\u001b[0m                 \u001b[0mval\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mfloat\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfloat_format\u001b[0m \u001b[0;34m%\u001b[0m \u001b[0mval\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    525\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0mgetattr\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mval\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m\"tzinfo\"\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 526\u001b[0;31m             raise ValueError(\n\u001b[0m\u001b[1;32m    527\u001b[0m                 \u001b[0;34m\"Excel does not support datetimes with \"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    528\u001b[0m                 \u001b[0;34m\"timezones. Please ensure that datetimes \"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
 330 |       "\u001b[0;31mValueError\u001b[0m: Excel does not support datetimes with timezones. Please ensure that datetimes are timezone unaware before writing to Excel."
 331 |      ]
 332 |     }
 333 |    ],
 334 |    "source": [
 335 |     "dd.to_excel('/tmp/dd.xlsx')"
 336 |    ]
 337 |   },
 338 |   {
 339 |    "cell_type": "code",
 340 |    "execution_count": 8,
 341 |    "metadata": {
 342 |     "lines_to_next_cell": 2
 343 |    },
 344 |    "outputs": [],
 345 |    "source": [
 346 |     "(dd  # doctest: +SKIP\n",
 347 |     " .reset_index()\n",
 348 |     " .assign(datetime=lambda df_: df_.datetime.dt.tz_convert(tz=None))\n",
 349 |     " .set_index('datetime')\n",
 350 |     " .to_excel('/tmp/dd.xlsx')\n",
 351 |     ")"
 352 |    ]
 353 |   },
 354 |   {
 355 |    "cell_type": "code",
 356 |    "execution_count": 9,
 357 |    "metadata": {
 358 |     "lines_to_next_cell": 2
 359 |    },
 360 |    "outputs": [],
 361 |    "source": [
 362 |     "writer = pd.ExcelWriter('/tmp/dd2.xlsx')\n",
 363 |     "dd2 = (dd    \n",
 364 |     " .reset_index()\n",
 365 |     " .assign(datetime=lambda df_: df_.datetime.dt.tz_convert(tz=None))\n",
 366 |     " .set_index('datetime')\n",
 367 |     ")\n",
 368 |     "(dd2      # doctest: +SKIP\n",
 369 |     " .loc['2010':'2010-12-31']\n",
 370 |     " .to_excel(writer, sheet_name='2010')\n",
 371 |     ")\n",
 372 |     "(dd2     # doctest: +SKIP\n",
 373 |     " .loc['2011':'2011-12-31'] \n",
 374 |     " .to_excel(writer, sheet_name='2011')\n",
 375 |     ")\n",
 376 |     "writer.save()      # doctest: +SKIP"
 377 |    ]
 378 |   },
 379 |   {
 380 |    "cell_type": "code",
 381 |    "execution_count": 10,
 382 |    "metadata": {
 383 |     "lines_to_next_cell": 2,
 384 |     "scrolled": true
 385 |    },
 386 |    "outputs": [
 387 |     {
 388 |      "ename": "ValueError",
 389 |      "evalue": "feather does not support serializing <class 'pandas.core.indexes.datetimes.DatetimeIndex'> for the index; you can .reset_index() to make the index into column(s)",
 390 |      "output_type": "error",
 391 |      "traceback": [
 392 |       "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
 393 |       "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
 394 |       "\u001b[0;32m<ipython-input-10-73127889b6d4>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mto_feather\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'/tmp/dd.fea'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
 395 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/util/_decorators.py\u001b[0m in \u001b[0;36mwrapper\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m    205\u001b[0m                 \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    206\u001b[0m                     \u001b[0mkwargs\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mnew_arg_name\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mnew_arg_value\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 207\u001b[0;31m             \u001b[0;32mreturn\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0margs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    208\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    209\u001b[0m         \u001b[0;32mreturn\u001b[0m \u001b[0mcast\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mF\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mwrapper\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
 396 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/core/frame.py\u001b[0m in \u001b[0;36mto_feather\u001b[0;34m(self, path, **kwargs)\u001b[0m\n\u001b[1;32m   2517\u001b[0m         \u001b[0;32mfrom\u001b[0m \u001b[0mpandas\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mio\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfeather_format\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0mto_feather\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   2518\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 2519\u001b[0;31m         \u001b[0mto_feather\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mpath\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkwargs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   2520\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   2521\u001b[0m     @doc(\n",
 397 |       "\u001b[0;32m~/envs/menv/lib/python3.8/site-packages/pandas/io/feather_format.py\u001b[0m in \u001b[0;36mto_feather\u001b[0;34m(df, path, storage_options, **kwargs)\u001b[0m\n\u001b[1;32m     59\u001b[0m     \u001b[0;32mif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m(\u001b[0m\u001b[0mInt64Index\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mRangeIndex\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     60\u001b[0m         \u001b[0mtyp\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtype\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 61\u001b[0;31m         raise ValueError(\n\u001b[0m\u001b[1;32m     62\u001b[0m             \u001b[0;34mf\"feather does not support serializing {typ} \"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     63\u001b[0m             \u001b[0;34m\"for the index; you can .reset_index() to make the index into column(s)\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
 398 |       "\u001b[0;31mValueError\u001b[0m: feather does not support serializing <class 'pandas.core.indexes.datetimes.DatetimeIndex'> for the index; you can .reset_index() to make the index into column(s)"
 399 |      ]
 400 |     }
 401 |    ],
 402 |    "source": [
 403 |     "dd.to_feather('/tmp/dd.fea')"
 404 |    ]
 405 |   },
 406 |   {
 407 |    "cell_type": "code",
 408 |    "execution_count": 11,
 409 |    "metadata": {
 410 |     "lines_to_next_cell": 2
 411 |    },
 412 |    "outputs": [],
 413 |    "source": [
 414 |     "(dd\n",
 415 |     " .reset_index()\n",
 416 |     " .to_feather('/tmp/dd.fea')\n",
 417 |     ")"
 418 |    ]
 419 |   },
 420 |   {
 421 |    "cell_type": "code",
 422 |    "execution_count": 12,
 423 |    "metadata": {
 424 |     "lines_to_next_cell": 2
 425 |    },
 426 |    "outputs": [
 427 |     {
 428 |      "data": {
 429 |       "text/plain": [
 430 |        "True"
 431 |       ]
 432 |      },
 433 |      "execution_count": 12,
 434 |      "metadata": {},
 435 |      "output_type": "execute_result"
 436 |     }
 437 |    ],
 438 |    "source": [
 439 |     "dd2 = pd.read_feather('/tmp/dd.fea')\n",
 440 |     "dd2.set_index('datetime').equals(dd)"
 441 |    ]
 442 |   },
 443 |   {
 444 |    "cell_type": "code",
 445 |    "execution_count": 13,
 446 |    "metadata": {
 447 |     "lines_to_next_cell": 2
 448 |    },
 449 |    "outputs": [],
 450 |    "source": [
 451 |     "import sqlite3\n",
 452 |     "con = sqlite3.connect('dd.db')\n",
 453 |     "dd.to_sql('dd', con, if_exists='replace')  # doctest: +SKIP"
 454 |    ]
 455 |   },
 456 |   {
 457 |    "cell_type": "code",
 458 |    "execution_count": 14,
 459 |    "metadata": {
 460 |     "lines_to_next_cell": 2
 461 |    },
 462 |    "outputs": [
 463 |     {
 464 |      "data": {
 465 |       "text/plain": [
 466 |        "False"
 467 |       ]
 468 |      },
 469 |      "execution_count": 14,
 470 |      "metadata": {},
 471 |      "output_type": "execute_result"
 472 |     }
 473 |    ],
 474 |    "source": [
 475 |     "import sqlalchemy as sa\n",
 476 |     "eng = sa.create_engine('sqlite:///dd.db')\n",
 477 |     "sa_con = eng.connect()\n",
 478 |     "dd2 = pd.read_sql('dd', sa_con, index_col='datetime')  # doctest: +SKIP\n",
 479 |     "dd2.equals(dd)  # doctest: +SKIP"
 480 |    ]
 481 |   },
 482 |   {
 483 |    "cell_type": "code",
 484 |    "execution_count": 15,
 485 |    "metadata": {
 486 |     "lines_to_next_cell": 2
 487 |    },
 488 |    "outputs": [
 489 |     {
 490 |      "data": {
 491 |       "text/html": [
 492 |        "<div>\n",
 493 |        "<style scoped>\n",
 494 |        "    .dataframe tbody tr th:only-of-type {\n",
 495 |        "        vertical-align: middle;\n",
 496 |        "    }\n",
 497 |        "\n",
 498 |        "    .dataframe tbody tr th {\n",
 499 |        "        vertical-align: top;\n",
 500 |        "    }\n",
 501 |        "\n",
 502 |        "    .dataframe thead th {\n",
 503 |        "        text-align: right;\n",
 504 |        "    }\n",
 505 |        "</style>\n",
 506 |        "<table border=\"1\" class=\"dataframe\">\n",
 507 |        "  <thead>\n",
 508 |        "    <tr style=\"text-align: right;\">\n",
 509 |        "      <th></th>\n",
 510 |        "      <th>agency_cd</th>\n",
 511 |        "      <th>site_no</th>\n",
 512 |        "      <th>tz_cd</th>\n",
 513 |        "      <th>cfs</th>\n",
 514 |        "      <th>144166_00060_cd</th>\n",
 515 |        "      <th>gage_height</th>\n",
 516 |        "      <th>144167_00065_cd</th>\n",
 517 |        "    </tr>\n",
 518 |        "    <tr>\n",
 519 |        "      <th>datetime</th>\n",
 520 |        "      <th></th>\n",
 521 |        "      <th></th>\n",
 522 |        "      <th></th>\n",
 523 |        "      <th></th>\n",
 524 |        "      <th></th>\n",
 525 |        "      <th></th>\n",
 526 |        "      <th></th>\n",
 527 |        "    </tr>\n",
 528 |        "  </thead>\n",
 529 |        "  <tbody>\n",
 530 |        "    <tr>\n",
 531 |        "      <th>2001-05-07 01:00:00</th>\n",
 532 |        "      <td>USGS</td>\n",
 533 |        "      <td>9333500</td>\n",
 534 |        "      <td>MDT</td>\n",
 535 |        "      <td>71.00</td>\n",
 536 |        "      <td>A:[91]</td>\n",
 537 |        "      <td>NaN</td>\n",
 538 |        "      <td>None</td>\n",
 539 |        "    </tr>\n",
 540 |        "    <tr>\n",
 541 |        "      <th>2001-05-07 01:15:00</th>\n",
 542 |        "      <td>USGS</td>\n",
 543 |        "      <td>9333500</td>\n",
 544 |        "      <td>MDT</td>\n",
 545 |        "      <td>71.00</td>\n",
 546 |        "      <td>A:[91]</td>\n",
 547 |        "      <td>NaN</td>\n",
 548 |        "      <td>None</td>\n",
 549 |        "    </tr>\n",
 550 |        "    <tr>\n",
 551 |        "      <th>2001-05-07 01:30:00</th>\n",
 552 |        "      <td>USGS</td>\n",
 553 |        "      <td>9333500</td>\n",
 554 |        "      <td>MDT</td>\n",
 555 |        "      <td>71.00</td>\n",
 556 |        "      <td>A:[91]</td>\n",
 557 |        "      <td>NaN</td>\n",
 558 |        "      <td>None</td>\n",
 559 |        "    </tr>\n",
 560 |        "    <tr>\n",
 561 |        "      <th>2001-05-07 01:45:00</th>\n",
 562 |        "      <td>USGS</td>\n",
 563 |        "      <td>9333500</td>\n",
 564 |        "      <td>MDT</td>\n",
 565 |        "      <td>70.00</td>\n",
 566 |        "      <td>A:[91]</td>\n",
 567 |        "      <td>NaN</td>\n",
 568 |        "      <td>None</td>\n",
 569 |        "    </tr>\n",
 570 |        "    <tr>\n",
 571 |        "      <th>2001-05-07 02:00:00</th>\n",
 572 |        "      <td>USGS</td>\n",
 573 |        "      <td>9333500</td>\n",
 574 |        "      <td>MDT</td>\n",
 575 |        "      <td>70.00</td>\n",
 576 |        "      <td>A:[91]</td>\n",
 577 |        "      <td>NaN</td>\n",
 578 |        "      <td>None</td>\n",
 579 |        "    </tr>\n",
 580 |        "    <tr>\n",
 581 |        "      <th>...</th>\n",
 582 |        "      <td>...</td>\n",
 583 |        "      <td>...</td>\n",
 584 |        "      <td>...</td>\n",
 585 |        "      <td>...</td>\n",
 586 |        "      <td>...</td>\n",
 587 |        "      <td>...</td>\n",
 588 |        "      <td>...</td>\n",
 589 |        "    </tr>\n",
 590 |        "    <tr>\n",
 591 |        "      <th>2020-09-28 08:30:00</th>\n",
 592 |        "      <td>USGS</td>\n",
 593 |        "      <td>9333500</td>\n",
 594 |        "      <td>MDT</td>\n",
 595 |        "      <td>9.53</td>\n",
 596 |        "      <td>P</td>\n",
 597 |        "      <td>6.16</td>\n",
 598 |        "      <td>P</td>\n",
 599 |        "    </tr>\n",
 600 |        "    <tr>\n",
 601 |        "      <th>2020-09-28 08:45:00</th>\n",
 602 |        "      <td>USGS</td>\n",
 603 |        "      <td>9333500</td>\n",
 604 |        "      <td>MDT</td>\n",
 605 |        "      <td>9.20</td>\n",
 606 |        "      <td>P</td>\n",
 607 |        "      <td>6.15</td>\n",
 608 |        "      <td>P</td>\n",
 609 |        "    </tr>\n",
 610 |        "    <tr>\n",
 611 |        "      <th>2020-09-28 09:00:00</th>\n",
 612 |        "      <td>USGS</td>\n",
 613 |        "      <td>9333500</td>\n",
 614 |        "      <td>MDT</td>\n",
 615 |        "      <td>9.20</td>\n",
 616 |        "      <td>P</td>\n",
 617 |        "      <td>6.15</td>\n",
 618 |        "      <td>P</td>\n",
 619 |        "    </tr>\n",
 620 |        "    <tr>\n",
 621 |        "      <th>2020-09-28 09:15:00</th>\n",
 622 |        "      <td>USGS</td>\n",
 623 |        "      <td>9333500</td>\n",
 624 |        "      <td>MDT</td>\n",
 625 |        "      <td>9.20</td>\n",
 626 |        "      <td>P</td>\n",
 627 |        "      <td>6.15</td>\n",
 628 |        "      <td>P</td>\n",
 629 |        "    </tr>\n",
 630 |        "    <tr>\n",
 631 |        "      <th>2020-09-28 09:30:00</th>\n",
 632 |        "      <td>USGS</td>\n",
 633 |        "      <td>9333500</td>\n",
 634 |        "      <td>MDT</td>\n",
 635 |        "      <td>9.20</td>\n",
 636 |        "      <td>P</td>\n",
 637 |        "      <td>6.15</td>\n",
 638 |        "      <td>P</td>\n",
 639 |        "    </tr>\n",
 640 |        "  </tbody>\n",
 641 |        "</table>\n",
 642 |        "<p>539305 rows × 7 columns</p>\n",
 643 |        "</div>"
 644 |       ],
 645 |       "text/plain": [
 646 |        "                    agency_cd  site_no tz_cd    cfs 144166_00060_cd  \\\n",
 647 |        "datetime                                                              \n",
 648 |        "2001-05-07 01:00:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 649 |        "2001-05-07 01:15:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 650 |        "2001-05-07 01:30:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 651 |        "2001-05-07 01:45:00      USGS  9333500   MDT  70.00          A:[91]   \n",
 652 |        "2001-05-07 02:00:00      USGS  9333500   MDT  70.00          A:[91]   \n",
 653 |        "...                       ...      ...   ...    ...             ...   \n",
 654 |        "2020-09-28 08:30:00      USGS  9333500   MDT   9.53               P   \n",
 655 |        "2020-09-28 08:45:00      USGS  9333500   MDT   9.20               P   \n",
 656 |        "2020-09-28 09:00:00      USGS  9333500   MDT   9.20               P   \n",
 657 |        "2020-09-28 09:15:00      USGS  9333500   MDT   9.20               P   \n",
 658 |        "2020-09-28 09:30:00      USGS  9333500   MDT   9.20               P   \n",
 659 |        "\n",
 660 |        "                     gage_height 144167_00065_cd  \n",
 661 |        "datetime                                          \n",
 662 |        "2001-05-07 01:00:00          NaN            None  \n",
 663 |        "2001-05-07 01:15:00          NaN            None  \n",
 664 |        "2001-05-07 01:30:00          NaN            None  \n",
 665 |        "2001-05-07 01:45:00          NaN            None  \n",
 666 |        "2001-05-07 02:00:00          NaN            None  \n",
 667 |        "...                          ...             ...  \n",
 668 |        "2020-09-28 08:30:00         6.16               P  \n",
 669 |        "2020-09-28 08:45:00         6.15               P  \n",
 670 |        "2020-09-28 09:00:00         6.15               P  \n",
 671 |        "2020-09-28 09:15:00         6.15               P  \n",
 672 |        "2020-09-28 09:30:00         6.15               P  \n",
 673 |        "\n",
 674 |        "[539305 rows x 7 columns]"
 675 |       ]
 676 |      },
 677 |      "execution_count": 15,
 678 |      "metadata": {},
 679 |      "output_type": "execute_result"
 680 |     }
 681 |    ],
 682 |    "source": [
 683 |     "dd2"
 684 |    ]
 685 |   },
 686 |   {
 687 |    "cell_type": "code",
 688 |    "execution_count": 16,
 689 |    "metadata": {
 690 |     "lines_to_next_cell": 2
 691 |    },
 692 |    "outputs": [
 693 |     {
 694 |      "data": {
 695 |       "text/plain": [
 696 |        "False"
 697 |       ]
 698 |      },
 699 |      "execution_count": 16,
 700 |      "metadata": {},
 701 |      "output_type": "execute_result"
 702 |     }
 703 |    ],
 704 |    "source": [
 705 |     "(dd2  # doctest: +SKIP\n",
 706 |     " .reset_index()\n",
 707 |     " .assign(datetime=lambda df_: df_.datetime\n",
 708 |     "       .dt.tz_localize('America/Denver', ambiguous=False))\n",
 709 |     " .set_index('datetime')\n",
 710 |     " .equals(dd)\n",
 711 |     ")"
 712 |    ]
 713 |   },
 714 |   {
 715 |    "cell_type": "code",
 716 |    "execution_count": 17,
 717 |    "metadata": {
 718 |     "lines_to_next_cell": 2
 719 |    },
 720 |    "outputs": [],
 721 |    "source": [
 722 |     "obj = dd.to_dict()"
 723 |    ]
 724 |   },
 725 |   {
 726 |    "cell_type": "code",
 727 |    "execution_count": 18,
 728 |    "metadata": {
 729 |     "lines_to_next_cell": 2
 730 |    },
 731 |    "outputs": [
 732 |     {
 733 |      "data": {
 734 |       "text/plain": [
 735 |        "True"
 736 |       ]
 737 |      },
 738 |      "execution_count": 18,
 739 |      "metadata": {},
 740 |      "output_type": "execute_result"
 741 |     }
 742 |    ],
 743 |    "source": [
 744 |     "dd2 = pd.DataFrame.from_dict(obj)\n",
 745 |     "dd.equals(dd2)"
 746 |    ]
 747 |   },
 748 |   {
 749 |    "cell_type": "code",
 750 |    "execution_count": 19,
 751 |    "metadata": {
 752 |     "lines_to_next_cell": 2
 753 |    },
 754 |    "outputs": [
 755 |     {
 756 |      "data": {
 757 |       "text/html": [
 758 |        "<div>\n",
 759 |        "<style scoped>\n",
 760 |        "    .dataframe tbody tr th:only-of-type {\n",
 761 |        "        vertical-align: middle;\n",
 762 |        "    }\n",
 763 |        "\n",
 764 |        "    .dataframe tbody tr th {\n",
 765 |        "        vertical-align: top;\n",
 766 |        "    }\n",
 767 |        "\n",
 768 |        "    .dataframe thead th {\n",
 769 |        "        text-align: right;\n",
 770 |        "    }\n",
 771 |        "</style>\n",
 772 |        "<table border=\"1\" class=\"dataframe\">\n",
 773 |        "  <thead>\n",
 774 |        "    <tr style=\"text-align: right;\">\n",
 775 |        "      <th></th>\n",
 776 |        "      <th>agency_cd</th>\n",
 777 |        "      <th>site_no</th>\n",
 778 |        "      <th>tz_cd</th>\n",
 779 |        "      <th>cfs</th>\n",
 780 |        "      <th>144166_00060_cd</th>\n",
 781 |        "      <th>gage_height</th>\n",
 782 |        "      <th>144167_00065_cd</th>\n",
 783 |        "    </tr>\n",
 784 |        "  </thead>\n",
 785 |        "  <tbody>\n",
 786 |        "    <tr>\n",
 787 |        "      <th>2001-05-07 07:00:00</th>\n",
 788 |        "      <td>USGS</td>\n",
 789 |        "      <td>9333500</td>\n",
 790 |        "      <td>MDT</td>\n",
 791 |        "      <td>71.00</td>\n",
 792 |        "      <td>A:[91]</td>\n",
 793 |        "      <td>NaN</td>\n",
 794 |        "      <td>None</td>\n",
 795 |        "    </tr>\n",
 796 |        "    <tr>\n",
 797 |        "      <th>2001-05-07 07:15:00</th>\n",
 798 |        "      <td>USGS</td>\n",
 799 |        "      <td>9333500</td>\n",
 800 |        "      <td>MDT</td>\n",
 801 |        "      <td>71.00</td>\n",
 802 |        "      <td>A:[91]</td>\n",
 803 |        "      <td>NaN</td>\n",
 804 |        "      <td>None</td>\n",
 805 |        "    </tr>\n",
 806 |        "    <tr>\n",
 807 |        "      <th>2001-05-07 07:30:00</th>\n",
 808 |        "      <td>USGS</td>\n",
 809 |        "      <td>9333500</td>\n",
 810 |        "      <td>MDT</td>\n",
 811 |        "      <td>71.00</td>\n",
 812 |        "      <td>A:[91]</td>\n",
 813 |        "      <td>NaN</td>\n",
 814 |        "      <td>None</td>\n",
 815 |        "    </tr>\n",
 816 |        "    <tr>\n",
 817 |        "      <th>2001-05-07 07:45:00</th>\n",
 818 |        "      <td>USGS</td>\n",
 819 |        "      <td>9333500</td>\n",
 820 |        "      <td>MDT</td>\n",
 821 |        "      <td>70.00</td>\n",
 822 |        "      <td>A:[91]</td>\n",
 823 |        "      <td>NaN</td>\n",
 824 |        "      <td>None</td>\n",
 825 |        "    </tr>\n",
 826 |        "    <tr>\n",
 827 |        "      <th>2001-05-07 08:00:00</th>\n",
 828 |        "      <td>USGS</td>\n",
 829 |        "      <td>9333500</td>\n",
 830 |        "      <td>MDT</td>\n",
 831 |        "      <td>70.00</td>\n",
 832 |        "      <td>A:[91]</td>\n",
 833 |        "      <td>NaN</td>\n",
 834 |        "      <td>None</td>\n",
 835 |        "    </tr>\n",
 836 |        "    <tr>\n",
 837 |        "      <th>...</th>\n",
 838 |        "      <td>...</td>\n",
 839 |        "      <td>...</td>\n",
 840 |        "      <td>...</td>\n",
 841 |        "      <td>...</td>\n",
 842 |        "      <td>...</td>\n",
 843 |        "      <td>...</td>\n",
 844 |        "      <td>...</td>\n",
 845 |        "    </tr>\n",
 846 |        "    <tr>\n",
 847 |        "      <th>2020-09-28 14:30:00</th>\n",
 848 |        "      <td>USGS</td>\n",
 849 |        "      <td>9333500</td>\n",
 850 |        "      <td>MDT</td>\n",
 851 |        "      <td>9.53</td>\n",
 852 |        "      <td>P</td>\n",
 853 |        "      <td>6.16</td>\n",
 854 |        "      <td>P</td>\n",
 855 |        "    </tr>\n",
 856 |        "    <tr>\n",
 857 |        "      <th>2020-09-28 14:45:00</th>\n",
 858 |        "      <td>USGS</td>\n",
 859 |        "      <td>9333500</td>\n",
 860 |        "      <td>MDT</td>\n",
 861 |        "      <td>9.20</td>\n",
 862 |        "      <td>P</td>\n",
 863 |        "      <td>6.15</td>\n",
 864 |        "      <td>P</td>\n",
 865 |        "    </tr>\n",
 866 |        "    <tr>\n",
 867 |        "      <th>2020-09-28 15:00:00</th>\n",
 868 |        "      <td>USGS</td>\n",
 869 |        "      <td>9333500</td>\n",
 870 |        "      <td>MDT</td>\n",
 871 |        "      <td>9.20</td>\n",
 872 |        "      <td>P</td>\n",
 873 |        "      <td>6.15</td>\n",
 874 |        "      <td>P</td>\n",
 875 |        "    </tr>\n",
 876 |        "    <tr>\n",
 877 |        "      <th>2020-09-28 15:15:00</th>\n",
 878 |        "      <td>USGS</td>\n",
 879 |        "      <td>9333500</td>\n",
 880 |        "      <td>MDT</td>\n",
 881 |        "      <td>9.20</td>\n",
 882 |        "      <td>P</td>\n",
 883 |        "      <td>6.15</td>\n",
 884 |        "      <td>P</td>\n",
 885 |        "    </tr>\n",
 886 |        "    <tr>\n",
 887 |        "      <th>2020-09-28 15:30:00</th>\n",
 888 |        "      <td>USGS</td>\n",
 889 |        "      <td>9333500</td>\n",
 890 |        "      <td>MDT</td>\n",
 891 |        "      <td>9.20</td>\n",
 892 |        "      <td>P</td>\n",
 893 |        "      <td>6.15</td>\n",
 894 |        "      <td>P</td>\n",
 895 |        "    </tr>\n",
 896 |        "  </tbody>\n",
 897 |        "</table>\n",
 898 |        "<p>539305 rows × 7 columns</p>\n",
 899 |        "</div>"
 900 |       ],
 901 |       "text/plain": [
 902 |        "                    agency_cd  site_no tz_cd    cfs 144166_00060_cd  \\\n",
 903 |        "2001-05-07 07:00:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 904 |        "2001-05-07 07:15:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 905 |        "2001-05-07 07:30:00      USGS  9333500   MDT  71.00          A:[91]   \n",
 906 |        "2001-05-07 07:45:00      USGS  9333500   MDT  70.00          A:[91]   \n",
 907 |        "2001-05-07 08:00:00      USGS  9333500   MDT  70.00          A:[91]   \n",
 908 |        "...                       ...      ...   ...    ...             ...   \n",
 909 |        "2020-09-28 14:30:00      USGS  9333500   MDT   9.53               P   \n",
 910 |        "2020-09-28 14:45:00      USGS  9333500   MDT   9.20               P   \n",
 911 |        "2020-09-28 15:00:00      USGS  9333500   MDT   9.20               P   \n",
 912 |        "2020-09-28 15:15:00      USGS  9333500   MDT   9.20               P   \n",
 913 |        "2020-09-28 15:30:00      USGS  9333500   MDT   9.20               P   \n",
 914 |        "\n",
 915 |        "                     gage_height 144167_00065_cd  \n",
 916 |        "2001-05-07 07:00:00          NaN            None  \n",
 917 |        "2001-05-07 07:15:00          NaN            None  \n",
 918 |        "2001-05-07 07:30:00          NaN            None  \n",
 919 |        "2001-05-07 07:45:00          NaN            None  \n",
 920 |        "2001-05-07 08:00:00          NaN            None  \n",
 921 |        "...                          ...             ...  \n",
 922 |        "2020-09-28 14:30:00         6.16               P  \n",
 923 |        "2020-09-28 14:45:00         6.15               P  \n",
 924 |        "2020-09-28 15:00:00         6.15               P  \n",
 925 |        "2020-09-28 15:15:00         6.15               P  \n",
 926 |        "2020-09-28 15:30:00         6.15               P  \n",
 927 |        "\n",
 928 |        "[539305 rows x 7 columns]"
 929 |       ]
 930 |      },
 931 |      "execution_count": 19,
 932 |      "metadata": {},
 933 |      "output_type": "execute_result"
 934 |     }
 935 |    ],
 936 |    "source": [
 937 |     "dd.to_json('/tmp/dd.json.gz')\n",
 938 |     "dd2 = pd.read_json('/tmp/dd.json')\n",
 939 |     "dd2"
 940 |    ]
 941 |   },
 942 |   {
 943 |    "cell_type": "code",
 944 |    "execution_count": 20,
 945 |    "metadata": {
 946 |     "lines_to_next_cell": 2
 947 |    },
 948 |    "outputs": [
 949 |     {
 950 |      "data": {
 951 |       "text/plain": [
 952 |        "False"
 953 |       ]
 954 |      },
 955 |      "execution_count": 20,
 956 |      "metadata": {},
 957 |      "output_type": "execute_result"
 958 |     }
 959 |    ],
 960 |    "source": [
 961 |     "dd2.equals(dd)"
 962 |    ]
 963 |   },
 964 |   {
 965 |    "cell_type": "code",
 966 |    "execution_count": 21,
 967 |    "metadata": {
 968 |     "lines_to_next_cell": 2
 969 |    },
 970 |    "outputs": [],
 971 |    "source": [
 972 |     "dd3 = (dd2\n",
 973 |     " .reset_index()\n",
 974 |     " .rename(columns={'index':'datetime'})\n",
 975 |     " .assign(datetime=lambda df_: df_.datetime.dt.tz_localize(tz='UTC')\n",
 976 |     "         .dt.tz_convert('America/Denver'))\n",
 977 |     " .set_index('datetime')\n",
 978 |     ")"
 979 |    ]
 980 |   },
 981 |   {
 982 |    "cell_type": "code",
 983 |    "execution_count": 22,
 984 |    "metadata": {
 985 |     "lines_to_next_cell": 2
 986 |    },
 987 |    "outputs": [
 988 |     {
 989 |      "data": {
 990 |       "text/html": [
 991 |        "<div>\n",
 992 |        "<style scoped>\n",
 993 |        "    .dataframe tbody tr th:only-of-type {\n",
 994 |        "        vertical-align: middle;\n",
 995 |        "    }\n",
 996 |        "\n",
 997 |        "    .dataframe tbody tr th {\n",
 998 |        "        vertical-align: top;\n",
 999 |        "    }\n",
1000 |        "\n",
1001 |        "    .dataframe thead th {\n",
1002 |        "        text-align: right;\n",
1003 |        "    }\n",
1004 |        "</style>\n",
1005 |        "<table border=\"1\" class=\"dataframe\">\n",
1006 |        "  <thead>\n",
1007 |        "    <tr style=\"text-align: right;\">\n",
1008 |        "      <th></th>\n",
1009 |        "      <th>agency_cd</th>\n",
1010 |        "      <th>site_no</th>\n",
1011 |        "      <th>tz_cd</th>\n",
1012 |        "      <th>cfs</th>\n",
1013 |        "      <th>144166_00060_cd</th>\n",
1014 |        "      <th>gage_height</th>\n",
1015 |        "      <th>144167_00065_cd</th>\n",
1016 |        "    </tr>\n",
1017 |        "    <tr>\n",
1018 |        "      <th>datetime</th>\n",
1019 |        "      <th></th>\n",
1020 |        "      <th></th>\n",
1021 |        "      <th></th>\n",
1022 |        "      <th></th>\n",
1023 |        "      <th></th>\n",
1024 |        "      <th></th>\n",
1025 |        "      <th></th>\n",
1026 |        "    </tr>\n",
1027 |        "  </thead>\n",
1028 |        "  <tbody>\n",
1029 |        "    <tr>\n",
1030 |        "      <th>2001-05-07 01:00:00-06:00</th>\n",
1031 |        "      <td>USGS</td>\n",
1032 |        "      <td>9333500</td>\n",
1033 |        "      <td>MDT</td>\n",
1034 |        "      <td>71.00</td>\n",
1035 |        "      <td>A:[91]</td>\n",
1036 |        "      <td>NaN</td>\n",
1037 |        "      <td>None</td>\n",
1038 |        "    </tr>\n",
1039 |        "    <tr>\n",
1040 |        "      <th>2001-05-07 01:15:00-06:00</th>\n",
1041 |        "      <td>USGS</td>\n",
1042 |        "      <td>9333500</td>\n",
1043 |        "      <td>MDT</td>\n",
1044 |        "      <td>71.00</td>\n",
1045 |        "      <td>A:[91]</td>\n",
1046 |        "      <td>NaN</td>\n",
1047 |        "      <td>None</td>\n",
1048 |        "    </tr>\n",
1049 |        "    <tr>\n",
1050 |        "      <th>2001-05-07 01:30:00-06:00</th>\n",
1051 |        "      <td>USGS</td>\n",
1052 |        "      <td>9333500</td>\n",
1053 |        "      <td>MDT</td>\n",
1054 |        "      <td>71.00</td>\n",
1055 |        "      <td>A:[91]</td>\n",
1056 |        "      <td>NaN</td>\n",
1057 |        "      <td>None</td>\n",
1058 |        "    </tr>\n",
1059 |        "    <tr>\n",
1060 |        "      <th>2001-05-07 01:45:00-06:00</th>\n",
1061 |        "      <td>USGS</td>\n",
1062 |        "      <td>9333500</td>\n",
1063 |        "      <td>MDT</td>\n",
1064 |        "      <td>70.00</td>\n",
1065 |        "      <td>A:[91]</td>\n",
1066 |        "      <td>NaN</td>\n",
1067 |        "      <td>None</td>\n",
1068 |        "    </tr>\n",
1069 |        "    <tr>\n",
1070 |        "      <th>2001-05-07 02:00:00-06:00</th>\n",
1071 |        "      <td>USGS</td>\n",
1072 |        "      <td>9333500</td>\n",
1073 |        "      <td>MDT</td>\n",
1074 |        "      <td>70.00</td>\n",
1075 |        "      <td>A:[91]</td>\n",
1076 |        "      <td>NaN</td>\n",
1077 |        "      <td>None</td>\n",
1078 |        "    </tr>\n",
1079 |        "    <tr>\n",
1080 |        "      <th>...</th>\n",
1081 |        "      <td>...</td>\n",
1082 |        "      <td>...</td>\n",
1083 |        "      <td>...</td>\n",
1084 |        "      <td>...</td>\n",
1085 |        "      <td>...</td>\n",
1086 |        "      <td>...</td>\n",
1087 |        "      <td>...</td>\n",
1088 |        "    </tr>\n",
1089 |        "    <tr>\n",
1090 |        "      <th>2020-09-28 08:30:00-06:00</th>\n",
1091 |        "      <td>USGS</td>\n",
1092 |        "      <td>9333500</td>\n",
1093 |        "      <td>MDT</td>\n",
1094 |        "      <td>9.53</td>\n",
1095 |        "      <td>P</td>\n",
1096 |        "      <td>6.16</td>\n",
1097 |        "      <td>P</td>\n",
1098 |        "    </tr>\n",
1099 |        "    <tr>\n",
1100 |        "      <th>2020-09-28 08:45:00-06:00</th>\n",
1101 |        "      <td>USGS</td>\n",
1102 |        "      <td>9333500</td>\n",
1103 |        "      <td>MDT</td>\n",
1104 |        "      <td>9.20</td>\n",
1105 |        "      <td>P</td>\n",
1106 |        "      <td>6.15</td>\n",
1107 |        "      <td>P</td>\n",
1108 |        "    </tr>\n",
1109 |        "    <tr>\n",
1110 |        "      <th>2020-09-28 09:00:00-06:00</th>\n",
1111 |        "      <td>USGS</td>\n",
1112 |        "      <td>9333500</td>\n",
1113 |        "      <td>MDT</td>\n",
1114 |        "      <td>9.20</td>\n",
1115 |        "      <td>P</td>\n",
1116 |        "      <td>6.15</td>\n",
1117 |        "      <td>P</td>\n",
1118 |        "    </tr>\n",
1119 |        "    <tr>\n",
1120 |        "      <th>2020-09-28 09:15:00-06:00</th>\n",
1121 |        "      <td>USGS</td>\n",
1122 |        "      <td>9333500</td>\n",
1123 |        "      <td>MDT</td>\n",
1124 |        "      <td>9.20</td>\n",
1125 |        "      <td>P</td>\n",
1126 |        "      <td>6.15</td>\n",
1127 |        "      <td>P</td>\n",
1128 |        "    </tr>\n",
1129 |        "    <tr>\n",
1130 |        "      <th>2020-09-28 09:30:00-06:00</th>\n",
1131 |        "      <td>USGS</td>\n",
1132 |        "      <td>9333500</td>\n",
1133 |        "      <td>MDT</td>\n",
1134 |        "      <td>9.20</td>\n",
1135 |        "      <td>P</td>\n",
1136 |        "      <td>6.15</td>\n",
1137 |        "      <td>P</td>\n",
1138 |        "    </tr>\n",
1139 |        "  </tbody>\n",
1140 |        "</table>\n",
1141 |        "<p>539305 rows × 7 columns</p>\n",
1142 |        "</div>"
1143 |       ],
1144 |       "text/plain": [
1145 |        "                          agency_cd  site_no tz_cd    cfs 144166_00060_cd  \\\n",
1146 |        "datetime                                                                    \n",
1147 |        "2001-05-07 01:00:00-06:00      USGS  9333500   MDT  71.00          A:[91]   \n",
1148 |        "2001-05-07 01:15:00-06:00      USGS  9333500   MDT  71.00          A:[91]   \n",
1149 |        "2001-05-07 01:30:00-06:00      USGS  9333500   MDT  71.00          A:[91]   \n",
1150 |        "2001-05-07 01:45:00-06:00      USGS  9333500   MDT  70.00          A:[91]   \n",
1151 |        "2001-05-07 02:00:00-06:00      USGS  9333500   MDT  70.00          A:[91]   \n",
1152 |        "...                             ...      ...   ...    ...             ...   \n",
1153 |        "2020-09-28 08:30:00-06:00      USGS  9333500   MDT   9.53               P   \n",
1154 |        "2020-09-28 08:45:00-06:00      USGS  9333500   MDT   9.20               P   \n",
1155 |        "2020-09-28 09:00:00-06:00      USGS  9333500   MDT   9.20               P   \n",
1156 |        "2020-09-28 09:15:00-06:00      USGS  9333500   MDT   9.20               P   \n",
1157 |        "2020-09-28 09:30:00-06:00      USGS  9333500   MDT   9.20               P   \n",
1158 |        "\n",
1159 |        "                           gage_height 144167_00065_cd  \n",
1160 |        "datetime                                                \n",
1161 |        "2001-05-07 01:00:00-06:00          NaN            None  \n",
1162 |        "2001-05-07 01:15:00-06:00          NaN            None  \n",
1163 |        "2001-05-07 01:30:00-06:00          NaN            None  \n",
1164 |        "2001-05-07 01:45:00-06:00          NaN            None  \n",
1165 |        "2001-05-07 02:00:00-06:00          NaN            None  \n",
1166 |        "...                                ...             ...  \n",
1167 |        "2020-09-28 08:30:00-06:00         6.16               P  \n",
1168 |        "2020-09-28 08:45:00-06:00         6.15               P  \n",
1169 |        "2020-09-28 09:00:00-06:00         6.15               P  \n",
1170 |        "2020-09-28 09:15:00-06:00         6.15               P  \n",
1171 |        "2020-09-28 09:30:00-06:00         6.15               P  \n",
1172 |        "\n",
1173 |        "[539305 rows x 7 columns]"
1174 |       ]
1175 |      },
1176 |      "execution_count": 22,
1177 |      "metadata": {},
1178 |      "output_type": "execute_result"
1179 |     }
1180 |    ],
1181 |    "source": [
1182 |     "dd3"
1183 |    ]
1184 |   },
1185 |   {
1186 |    "cell_type": "code",
1187 |    "execution_count": 23,
1188 |    "metadata": {
1189 |     "lines_to_next_cell": 2
1190 |    },
1191 |    "outputs": [
1192 |     {
1193 |      "data": {
1194 |       "text/plain": [
1195 |        "False"
1196 |       ]
1197 |      },
1198 |      "execution_count": 23,
1199 |      "metadata": {},
1200 |      "output_type": "execute_result"
1201 |     }
1202 |    ],
1203 |    "source": [
1204 |     "dd3.equals(dd)"
1205 |    ]
1206 |   },
1207 |   {
1208 |    "cell_type": "code",
1209 |    "execution_count": 24,
1210 |    "metadata": {
1211 |     "lines_to_next_cell": 2
1212 |    },
1213 |    "outputs": [
1214 |     {
1215 |      "data": {
1216 |       "text/plain": [
1217 |        "True"
1218 |       ]
1219 |      },
1220 |      "execution_count": 24,
1221 |      "metadata": {},
1222 |      "output_type": "execute_result"
1223 |     }
1224 |    ],
1225 |    "source": [
1226 |     "dd3.round(3).equals(dd)"
1227 |    ]
1228 |   },
1229 |   {
1230 |    "cell_type": "code",
1231 |    "execution_count": 25,
1232 |    "metadata": {
1233 |     "lines_to_next_cell": 2
1234 |    },
1235 |    "outputs": [
1236 |     {
1237 |      "data": {
1238 |       "text/html": [
1239 |        "<div>\n",
1240 |        "<style scoped>\n",
1241 |        "    .dataframe tbody tr th:only-of-type {\n",
1242 |        "        vertical-align: middle;\n",
1243 |        "    }\n",
1244 |        "\n",
1245 |        "    .dataframe tbody tr th {\n",
1246 |        "        vertical-align: top;\n",
1247 |        "    }\n",
1248 |        "\n",
1249 |        "    .dataframe thead th {\n",
1250 |        "        text-align: right;\n",
1251 |        "    }\n",
1252 |        "</style>\n",
1253 |        "<table border=\"1\" class=\"dataframe\">\n",
1254 |        "  <thead>\n",
1255 |        "    <tr style=\"text-align: right;\">\n",
1256 |        "      <th></th>\n",
1257 |        "      <th>agency_cd</th>\n",
1258 |        "      <th>site_no</th>\n",
1259 |        "      <th>tz_cd</th>\n",
1260 |        "      <th>cfs</th>\n",
1261 |        "      <th>144166_00060_cd</th>\n",
1262 |        "      <th>gage_height</th>\n",
1263 |        "      <th>144167_00065_cd</th>\n",
1264 |        "    </tr>\n",
1265 |        "    <tr>\n",
1266 |        "      <th>datetime</th>\n",
1267 |        "      <th></th>\n",
1268 |        "      <th></th>\n",
1269 |        "      <th></th>\n",
1270 |        "      <th></th>\n",
1271 |        "      <th></th>\n",
1272 |        "      <th></th>\n",
1273 |        "      <th></th>\n",
1274 |        "    </tr>\n",
1275 |        "  </thead>\n",
1276 |        "  <tbody>\n",
1277 |        "    <tr>\n",
1278 |        "      <th>2001-05-07 01:00:00-06:00</th>\n",
1279 |        "      <td>USGS</td>\n",
1280 |        "      <td>9333500</td>\n",
1281 |        "      <td>MDT</td>\n",
1282 |        "      <td>71.0</td>\n",
1283 |        "      <td>A:[91]</td>\n",
1284 |        "      <td>NaN</td>\n",
1285 |        "      <td>NaN</td>\n",
1286 |        "    </tr>\n",
1287 |        "    <tr>\n",
1288 |        "      <th>2001-05-07 01:15:00-06:00</th>\n",
1289 |        "      <td>USGS</td>\n",
1290 |        "      <td>9333500</td>\n",
1291 |        "      <td>MDT</td>\n",
1292 |        "      <td>71.0</td>\n",
1293 |        "      <td>A:[91]</td>\n",
1294 |        "      <td>NaN</td>\n",
1295 |        "      <td>NaN</td>\n",
1296 |        "    </tr>\n",
1297 |        "    <tr>\n",
1298 |        "      <th>2001-05-07 01:30:00-06:00</th>\n",
1299 |        "      <td>USGS</td>\n",
1300 |        "      <td>9333500</td>\n",
1301 |        "      <td>MDT</td>\n",
1302 |        "      <td>71.0</td>\n",
1303 |        "      <td>A:[91]</td>\n",
1304 |        "      <td>NaN</td>\n",
1305 |        "      <td>NaN</td>\n",
1306 |        "    </tr>\n",
1307 |        "    <tr>\n",
1308 |        "      <th>2001-05-07 01:45:00-06:00</th>\n",
1309 |        "      <td>USGS</td>\n",
1310 |        "      <td>9333500</td>\n",
1311 |        "      <td>MDT</td>\n",
1312 |        "      <td>70.0</td>\n",
1313 |        "      <td>A:[91]</td>\n",
1314 |        "      <td>NaN</td>\n",
1315 |        "      <td>NaN</td>\n",
1316 |        "    </tr>\n",
1317 |        "    <tr>\n",
1318 |        "      <th>2001-05-07 02:00:00-06:00</th>\n",
1319 |        "      <td>USGS</td>\n",
1320 |        "      <td>9333500</td>\n",
1321 |        "      <td>MDT</td>\n",
1322 |        "      <td>70.0</td>\n",
1323 |        "      <td>A:[91]</td>\n",
1324 |        "      <td>NaN</td>\n",
1325 |        "      <td>NaN</td>\n",
1326 |        "    </tr>\n",
1327 |        "  </tbody>\n",
1328 |        "</table>\n",
1329 |        "</div>"
1330 |       ],
1331 |       "text/plain": [
1332 |        "                          agency_cd  site_no tz_cd   cfs 144166_00060_cd  \\\n",
1333 |        "datetime                                                                   \n",
1334 |        "2001-05-07 01:00:00-06:00      USGS  9333500   MDT  71.0          A:[91]   \n",
1335 |        "2001-05-07 01:15:00-06:00      USGS  9333500   MDT  71.0          A:[91]   \n",
1336 |        "2001-05-07 01:30:00-06:00      USGS  9333500   MDT  71.0          A:[91]   \n",
1337 |        "2001-05-07 01:45:00-06:00      USGS  9333500   MDT  70.0          A:[91]   \n",
1338 |        "2001-05-07 02:00:00-06:00      USGS  9333500   MDT  70.0          A:[91]   \n",
1339 |        "\n",
1340 |        "                           gage_height 144167_00065_cd  \n",
1341 |        "datetime                                                \n",
1342 |        "2001-05-07 01:00:00-06:00          NaN             NaN  \n",
1343 |        "2001-05-07 01:15:00-06:00          NaN             NaN  \n",
1344 |        "2001-05-07 01:30:00-06:00          NaN             NaN  \n",
1345 |        "2001-05-07 01:45:00-06:00          NaN             NaN  \n",
1346 |        "2001-05-07 02:00:00-06:00          NaN             NaN  "
1347 |       ]
1348 |      },
1349 |      "execution_count": 25,
1350 |      "metadata": {},
1351 |      "output_type": "execute_result"
1352 |     }
1353 |    ],
1354 |    "source": [
1355 |     "dd.head()"
1356 |    ]
1357 |   },
1358 |   {
1359 |    "cell_type": "code",
1360 |    "execution_count": 26,
1361 |    "metadata": {
1362 |     "lines_to_next_cell": 2
1363 |    },
1364 |    "outputs": [
1365 |     {
1366 |      "data": {
1367 |       "text/plain": [
1368 |        "'{\"agency_cd\":{\"989218800000\":\"USGS\",\"989219700000\":\"USGS\",\"9'"
1369 |       ]
1370 |      },
1371 |      "execution_count": 26,
1372 |      "metadata": {},
1373 |      "output_type": "execute_result"
1374 |     }
1375 |    ],
1376 |    "source": [
1377 |     "dd.head().to_json()[:60]"
1378 |    ]
1379 |   }
1380 |  ],
1381 |  "metadata": {
1382 |   "jupytext": {
1383 |    "cell_metadata_filter": "-all",
1384 |    "main_language": "python",
1385 |    "notebook_metadata_filter": "-all"
1386 |   },
1387 |   "kernelspec": {
1388 |    "display_name": "Python 3",
1389 |    "language": "python",
1390 |    "name": "python3"
1391 |   },
1392 |   "language_info": {
1393 |    "codemirror_mode": {
1394 |     "name": "ipython",
1395 |     "version": 3
1396 |    },
1397 |    "file_extension": ".py",
1398 |    "mimetype": "text/x-python",
1399 |    "name": "python",
1400 |    "nbconvert_exporter": "python",
1401 |    "pygments_lexer": "ipython3",
1402 |    "version": "3.8.5"
1403 |   }
1404 |  },
1405 |  "nbformat": 4,
1406 |  "nbformat_minor": 4
1407 | }
1408 | 


--------------------------------------------------------------------------------