├── 210124_venn.ipynb ├── 210219_Medium_Squarify_Matplotlib.ipynb ├── 210630_Medium_ColabwithR.ipynb ├── 210630_Medium_Exercise_Visualization.ipynb ├── 220219_Medium_PoissonDistribution.ipynb ├── 220220_Medium_ChiSquareDistribution.ipynb ├── 220220_Medium_GeometricDistribution.ipynb ├── 220225_Medium_PDF.ipynb └── README.md /210124_venn.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "nbformat": 4, 3 | "nbformat_minor": 0, 4 | "metadata": { 5 | "colab": { 6 | "name": "Medium_210124Venn.ipynb", 7 | "provenance": [], 8 | "collapsed_sections": [] 9 | }, 10 | "kernelspec": { 11 | "name": "python3", 12 | "display_name": "Python 3" 13 | } 14 | }, 15 | "cells": [ 16 | { 17 | "cell_type": "markdown", 18 | "metadata": { 19 | "id": "m5FstR3BXWxM" 20 | }, 21 | "source": [ 22 | "# Venn Diagrams\r\n", 23 | "\r\n", 24 | "## Kate Wall\r\n", 25 | "## Last Edit: Jan. 24, 2021\r\n", 26 | "## How to easily make a Venn Diagrams from pandas DataFrames\r\n" 27 | ] 28 | }, 29 | { 30 | "cell_type": "code", 31 | "metadata": { 32 | "id": "mSJrqTGenhbe" 33 | }, 34 | "source": [ 35 | "from collections import Counter\n", 36 | "from matplotlib_venn import venn2, venn3\n", 37 | "import matplotlib.pyplot as plt\n", 38 | "import pandas as pd\n", 39 | "from IPython.core.display import HTML\n", 40 | "def multi_table(table_list): #for visualizing tables in the same cell\n", 41 | " return HTML(\n", 42 | " '' +\n", 43 | " ''.join(['' for table in table_list]) +\n", 44 | " '
' + table._repr_html_() + '
'\n", 45 | " ) #https://github.com/epmoyer/ipy_table/issues/24" 46 | ], 47 | "execution_count": 1, 48 | "outputs": [] 49 | }, 50 | { 51 | "cell_type": "markdown", 52 | "metadata": { 53 | "id": "zVJb4ddcV9MH" 54 | }, 55 | "source": [ 56 | "# Setup" 57 | ] 58 | }, 59 | { 60 | "cell_type": "code", 61 | "metadata": { 62 | "colab": { 63 | "base_uri": "https://localhost:8080/", 64 | "height": 260 65 | }, 66 | "id": "08njqMO1Vz9r", 67 | "outputId": "11a878f9-0f36-46f5-89d2-3ed9ed7c7f7c" 68 | }, 69 | "source": [ 70 | "groupA = ['person1','person2','person3','person4','person5','person6','person7']\r\n", 71 | "groupB = ['person1','person2','person3', 'person8','person9']\r\n", 72 | "groupC = ['person1','person2', 'person4', 'person9','person10']\r\n", 73 | "dfA = pd.DataFrame(groupA,columns=['A'])\r\n", 74 | "dfB = pd.DataFrame(groupB,columns=['B'])\r\n", 75 | "dfC = pd.DataFrame(groupC,columns=['C'])\r\n", 76 | "multi_table([dfA,dfB,dfC])" 77 | ], 78 | "execution_count": 2, 79 | "outputs": [ 80 | { 81 | "output_type": "execute_result", 82 | "data": { 83 | "text/html": [ 84 | "
\n", 85 | "\n", 98 | "\n", 99 | " \n", 100 | " \n", 101 | " \n", 102 | " \n", 103 | " \n", 104 | " \n", 105 | " \n", 106 | " \n", 107 | " \n", 108 | " \n", 109 | " \n", 110 | " \n", 111 | " \n", 112 | " \n", 113 | " \n", 114 | " \n", 115 | " \n", 116 | " \n", 117 | " \n", 118 | " \n", 119 | " \n", 120 | " \n", 121 | " \n", 122 | " \n", 123 | " \n", 124 | " \n", 125 | " \n", 126 | " \n", 127 | " \n", 128 | " \n", 129 | " \n", 130 | " \n", 131 | " \n", 132 | " \n", 133 | " \n", 134 | " \n", 135 | "
A
0person1
1person2
2person3
3person4
4person5
5person6
6person7
\n", 136 | "
\n", 137 | "\n", 150 | "\n", 151 | " \n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | " \n", 174 | " \n", 175 | " \n", 176 | " \n", 177 | " \n", 178 | " \n", 179 | "
B
0person1
1person2
2person3
3person8
4person9
\n", 180 | "
\n", 181 | "\n", 194 | "\n", 195 | " \n", 196 | " \n", 197 | " \n", 198 | " \n", 199 | " \n", 200 | " \n", 201 | " \n", 202 | " \n", 203 | " \n", 204 | " \n", 205 | " \n", 206 | " \n", 207 | " \n", 208 | " \n", 209 | " \n", 210 | " \n", 211 | " \n", 212 | " \n", 213 | " \n", 214 | " \n", 215 | " \n", 216 | " \n", 217 | " \n", 218 | " \n", 219 | " \n", 220 | " \n", 221 | " \n", 222 | " \n", 223 | "
C
0person1
1person2
2person4
3person9
4person10
\n", 224 | "
" 225 | ], 226 | "text/plain": [ 227 | "" 228 | ] 229 | }, 230 | "metadata": { 231 | "tags": [] 232 | }, 233 | "execution_count": 2 234 | } 235 | ] 236 | }, 237 | { 238 | "cell_type": "code", 239 | "metadata": { 240 | "colab": { 241 | "base_uri": "https://localhost:8080/", 242 | "height": 345 243 | }, 244 | "id": "D3FzGXlItoZh", 245 | "outputId": "0587d28b-82d3-4330-a781-5d7a28ff3c21" 246 | }, 247 | "source": [ 248 | "people = ['person1','person2','person3','person4','person5','person6','person7','person8','person9','person10']\r\n", 249 | "names = ['angela ','nick ','harry ','nicole ','britney','haseem ','anna ','sarah ','taylor ','jim ']\r\n", 250 | "roster = pd.DataFrame(zip(people,names),columns=['people','name'])\r\n", 251 | "roster" 252 | ], 253 | "execution_count": 3, 254 | "outputs": [ 255 | { 256 | "output_type": "execute_result", 257 | "data": { 258 | "text/html": [ 259 | "
\n", 260 | "\n", 273 | "\n", 274 | " \n", 275 | " \n", 276 | " \n", 277 | " \n", 278 | " \n", 279 | " \n", 280 | " \n", 281 | " \n", 282 | " \n", 283 | " \n", 284 | " \n", 285 | " \n", 286 | " \n", 287 | " \n", 288 | " \n", 289 | " \n", 290 | " \n", 291 | " \n", 292 | " \n", 293 | " \n", 294 | " \n", 295 | " \n", 296 | " \n", 297 | " \n", 298 | " \n", 299 | " \n", 300 | " \n", 301 | " \n", 302 | " \n", 303 | " \n", 304 | " \n", 305 | " \n", 306 | " \n", 307 | " \n", 308 | " \n", 309 | " \n", 310 | " \n", 311 | " \n", 312 | " \n", 313 | " \n", 314 | " \n", 315 | " \n", 316 | " \n", 317 | " \n", 318 | " \n", 319 | " \n", 320 | " \n", 321 | " \n", 322 | " \n", 323 | " \n", 324 | " \n", 325 | " \n", 326 | " \n", 327 | " \n", 328 | " \n", 329 | " \n", 330 | " \n", 331 | " \n", 332 | " \n", 333 | "
peoplename
0person1angela
1person2nick
2person3harry
3person4nicole
4person5britney
5person6haseem
6person7anna
7person8sarah
8person9taylor
9person10jim
\n", 334 | "
" 335 | ], 336 | "text/plain": [ 337 | " people name\n", 338 | "0 person1 angela \n", 339 | "1 person2 nick \n", 340 | "2 person3 harry \n", 341 | "3 person4 nicole \n", 342 | "4 person5 britney\n", 343 | "5 person6 haseem \n", 344 | "6 person7 anna \n", 345 | "7 person8 sarah \n", 346 | "8 person9 taylor \n", 347 | "9 person10 jim " 348 | ] 349 | }, 350 | "metadata": { 351 | "tags": [] 352 | }, 353 | "execution_count": 3 354 | } 355 | ] 356 | }, 357 | { 358 | "cell_type": "code", 359 | "metadata": { 360 | "colab": { 361 | "base_uri": "https://localhost:8080/" 362 | }, 363 | "id": "FXD2XRNYvtsB", 364 | "outputId": "a42560d1-2c05-4a51-b07f-93a3bb0c2826" 365 | }, 366 | "source": [ 367 | "mapRoster = roster.set_index('people').squeeze().to_dict()\r\n", 368 | "mapRoster" 369 | ], 370 | "execution_count": 4, 371 | "outputs": [ 372 | { 373 | "output_type": "execute_result", 374 | "data": { 375 | "text/plain": [ 376 | "{'person1': 'angela ',\n", 377 | " 'person10': 'jim ',\n", 378 | " 'person2': 'nick ',\n", 379 | " 'person3': 'harry ',\n", 380 | " 'person4': 'nicole ',\n", 381 | " 'person5': 'britney',\n", 382 | " 'person6': 'haseem ',\n", 383 | " 'person7': 'anna ',\n", 384 | " 'person8': 'sarah ',\n", 385 | " 'person9': 'taylor '}" 386 | ] 387 | }, 388 | "metadata": { 389 | "tags": [] 390 | }, 391 | "execution_count": 4 392 | } 393 | ] 394 | }, 395 | { 396 | "cell_type": "code", 397 | "metadata": { 398 | "colab": { 399 | "base_uri": "https://localhost:8080/", 400 | "height": 260 401 | }, 402 | "id": "6r9XoI2Q32s8", 403 | "outputId": "bb7d358f-2fbc-4d1e-fdf7-2497f6c58446" 404 | }, 405 | "source": [ 406 | "dfA['ANames'] = dfA.A.map(mapRoster)\n", 407 | "dfB['BNames'] = dfB.B.map(mapRoster)\n", 408 | "dfC['CNames'] = dfC.C.map(mapRoster)\n", 409 | "multi_table([dfA,dfB,dfC])" 410 | ], 411 | "execution_count": 5, 412 | "outputs": [ 413 | { 414 | "output_type": "execute_result", 415 | "data": { 416 | "text/html": [ 417 | "
\n", 418 | "\n", 431 | "\n", 432 | " \n", 433 | " \n", 434 | " \n", 435 | " \n", 436 | " \n", 437 | " \n", 438 | " \n", 439 | " \n", 440 | " \n", 441 | " \n", 442 | " \n", 443 | " \n", 444 | " \n", 445 | " \n", 446 | " \n", 447 | " \n", 448 | " \n", 449 | " \n", 450 | " \n", 451 | " \n", 452 | " \n", 453 | " \n", 454 | " \n", 455 | " \n", 456 | " \n", 457 | " \n", 458 | " \n", 459 | " \n", 460 | " \n", 461 | " \n", 462 | " \n", 463 | " \n", 464 | " \n", 465 | " \n", 466 | " \n", 467 | " \n", 468 | " \n", 469 | " \n", 470 | " \n", 471 | " \n", 472 | " \n", 473 | " \n", 474 | " \n", 475 | " \n", 476 | "
AANames
0person1angela
1person2nick
2person3harry
3person4nicole
4person5britney
5person6haseem
6person7anna
\n", 477 | "
\n", 478 | "\n", 491 | "\n", 492 | " \n", 493 | " \n", 494 | " \n", 495 | " \n", 496 | " \n", 497 | " \n", 498 | " \n", 499 | " \n", 500 | " \n", 501 | " \n", 502 | " \n", 503 | " \n", 504 | " \n", 505 | " \n", 506 | " \n", 507 | " \n", 508 | " \n", 509 | " \n", 510 | " \n", 511 | " \n", 512 | " \n", 513 | " \n", 514 | " \n", 515 | " \n", 516 | " \n", 517 | " \n", 518 | " \n", 519 | " \n", 520 | " \n", 521 | " \n", 522 | " \n", 523 | " \n", 524 | " \n", 525 | " \n", 526 | "
BBNames
0person1angela
1person2nick
2person3harry
3person8sarah
4person9taylor
\n", 527 | "
\n", 528 | "\n", 541 | "\n", 542 | " \n", 543 | " \n", 544 | " \n", 545 | " \n", 546 | " \n", 547 | " \n", 548 | " \n", 549 | " \n", 550 | " \n", 551 | " \n", 552 | " \n", 553 | " \n", 554 | " \n", 555 | " \n", 556 | " \n", 557 | " \n", 558 | " \n", 559 | " \n", 560 | " \n", 561 | " \n", 562 | " \n", 563 | " \n", 564 | " \n", 565 | " \n", 566 | " \n", 567 | " \n", 568 | " \n", 569 | " \n", 570 | " \n", 571 | " \n", 572 | " \n", 573 | " \n", 574 | " \n", 575 | " \n", 576 | "
CCNames
0person1angela
1person2nick
2person4nicole
3person9taylor
4person10jim
\n", 577 | "
" 578 | ], 579 | "text/plain": [ 580 | "" 581 | ] 582 | }, 583 | "metadata": { 584 | "tags": [] 585 | }, 586 | "execution_count": 5 587 | } 588 | ] 589 | }, 590 | { 591 | "cell_type": "code", 592 | "metadata": { 593 | "colab": { 594 | "base_uri": "https://localhost:8080/", 595 | "height": 260 596 | }, 597 | "id": "aU_lAO0yDJSC", 598 | "outputId": "79833585-ae71-4bdd-fd66-9020184d3066" 599 | }, 600 | "source": [ 601 | "del dfA['A'],dfB['B'],dfC['C']\r\n", 602 | "multi_table([dfA,dfB,dfC])" 603 | ], 604 | "execution_count": 6, 605 | "outputs": [ 606 | { 607 | "output_type": "execute_result", 608 | "data": { 609 | "text/html": [ 610 | "
\n", 611 | "\n", 624 | "\n", 625 | " \n", 626 | " \n", 627 | " \n", 628 | " \n", 629 | " \n", 630 | " \n", 631 | " \n", 632 | " \n", 633 | " \n", 634 | " \n", 635 | " \n", 636 | " \n", 637 | " \n", 638 | " \n", 639 | " \n", 640 | " \n", 641 | " \n", 642 | " \n", 643 | " \n", 644 | " \n", 645 | " \n", 646 | " \n", 647 | " \n", 648 | " \n", 649 | " \n", 650 | " \n", 651 | " \n", 652 | " \n", 653 | " \n", 654 | " \n", 655 | " \n", 656 | " \n", 657 | " \n", 658 | " \n", 659 | " \n", 660 | " \n", 661 | "
ANames
0angela
1nick
2harry
3nicole
4britney
5haseem
6anna
\n", 662 | "
\n", 663 | "\n", 676 | "\n", 677 | " \n", 678 | " \n", 679 | " \n", 680 | " \n", 681 | " \n", 682 | " \n", 683 | " \n", 684 | " \n", 685 | " \n", 686 | " \n", 687 | " \n", 688 | " \n", 689 | " \n", 690 | " \n", 691 | " \n", 692 | " \n", 693 | " \n", 694 | " \n", 695 | " \n", 696 | " \n", 697 | " \n", 698 | " \n", 699 | " \n", 700 | " \n", 701 | " \n", 702 | " \n", 703 | " \n", 704 | " \n", 705 | "
BNames
0angela
1nick
2harry
3sarah
4taylor
\n", 706 | "
\n", 707 | "\n", 720 | "\n", 721 | " \n", 722 | " \n", 723 | " \n", 724 | " \n", 725 | " \n", 726 | " \n", 727 | " \n", 728 | " \n", 729 | " \n", 730 | " \n", 731 | " \n", 732 | " \n", 733 | " \n", 734 | " \n", 735 | " \n", 736 | " \n", 737 | " \n", 738 | " \n", 739 | " \n", 740 | " \n", 741 | " \n", 742 | " \n", 743 | " \n", 744 | " \n", 745 | " \n", 746 | " \n", 747 | " \n", 748 | " \n", 749 | "
CNames
0angela
1nick
2nicole
3taylor
4jim
\n", 750 | "
" 751 | ], 752 | "text/plain": [ 753 | "" 754 | ] 755 | }, 756 | "metadata": { 757 | "tags": [] 758 | }, 759 | "execution_count": 6 760 | } 761 | ] 762 | }, 763 | { 764 | "cell_type": "markdown", 765 | "metadata": { 766 | "id": "JKdtDSyUja-x" 767 | }, 768 | "source": [ 769 | "# Three-Way Venn Diagram" 770 | ] 771 | }, 772 | { 773 | "cell_type": "code", 774 | "metadata": { 775 | "id": "iLXyA-VJ40kn" 776 | }, 777 | "source": [ 778 | "A = set(dfA.ANames)\r\n", 779 | "B = set(dfB.BNames)\r\n", 780 | "C = set(dfC.CNames)\r\n", 781 | "\r\n", 782 | "AB_overlap = A & B\r\n", 783 | "AC_overlap = A & C\r\n", 784 | "BC_overlap = B & C\r\n", 785 | "ABC_overlap = A & B & C\r\n", 786 | "\r\n", 787 | "A_rest = A - AB_overlap - AC_overlap\r\n", 788 | "B_rest = B - AB_overlap - BC_overlap\r\n", 789 | "C_rest = C - AC_overlap - BC_overlap\r\n", 790 | "\r\n", 791 | "AB_only = AB_overlap - ABC_overlap\r\n", 792 | "AC_only = AC_overlap - ABC_overlap\r\n", 793 | "BC_only = BC_overlap - ABC_overlap" 794 | ], 795 | "execution_count": 7, 796 | "outputs": [] 797 | }, 798 | { 799 | "cell_type": "code", 800 | "metadata": { 801 | "colab": { 802 | "base_uri": "https://localhost:8080/", 803 | "height": 392 804 | }, 805 | "id": "nFixjxK570H0", 806 | "outputId": "c35ac279-c8cc-48ba-bb4e-83fe0c00627c" 807 | }, 808 | "source": [ 809 | "sets = Counter() #set order A, B, C \r\n", 810 | "sets['100'] = len(A_rest) #100 denotes A on, B off, C off\r\n", 811 | "sets['001'] = len(C_rest) #001 denotes A off, B off, C on\r\n", 812 | "sets['010'] = len(B_rest) #010 denotes A off, B on, C off\r\n", 813 | "sets['101'] = len(AC_only) #101 denotes A on, B off, C on\r\n", 814 | "sets['110'] = len(AB_only) #110 denotes A on, B on, C off\r\n", 815 | "sets['011'] = len(BC_only) #011 denotes A off, B on, C on\r\n", 816 | "sets['111'] = len(ABC_overlap) #011 denotes A on, B on, C on\r\n", 817 | "labels = ('Group A', 'Group B', 'Group C')\r\n", 818 | "\r\n", 819 | "plt.figure(figsize=(7,7))\r\n", 820 | "ax = plt.gca()\r\n", 821 | "venn3(subsets=sets, set_labels=labels, ax=ax,set_colors=('darkviolet','deepskyblue','blue'),alpha=0.7) \r\n", 822 | "plt.show()" 823 | ], 824 | "execution_count": 8, 825 | "outputs": [ 826 | { 827 | "output_type": "display_data", 828 | "data": { 829 | "image/png": "\n", 830 | "text/plain": [ 831 | "
" 832 | ] 833 | }, 834 | "metadata": { 835 | "tags": [] 836 | } 837 | } 838 | ] 839 | }, 840 | { 841 | "cell_type": "markdown", 842 | "metadata": { 843 | "id": "g01YsUjIMepu" 844 | }, 845 | "source": [ 846 | "## Set the \"set label\" color (e.g. Group A) " 847 | ] 848 | }, 849 | { 850 | "cell_type": "code", 851 | "metadata": { 852 | "colab": { 853 | "base_uri": "https://localhost:8080/", 854 | "height": 392 855 | }, 856 | "id": "sc2Xd8fmJ-z4", 857 | "outputId": "128f303f-2ac7-4dfc-a213-6f63c25f2cce" 858 | }, 859 | "source": [ 860 | "plt.figure(figsize=(7,7))\r\n", 861 | "ax = plt.gca()\r\n", 862 | "colors = ['darkviolet','deepskyblue','blue']\r\n", 863 | "v = venn3(subsets=sets, set_labels=labels, ax=ax,set_colors=('darkviolet','deepskyblue','blue'),alpha=0.7) \r\n", 864 | "i = 0\r\n", 865 | "for text in v.set_labels:\r\n", 866 | " text.set_color(colors[i])\r\n", 867 | " i+=1\r\n", 868 | "plt.show()" 869 | ], 870 | "execution_count": 9, 871 | "outputs": [ 872 | { 873 | "output_type": "display_data", 874 | "data": { 875 | "image/png": "\n", 876 | "text/plain": [ 877 | "
" 878 | ] 879 | }, 880 | "metadata": { 881 | "tags": [] 882 | } 883 | } 884 | ] 885 | }, 886 | { 887 | "cell_type": "markdown", 888 | "metadata": { 889 | "id": "XoX45JzEMp_R" 890 | }, 891 | "source": [ 892 | "## Set the \"subset label\" color (e.g. 1,2,3)" 893 | ] 894 | }, 895 | { 896 | "cell_type": "code", 897 | "metadata": { 898 | "colab": { 899 | "base_uri": "https://localhost:8080/", 900 | "height": 392 901 | }, 902 | "id": "OIIEYLgGL1Ha", 903 | "outputId": "90895949-1bab-40a4-e94c-00e498574833" 904 | }, 905 | "source": [ 906 | "plt.figure(figsize=(7,7))\r\n", 907 | "ax = plt.gca()\r\n", 908 | "colors = ['darkviolet','deepskyblue','blue']\r\n", 909 | "v = venn3(subsets=sets, set_labels=labels, ax=ax,set_colors=('darkviolet','deepskyblue','blue'),alpha=0.7) \r\n", 910 | "i = 0\r\n", 911 | "for text in v.set_labels:\r\n", 912 | " text.set_color(colors[i])\r\n", 913 | " i+=1\r\n", 914 | "\r\n", 915 | "for text in v.subset_labels:\r\n", 916 | " text.set_color('white')\r\n", 917 | " text.set_fontsize(16)\r\n", 918 | " text.set_fontweight('bold')\r\n", 919 | "plt.show()" 920 | ], 921 | "execution_count": 10, 922 | "outputs": [ 923 | { 924 | "output_type": "display_data", 925 | "data": { 926 | "image/png": "\n", 927 | "text/plain": [ 928 | "
" 929 | ] 930 | }, 931 | "metadata": { 932 | "tags": [] 933 | } 934 | } 935 | ] 936 | }, 937 | { 938 | "cell_type": "markdown", 939 | "metadata": { 940 | "id": "p8MzwD3TNM-y" 941 | }, 942 | "source": [ 943 | "## Replace the labels with a legend" 944 | ] 945 | }, 946 | { 947 | "cell_type": "code", 948 | "metadata": { 949 | "colab": { 950 | "base_uri": "https://localhost:8080/", 951 | "height": 408 952 | }, 953 | "id": "zUnC9s3a1CN_", 954 | "outputId": "dcdd09bc-35d6-4e06-b86f-1888d7309740" 955 | }, 956 | "source": [ 957 | "plt.figure(figsize=(7,7))\r\n", 958 | "ax = plt.gca()\r\n", 959 | "v = venn3(subsets=sets, set_labels=('','',''), ax=ax,set_colors=('darkviolet','deepskyblue','blue'),alpha=0.7) \r\n", 960 | "for text in v.subset_labels:\r\n", 961 | " text.set_color('white')\r\n", 962 | " text.set_fontsize(16)\r\n", 963 | " text.set_fontweight('bold')\r\n", 964 | "\r\n", 965 | "h = [] \r\n", 966 | "for i in sets:\r\n", 967 | " h.append(v.get_patch_by_id(i)) #get color patches \r\n", 968 | "l = ['A only','C only','B only','A & C shared','A & B shared','B & C shared','A & B & C shared']\r\n", 969 | "ax.legend(handles=h, labels=l, title=\"Legend\",loc='lower left') #write labels for color patches\r\n", 970 | "plt.title('Membership across Three Groups')\r\n", 971 | "plt.show()" 972 | ], 973 | "execution_count": 11, 974 | "outputs": [ 975 | { 976 | "output_type": "display_data", 977 | "data": { 978 | "image/png": "\n", 979 | "text/plain": [ 980 | "
" 981 | ] 982 | }, 983 | "metadata": { 984 | "tags": [] 985 | } 986 | } 987 | ] 988 | }, 989 | { 990 | "cell_type": "markdown", 991 | "metadata": { 992 | "id": "hrKHhSqWNWI1" 993 | }, 994 | "source": [ 995 | "## Customize the legend contents" 996 | ] 997 | }, 998 | { 999 | "cell_type": "code", 1000 | "metadata": { 1001 | "colab": { 1002 | "base_uri": "https://localhost:8080/", 1003 | "height": 408 1004 | }, 1005 | "id": "gpE1_2oG-8zE", 1006 | "outputId": "3c56b033-478d-40cd-ece5-dabbf236de12" 1007 | }, 1008 | "source": [ 1009 | "plt.figure(figsize=(7,7))\r\n", 1010 | "ax = plt.gca()\r\n", 1011 | "v = venn3(subsets=sets, set_labels=('','',''), ax=ax,set_colors=('darkviolet','deepskyblue','blue'),alpha=0.7)\r\n", 1012 | "for text in v.subset_labels:\r\n", 1013 | " text.set_color('white')\r\n", 1014 | " text.set_fontsize(16)\r\n", 1015 | " text.set_fontweight('bold')\r\n", 1016 | "\r\n", 1017 | "ax.legend(handles=h[0:3], labels=l[0:3], title=\"Legend\",loc='lower left') #create tailored legend from handles and labels \r\n", 1018 | "plt.title('Membership across Three Groups')\r\n", 1019 | "plt.show()" 1020 | ], 1021 | "execution_count": 12, 1022 | "outputs": [ 1023 | { 1024 | "output_type": "display_data", 1025 | "data": { 1026 | "image/png": "\n", 1027 | "text/plain": [ 1028 | "
" 1029 | ] 1030 | }, 1031 | "metadata": { 1032 | "tags": [] 1033 | } 1034 | } 1035 | ] 1036 | }, 1037 | { 1038 | "cell_type": "markdown", 1039 | "metadata": { 1040 | "id": "6KepmYEvAV8X" 1041 | }, 1042 | "source": [ 1043 | "# Two-Way Venn Diagram " 1044 | ] 1045 | }, 1046 | { 1047 | "cell_type": "code", 1048 | "metadata": { 1049 | "colab": { 1050 | "base_uri": "https://localhost:8080/", 1051 | "height": 260 1052 | }, 1053 | "id": "V9WKdqteBn9G", 1054 | "outputId": "e53d79ee-08ff-433a-debb-1b78b19ea41e" 1055 | }, 1056 | "source": [ 1057 | "multi_table([dfA,dfB])" 1058 | ], 1059 | "execution_count": 13, 1060 | "outputs": [ 1061 | { 1062 | "output_type": "execute_result", 1063 | "data": { 1064 | "text/html": [ 1065 | "
\n", 1066 | "\n", 1079 | "\n", 1080 | " \n", 1081 | " \n", 1082 | " \n", 1083 | " \n", 1084 | " \n", 1085 | " \n", 1086 | " \n", 1087 | " \n", 1088 | " \n", 1089 | " \n", 1090 | " \n", 1091 | " \n", 1092 | " \n", 1093 | " \n", 1094 | " \n", 1095 | " \n", 1096 | " \n", 1097 | " \n", 1098 | " \n", 1099 | " \n", 1100 | " \n", 1101 | " \n", 1102 | " \n", 1103 | " \n", 1104 | " \n", 1105 | " \n", 1106 | " \n", 1107 | " \n", 1108 | " \n", 1109 | " \n", 1110 | " \n", 1111 | " \n", 1112 | " \n", 1113 | " \n", 1114 | " \n", 1115 | " \n", 1116 | "
ANames
0angela
1nick
2harry
3nicole
4britney
5haseem
6anna
\n", 1117 | "
\n", 1118 | "\n", 1131 | "\n", 1132 | " \n", 1133 | " \n", 1134 | " \n", 1135 | " \n", 1136 | " \n", 1137 | " \n", 1138 | " \n", 1139 | " \n", 1140 | " \n", 1141 | " \n", 1142 | " \n", 1143 | " \n", 1144 | " \n", 1145 | " \n", 1146 | " \n", 1147 | " \n", 1148 | " \n", 1149 | " \n", 1150 | " \n", 1151 | " \n", 1152 | " \n", 1153 | " \n", 1154 | " \n", 1155 | " \n", 1156 | " \n", 1157 | " \n", 1158 | " \n", 1159 | " \n", 1160 | "
BNames
0angela
1nick
2harry
3sarah
4taylor
\n", 1161 | "
" 1162 | ], 1163 | "text/plain": [ 1164 | "" 1165 | ] 1166 | }, 1167 | "metadata": { 1168 | "tags": [] 1169 | }, 1170 | "execution_count": 13 1171 | } 1172 | ] 1173 | }, 1174 | { 1175 | "cell_type": "code", 1176 | "metadata": { 1177 | "colab": { 1178 | "base_uri": "https://localhost:8080/", 1179 | "height": 362 1180 | }, 1181 | "id": "zGQxYula_xUb", 1182 | "outputId": "2f4972c7-110c-4338-bf92-10cfbae3ca05" 1183 | }, 1184 | "source": [ 1185 | "sets = Counter() #set order A, B \r\n", 1186 | "sets['10'] = len(A-AB_overlap) #10 denotes A on, B off\r\n", 1187 | "sets['01'] = len(B-AB_overlap) #01 denotes A off, B on\r\n", 1188 | "sets['11'] = len(AB_overlap) #11 denotes A on, B on\r\n", 1189 | "labels = ('Group A', 'Group B')\r\n", 1190 | "\r\n", 1191 | "plt.figure(figsize=(7,7))\r\n", 1192 | "ax = plt.gca()\r\n", 1193 | "v= venn2(subsets=sets, set_labels=labels, ax=ax,set_colors=('darkviolet','deepskyblue'),alpha=0.7)\r\n", 1194 | "plt.title('Membership across Two Groups')\r\n", 1195 | "plt.show()" 1196 | ], 1197 | "execution_count": 14, 1198 | "outputs": [ 1199 | { 1200 | "output_type": "display_data", 1201 | "data": { 1202 | "image/png": "\n", 1203 | "text/plain": [ 1204 | "
" 1205 | ] 1206 | }, 1207 | "metadata": { 1208 | "tags": [] 1209 | } 1210 | } 1211 | ] 1212 | } 1213 | ] 1214 | } 1215 | -------------------------------------------------------------------------------- /210630_Medium_ColabwithR.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "nbformat": 4, 3 | "nbformat_minor": 0, 4 | "metadata": { 5 | "colab": { 6 | "name": "Medium_ColabwithR.ipynb", 7 | "provenance": [], 8 | "collapsed_sections": [], 9 | "authorship_tag": "ABX9TyMqsBhxGjsK57FPugbyamcU" 10 | }, 11 | "kernelspec": { 12 | "name": "ir", 13 | "display_name": "R" 14 | } 15 | }, 16 | "cells": [ 17 | { 18 | "cell_type": "markdown", 19 | "metadata": { 20 | "id": "3VcL-Nj-MBVy" 21 | }, 22 | "source": [ 23 | "# I. Initialization" 24 | ] 25 | }, 26 | { 27 | "cell_type": "code", 28 | "metadata": { 29 | "colab": { 30 | "base_uri": "https://localhost:8080/", 31 | "height": 34 32 | }, 33 | "id": "sGEHnVLpgFdV", 34 | "outputId": "d108dabf-f15a-4b47-a1dc-560a626286c4" 35 | }, 36 | "source": [ 37 | "R.version.string" 38 | ], 39 | "execution_count": null, 40 | "outputs": [ 41 | { 42 | "output_type": "display_data", 43 | "data": { 44 | "text/plain": [ 45 | "[1] \"R version 4.1.0 (2021-05-18)\"" 46 | ], 47 | "text/latex": "'R version 4.1.0 (2021-05-18)'", 48 | "text/markdown": "'R version 4.1.0 (2021-05-18)'", 49 | "text/html": [ 50 | "'R version 4.1.0 (2021-05-18)'" 51 | ] 52 | }, 53 | "metadata": { 54 | "tags": [] 55 | } 56 | } 57 | ] 58 | }, 59 | { 60 | "cell_type": "code", 61 | "metadata": { 62 | "id": "VNMyewZ4vRko" 63 | }, 64 | "source": [ 65 | "#https://towardsdatascience.com/how-to-use-r-in-google-colab-b6e02d736497 method 2, runtime is R\n", 66 | "#This should work, but it did not for me. More info at the link below. Did not work in full but got close. \n", 67 | "#https://towardsdatascience.com/how-to-use-r-in-google-colab-b6e02d736497\n", 68 | "#install.packages(\"googledrive\")\n", 69 | "#library(\"googledrive\")\n", 70 | "#drive_auth(\n", 71 | "# email = gargle::gargle_oauth_email(),\n", 72 | "# path = NULL,\n", 73 | "# scopes = \"https://www.googleapis.com/auth/drive\",\n", 74 | "# cache = gargle::gargle_oauth_cache(),\n", 75 | "# use_oob = gargle::gargle_oob_default(),\n", 76 | "# token = NULL\n", 77 | "#)" 78 | ], 79 | "execution_count": null, 80 | "outputs": [] 81 | }, 82 | { 83 | "cell_type": "code", 84 | "metadata": { 85 | "colab": { 86 | "base_uri": "https://localhost:8080/" 87 | }, 88 | "id": "y99Ep9_hgx2k", 89 | "outputId": "277d1cc2-65c7-4fcb-a2ef-5773b30610c2" 90 | }, 91 | "source": [ 92 | "install.packages(\"googledrive\") #only need to install occasionally\n", 93 | "install.packages(\"httpuv\")\n", 94 | "library(\"googledrive\")\n", 95 | "library(\"httpuv\")" 96 | ], 97 | "execution_count": null, 98 | "outputs": [ 99 | { 100 | "output_type": "stream", 101 | "text": [ 102 | "Installing package into ‘/usr/local/lib/R/site-library’\n", 103 | "(as ‘lib’ is unspecified)\n", 104 | "\n", 105 | "Installing package into ‘/usr/local/lib/R/site-library’\n", 106 | "(as ‘lib’ is unspecified)\n", 107 | "\n" 108 | ], 109 | "name": "stderr" 110 | } 111 | ] 112 | }, 113 | { 114 | "cell_type": "code", 115 | "metadata": { 116 | "id": "628_cnx5NZe2", 117 | "colab": { 118 | "base_uri": "https://localhost:8080/" 119 | }, 120 | "outputId": "619c7bd9-f465-485b-e34e-ab0e52e3bd2a" 121 | }, 122 | "source": [ 123 | "if (file.exists(\"/usr/local/lib/python3.7/dist-packages/google/colab/_ipython.py\")) { #may need to update python version occasionally\n", 124 | " install.packages(\"R.utils\")\n", 125 | " library(\"R.utils\")\n", 126 | " library(\"httr\")\n", 127 | " my_check <- function() {return(TRUE)}\n", 128 | " reassignInPackage(\"is_interactive\", pkgName = \"httr\", my_check) \n", 129 | " options(rlang_interactive=TRUE)\n", 130 | "}" 131 | ], 132 | "execution_count": null, 133 | "outputs": [ 134 | { 135 | "output_type": "stream", 136 | "text": [ 137 | "Installing package into ‘/usr/local/lib/R/site-library’\n", 138 | "(as ‘lib’ is unspecified)\n", 139 | "\n", 140 | "Loading required package: R.oo\n", 141 | "\n", 142 | "Loading required package: R.methodsS3\n", 143 | "\n", 144 | "R.methodsS3 v1.8.1 (2020-08-26 16:20:06 UTC) successfully loaded. See ?R.methodsS3 for help.\n", 145 | "\n", 146 | "R.oo v1.24.0 (2020-08-26 16:11:58 UTC) successfully loaded. See ?R.oo for help.\n", 147 | "\n", 148 | "\n", 149 | "Attaching package: ‘R.oo’\n", 150 | "\n", 151 | "\n", 152 | "The following object is masked from ‘package:R.methodsS3’:\n", 153 | "\n", 154 | " throw\n", 155 | "\n", 156 | "\n", 157 | "The following objects are masked from ‘package:methods’:\n", 158 | "\n", 159 | " getClasses, getMethods\n", 160 | "\n", 161 | "\n", 162 | "The following objects are masked from ‘package:base’:\n", 163 | "\n", 164 | " attach, detach, load, save\n", 165 | "\n", 166 | "\n", 167 | "R.utils v2.10.1 (2020-08-26 22:50:31 UTC) successfully loaded. See ?R.utils for help.\n", 168 | "\n", 169 | "\n", 170 | "Attaching package: ‘R.utils’\n", 171 | "\n", 172 | "\n", 173 | "The following object is masked from ‘package:utils’:\n", 174 | "\n", 175 | " timestamp\n", 176 | "\n", 177 | "\n", 178 | "The following objects are masked from ‘package:base’:\n", 179 | "\n", 180 | " cat, commandArgs, getOption, inherits, isOpen, nullfile, parse,\n", 181 | " warnings\n", 182 | "\n", 183 | "\n" 184 | ], 185 | "name": "stderr" 186 | } 187 | ] 188 | }, 189 | { 190 | "cell_type": "code", 191 | "metadata": { 192 | "id": "aKSqnB81a5nH" 193 | }, 194 | "source": [ 195 | "drive_auth(use_oob = TRUE, cache = FALSE)" 196 | ], 197 | "execution_count": null, 198 | "outputs": [] 199 | }, 200 | { 201 | "cell_type": "markdown", 202 | "metadata": { 203 | "id": "5RO6C0OKLTbC" 204 | }, 205 | "source": [ 206 | "# II. Method to Download Direct from Web to Colab Session" 207 | ] 208 | }, 209 | { 210 | "cell_type": "code", 211 | "metadata": { 212 | "colab": { 213 | "base_uri": "https://localhost:8080/", 214 | "height": 34 215 | }, 216 | "id": "tGGCu4Mp56nq", 217 | "outputId": "9d4ce75a-09cf-42d2-fba8-bbdb3a29c4f7" 218 | }, 219 | "source": [ 220 | "getwd()" 221 | ], 222 | "execution_count": null, 223 | "outputs": [ 224 | { 225 | "output_type": "display_data", 226 | "data": { 227 | "text/plain": [ 228 | "[1] \"/content\"" 229 | ], 230 | "text/latex": "'/content'", 231 | "text/markdown": "'/content'", 232 | "text/html": [ 233 | "'/content'" 234 | ] 235 | }, 236 | "metadata": { 237 | "tags": [] 238 | } 239 | } 240 | ] 241 | }, 242 | { 243 | "cell_type": "markdown", 244 | "metadata": { 245 | "id": "RQe3jHzYmMdT" 246 | }, 247 | "source": [ 248 | "That only gets you part of the way to the problem. Next step is to load your file. Create a session download into your temporary 'content' folder, and proceed from there." 249 | ] 250 | }, 251 | { 252 | "cell_type": "code", 253 | "metadata": { 254 | "id": "-45f7m5S3PxM", 255 | "colab": { 256 | "base_uri": "https://localhost:8080/" 257 | }, 258 | "outputId": "a5e07d11-e020-4e93-f6af-8bd87ce930c5" 259 | }, 260 | "source": [ 261 | "download.file('https://data.cdc.gov/api/views/vba9-s8jp/rows.csv?accessType=DOWNLOAD','/content/dnld_direct_from_web.csv')\n", 262 | "unzip(zipfile=\"/content/downloaded.zip\", exdir=\".\") " 263 | ], 264 | "execution_count": null, 265 | "outputs": [ 266 | { 267 | "output_type": "stream", 268 | "text": [ 269 | "Warning message in unzip(zipfile = \"/content/downloaded.zip\", exdir = \".\"):\n", 270 | "“error 1 in extracting from zip file”\n" 271 | ], 272 | "name": "stderr" 273 | } 274 | ] 275 | }, 276 | { 277 | "cell_type": "code", 278 | "metadata": { 279 | "colab": { 280 | "base_uri": "https://localhost:8080/", 281 | "height": 881 282 | }, 283 | "id": "ARXril-X6fXa", 284 | "outputId": "b9969961-d823-40ce-ea31-b2dafc5d10f2" 285 | }, 286 | "source": [ 287 | "library(readr)\n", 288 | "a <- read.csv('/content/dnld_direct_from_web.csv')\n", 289 | "head(a)" 290 | ], 291 | "execution_count": null, 292 | "outputs": [ 293 | { 294 | "output_type": "display_data", 295 | "data": { 296 | "text/plain": [ 297 | " YearStart YearEnd LocationAbbr LocationDesc \n", 298 | "1 2019 2019 AL Alabama \n", 299 | "2 2019 2019 ID Idaho \n", 300 | "3 2019 2019 IA Iowa \n", 301 | "4 2019 2019 LA Louisiana \n", 302 | "5 2019 2019 ME Maine \n", 303 | "6 2019 2019 MA Massachusetts\n", 304 | " Datasource Class \n", 305 | "1 Youth Risk Behavior Surveillance System Sugar Drinks \n", 306 | "2 Youth Risk Behavior Surveillance System Sugar Drinks \n", 307 | "3 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 308 | "4 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 309 | "5 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 310 | "6 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 311 | " Topic \n", 312 | "1 Sugar Drinks - Behavior\n", 313 | "2 Sugar Drinks - Behavior\n", 314 | "3 Obesity / Weight Status\n", 315 | "4 Obesity / Weight Status\n", 316 | "5 Obesity / Weight Status\n", 317 | "6 Obesity / Weight Status\n", 318 | " Question \n", 319 | "1 Percent of students in grades 9-12 who drank regular soda/pop at least one time per day\n", 320 | "2 Percent of students in grades 9-12 who drank regular soda/pop at least one time per day\n", 321 | "3 Percent of students in grades 9-12 who have obesity \n", 322 | "4 Percent of students in grades 9-12 who have obesity \n", 323 | "5 Percent of students in grades 9-12 who have an overweight classification \n", 324 | "6 Percent of students in grades 9-12 who have an overweight classification \n", 325 | " Data_Value_Unit Data_Value_Type ⋯ GeoLocation ClassID\n", 326 | "1 NA Value ⋯ (32.840571122, -86.631860762) SD \n", 327 | "2 NA Value ⋯ (43.682630005, -114.363730042) SD \n", 328 | "3 NA Value ⋯ (42.469400913, -93.816490556) OWS \n", 329 | "4 NA Value ⋯ (31.312660644, -92.445680071) OWS \n", 330 | "5 NA Value ⋯ (45.254228894001, -68.985031336) OWS \n", 331 | "6 NA Value ⋯ (42.27687047, -72.082690675) OWS \n", 332 | " TopicID QuestionID DataValueTypeID LocationID StratificationCategory1\n", 333 | "1 SD1 Q058 VALUE 1 Race/Ethnicity \n", 334 | "2 SD1 Q058 VALUE 16 Race/Ethnicity \n", 335 | "3 OWS1 Q038 VALUE 19 Grade \n", 336 | "4 OWS1 Q038 VALUE 22 Gender \n", 337 | "5 OWS1 Q039 VALUE 23 Race/Ethnicity \n", 338 | "6 OWS1 Q039 VALUE 25 Total \n", 339 | " Stratification1 StratificationCategoryId1 StratificationID1\n", 340 | "1 Hispanic RACE RACEHIS \n", 341 | "2 Hispanic RACE RACEHIS \n", 342 | "3 11th GRADE GRADE11 \n", 343 | "4 Female GEN FEMALE \n", 344 | "5 Hispanic RACE RACEHIS \n", 345 | "6 Total OVR OVERALL " 346 | ], 347 | "text/latex": "A data.frame: 6 × 31\n\\begin{tabular}{r|lllllllllllllllllllll}\n & YearStart & YearEnd & LocationAbbr & LocationDesc & Datasource & Class & Topic & Question & Data\\_Value\\_Unit & Data\\_Value\\_Type & ⋯ & GeoLocation & ClassID & TopicID & QuestionID & DataValueTypeID & LocationID & StratificationCategory1 & Stratification1 & StratificationCategoryId1 & StratificationID1\\\\\n & & & & & & & & & & & ⋯ & & & & & & & & & & \\\\\n\\hline\n\t1 & 2019 & 2019 & AL & Alabama & Youth Risk Behavior Surveillance System & Sugar Drinks & Sugar Drinks - Behavior & Percent of students in grades 9-12 who drank regular soda/pop at least one time per day & NA & Value & ⋯ & (32.840571122, -86.631860762) & SD & SD1 & Q058 & VALUE & 1 & Race/Ethnicity & Hispanic & RACE & RACEHIS\\\\\n\t2 & 2019 & 2019 & ID & Idaho & Youth Risk Behavior Surveillance System & Sugar Drinks & Sugar Drinks - Behavior & Percent of students in grades 9-12 who drank regular soda/pop at least one time per day & NA & Value & ⋯ & (43.682630005, -114.363730042) & SD & SD1 & Q058 & VALUE & 16 & Race/Ethnicity & Hispanic & RACE & RACEHIS\\\\\n\t3 & 2019 & 2019 & IA & Iowa & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have obesity & NA & Value & ⋯ & (42.469400913, -93.816490556) & OWS & OWS1 & Q038 & VALUE & 19 & Grade & 11th & GRADE & GRADE11\\\\\n\t4 & 2019 & 2019 & LA & Louisiana & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have obesity & NA & Value & ⋯ & (31.312660644, -92.445680071) & OWS & OWS1 & Q038 & VALUE & 22 & Gender & Female & GEN & FEMALE \\\\\n\t5 & 2019 & 2019 & ME & Maine & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have an overweight classification & NA & Value & ⋯ & (45.254228894001, -68.985031336) & OWS & OWS1 & Q039 & VALUE & 23 & Race/Ethnicity & Hispanic & RACE & RACEHIS\\\\\n\t6 & 2019 & 2019 & MA & Massachusetts & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have an overweight classification & NA & Value & ⋯ & (42.27687047, -72.082690675) & OWS & OWS1 & Q039 & VALUE & 25 & Total & Total & OVR & OVERALL\\\\\n\\end{tabular}\n", 348 | "text/markdown": "\nA data.frame: 6 × 31\n\n| | YearStart <int> | YearEnd <int> | LocationAbbr <chr> | LocationDesc <chr> | Datasource <chr> | Class <chr> | Topic <chr> | Question <chr> | Data_Value_Unit <lgl> | Data_Value_Type <chr> | ⋯ ⋯ | GeoLocation <chr> | ClassID <chr> | TopicID <chr> | QuestionID <chr> | DataValueTypeID <chr> | LocationID <int> | StratificationCategory1 <chr> | Stratification1 <chr> | StratificationCategoryId1 <chr> | StratificationID1 <chr> |\n|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n| 1 | 2019 | 2019 | AL | Alabama | Youth Risk Behavior Surveillance System | Sugar Drinks | Sugar Drinks - Behavior | Percent of students in grades 9-12 who drank regular soda/pop at least one time per day | NA | Value | ⋯ | (32.840571122, -86.631860762) | SD | SD1 | Q058 | VALUE | 1 | Race/Ethnicity | Hispanic | RACE | RACEHIS |\n| 2 | 2019 | 2019 | ID | Idaho | Youth Risk Behavior Surveillance System | Sugar Drinks | Sugar Drinks - Behavior | Percent of students in grades 9-12 who drank regular soda/pop at least one time per day | NA | Value | ⋯ | (43.682630005, -114.363730042) | SD | SD1 | Q058 | VALUE | 16 | Race/Ethnicity | Hispanic | RACE | RACEHIS |\n| 3 | 2019 | 2019 | IA | Iowa | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have obesity | NA | Value | ⋯ | (42.469400913, -93.816490556) | OWS | OWS1 | Q038 | VALUE | 19 | Grade | 11th | GRADE | GRADE11 |\n| 4 | 2019 | 2019 | LA | Louisiana | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have obesity | NA | Value | ⋯ | (31.312660644, -92.445680071) | OWS | OWS1 | Q038 | VALUE | 22 | Gender | Female | GEN | FEMALE |\n| 5 | 2019 | 2019 | ME | Maine | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have an overweight classification | NA | Value | ⋯ | (45.254228894001, -68.985031336) | OWS | OWS1 | Q039 | VALUE | 23 | Race/Ethnicity | Hispanic | RACE | RACEHIS |\n| 6 | 2019 | 2019 | MA | Massachusetts | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have an overweight classification | NA | Value | ⋯ | (42.27687047, -72.082690675) | OWS | OWS1 | Q039 | VALUE | 25 | Total | Total | OVR | OVERALL |\n\n", 349 | "text/html": [ 350 | "\n", 351 | "\n", 352 | "\n", 353 | "\t\n", 354 | "\t\n", 355 | "\n", 356 | "\n", 357 | "\t\n", 358 | "\t\n", 359 | "\t\n", 360 | "\t\n", 361 | "\t\n", 362 | "\t\n", 363 | "\n", 364 | "
A data.frame: 6 × 31
YearStartYearEndLocationAbbrLocationDescDatasourceClassTopicQuestionData_Value_UnitData_Value_TypeGeoLocationClassIDTopicIDQuestionIDDataValueTypeIDLocationIDStratificationCategory1Stratification1StratificationCategoryId1StratificationID1
<int><int><chr><chr><chr><chr><chr><chr><lgl><chr><chr><chr><chr><chr><chr><int><chr><chr><chr><chr>
120192019ALAlabama Youth Risk Behavior Surveillance SystemSugar Drinks Sugar Drinks - BehaviorPercent of students in grades 9-12 who drank regular soda/pop at least one time per dayNAValue(32.840571122, -86.631860762) SD SD1 Q058VALUE 1Race/EthnicityHispanicRACE RACEHIS
220192019IDIdaho Youth Risk Behavior Surveillance SystemSugar Drinks Sugar Drinks - BehaviorPercent of students in grades 9-12 who drank regular soda/pop at least one time per dayNAValue(43.682630005, -114.363730042) SD SD1 Q058VALUE16Race/EthnicityHispanicRACE RACEHIS
320192019IAIowa Youth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have obesity NAValue(42.469400913, -93.816490556) OWSOWS1Q038VALUE19Grade 11th GRADEGRADE11
420192019LALouisiana Youth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have obesity NAValue(31.312660644, -92.445680071) OWSOWS1Q038VALUE22Gender Female GEN FEMALE
520192019MEMaine Youth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have an overweight classification NAValue(45.254228894001, -68.985031336)OWSOWS1Q039VALUE23Race/EthnicityHispanicRACE RACEHIS
620192019MAMassachusettsYouth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have an overweight classification NAValue(42.27687047, -72.082690675) OWSOWS1Q039VALUE25Total Total OVR OVERALL
\n" 365 | ] 366 | }, 367 | "metadata": { 368 | "tags": [] 369 | } 370 | } 371 | ] 372 | }, 373 | { 374 | "cell_type": "markdown", 375 | "metadata": { 376 | "id": "YDcXvN4hLlSF" 377 | }, 378 | "source": [ 379 | "# III. Method to Download from Your Google Drive to Colab Session" 380 | ] 381 | }, 382 | { 383 | "cell_type": "code", 384 | "metadata": { 385 | "colab": { 386 | "base_uri": "https://localhost:8080/", 387 | "height": 966 388 | }, 389 | "id": "qecatv0iqCyv", 390 | "outputId": "c480ad68-4c6d-494d-bf7e-cfa0f2debd7f" 391 | }, 392 | "source": [ 393 | "x <- drive_get(\"~/Folder1/Folder2/Nutrition__Physical_Activity__and_Obesity_-_Youth_Risk_Behavior_Surveillance_System.csv\")\n", 394 | "drive_download(x)\n", 395 | "z <- read.csv(\"/content/Nutrition__Physical_Activity__and_Obesity_-_Youth_Risk_Behavior_Surveillance_System.csv\")\n", 396 | "head(z)" 397 | ], 398 | "execution_count": null, 399 | "outputs": [ 400 | { 401 | "output_type": "stream", 402 | "text": [ 403 | "File downloaded:\n", 404 | " * Nutrition__Physical_Activity__and_Obesity_-_Youth_Risk_Behavior_Surveillance_System.csv\n", 405 | "Saved locally as:\n", 406 | " * Nutrition__Physical_Activity__and_Obesity_-_Youth_Risk_Behavior_Surveillance_System.csv\n", 407 | "\n" 408 | ], 409 | "name": "stderr" 410 | }, 411 | { 412 | "output_type": "display_data", 413 | "data": { 414 | "text/plain": [ 415 | " YearStart YearEnd LocationAbbr LocationDesc \n", 416 | "1 2019 2019 AL Alabama \n", 417 | "2 2019 2019 ID Idaho \n", 418 | "3 2019 2019 IA Iowa \n", 419 | "4 2019 2019 LA Louisiana \n", 420 | "5 2019 2019 ME Maine \n", 421 | "6 2019 2019 MA Massachusetts\n", 422 | " Datasource Class \n", 423 | "1 Youth Risk Behavior Surveillance System Sugar Drinks \n", 424 | "2 Youth Risk Behavior Surveillance System Sugar Drinks \n", 425 | "3 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 426 | "4 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 427 | "5 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 428 | "6 Youth Risk Behavior Surveillance System Obesity / Weight Status\n", 429 | " Topic \n", 430 | "1 Sugar Drinks - Behavior\n", 431 | "2 Sugar Drinks - Behavior\n", 432 | "3 Obesity / Weight Status\n", 433 | "4 Obesity / Weight Status\n", 434 | "5 Obesity / Weight Status\n", 435 | "6 Obesity / Weight Status\n", 436 | " Question \n", 437 | "1 Percent of students in grades 9-12 who drank regular soda/pop at least one time per day\n", 438 | "2 Percent of students in grades 9-12 who drank regular soda/pop at least one time per day\n", 439 | "3 Percent of students in grades 9-12 who have obesity \n", 440 | "4 Percent of students in grades 9-12 who have obesity \n", 441 | "5 Percent of students in grades 9-12 who have an overweight classification \n", 442 | "6 Percent of students in grades 9-12 who have an overweight classification \n", 443 | " Data_Value_Unit Data_Value_Type ⋯ GeoLocation ClassID\n", 444 | "1 NA Value ⋯ (32.840571122, -86.631860762) SD \n", 445 | "2 NA Value ⋯ (43.682630005, -114.363730042) SD \n", 446 | "3 NA Value ⋯ (42.469400913, -93.816490556) OWS \n", 447 | "4 NA Value ⋯ (31.312660644, -92.445680071) OWS \n", 448 | "5 NA Value ⋯ (45.254228894001, -68.985031336) OWS \n", 449 | "6 NA Value ⋯ (42.27687047, -72.082690675) OWS \n", 450 | " TopicID QuestionID DataValueTypeID LocationID StratificationCategory1\n", 451 | "1 SD1 Q058 VALUE 1 Race/Ethnicity \n", 452 | "2 SD1 Q058 VALUE 16 Race/Ethnicity \n", 453 | "3 OWS1 Q038 VALUE 19 Grade \n", 454 | "4 OWS1 Q038 VALUE 22 Gender \n", 455 | "5 OWS1 Q039 VALUE 23 Race/Ethnicity \n", 456 | "6 OWS1 Q039 VALUE 25 Total \n", 457 | " Stratification1 StratificationCategoryId1 StratificationID1\n", 458 | "1 Hispanic RACE RACEHIS \n", 459 | "2 Hispanic RACE RACEHIS \n", 460 | "3 11th GRADE GRADE11 \n", 461 | "4 Female GEN FEMALE \n", 462 | "5 Hispanic RACE RACEHIS \n", 463 | "6 Total OVR OVERALL " 464 | ], 465 | "text/latex": "A data.frame: 6 × 31\n\\begin{tabular}{r|lllllllllllllllllllll}\n & YearStart & YearEnd & LocationAbbr & LocationDesc & Datasource & Class & Topic & Question & Data\\_Value\\_Unit & Data\\_Value\\_Type & ⋯ & GeoLocation & ClassID & TopicID & QuestionID & DataValueTypeID & LocationID & StratificationCategory1 & Stratification1 & StratificationCategoryId1 & StratificationID1\\\\\n & & & & & & & & & & & ⋯ & & & & & & & & & & \\\\\n\\hline\n\t1 & 2019 & 2019 & AL & Alabama & Youth Risk Behavior Surveillance System & Sugar Drinks & Sugar Drinks - Behavior & Percent of students in grades 9-12 who drank regular soda/pop at least one time per day & NA & Value & ⋯ & (32.840571122, -86.631860762) & SD & SD1 & Q058 & VALUE & 1 & Race/Ethnicity & Hispanic & RACE & RACEHIS\\\\\n\t2 & 2019 & 2019 & ID & Idaho & Youth Risk Behavior Surveillance System & Sugar Drinks & Sugar Drinks - Behavior & Percent of students in grades 9-12 who drank regular soda/pop at least one time per day & NA & Value & ⋯ & (43.682630005, -114.363730042) & SD & SD1 & Q058 & VALUE & 16 & Race/Ethnicity & Hispanic & RACE & RACEHIS\\\\\n\t3 & 2019 & 2019 & IA & Iowa & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have obesity & NA & Value & ⋯ & (42.469400913, -93.816490556) & OWS & OWS1 & Q038 & VALUE & 19 & Grade & 11th & GRADE & GRADE11\\\\\n\t4 & 2019 & 2019 & LA & Louisiana & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have obesity & NA & Value & ⋯ & (31.312660644, -92.445680071) & OWS & OWS1 & Q038 & VALUE & 22 & Gender & Female & GEN & FEMALE \\\\\n\t5 & 2019 & 2019 & ME & Maine & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have an overweight classification & NA & Value & ⋯ & (45.254228894001, -68.985031336) & OWS & OWS1 & Q039 & VALUE & 23 & Race/Ethnicity & Hispanic & RACE & RACEHIS\\\\\n\t6 & 2019 & 2019 & MA & Massachusetts & Youth Risk Behavior Surveillance System & Obesity / Weight Status & Obesity / Weight Status & Percent of students in grades 9-12 who have an overweight classification & NA & Value & ⋯ & (42.27687047, -72.082690675) & OWS & OWS1 & Q039 & VALUE & 25 & Total & Total & OVR & OVERALL\\\\\n\\end{tabular}\n", 466 | "text/markdown": "\nA data.frame: 6 × 31\n\n| | YearStart <int> | YearEnd <int> | LocationAbbr <chr> | LocationDesc <chr> | Datasource <chr> | Class <chr> | Topic <chr> | Question <chr> | Data_Value_Unit <lgl> | Data_Value_Type <chr> | ⋯ ⋯ | GeoLocation <chr> | ClassID <chr> | TopicID <chr> | QuestionID <chr> | DataValueTypeID <chr> | LocationID <int> | StratificationCategory1 <chr> | Stratification1 <chr> | StratificationCategoryId1 <chr> | StratificationID1 <chr> |\n|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|\n| 1 | 2019 | 2019 | AL | Alabama | Youth Risk Behavior Surveillance System | Sugar Drinks | Sugar Drinks - Behavior | Percent of students in grades 9-12 who drank regular soda/pop at least one time per day | NA | Value | ⋯ | (32.840571122, -86.631860762) | SD | SD1 | Q058 | VALUE | 1 | Race/Ethnicity | Hispanic | RACE | RACEHIS |\n| 2 | 2019 | 2019 | ID | Idaho | Youth Risk Behavior Surveillance System | Sugar Drinks | Sugar Drinks - Behavior | Percent of students in grades 9-12 who drank regular soda/pop at least one time per day | NA | Value | ⋯ | (43.682630005, -114.363730042) | SD | SD1 | Q058 | VALUE | 16 | Race/Ethnicity | Hispanic | RACE | RACEHIS |\n| 3 | 2019 | 2019 | IA | Iowa | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have obesity | NA | Value | ⋯ | (42.469400913, -93.816490556) | OWS | OWS1 | Q038 | VALUE | 19 | Grade | 11th | GRADE | GRADE11 |\n| 4 | 2019 | 2019 | LA | Louisiana | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have obesity | NA | Value | ⋯ | (31.312660644, -92.445680071) | OWS | OWS1 | Q038 | VALUE | 22 | Gender | Female | GEN | FEMALE |\n| 5 | 2019 | 2019 | ME | Maine | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have an overweight classification | NA | Value | ⋯ | (45.254228894001, -68.985031336) | OWS | OWS1 | Q039 | VALUE | 23 | Race/Ethnicity | Hispanic | RACE | RACEHIS |\n| 6 | 2019 | 2019 | MA | Massachusetts | Youth Risk Behavior Surveillance System | Obesity / Weight Status | Obesity / Weight Status | Percent of students in grades 9-12 who have an overweight classification | NA | Value | ⋯ | (42.27687047, -72.082690675) | OWS | OWS1 | Q039 | VALUE | 25 | Total | Total | OVR | OVERALL |\n\n", 467 | "text/html": [ 468 | "\n", 469 | "\n", 470 | "\n", 471 | "\t\n", 472 | "\t\n", 473 | "\n", 474 | "\n", 475 | "\t\n", 476 | "\t\n", 477 | "\t\n", 478 | "\t\n", 479 | "\t\n", 480 | "\t\n", 481 | "\n", 482 | "
A data.frame: 6 × 31
YearStartYearEndLocationAbbrLocationDescDatasourceClassTopicQuestionData_Value_UnitData_Value_TypeGeoLocationClassIDTopicIDQuestionIDDataValueTypeIDLocationIDStratificationCategory1Stratification1StratificationCategoryId1StratificationID1
<int><int><chr><chr><chr><chr><chr><chr><lgl><chr><chr><chr><chr><chr><chr><int><chr><chr><chr><chr>
120192019ALAlabama Youth Risk Behavior Surveillance SystemSugar Drinks Sugar Drinks - BehaviorPercent of students in grades 9-12 who drank regular soda/pop at least one time per dayNAValue(32.840571122, -86.631860762) SD SD1 Q058VALUE 1Race/EthnicityHispanicRACE RACEHIS
220192019IDIdaho Youth Risk Behavior Surveillance SystemSugar Drinks Sugar Drinks - BehaviorPercent of students in grades 9-12 who drank regular soda/pop at least one time per dayNAValue(43.682630005, -114.363730042) SD SD1 Q058VALUE16Race/EthnicityHispanicRACE RACEHIS
320192019IAIowa Youth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have obesity NAValue(42.469400913, -93.816490556) OWSOWS1Q038VALUE19Grade 11th GRADEGRADE11
420192019LALouisiana Youth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have obesity NAValue(31.312660644, -92.445680071) OWSOWS1Q038VALUE22Gender Female GEN FEMALE
520192019MEMaine Youth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have an overweight classification NAValue(45.254228894001, -68.985031336)OWSOWS1Q039VALUE23Race/EthnicityHispanicRACE RACEHIS
620192019MAMassachusettsYouth Risk Behavior Surveillance SystemObesity / Weight StatusObesity / Weight StatusPercent of students in grades 9-12 who have an overweight classification NAValue(42.27687047, -72.082690675) OWSOWS1Q039VALUE25Total Total OVR OVERALL
\n" 483 | ] 484 | }, 485 | "metadata": { 486 | "tags": [] 487 | } 488 | } 489 | ] 490 | } 491 | ] 492 | } -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # medium_tutorials 2 | ## reference files to support posts authored at https://medium.com/@k8wall 3 | --------------------------------------------------------------------------------