├── .gitignore
├── 01-Loading Data.ipynb
├── 02-DataFrame and Series.ipynb
├── 03-Indexes.ipynb
├── 04-Filtering.ipynb
├── 05-Updating Rows and Columns.ipynb
├── 06-Add Remove Rows and Columns.ipynb
├── 07-Sorting Data.ipynb
├── 08-Grouping and Aggregating.ipynb
├── 09-Cleaning Data.ipynb
├── 10-Working with Dates and Time Series Data.ipynb
├── 11-Reading and Writing Data.ipynb
├── README.md
├── data
    ├── ETH_1h.csv.zip
    ├── README_2019.txt
    ├── so_survey_2019.pdf
    ├── survey_results_public.csv.zip
    ├── survey_results_schema.csv
    └── survey_results_schema.csv.zip
└── requirements.txt


/.gitignore:
--------------------------------------------------------------------------------
  1 | # Byte-compiled / optimized / DLL files
  2 | __pycache__/
  3 | *.py[cod]
  4 | *$py.class
  5 | 
  6 | # C extensions
  7 | *.so
  8 | 
  9 | # Distribution / packaging
 10 | .Python
 11 | build/
 12 | develop-eggs/
 13 | dist/
 14 | downloads/
 15 | eggs/
 16 | .eggs/
 17 | lib/
 18 | lib64/
 19 | parts/
 20 | sdist/
 21 | var/
 22 | wheels/
 23 | share/python-wheels/
 24 | *.egg-info/
 25 | .installed.cfg
 26 | *.egg
 27 | MANIFEST
 28 | 
 29 | # PyInstaller
 30 | #  Usually these files are written by a python script from a template
 31 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 32 | *.manifest
 33 | *.spec
 34 | 
 35 | # Installer logs
 36 | pip-log.txt
 37 | pip-delete-this-directory.txt
 38 | 
 39 | # Unit test / coverage reports
 40 | htmlcov/
 41 | .tox/
 42 | .nox/
 43 | .coverage
 44 | .coverage.*
 45 | .cache
 46 | nosetests.xml
 47 | coverage.xml
 48 | *.cover
 49 | *.py,cover
 50 | .hypothesis/
 51 | .pytest_cache/
 52 | cover/
 53 | 
 54 | # Translations
 55 | *.mo
 56 | *.pot
 57 | 
 58 | # Django stuff:
 59 | *.log
 60 | local_settings.py
 61 | db.sqlite3
 62 | db.sqlite3-journal
 63 | 
 64 | # Flask stuff:
 65 | instance/
 66 | .webassets-cache
 67 | 
 68 | # Scrapy stuff:
 69 | .scrapy
 70 | 
 71 | # Sphinx documentation
 72 | docs/_build/
 73 | 
 74 | # PyBuilder
 75 | .pybuilder/
 76 | target/
 77 | 
 78 | # Jupyter Notebook
 79 | .ipynb_checkpoints
 80 | 
 81 | # IPython
 82 | profile_default/
 83 | ipython_config.py
 84 | 
 85 | # pyenv
 86 | #   For a library or package, you might want to ignore these files since the code is
 87 | #   intended to run in multiple environments; otherwise, check them in:
 88 | # .python-version
 89 | 
 90 | # pipenv
 91 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 92 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 93 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 94 | #   install all needed dependencies.
 95 | #Pipfile.lock
 96 | 
 97 | # poetry
 98 | #   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
 99 | #   This is especially recommended for binary packages to ensure reproducibility, and is more
100 | #   commonly ignored for libraries.
101 | #   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
102 | #poetry.lock
103 | 
104 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow
105 | __pypackages__/
106 | 
107 | # Celery stuff
108 | celerybeat-schedule
109 | celerybeat.pid
110 | 
111 | # SageMath parsed files
112 | *.sage.py
113 | 
114 | # Environments
115 | .env
116 | .venv
117 | env/
118 | venv/
119 | ENV/
120 | env.bak/
121 | venv.bak/
122 | 
123 | # Spyder project settings
124 | .spyderproject
125 | .spyproject
126 | 
127 | # Rope project settings
128 | .ropeproject
129 | 
130 | # mkdocs documentation
131 | /site
132 | 
133 | # mypy
134 | .mypy_cache/
135 | .dmypy.json
136 | dmypy.json
137 | 
138 | # Pyre type checker
139 | .pyre/
140 | 
141 | # pytype static type analyzer
142 | .pytype/
143 | 
144 | # Cython debug symbols
145 | cython_debug/
146 | 
147 | # PyCharm
148 | #  JetBrains specific template is maintainted in a separate JetBrains.gitignore that can
149 | #  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
150 | #  and can be added to the global gitignore or merged into this file.  For a more nuclear
151 | #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
152 | #.idea/
153 | 
154 | *.csv
155 | *.json
156 | *.tsv
157 | *.xlsx
158 | 
159 | 


--------------------------------------------------------------------------------
/02-DataFrame and Series.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |  "cells": [
   3 |   {
   4 |    "cell_type": "markdown",
   5 |    "metadata": {},
   6 |    "source": [
   7 |     "# DataFrame and Series Basics"
   8 |    ]
   9 |   },
  10 |   {
  11 |    "cell_type": "code",
  12 |    "execution_count": 3,
  13 |    "metadata": {},
  14 |    "outputs": [],
  15 |    "source": [
  16 |     "import pandas as pd"
  17 |    ]
  18 |   },
  19 |   {
  20 |    "cell_type": "code",
  21 |    "execution_count": 4,
  22 |    "metadata": {},
  23 |    "outputs": [],
  24 |    "source": [
  25 |     "person = {\n",
  26 |     "    \"first\": \"Phil\",\n",
  27 |     "    \"last\": \"Lembo\",\n",
  28 |     "    \"email\": \"phil.lembo@gmail.com\"\n",
  29 |     "}"
  30 |    ]
  31 |   },
  32 |   {
  33 |    "cell_type": "code",
  34 |    "execution_count": 5,
  35 |    "metadata": {},
  36 |    "outputs": [],
  37 |    "source": [
  38 |     "people = {\n",
  39 |     "    \"first\": [\"Phil\"],\n",
  40 |     "    \"last\": [\"Lembo\"],\n",
  41 |     "    \"email\": [\"phil.lembo@gmail.com\"]\n",
  42 |     "}"
  43 |    ]
  44 |   },
  45 |   {
  46 |    "cell_type": "code",
  47 |    "execution_count": 6,
  48 |    "metadata": {},
  49 |    "outputs": [],
  50 |    "source": [
  51 |     "people = {\n",
  52 |     "    \"first\": [\"Phil\", \"Jane\", \"Rob\"],\n",
  53 |     "    \"last\": [\"Lembo\", \"Doe\", \"Roe\"],\n",
  54 |     "    \"email\": [\"phil.lembo@gmail.com\", \"janedoe@email.com\", \"robroe@email.com\"]\n",
  55 |     "}"
  56 |    ]
  57 |   },
  58 |   {
  59 |    "cell_type": "code",
  60 |    "execution_count": 7,
  61 |    "metadata": {},
  62 |    "outputs": [
  63 |     {
  64 |      "data": {
  65 |       "text/plain": [
  66 |        "['phil.lembo@gmail.com', 'janedoe@email.com', 'robroe@email.com']"
  67 |       ]
  68 |      },
  69 |      "execution_count": 7,
  70 |      "metadata": {},
  71 |      "output_type": "execute_result"
  72 |     }
  73 |    ],
  74 |    "source": [
  75 |     "people[\"email\"]"
  76 |    ]
  77 |   },
  78 |   {
  79 |    "cell_type": "code",
  80 |    "execution_count": 8,
  81 |    "metadata": {},
  82 |    "outputs": [],
  83 |    "source": [
  84 |     "df = pd.DataFrame(people)"
  85 |    ]
  86 |   },
  87 |   {
  88 |    "cell_type": "code",
  89 |    "execution_count": 9,
  90 |    "metadata": {},
  91 |    "outputs": [
  92 |     {
  93 |      "data": {
  94 |       "text/html": [
  95 |        "<div>\n",
  96 |        "<style scoped>\n",
  97 |        "    .dataframe tbody tr th:only-of-type {\n",
  98 |        "        vertical-align: middle;\n",
  99 |        "    }\n",
 100 |        "\n",
 101 |        "    .dataframe tbody tr th {\n",
 102 |        "        vertical-align: top;\n",
 103 |        "    }\n",
 104 |        "\n",
 105 |        "    .dataframe thead th {\n",
 106 |        "        text-align: right;\n",
 107 |        "    }\n",
 108 |        "</style>\n",
 109 |        "<table border=\"1\" class=\"dataframe\">\n",
 110 |        "  <thead>\n",
 111 |        "    <tr style=\"text-align: right;\">\n",
 112 |        "      <th></th>\n",
 113 |        "      <th>first</th>\n",
 114 |        "      <th>last</th>\n",
 115 |        "      <th>email</th>\n",
 116 |        "    </tr>\n",
 117 |        "  </thead>\n",
 118 |        "  <tbody>\n",
 119 |        "    <tr>\n",
 120 |        "      <th>0</th>\n",
 121 |        "      <td>Phil</td>\n",
 122 |        "      <td>Lembo</td>\n",
 123 |        "      <td>phil.lembo@gmail.com</td>\n",
 124 |        "    </tr>\n",
 125 |        "    <tr>\n",
 126 |        "      <th>1</th>\n",
 127 |        "      <td>Jane</td>\n",
 128 |        "      <td>Doe</td>\n",
 129 |        "      <td>janedoe@email.com</td>\n",
 130 |        "    </tr>\n",
 131 |        "    <tr>\n",
 132 |        "      <th>2</th>\n",
 133 |        "      <td>Rob</td>\n",
 134 |        "      <td>Roe</td>\n",
 135 |        "      <td>robroe@email.com</td>\n",
 136 |        "    </tr>\n",
 137 |        "  </tbody>\n",
 138 |        "</table>\n",
 139 |        "</div>"
 140 |       ],
 141 |       "text/plain": [
 142 |        "  first   last                 email\n",
 143 |        "0  Phil  Lembo  phil.lembo@gmail.com\n",
 144 |        "1  Jane    Doe     janedoe@email.com\n",
 145 |        "2   Rob    Roe      robroe@email.com"
 146 |       ]
 147 |      },
 148 |      "execution_count": 9,
 149 |      "metadata": {},
 150 |      "output_type": "execute_result"
 151 |     }
 152 |    ],
 153 |    "source": [
 154 |     "df"
 155 |    ]
 156 |   },
 157 |   {
 158 |    "cell_type": "markdown",
 159 |    "metadata": {},
 160 |    "source": [
 161 |     "There are two major data types in pandas: DataFrames and Series, and df here has the DataFrame data type."
 162 |    ]
 163 |   },
 164 |   {
 165 |    "cell_type": "code",
 166 |    "execution_count": 40,
 167 |    "metadata": {},
 168 |    "outputs": [
 169 |     {
 170 |      "data": {
 171 |       "text/plain": [
 172 |        "pandas.core.frame.DataFrame"
 173 |       ]
 174 |      },
 175 |      "execution_count": 40,
 176 |      "metadata": {},
 177 |      "output_type": "execute_result"
 178 |     }
 179 |    ],
 180 |    "source": [
 181 |     "type(df)"
 182 |    ]
 183 |   },
 184 |   {
 185 |    "cell_type": "code",
 186 |    "execution_count": 10,
 187 |    "metadata": {},
 188 |    "outputs": [
 189 |     {
 190 |      "data": {
 191 |       "text/plain": [
 192 |        "0    phil.lembo@gmail.com\n",
 193 |        "1       janedoe@email.com\n",
 194 |        "2        robroe@email.com\n",
 195 |        "Name: email, dtype: object"
 196 |       ]
 197 |      },
 198 |      "execution_count": 10,
 199 |      "metadata": {},
 200 |      "output_type": "execute_result"
 201 |     }
 202 |    ],
 203 |    "source": [
 204 |     "df['email']"
 205 |    ]
 206 |   },
 207 |   {
 208 |    "cell_type": "markdown",
 209 |    "metadata": {},
 210 |    "source": [
 211 |     "The type of the data stored in email is a pandas Series."
 212 |    ]
 213 |   },
 214 |   {
 215 |    "cell_type": "code",
 216 |    "execution_count": 11,
 217 |    "metadata": {},
 218 |    "outputs": [
 219 |     {
 220 |      "data": {
 221 |       "text/plain": [
 222 |        "pandas.core.series.Series"
 223 |       ]
 224 |      },
 225 |      "execution_count": 11,
 226 |      "metadata": {},
 227 |      "output_type": "execute_result"
 228 |     }
 229 |    ],
 230 |    "source": [
 231 |     "type(df['email'])"
 232 |    ]
 233 |   },
 234 |   {
 235 |    "cell_type": "markdown",
 236 |    "metadata": {},
 237 |    "source": [
 238 |     "This is an alternative way of calling the email column, but using it risks it being confused with methods."
 239 |    ]
 240 |   },
 241 |   {
 242 |    "cell_type": "code",
 243 |    "execution_count": 12,
 244 |    "metadata": {},
 245 |    "outputs": [
 246 |     {
 247 |      "data": {
 248 |       "text/plain": [
 249 |        "0    phil.lembo@gmail.com\n",
 250 |        "1       janedoe@email.com\n",
 251 |        "2        robroe@email.com\n",
 252 |        "Name: email, dtype: object"
 253 |       ]
 254 |      },
 255 |      "execution_count": 12,
 256 |      "metadata": {},
 257 |      "output_type": "execute_result"
 258 |     }
 259 |    ],
 260 |    "source": [
 261 |     "df.email"
 262 |    ]
 263 |   },
 264 |   {
 265 |    "cell_type": "markdown",
 266 |    "metadata": {},
 267 |    "source": [
 268 |     "Pass a list of columns using double-bracket notation."
 269 |    ]
 270 |   },
 271 |   {
 272 |    "cell_type": "code",
 273 |    "execution_count": 13,
 274 |    "metadata": {},
 275 |    "outputs": [
 276 |     {
 277 |      "data": {
 278 |       "text/html": [
 279 |        "<div>\n",
 280 |        "<style scoped>\n",
 281 |        "    .dataframe tbody tr th:only-of-type {\n",
 282 |        "        vertical-align: middle;\n",
 283 |        "    }\n",
 284 |        "\n",
 285 |        "    .dataframe tbody tr th {\n",
 286 |        "        vertical-align: top;\n",
 287 |        "    }\n",
 288 |        "\n",
 289 |        "    .dataframe thead th {\n",
 290 |        "        text-align: right;\n",
 291 |        "    }\n",
 292 |        "</style>\n",
 293 |        "<table border=\"1\" class=\"dataframe\">\n",
 294 |        "  <thead>\n",
 295 |        "    <tr style=\"text-align: right;\">\n",
 296 |        "      <th></th>\n",
 297 |        "      <th>last</th>\n",
 298 |        "      <th>email</th>\n",
 299 |        "    </tr>\n",
 300 |        "  </thead>\n",
 301 |        "  <tbody>\n",
 302 |        "    <tr>\n",
 303 |        "      <th>0</th>\n",
 304 |        "      <td>Lembo</td>\n",
 305 |        "      <td>phil.lembo@gmail.com</td>\n",
 306 |        "    </tr>\n",
 307 |        "    <tr>\n",
 308 |        "      <th>1</th>\n",
 309 |        "      <td>Doe</td>\n",
 310 |        "      <td>janedoe@email.com</td>\n",
 311 |        "    </tr>\n",
 312 |        "    <tr>\n",
 313 |        "      <th>2</th>\n",
 314 |        "      <td>Roe</td>\n",
 315 |        "      <td>robroe@email.com</td>\n",
 316 |        "    </tr>\n",
 317 |        "  </tbody>\n",
 318 |        "</table>\n",
 319 |        "</div>"
 320 |       ],
 321 |       "text/plain": [
 322 |        "    last                 email\n",
 323 |        "0  Lembo  phil.lembo@gmail.com\n",
 324 |        "1    Doe     janedoe@email.com\n",
 325 |        "2    Roe      robroe@email.com"
 326 |       ]
 327 |      },
 328 |      "execution_count": 13,
 329 |      "metadata": {},
 330 |      "output_type": "execute_result"
 331 |     }
 332 |    ],
 333 |    "source": [
 334 |     "df[['last', 'email']]"
 335 |    ]
 336 |   },
 337 |   {
 338 |    "cell_type": "markdown",
 339 |    "metadata": {},
 340 |    "source": [
 341 |     "This retrieves a DataFrame."
 342 |    ]
 343 |   },
 344 |   {
 345 |    "cell_type": "code",
 346 |    "execution_count": 14,
 347 |    "metadata": {},
 348 |    "outputs": [
 349 |     {
 350 |      "data": {
 351 |       "text/plain": [
 352 |        "pandas.core.frame.DataFrame"
 353 |       ]
 354 |      },
 355 |      "execution_count": 14,
 356 |      "metadata": {},
 357 |      "output_type": "execute_result"
 358 |     }
 359 |    ],
 360 |    "source": [
 361 |     "type(df[['last', 'email']])"
 362 |    ]
 363 |   },
 364 |   {
 365 |    "cell_type": "markdown",
 366 |    "metadata": {},
 367 |    "source": [
 368 |     "Show columns in dataframe."
 369 |    ]
 370 |   },
 371 |   {
 372 |    "cell_type": "code",
 373 |    "execution_count": 15,
 374 |    "metadata": {},
 375 |    "outputs": [
 376 |     {
 377 |      "data": {
 378 |       "text/plain": [
 379 |        "Index(['first', 'last', 'email'], dtype='object')"
 380 |       ]
 381 |      },
 382 |      "execution_count": 15,
 383 |      "metadata": {},
 384 |      "output_type": "execute_result"
 385 |     }
 386 |    ],
 387 |    "source": [
 388 |     "df.columns"
 389 |    ]
 390 |   },
 391 |   {
 392 |    "cell_type": "markdown",
 393 |    "metadata": {},
 394 |    "source": [
 395 |     "To get rows, use loc and iloc indexers.\n",
 396 |     "\n",
 397 |     "iloc = \"integer location\", seach by numeric index\n",
 398 |     "\n",
 399 |     "loc = search by label\n"
 400 |    ]
 401 |   },
 402 |   {
 403 |    "cell_type": "code",
 404 |    "execution_count": 16,
 405 |    "metadata": {},
 406 |    "outputs": [
 407 |     {
 408 |      "data": {
 409 |       "text/plain": [
 410 |        "first                    Phil\n",
 411 |        "last                    Lembo\n",
 412 |        "email    phil.lembo@gmail.com\n",
 413 |        "Name: 0, dtype: object"
 414 |       ]
 415 |      },
 416 |      "execution_count": 16,
 417 |      "metadata": {},
 418 |      "output_type": "execute_result"
 419 |     }
 420 |    ],
 421 |    "source": [
 422 |     "df.iloc[0]"
 423 |    ]
 424 |   },
 425 |   {
 426 |    "cell_type": "code",
 427 |    "execution_count": 17,
 428 |    "metadata": {},
 429 |    "outputs": [
 430 |     {
 431 |      "data": {
 432 |       "text/plain": [
 433 |        "pandas.core.series.Series"
 434 |       ]
 435 |      },
 436 |      "execution_count": 17,
 437 |      "metadata": {},
 438 |      "output_type": "execute_result"
 439 |     }
 440 |    ],
 441 |    "source": [
 442 |     "type(df.iloc[0])"
 443 |    ]
 444 |   },
 445 |   {
 446 |    "cell_type": "code",
 447 |    "execution_count": 18,
 448 |    "metadata": {},
 449 |    "outputs": [
 450 |     {
 451 |      "data": {
 452 |       "text/html": [
 453 |        "<div>\n",
 454 |        "<style scoped>\n",
 455 |        "    .dataframe tbody tr th:only-of-type {\n",
 456 |        "        vertical-align: middle;\n",
 457 |        "    }\n",
 458 |        "\n",
 459 |        "    .dataframe tbody tr th {\n",
 460 |        "        vertical-align: top;\n",
 461 |        "    }\n",
 462 |        "\n",
 463 |        "    .dataframe thead th {\n",
 464 |        "        text-align: right;\n",
 465 |        "    }\n",
 466 |        "</style>\n",
 467 |        "<table border=\"1\" class=\"dataframe\">\n",
 468 |        "  <thead>\n",
 469 |        "    <tr style=\"text-align: right;\">\n",
 470 |        "      <th></th>\n",
 471 |        "      <th>first</th>\n",
 472 |        "      <th>last</th>\n",
 473 |        "      <th>email</th>\n",
 474 |        "    </tr>\n",
 475 |        "  </thead>\n",
 476 |        "  <tbody>\n",
 477 |        "    <tr>\n",
 478 |        "      <th>0</th>\n",
 479 |        "      <td>Phil</td>\n",
 480 |        "      <td>Lembo</td>\n",
 481 |        "      <td>phil.lembo@gmail.com</td>\n",
 482 |        "    </tr>\n",
 483 |        "    <tr>\n",
 484 |        "      <th>1</th>\n",
 485 |        "      <td>Jane</td>\n",
 486 |        "      <td>Doe</td>\n",
 487 |        "      <td>janedoe@email.com</td>\n",
 488 |        "    </tr>\n",
 489 |        "  </tbody>\n",
 490 |        "</table>\n",
 491 |        "</div>"
 492 |       ],
 493 |       "text/plain": [
 494 |        "  first   last                 email\n",
 495 |        "0  Phil  Lembo  phil.lembo@gmail.com\n",
 496 |        "1  Jane    Doe     janedoe@email.com"
 497 |       ]
 498 |      },
 499 |      "execution_count": 18,
 500 |      "metadata": {},
 501 |      "output_type": "execute_result"
 502 |     }
 503 |    ],
 504 |    "source": [
 505 |     "df.iloc[[0, 1]]"
 506 |    ]
 507 |   },
 508 |   {
 509 |    "cell_type": "markdown",
 510 |    "metadata": {},
 511 |    "source": [
 512 |     "Grab first two rows of the email column (column 3, index 2)."
 513 |    ]
 514 |   },
 515 |   {
 516 |    "cell_type": "code",
 517 |    "execution_count": 19,
 518 |    "metadata": {},
 519 |    "outputs": [
 520 |     {
 521 |      "data": {
 522 |       "text/plain": [
 523 |        "0    phil.lembo@gmail.com\n",
 524 |        "1       janedoe@email.com\n",
 525 |        "Name: email, dtype: object"
 526 |       ]
 527 |      },
 528 |      "execution_count": 19,
 529 |      "metadata": {},
 530 |      "output_type": "execute_result"
 531 |     }
 532 |    ],
 533 |    "source": [
 534 |     "df.iloc[[0, 1], 2]"
 535 |    ]
 536 |   },
 537 |   {
 538 |    "cell_type": "markdown",
 539 |    "metadata": {},
 540 |    "source": [
 541 |     "Using loc without custom labels, looks alot like iloc because you have to use a numeric value."
 542 |    ]
 543 |   },
 544 |   {
 545 |    "cell_type": "code",
 546 |    "execution_count": 20,
 547 |    "metadata": {},
 548 |    "outputs": [
 549 |     {
 550 |      "data": {
 551 |       "text/plain": [
 552 |        "first                    Phil\n",
 553 |        "last                    Lembo\n",
 554 |        "email    phil.lembo@gmail.com\n",
 555 |        "Name: 0, dtype: object"
 556 |       ]
 557 |      },
 558 |      "execution_count": 20,
 559 |      "metadata": {},
 560 |      "output_type": "execute_result"
 561 |     }
 562 |    ],
 563 |    "source": [
 564 |     "df.loc[0]"
 565 |    ]
 566 |   },
 567 |   {
 568 |    "cell_type": "code",
 569 |    "execution_count": 21,
 570 |    "metadata": {},
 571 |    "outputs": [
 572 |     {
 573 |      "data": {
 574 |       "text/html": [
 575 |        "<div>\n",
 576 |        "<style scoped>\n",
 577 |        "    .dataframe tbody tr th:only-of-type {\n",
 578 |        "        vertical-align: middle;\n",
 579 |        "    }\n",
 580 |        "\n",
 581 |        "    .dataframe tbody tr th {\n",
 582 |        "        vertical-align: top;\n",
 583 |        "    }\n",
 584 |        "\n",
 585 |        "    .dataframe thead th {\n",
 586 |        "        text-align: right;\n",
 587 |        "    }\n",
 588 |        "</style>\n",
 589 |        "<table border=\"1\" class=\"dataframe\">\n",
 590 |        "  <thead>\n",
 591 |        "    <tr style=\"text-align: right;\">\n",
 592 |        "      <th></th>\n",
 593 |        "      <th>first</th>\n",
 594 |        "      <th>last</th>\n",
 595 |        "      <th>email</th>\n",
 596 |        "    </tr>\n",
 597 |        "  </thead>\n",
 598 |        "  <tbody>\n",
 599 |        "    <tr>\n",
 600 |        "      <th>0</th>\n",
 601 |        "      <td>Phil</td>\n",
 602 |        "      <td>Lembo</td>\n",
 603 |        "      <td>phil.lembo@gmail.com</td>\n",
 604 |        "    </tr>\n",
 605 |        "    <tr>\n",
 606 |        "      <th>1</th>\n",
 607 |        "      <td>Jane</td>\n",
 608 |        "      <td>Doe</td>\n",
 609 |        "      <td>janedoe@email.com</td>\n",
 610 |        "    </tr>\n",
 611 |        "  </tbody>\n",
 612 |        "</table>\n",
 613 |        "</div>"
 614 |       ],
 615 |       "text/plain": [
 616 |        "  first   last                 email\n",
 617 |        "0  Phil  Lembo  phil.lembo@gmail.com\n",
 618 |        "1  Jane    Doe     janedoe@email.com"
 619 |       ]
 620 |      },
 621 |      "execution_count": 21,
 622 |      "metadata": {},
 623 |      "output_type": "execute_result"
 624 |     }
 625 |    ],
 626 |    "source": [
 627 |     "df.loc[[0, 1]]"
 628 |    ]
 629 |   },
 630 |   {
 631 |    "cell_type": "markdown",
 632 |    "metadata": {},
 633 |    "source": [
 634 |     "But now we can use a column label."
 635 |    ]
 636 |   },
 637 |   {
 638 |    "cell_type": "code",
 639 |    "execution_count": 22,
 640 |    "metadata": {},
 641 |    "outputs": [
 642 |     {
 643 |      "data": {
 644 |       "text/plain": [
 645 |        "0    phil.lembo@gmail.com\n",
 646 |        "1       janedoe@email.com\n",
 647 |        "Name: email, dtype: object"
 648 |       ]
 649 |      },
 650 |      "execution_count": 22,
 651 |      "metadata": {},
 652 |      "output_type": "execute_result"
 653 |     }
 654 |    ],
 655 |    "source": [
 656 |     "df.loc[[0, 1], 'email']"
 657 |    ]
 658 |   },
 659 |   {
 660 |    "cell_type": "markdown",
 661 |    "metadata": {},
 662 |    "source": [
 663 |     "... or a list of labels!"
 664 |    ]
 665 |   },
 666 |   {
 667 |    "cell_type": "code",
 668 |    "execution_count": 23,
 669 |    "metadata": {},
 670 |    "outputs": [
 671 |     {
 672 |      "data": {
 673 |       "text/html": [
 674 |        "<div>\n",
 675 |        "<style scoped>\n",
 676 |        "    .dataframe tbody tr th:only-of-type {\n",
 677 |        "        vertical-align: middle;\n",
 678 |        "    }\n",
 679 |        "\n",
 680 |        "    .dataframe tbody tr th {\n",
 681 |        "        vertical-align: top;\n",
 682 |        "    }\n",
 683 |        "\n",
 684 |        "    .dataframe thead th {\n",
 685 |        "        text-align: right;\n",
 686 |        "    }\n",
 687 |        "</style>\n",
 688 |        "<table border=\"1\" class=\"dataframe\">\n",
 689 |        "  <thead>\n",
 690 |        "    <tr style=\"text-align: right;\">\n",
 691 |        "      <th></th>\n",
 692 |        "      <th>email</th>\n",
 693 |        "      <th>last</th>\n",
 694 |        "    </tr>\n",
 695 |        "  </thead>\n",
 696 |        "  <tbody>\n",
 697 |        "    <tr>\n",
 698 |        "      <th>0</th>\n",
 699 |        "      <td>phil.lembo@gmail.com</td>\n",
 700 |        "      <td>Lembo</td>\n",
 701 |        "    </tr>\n",
 702 |        "    <tr>\n",
 703 |        "      <th>1</th>\n",
 704 |        "      <td>janedoe@email.com</td>\n",
 705 |        "      <td>Doe</td>\n",
 706 |        "    </tr>\n",
 707 |        "  </tbody>\n",
 708 |        "</table>\n",
 709 |        "</div>"
 710 |       ],
 711 |       "text/plain": [
 712 |        "                  email   last\n",
 713 |        "0  phil.lembo@gmail.com  Lembo\n",
 714 |        "1     janedoe@email.com    Doe"
 715 |       ]
 716 |      },
 717 |      "execution_count": 23,
 718 |      "metadata": {},
 719 |      "output_type": "execute_result"
 720 |     }
 721 |    ],
 722 |    "source": [
 723 |     "df.loc[[0, 1], ['email', 'last']]"
 724 |    ]
 725 |   },
 726 |   {
 727 |    "cell_type": "code",
 728 |    "execution_count": 24,
 729 |    "metadata": {},
 730 |    "outputs": [],
 731 |    "source": [
 732 |     "res_df = pd.read_csv('data/survey_results_public.csv')\n",
 733 |     "schema_df = pd.read_csv('data/survey_results_schema.csv')\n",
 734 |     "pd.set_option('display.max_columns', 85)\n",
 735 |     "pd.set_option('display.max_rows', 85)"
 736 |    ]
 737 |   },
 738 |   {
 739 |    "cell_type": "markdown",
 740 |    "metadata": {},
 741 |    "source": [
 742 |     "Basic characteristics of dataframe (number of rows, number of columns)."
 743 |    ]
 744 |   },
 745 |   {
 746 |    "cell_type": "code",
 747 |    "execution_count": 25,
 748 |    "metadata": {},
 749 |    "outputs": [
 750 |     {
 751 |      "data": {
 752 |       "text/plain": [
 753 |        "(88883, 85)"
 754 |       ]
 755 |      },
 756 |      "execution_count": 25,
 757 |      "metadata": {},
 758 |      "output_type": "execute_result"
 759 |     }
 760 |    ],
 761 |    "source": [
 762 |     "res_df.shape"
 763 |    ]
 764 |   },
 765 |   {
 766 |    "cell_type": "markdown",
 767 |    "metadata": {},
 768 |    "source": [
 769 |     "List all the column labels."
 770 |    ]
 771 |   },
 772 |   {
 773 |    "cell_type": "code",
 774 |    "execution_count": 26,
 775 |    "metadata": {},
 776 |    "outputs": [
 777 |     {
 778 |      "data": {
 779 |       "text/plain": [
 780 |        "Index(['Respondent', 'MainBranch', 'Hobbyist', 'OpenSourcer', 'OpenSource',\n",
 781 |        "       'Employment', 'Country', 'Student', 'EdLevel', 'UndergradMajor',\n",
 782 |        "       'EduOther', 'OrgSize', 'DevType', 'YearsCode', 'Age1stCode',\n",
 783 |        "       'YearsCodePro', 'CareerSat', 'JobSat', 'MgrIdiot', 'MgrMoney',\n",
 784 |        "       'MgrWant', 'JobSeek', 'LastHireDate', 'LastInt', 'FizzBuzz',\n",
 785 |        "       'JobFactors', 'ResumeUpdate', 'CurrencySymbol', 'CurrencyDesc',\n",
 786 |        "       'CompTotal', 'CompFreq', 'ConvertedComp', 'WorkWeekHrs', 'WorkPlan',\n",
 787 |        "       'WorkChallenge', 'WorkRemote', 'WorkLoc', 'ImpSyn', 'CodeRev',\n",
 788 |        "       'CodeRevHrs', 'UnitTests', 'PurchaseHow', 'PurchaseWhat',\n",
 789 |        "       'LanguageWorkedWith', 'LanguageDesireNextYear', 'DatabaseWorkedWith',\n",
 790 |        "       'DatabaseDesireNextYear', 'PlatformWorkedWith',\n",
 791 |        "       'PlatformDesireNextYear', 'WebFrameWorkedWith',\n",
 792 |        "       'WebFrameDesireNextYear', 'MiscTechWorkedWith',\n",
 793 |        "       'MiscTechDesireNextYear', 'DevEnviron', 'OpSys', 'Containers',\n",
 794 |        "       'BlockchainOrg', 'BlockchainIs', 'BetterLife', 'ITperson', 'OffOn',\n",
 795 |        "       'SocialMedia', 'Extraversion', 'ScreenName', 'SOVisit1st',\n",
 796 |        "       'SOVisitFreq', 'SOVisitTo', 'SOFindAnswer', 'SOTimeSaved',\n",
 797 |        "       'SOHowMuchTime', 'SOAccount', 'SOPartFreq', 'SOJobs', 'EntTeams',\n",
 798 |        "       'SOComm', 'WelcomeChange', 'SONewContent', 'Age', 'Gender', 'Trans',\n",
 799 |        "       'Sexuality', 'Ethnicity', 'Dependents', 'SurveyLength', 'SurveyEase'],\n",
 800 |        "      dtype='object')"
 801 |       ]
 802 |      },
 803 |      "execution_count": 26,
 804 |      "metadata": {},
 805 |      "output_type": "execute_result"
 806 |     }
 807 |    ],
 808 |    "source": [
 809 |     "res_df.columns"
 810 |    ]
 811 |   },
 812 |   {
 813 |    "cell_type": "markdown",
 814 |    "metadata": {},
 815 |    "source": [
 816 |     "All responses in the Hobbyist column."
 817 |    ]
 818 |   },
 819 |   {
 820 |    "cell_type": "code",
 821 |    "execution_count": 27,
 822 |    "metadata": {},
 823 |    "outputs": [
 824 |     {
 825 |      "data": {
 826 |       "text/plain": [
 827 |        "0        Yes\n",
 828 |        "1         No\n",
 829 |        "2        Yes\n",
 830 |        "3         No\n",
 831 |        "4        Yes\n",
 832 |        "        ... \n",
 833 |        "88878    Yes\n",
 834 |        "88879     No\n",
 835 |        "88880     No\n",
 836 |        "88881     No\n",
 837 |        "88882    Yes\n",
 838 |        "Name: Hobbyist, Length: 88883, dtype: object"
 839 |       ]
 840 |      },
 841 |      "execution_count": 27,
 842 |      "metadata": {},
 843 |      "output_type": "execute_result"
 844 |     }
 845 |    ],
 846 |    "source": [
 847 |     "res_df['Hobbyist']"
 848 |    ]
 849 |   },
 850 |   {
 851 |    "cell_type": "markdown",
 852 |    "metadata": {},
 853 |    "source": [
 854 |     "Number of each response to question ('Yeses' and 'Nos')."
 855 |    ]
 856 |   },
 857 |   {
 858 |    "cell_type": "code",
 859 |    "execution_count": 28,
 860 |    "metadata": {},
 861 |    "outputs": [
 862 |     {
 863 |      "data": {
 864 |       "text/plain": [
 865 |        "Yes    71257\n",
 866 |        "No     17626\n",
 867 |        "Name: Hobbyist, dtype: int64"
 868 |       ]
 869 |      },
 870 |      "execution_count": 28,
 871 |      "metadata": {},
 872 |      "output_type": "execute_result"
 873 |     }
 874 |    ],
 875 |    "source": [
 876 |     "res_df['Hobbyist'].value_counts()"
 877 |    ]
 878 |   },
 879 |   {
 880 |    "cell_type": "markdown",
 881 |    "metadata": {},
 882 |    "source": [
 883 |     "All responses from first row."
 884 |    ]
 885 |   },
 886 |   {
 887 |    "cell_type": "code",
 888 |    "execution_count": 29,
 889 |    "metadata": {},
 890 |    "outputs": [
 891 |     {
 892 |      "data": {
 893 |       "text/plain": [
 894 |        "Respondent                                                                1\n",
 895 |        "MainBranch                           I am a student who is learning to code\n",
 896 |        "Hobbyist                                                                Yes\n",
 897 |        "OpenSourcer                                                           Never\n",
 898 |        "OpenSource                The quality of OSS and closed source software ...\n",
 899 |        "Employment                           Not employed, and not looking for work\n",
 900 |        "Country                                                      United Kingdom\n",
 901 |        "Student                                                                  No\n",
 902 |        "EdLevel                                           Primary/elementary school\n",
 903 |        "UndergradMajor                                                          NaN\n",
 904 |        "EduOther                  Taught yourself a new language, framework, or ...\n",
 905 |        "OrgSize                                                                 NaN\n",
 906 |        "DevType                                                                 NaN\n",
 907 |        "YearsCode                                                                 4\n",
 908 |        "Age1stCode                                                               10\n",
 909 |        "YearsCodePro                                                            NaN\n",
 910 |        "CareerSat                                                               NaN\n",
 911 |        "JobSat                                                                  NaN\n",
 912 |        "MgrIdiot                                                                NaN\n",
 913 |        "MgrMoney                                                                NaN\n",
 914 |        "MgrWant                                                                 NaN\n",
 915 |        "JobSeek                                                                 NaN\n",
 916 |        "LastHireDate                                                            NaN\n",
 917 |        "LastInt                                                                 NaN\n",
 918 |        "FizzBuzz                                                                NaN\n",
 919 |        "JobFactors                                                              NaN\n",
 920 |        "ResumeUpdate                                                            NaN\n",
 921 |        "CurrencySymbol                                                          NaN\n",
 922 |        "CurrencyDesc                                                            NaN\n",
 923 |        "CompTotal                                                               NaN\n",
 924 |        "CompFreq                                                                NaN\n",
 925 |        "ConvertedComp                                                           NaN\n",
 926 |        "WorkWeekHrs                                                             NaN\n",
 927 |        "WorkPlan                                                                NaN\n",
 928 |        "WorkChallenge                                                           NaN\n",
 929 |        "WorkRemote                                                              NaN\n",
 930 |        "WorkLoc                                                                 NaN\n",
 931 |        "ImpSyn                                                                  NaN\n",
 932 |        "CodeRev                                                                 NaN\n",
 933 |        "CodeRevHrs                                                              NaN\n",
 934 |        "UnitTests                                                               NaN\n",
 935 |        "PurchaseHow                                                             NaN\n",
 936 |        "PurchaseWhat                                                            NaN\n",
 937 |        "LanguageWorkedWith                          HTML/CSS;Java;JavaScript;Python\n",
 938 |        "LanguageDesireNextYear      C;C++;C#;Go;HTML/CSS;Java;JavaScript;Python;SQL\n",
 939 |        "DatabaseWorkedWith                                                   SQLite\n",
 940 |        "DatabaseDesireNextYear                                                MySQL\n",
 941 |        "PlatformWorkedWith                                            MacOS;Windows\n",
 942 |        "PlatformDesireNextYear                              Android;Arduino;Windows\n",
 943 |        "WebFrameWorkedWith                                             Django;Flask\n",
 944 |        "WebFrameDesireNextYear                                         Flask;jQuery\n",
 945 |        "MiscTechWorkedWith                                                  Node.js\n",
 946 |        "MiscTechDesireNextYear                                              Node.js\n",
 947 |        "DevEnviron                                       IntelliJ;Notepad++;PyCharm\n",
 948 |        "OpSys                                                               Windows\n",
 949 |        "Containers                                          I do not use containers\n",
 950 |        "BlockchainOrg                                                           NaN\n",
 951 |        "BlockchainIs                                                            NaN\n",
 952 |        "BetterLife                                                              Yes\n",
 953 |        "ITperson                           Fortunately, someone else has that title\n",
 954 |        "OffOn                                                                   Yes\n",
 955 |        "SocialMedia                                                         Twitter\n",
 956 |        "Extraversion                                                         Online\n",
 957 |        "ScreenName                                                         Username\n",
 958 |        "SOVisit1st                                                             2017\n",
 959 |        "SOVisitFreq                                 A few times per month or weekly\n",
 960 |        "SOVisitTo                 Find answers to specific questions;Learn how t...\n",
 961 |        "SOFindAnswer                                             3-5 times per week\n",
 962 |        "SOTimeSaved                                  Stack Overflow was much faster\n",
 963 |        "SOHowMuchTime                                                 31-60 minutes\n",
 964 |        "SOAccount                                                                No\n",
 965 |        "SOPartFreq                                                              NaN\n",
 966 |        "SOJobs                    No, I didn't know that Stack Overflow had a jo...\n",
 967 |        "EntTeams                                No, and I don't know what those are\n",
 968 |        "SOComm                                                              Neutral\n",
 969 |        "WelcomeChange                       Just as welcome now as I felt last year\n",
 970 |        "SONewContent              Tech articles written by other developers;Indu...\n",
 971 |        "Age                                                                      14\n",
 972 |        "Gender                                                                  Man\n",
 973 |        "Trans                                                                    No\n",
 974 |        "Sexuality                                           Straight / Heterosexual\n",
 975 |        "Ethnicity                                                               NaN\n",
 976 |        "Dependents                                                               No\n",
 977 |        "SurveyLength                                          Appropriate in length\n",
 978 |        "SurveyEase                                       Neither easy nor difficult\n",
 979 |        "Name: 0, dtype: object"
 980 |       ]
 981 |      },
 982 |      "execution_count": 29,
 983 |      "metadata": {},
 984 |      "output_type": "execute_result"
 985 |     }
 986 |    ],
 987 |    "source": [
 988 |     "res_df.loc[0]"
 989 |    ]
 990 |   },
 991 |   {
 992 |    "cell_type": "markdown",
 993 |    "metadata": {},
 994 |    "source": [
 995 |     "Get responses to Hobbyist question in first three rows by passing in a list of rows."
 996 |    ]
 997 |   },
 998 |   {
 999 |    "cell_type": "code",
1000 |    "execution_count": 30,
1001 |    "metadata": {},
1002 |    "outputs": [
1003 |     {
1004 |      "data": {
1005 |       "text/plain": [
1006 |        "0    Yes\n",
1007 |        "1     No\n",
1008 |        "2    Yes\n",
1009 |        "Name: Hobbyist, dtype: object"
1010 |       ]
1011 |      },
1012 |      "execution_count": 30,
1013 |      "metadata": {},
1014 |      "output_type": "execute_result"
1015 |     }
1016 |    ],
1017 |    "source": [
1018 |     "res_df.loc[[0, 1, 2], 'Hobbyist']"
1019 |    ]
1020 |   },
1021 |   {
1022 |    "cell_type": "markdown",
1023 |    "metadata": {},
1024 |    "source": [
1025 |     "Can also use slice notation to retrieve a range of rows."
1026 |    ]
1027 |   },
1028 |   {
1029 |    "cell_type": "code",
1030 |    "execution_count": 34,
1031 |    "metadata": {},
1032 |    "outputs": [
1033 |     {
1034 |      "data": {
1035 |       "text/html": [
1036 |        "<div>\n",
1037 |        "<style scoped>\n",
1038 |        "    .dataframe tbody tr th:only-of-type {\n",
1039 |        "        vertical-align: middle;\n",
1040 |        "    }\n",
1041 |        "\n",
1042 |        "    .dataframe tbody tr th {\n",
1043 |        "        vertical-align: top;\n",
1044 |        "    }\n",
1045 |        "\n",
1046 |        "    .dataframe thead th {\n",
1047 |        "        text-align: right;\n",
1048 |        "    }\n",
1049 |        "</style>\n",
1050 |        "<table border=\"1\" class=\"dataframe\">\n",
1051 |        "  <thead>\n",
1052 |        "    <tr style=\"text-align: right;\">\n",
1053 |        "      <th></th>\n",
1054 |        "      <th>Respondent</th>\n",
1055 |        "      <th>MainBranch</th>\n",
1056 |        "      <th>Hobbyist</th>\n",
1057 |        "      <th>OpenSourcer</th>\n",
1058 |        "      <th>OpenSource</th>\n",
1059 |        "      <th>Employment</th>\n",
1060 |        "      <th>Country</th>\n",
1061 |        "      <th>Student</th>\n",
1062 |        "      <th>EdLevel</th>\n",
1063 |        "      <th>UndergradMajor</th>\n",
1064 |        "      <th>EduOther</th>\n",
1065 |        "      <th>OrgSize</th>\n",
1066 |        "      <th>DevType</th>\n",
1067 |        "      <th>YearsCode</th>\n",
1068 |        "      <th>Age1stCode</th>\n",
1069 |        "      <th>YearsCodePro</th>\n",
1070 |        "      <th>CareerSat</th>\n",
1071 |        "      <th>JobSat</th>\n",
1072 |        "      <th>MgrIdiot</th>\n",
1073 |        "      <th>MgrMoney</th>\n",
1074 |        "      <th>MgrWant</th>\n",
1075 |        "      <th>JobSeek</th>\n",
1076 |        "      <th>LastHireDate</th>\n",
1077 |        "      <th>LastInt</th>\n",
1078 |        "      <th>FizzBuzz</th>\n",
1079 |        "      <th>JobFactors</th>\n",
1080 |        "      <th>ResumeUpdate</th>\n",
1081 |        "      <th>CurrencySymbol</th>\n",
1082 |        "      <th>CurrencyDesc</th>\n",
1083 |        "      <th>CompTotal</th>\n",
1084 |        "      <th>CompFreq</th>\n",
1085 |        "      <th>ConvertedComp</th>\n",
1086 |        "      <th>WorkWeekHrs</th>\n",
1087 |        "      <th>WorkPlan</th>\n",
1088 |        "      <th>WorkChallenge</th>\n",
1089 |        "      <th>WorkRemote</th>\n",
1090 |        "      <th>WorkLoc</th>\n",
1091 |        "      <th>ImpSyn</th>\n",
1092 |        "      <th>CodeRev</th>\n",
1093 |        "      <th>CodeRevHrs</th>\n",
1094 |        "      <th>UnitTests</th>\n",
1095 |        "      <th>PurchaseHow</th>\n",
1096 |        "      <th>PurchaseWhat</th>\n",
1097 |        "      <th>LanguageWorkedWith</th>\n",
1098 |        "      <th>LanguageDesireNextYear</th>\n",
1099 |        "      <th>DatabaseWorkedWith</th>\n",
1100 |        "      <th>DatabaseDesireNextYear</th>\n",
1101 |        "      <th>PlatformWorkedWith</th>\n",
1102 |        "      <th>PlatformDesireNextYear</th>\n",
1103 |        "      <th>WebFrameWorkedWith</th>\n",
1104 |        "      <th>WebFrameDesireNextYear</th>\n",
1105 |        "      <th>MiscTechWorkedWith</th>\n",
1106 |        "      <th>MiscTechDesireNextYear</th>\n",
1107 |        "      <th>DevEnviron</th>\n",
1108 |        "      <th>OpSys</th>\n",
1109 |        "      <th>Containers</th>\n",
1110 |        "      <th>BlockchainOrg</th>\n",
1111 |        "      <th>BlockchainIs</th>\n",
1112 |        "      <th>BetterLife</th>\n",
1113 |        "      <th>ITperson</th>\n",
1114 |        "      <th>OffOn</th>\n",
1115 |        "      <th>SocialMedia</th>\n",
1116 |        "      <th>Extraversion</th>\n",
1117 |        "      <th>ScreenName</th>\n",
1118 |        "      <th>SOVisit1st</th>\n",
1119 |        "      <th>SOVisitFreq</th>\n",
1120 |        "      <th>SOVisitTo</th>\n",
1121 |        "      <th>SOFindAnswer</th>\n",
1122 |        "      <th>SOTimeSaved</th>\n",
1123 |        "      <th>SOHowMuchTime</th>\n",
1124 |        "      <th>SOAccount</th>\n",
1125 |        "      <th>SOPartFreq</th>\n",
1126 |        "      <th>SOJobs</th>\n",
1127 |        "      <th>EntTeams</th>\n",
1128 |        "      <th>SOComm</th>\n",
1129 |        "      <th>WelcomeChange</th>\n",
1130 |        "      <th>SONewContent</th>\n",
1131 |        "      <th>Age</th>\n",
1132 |        "      <th>Gender</th>\n",
1133 |        "      <th>Trans</th>\n",
1134 |        "      <th>Sexuality</th>\n",
1135 |        "      <th>Ethnicity</th>\n",
1136 |        "      <th>Dependents</th>\n",
1137 |        "      <th>SurveyLength</th>\n",
1138 |        "      <th>SurveyEase</th>\n",
1139 |        "    </tr>\n",
1140 |        "  </thead>\n",
1141 |        "  <tbody>\n",
1142 |        "    <tr>\n",
1143 |        "      <th>0</th>\n",
1144 |        "      <td>1</td>\n",
1145 |        "      <td>I am a student who is learning to code</td>\n",
1146 |        "      <td>Yes</td>\n",
1147 |        "      <td>Never</td>\n",
1148 |        "      <td>The quality of OSS and closed source software ...</td>\n",
1149 |        "      <td>Not employed, and not looking for work</td>\n",
1150 |        "      <td>United Kingdom</td>\n",
1151 |        "      <td>No</td>\n",
1152 |        "      <td>Primary/elementary school</td>\n",
1153 |        "      <td>NaN</td>\n",
1154 |        "      <td>Taught yourself a new language, framework, or ...</td>\n",
1155 |        "      <td>NaN</td>\n",
1156 |        "      <td>NaN</td>\n",
1157 |        "      <td>4</td>\n",
1158 |        "      <td>10</td>\n",
1159 |        "      <td>NaN</td>\n",
1160 |        "      <td>NaN</td>\n",
1161 |        "      <td>NaN</td>\n",
1162 |        "      <td>NaN</td>\n",
1163 |        "      <td>NaN</td>\n",
1164 |        "      <td>NaN</td>\n",
1165 |        "      <td>NaN</td>\n",
1166 |        "      <td>NaN</td>\n",
1167 |        "      <td>NaN</td>\n",
1168 |        "      <td>NaN</td>\n",
1169 |        "      <td>NaN</td>\n",
1170 |        "      <td>NaN</td>\n",
1171 |        "      <td>NaN</td>\n",
1172 |        "      <td>NaN</td>\n",
1173 |        "      <td>NaN</td>\n",
1174 |        "      <td>NaN</td>\n",
1175 |        "      <td>NaN</td>\n",
1176 |        "      <td>NaN</td>\n",
1177 |        "      <td>NaN</td>\n",
1178 |        "      <td>NaN</td>\n",
1179 |        "      <td>NaN</td>\n",
1180 |        "      <td>NaN</td>\n",
1181 |        "      <td>NaN</td>\n",
1182 |        "      <td>NaN</td>\n",
1183 |        "      <td>NaN</td>\n",
1184 |        "      <td>NaN</td>\n",
1185 |        "      <td>NaN</td>\n",
1186 |        "      <td>NaN</td>\n",
1187 |        "      <td>HTML/CSS;Java;JavaScript;Python</td>\n",
1188 |        "      <td>C;C++;C#;Go;HTML/CSS;Java;JavaScript;Python;SQL</td>\n",
1189 |        "      <td>SQLite</td>\n",
1190 |        "      <td>MySQL</td>\n",
1191 |        "      <td>MacOS;Windows</td>\n",
1192 |        "      <td>Android;Arduino;Windows</td>\n",
1193 |        "      <td>Django;Flask</td>\n",
1194 |        "      <td>Flask;jQuery</td>\n",
1195 |        "      <td>Node.js</td>\n",
1196 |        "      <td>Node.js</td>\n",
1197 |        "      <td>IntelliJ;Notepad++;PyCharm</td>\n",
1198 |        "      <td>Windows</td>\n",
1199 |        "      <td>I do not use containers</td>\n",
1200 |        "      <td>NaN</td>\n",
1201 |        "      <td>NaN</td>\n",
1202 |        "      <td>Yes</td>\n",
1203 |        "      <td>Fortunately, someone else has that title</td>\n",
1204 |        "      <td>Yes</td>\n",
1205 |        "      <td>Twitter</td>\n",
1206 |        "      <td>Online</td>\n",
1207 |        "      <td>Username</td>\n",
1208 |        "      <td>2017</td>\n",
1209 |        "      <td>A few times per month or weekly</td>\n",
1210 |        "      <td>Find answers to specific questions;Learn how t...</td>\n",
1211 |        "      <td>3-5 times per week</td>\n",
1212 |        "      <td>Stack Overflow was much faster</td>\n",
1213 |        "      <td>31-60 minutes</td>\n",
1214 |        "      <td>No</td>\n",
1215 |        "      <td>NaN</td>\n",
1216 |        "      <td>No, I didn't know that Stack Overflow had a jo...</td>\n",
1217 |        "      <td>No, and I don't know what those are</td>\n",
1218 |        "      <td>Neutral</td>\n",
1219 |        "      <td>Just as welcome now as I felt last year</td>\n",
1220 |        "      <td>Tech articles written by other developers;Indu...</td>\n",
1221 |        "      <td>14.0</td>\n",
1222 |        "      <td>Man</td>\n",
1223 |        "      <td>No</td>\n",
1224 |        "      <td>Straight / Heterosexual</td>\n",
1225 |        "      <td>NaN</td>\n",
1226 |        "      <td>No</td>\n",
1227 |        "      <td>Appropriate in length</td>\n",
1228 |        "      <td>Neither easy nor difficult</td>\n",
1229 |        "    </tr>\n",
1230 |        "    <tr>\n",
1231 |        "      <th>1</th>\n",
1232 |        "      <td>2</td>\n",
1233 |        "      <td>I am a student who is learning to code</td>\n",
1234 |        "      <td>No</td>\n",
1235 |        "      <td>Less than once per year</td>\n",
1236 |        "      <td>The quality of OSS and closed source software ...</td>\n",
1237 |        "      <td>Not employed, but looking for work</td>\n",
1238 |        "      <td>Bosnia and Herzegovina</td>\n",
1239 |        "      <td>Yes, full-time</td>\n",
1240 |        "      <td>Secondary school (e.g. American high school, G...</td>\n",
1241 |        "      <td>NaN</td>\n",
1242 |        "      <td>Taken an online course in programming or softw...</td>\n",
1243 |        "      <td>NaN</td>\n",
1244 |        "      <td>Developer, desktop or enterprise applications;...</td>\n",
1245 |        "      <td>NaN</td>\n",
1246 |        "      <td>17</td>\n",
1247 |        "      <td>NaN</td>\n",
1248 |        "      <td>NaN</td>\n",
1249 |        "      <td>NaN</td>\n",
1250 |        "      <td>NaN</td>\n",
1251 |        "      <td>NaN</td>\n",
1252 |        "      <td>NaN</td>\n",
1253 |        "      <td>I am actively looking for a job</td>\n",
1254 |        "      <td>I've never had a job</td>\n",
1255 |        "      <td>NaN</td>\n",
1256 |        "      <td>NaN</td>\n",
1257 |        "      <td>Financial performance or funding status of the...</td>\n",
1258 |        "      <td>Something else changed (education, award, medi...</td>\n",
1259 |        "      <td>NaN</td>\n",
1260 |        "      <td>NaN</td>\n",
1261 |        "      <td>NaN</td>\n",
1262 |        "      <td>NaN</td>\n",
1263 |        "      <td>NaN</td>\n",
1264 |        "      <td>NaN</td>\n",
1265 |        "      <td>NaN</td>\n",
1266 |        "      <td>NaN</td>\n",
1267 |        "      <td>NaN</td>\n",
1268 |        "      <td>NaN</td>\n",
1269 |        "      <td>NaN</td>\n",
1270 |        "      <td>NaN</td>\n",
1271 |        "      <td>NaN</td>\n",
1272 |        "      <td>NaN</td>\n",
1273 |        "      <td>NaN</td>\n",
1274 |        "      <td>NaN</td>\n",
1275 |        "      <td>C++;HTML/CSS;Python</td>\n",
1276 |        "      <td>C++;HTML/CSS;JavaScript;SQL</td>\n",
1277 |        "      <td>NaN</td>\n",
1278 |        "      <td>MySQL</td>\n",
1279 |        "      <td>Windows</td>\n",
1280 |        "      <td>Windows</td>\n",
1281 |        "      <td>Django</td>\n",
1282 |        "      <td>Django</td>\n",
1283 |        "      <td>NaN</td>\n",
1284 |        "      <td>NaN</td>\n",
1285 |        "      <td>Atom;PyCharm</td>\n",
1286 |        "      <td>Windows</td>\n",
1287 |        "      <td>I do not use containers</td>\n",
1288 |        "      <td>NaN</td>\n",
1289 |        "      <td>Useful across many domains and could change ma...</td>\n",
1290 |        "      <td>Yes</td>\n",
1291 |        "      <td>Yes</td>\n",
1292 |        "      <td>Yes</td>\n",
1293 |        "      <td>Instagram</td>\n",
1294 |        "      <td>Online</td>\n",
1295 |        "      <td>Username</td>\n",
1296 |        "      <td>2017</td>\n",
1297 |        "      <td>Daily or almost daily</td>\n",
1298 |        "      <td>Find answers to specific questions;Learn how t...</td>\n",
1299 |        "      <td>3-5 times per week</td>\n",
1300 |        "      <td>Stack Overflow was much faster</td>\n",
1301 |        "      <td>11-30 minutes</td>\n",
1302 |        "      <td>Yes</td>\n",
1303 |        "      <td>A few times per month or weekly</td>\n",
1304 |        "      <td>No, I knew that Stack Overflow had a job board...</td>\n",
1305 |        "      <td>No, and I don't know what those are</td>\n",
1306 |        "      <td>Yes, somewhat</td>\n",
1307 |        "      <td>Just as welcome now as I felt last year</td>\n",
1308 |        "      <td>Tech articles written by other developers;Indu...</td>\n",
1309 |        "      <td>19.0</td>\n",
1310 |        "      <td>Man</td>\n",
1311 |        "      <td>No</td>\n",
1312 |        "      <td>Straight / Heterosexual</td>\n",
1313 |        "      <td>NaN</td>\n",
1314 |        "      <td>No</td>\n",
1315 |        "      <td>Appropriate in length</td>\n",
1316 |        "      <td>Neither easy nor difficult</td>\n",
1317 |        "    </tr>\n",
1318 |        "    <tr>\n",
1319 |        "      <th>2</th>\n",
1320 |        "      <td>3</td>\n",
1321 |        "      <td>I am not primarily a developer, but I write co...</td>\n",
1322 |        "      <td>Yes</td>\n",
1323 |        "      <td>Never</td>\n",
1324 |        "      <td>The quality of OSS and closed source software ...</td>\n",
1325 |        "      <td>Employed full-time</td>\n",
1326 |        "      <td>Thailand</td>\n",
1327 |        "      <td>No</td>\n",
1328 |        "      <td>Bachelor’s degree (BA, BS, B.Eng., etc.)</td>\n",
1329 |        "      <td>Web development or web design</td>\n",
1330 |        "      <td>Taught yourself a new language, framework, or ...</td>\n",
1331 |        "      <td>100 to 499 employees</td>\n",
1332 |        "      <td>Designer;Developer, back-end;Developer, front-...</td>\n",
1333 |        "      <td>3</td>\n",
1334 |        "      <td>22</td>\n",
1335 |        "      <td>1</td>\n",
1336 |        "      <td>Slightly satisfied</td>\n",
1337 |        "      <td>Slightly satisfied</td>\n",
1338 |        "      <td>Not at all confident</td>\n",
1339 |        "      <td>Not sure</td>\n",
1340 |        "      <td>Not sure</td>\n",
1341 |        "      <td>I’m not actively looking, but I am open to new...</td>\n",
1342 |        "      <td>1-2 years ago</td>\n",
1343 |        "      <td>Interview with people in peer roles</td>\n",
1344 |        "      <td>No</td>\n",
1345 |        "      <td>Languages, frameworks, and other technologies ...</td>\n",
1346 |        "      <td>I was preparing for a job search</td>\n",
1347 |        "      <td>THB</td>\n",
1348 |        "      <td>Thai baht</td>\n",
1349 |        "      <td>23000.0</td>\n",
1350 |        "      <td>Monthly</td>\n",
1351 |        "      <td>8820.0</td>\n",
1352 |        "      <td>40.0</td>\n",
1353 |        "      <td>There's no schedule or spec; I work on what se...</td>\n",
1354 |        "      <td>Distracting work environment;Inadequate access...</td>\n",
1355 |        "      <td>Less than once per month / Never</td>\n",
1356 |        "      <td>Home</td>\n",
1357 |        "      <td>Average</td>\n",
1358 |        "      <td>No</td>\n",
1359 |        "      <td>NaN</td>\n",
1360 |        "      <td>No, but I think we should</td>\n",
1361 |        "      <td>Not sure</td>\n",
1362 |        "      <td>I have little or no influence</td>\n",
1363 |        "      <td>HTML/CSS</td>\n",
1364 |        "      <td>Elixir;HTML/CSS</td>\n",
1365 |        "      <td>PostgreSQL</td>\n",
1366 |        "      <td>PostgreSQL</td>\n",
1367 |        "      <td>NaN</td>\n",
1368 |        "      <td>NaN</td>\n",
1369 |        "      <td>NaN</td>\n",
1370 |        "      <td>Other(s):</td>\n",
1371 |        "      <td>NaN</td>\n",
1372 |        "      <td>NaN</td>\n",
1373 |        "      <td>Vim;Visual Studio Code</td>\n",
1374 |        "      <td>Linux-based</td>\n",
1375 |        "      <td>I do not use containers</td>\n",
1376 |        "      <td>NaN</td>\n",
1377 |        "      <td>NaN</td>\n",
1378 |        "      <td>Yes</td>\n",
1379 |        "      <td>Yes</td>\n",
1380 |        "      <td>Yes</td>\n",
1381 |        "      <td>Reddit</td>\n",
1382 |        "      <td>In real life (in person)</td>\n",
1383 |        "      <td>Username</td>\n",
1384 |        "      <td>2011</td>\n",
1385 |        "      <td>A few times per week</td>\n",
1386 |        "      <td>Find answers to specific questions;Learn how t...</td>\n",
1387 |        "      <td>6-10 times per week</td>\n",
1388 |        "      <td>They were about the same</td>\n",
1389 |        "      <td>NaN</td>\n",
1390 |        "      <td>Yes</td>\n",
1391 |        "      <td>Less than once per month or monthly</td>\n",
1392 |        "      <td>Yes</td>\n",
1393 |        "      <td>No, I've heard of them, but I am not part of a...</td>\n",
1394 |        "      <td>Neutral</td>\n",
1395 |        "      <td>Just as welcome now as I felt last year</td>\n",
1396 |        "      <td>Tech meetups or events in your area;Courses on...</td>\n",
1397 |        "      <td>28.0</td>\n",
1398 |        "      <td>Man</td>\n",
1399 |        "      <td>No</td>\n",
1400 |        "      <td>Straight / Heterosexual</td>\n",
1401 |        "      <td>NaN</td>\n",
1402 |        "      <td>Yes</td>\n",
1403 |        "      <td>Appropriate in length</td>\n",
1404 |        "      <td>Neither easy nor difficult</td>\n",
1405 |        "    </tr>\n",
1406 |        "  </tbody>\n",
1407 |        "</table>\n",
1408 |        "</div>"
1409 |       ],
1410 |       "text/plain": [
1411 |        "   Respondent                                         MainBranch Hobbyist  \\\n",
1412 |        "0           1             I am a student who is learning to code      Yes   \n",
1413 |        "1           2             I am a student who is learning to code       No   \n",
1414 |        "2           3  I am not primarily a developer, but I write co...      Yes   \n",
1415 |        "\n",
1416 |        "               OpenSourcer                                         OpenSource  \\\n",
1417 |        "0                    Never  The quality of OSS and closed source software ...   \n",
1418 |        "1  Less than once per year  The quality of OSS and closed source software ...   \n",
1419 |        "2                    Never  The quality of OSS and closed source software ...   \n",
1420 |        "\n",
1421 |        "                               Employment                 Country  \\\n",
1422 |        "0  Not employed, and not looking for work          United Kingdom   \n",
1423 |        "1      Not employed, but looking for work  Bosnia and Herzegovina   \n",
1424 |        "2                      Employed full-time                Thailand   \n",
1425 |        "\n",
1426 |        "          Student                                            EdLevel  \\\n",
1427 |        "0              No                          Primary/elementary school   \n",
1428 |        "1  Yes, full-time  Secondary school (e.g. American high school, G...   \n",
1429 |        "2              No           Bachelor’s degree (BA, BS, B.Eng., etc.)   \n",
1430 |        "\n",
1431 |        "                  UndergradMajor  \\\n",
1432 |        "0                            NaN   \n",
1433 |        "1                            NaN   \n",
1434 |        "2  Web development or web design   \n",
1435 |        "\n",
1436 |        "                                            EduOther               OrgSize  \\\n",
1437 |        "0  Taught yourself a new language, framework, or ...                   NaN   \n",
1438 |        "1  Taken an online course in programming or softw...                   NaN   \n",
1439 |        "2  Taught yourself a new language, framework, or ...  100 to 499 employees   \n",
1440 |        "\n",
1441 |        "                                             DevType YearsCode Age1stCode  \\\n",
1442 |        "0                                                NaN         4         10   \n",
1443 |        "1  Developer, desktop or enterprise applications;...       NaN         17   \n",
1444 |        "2  Designer;Developer, back-end;Developer, front-...         3         22   \n",
1445 |        "\n",
1446 |        "  YearsCodePro           CareerSat              JobSat              MgrIdiot  \\\n",
1447 |        "0          NaN                 NaN                 NaN                   NaN   \n",
1448 |        "1          NaN                 NaN                 NaN                   NaN   \n",
1449 |        "2            1  Slightly satisfied  Slightly satisfied  Not at all confident   \n",
1450 |        "\n",
1451 |        "   MgrMoney   MgrWant                                            JobSeek  \\\n",
1452 |        "0       NaN       NaN                                                NaN   \n",
1453 |        "1       NaN       NaN                    I am actively looking for a job   \n",
1454 |        "2  Not sure  Not sure  I’m not actively looking, but I am open to new...   \n",
1455 |        "\n",
1456 |        "           LastHireDate                              LastInt FizzBuzz  \\\n",
1457 |        "0                   NaN                                  NaN      NaN   \n",
1458 |        "1  I've never had a job                                  NaN      NaN   \n",
1459 |        "2         1-2 years ago  Interview with people in peer roles       No   \n",
1460 |        "\n",
1461 |        "                                          JobFactors  \\\n",
1462 |        "0                                                NaN   \n",
1463 |        "1  Financial performance or funding status of the...   \n",
1464 |        "2  Languages, frameworks, and other technologies ...   \n",
1465 |        "\n",
1466 |        "                                        ResumeUpdate CurrencySymbol  \\\n",
1467 |        "0                                                NaN            NaN   \n",
1468 |        "1  Something else changed (education, award, medi...            NaN   \n",
1469 |        "2                   I was preparing for a job search            THB   \n",
1470 |        "\n",
1471 |        "  CurrencyDesc  CompTotal CompFreq  ConvertedComp  WorkWeekHrs  \\\n",
1472 |        "0          NaN        NaN      NaN            NaN          NaN   \n",
1473 |        "1          NaN        NaN      NaN            NaN          NaN   \n",
1474 |        "2    Thai baht    23000.0  Monthly         8820.0         40.0   \n",
1475 |        "\n",
1476 |        "                                            WorkPlan  \\\n",
1477 |        "0                                                NaN   \n",
1478 |        "1                                                NaN   \n",
1479 |        "2  There's no schedule or spec; I work on what se...   \n",
1480 |        "\n",
1481 |        "                                       WorkChallenge  \\\n",
1482 |        "0                                                NaN   \n",
1483 |        "1                                                NaN   \n",
1484 |        "2  Distracting work environment;Inadequate access...   \n",
1485 |        "\n",
1486 |        "                         WorkRemote WorkLoc   ImpSyn CodeRev  CodeRevHrs  \\\n",
1487 |        "0                               NaN     NaN      NaN     NaN         NaN   \n",
1488 |        "1                               NaN     NaN      NaN     NaN         NaN   \n",
1489 |        "2  Less than once per month / Never    Home  Average      No         NaN   \n",
1490 |        "\n",
1491 |        "                   UnitTests PurchaseHow                   PurchaseWhat  \\\n",
1492 |        "0                        NaN         NaN                            NaN   \n",
1493 |        "1                        NaN         NaN                            NaN   \n",
1494 |        "2  No, but I think we should    Not sure  I have little or no influence   \n",
1495 |        "\n",
1496 |        "                LanguageWorkedWith  \\\n",
1497 |        "0  HTML/CSS;Java;JavaScript;Python   \n",
1498 |        "1              C++;HTML/CSS;Python   \n",
1499 |        "2                         HTML/CSS   \n",
1500 |        "\n",
1501 |        "                            LanguageDesireNextYear DatabaseWorkedWith  \\\n",
1502 |        "0  C;C++;C#;Go;HTML/CSS;Java;JavaScript;Python;SQL             SQLite   \n",
1503 |        "1                      C++;HTML/CSS;JavaScript;SQL                NaN   \n",
1504 |        "2                                  Elixir;HTML/CSS         PostgreSQL   \n",
1505 |        "\n",
1506 |        "  DatabaseDesireNextYear PlatformWorkedWith   PlatformDesireNextYear  \\\n",
1507 |        "0                  MySQL      MacOS;Windows  Android;Arduino;Windows   \n",
1508 |        "1                  MySQL            Windows                  Windows   \n",
1509 |        "2             PostgreSQL                NaN                      NaN   \n",
1510 |        "\n",
1511 |        "  WebFrameWorkedWith WebFrameDesireNextYear MiscTechWorkedWith  \\\n",
1512 |        "0       Django;Flask           Flask;jQuery            Node.js   \n",
1513 |        "1             Django                 Django                NaN   \n",
1514 |        "2                NaN              Other(s):                NaN   \n",
1515 |        "\n",
1516 |        "  MiscTechDesireNextYear                  DevEnviron        OpSys  \\\n",
1517 |        "0                Node.js  IntelliJ;Notepad++;PyCharm      Windows   \n",
1518 |        "1                    NaN                Atom;PyCharm      Windows   \n",
1519 |        "2                    NaN      Vim;Visual Studio Code  Linux-based   \n",
1520 |        "\n",
1521 |        "                Containers BlockchainOrg  \\\n",
1522 |        "0  I do not use containers           NaN   \n",
1523 |        "1  I do not use containers           NaN   \n",
1524 |        "2  I do not use containers           NaN   \n",
1525 |        "\n",
1526 |        "                                        BlockchainIs BetterLife  \\\n",
1527 |        "0                                                NaN        Yes   \n",
1528 |        "1  Useful across many domains and could change ma...        Yes   \n",
1529 |        "2                                                NaN        Yes   \n",
1530 |        "\n",
1531 |        "                                   ITperson OffOn SocialMedia  \\\n",
1532 |        "0  Fortunately, someone else has that title   Yes     Twitter   \n",
1533 |        "1                                       Yes   Yes   Instagram   \n",
1534 |        "2                                       Yes   Yes      Reddit   \n",
1535 |        "\n",
1536 |        "               Extraversion ScreenName SOVisit1st  \\\n",
1537 |        "0                    Online   Username       2017   \n",
1538 |        "1                    Online   Username       2017   \n",
1539 |        "2  In real life (in person)   Username       2011   \n",
1540 |        "\n",
1541 |        "                       SOVisitFreq  \\\n",
1542 |        "0  A few times per month or weekly   \n",
1543 |        "1            Daily or almost daily   \n",
1544 |        "2             A few times per week   \n",
1545 |        "\n",
1546 |        "                                           SOVisitTo         SOFindAnswer  \\\n",
1547 |        "0  Find answers to specific questions;Learn how t...   3-5 times per week   \n",
1548 |        "1  Find answers to specific questions;Learn how t...   3-5 times per week   \n",
1549 |        "2  Find answers to specific questions;Learn how t...  6-10 times per week   \n",
1550 |        "\n",
1551 |        "                      SOTimeSaved  SOHowMuchTime SOAccount  \\\n",
1552 |        "0  Stack Overflow was much faster  31-60 minutes        No   \n",
1553 |        "1  Stack Overflow was much faster  11-30 minutes       Yes   \n",
1554 |        "2        They were about the same            NaN       Yes   \n",
1555 |        "\n",
1556 |        "                            SOPartFreq  \\\n",
1557 |        "0                                  NaN   \n",
1558 |        "1      A few times per month or weekly   \n",
1559 |        "2  Less than once per month or monthly   \n",
1560 |        "\n",
1561 |        "                                              SOJobs  \\\n",
1562 |        "0  No, I didn't know that Stack Overflow had a jo...   \n",
1563 |        "1  No, I knew that Stack Overflow had a job board...   \n",
1564 |        "2                                                Yes   \n",
1565 |        "\n",
1566 |        "                                            EntTeams         SOComm  \\\n",
1567 |        "0                No, and I don't know what those are        Neutral   \n",
1568 |        "1                No, and I don't know what those are  Yes, somewhat   \n",
1569 |        "2  No, I've heard of them, but I am not part of a...        Neutral   \n",
1570 |        "\n",
1571 |        "                             WelcomeChange  \\\n",
1572 |        "0  Just as welcome now as I felt last year   \n",
1573 |        "1  Just as welcome now as I felt last year   \n",
1574 |        "2  Just as welcome now as I felt last year   \n",
1575 |        "\n",
1576 |        "                                        SONewContent   Age Gender Trans  \\\n",
1577 |        "0  Tech articles written by other developers;Indu...  14.0    Man    No   \n",
1578 |        "1  Tech articles written by other developers;Indu...  19.0    Man    No   \n",
1579 |        "2  Tech meetups or events in your area;Courses on...  28.0    Man    No   \n",
1580 |        "\n",
1581 |        "                 Sexuality Ethnicity Dependents           SurveyLength  \\\n",
1582 |        "0  Straight / Heterosexual       NaN         No  Appropriate in length   \n",
1583 |        "1  Straight / Heterosexual       NaN         No  Appropriate in length   \n",
1584 |        "2  Straight / Heterosexual       NaN        Yes  Appropriate in length   \n",
1585 |        "\n",
1586 |        "                   SurveyEase  \n",
1587 |        "0  Neither easy nor difficult  \n",
1588 |        "1  Neither easy nor difficult  \n",
1589 |        "2  Neither easy nor difficult  "
1590 |       ]
1591 |      },
1592 |      "execution_count": 34,
1593 |      "metadata": {},
1594 |      "output_type": "execute_result"
1595 |     }
1596 |    ],
1597 |    "source": [
1598 |     "res_df.loc[0:2]"
1599 |    ]
1600 |   },
1601 |   {
1602 |    "cell_type": "markdown",
1603 |    "metadata": {},
1604 |    "source": [
1605 |     "How the first row responded to the Hobbyist question."
1606 |    ]
1607 |   },
1608 |   {
1609 |    "cell_type": "code",
1610 |    "execution_count": 38,
1611 |    "metadata": {},
1612 |    "outputs": [
1613 |     {
1614 |      "data": {
1615 |       "text/plain": [
1616 |        "'Yes'"
1617 |       ]
1618 |      },
1619 |      "execution_count": 38,
1620 |      "metadata": {},
1621 |      "output_type": "execute_result"
1622 |     }
1623 |    ],
1624 |    "source": [
1625 |     "res_df.loc[0, 'Hobbyist']"
1626 |    ]
1627 |   },
1628 |   {
1629 |    "cell_type": "markdown",
1630 |    "metadata": {},
1631 |    "source": [
1632 |     "Note we can drop the brackets when selecting rows _and_ a column together."
1633 |    ]
1634 |   },
1635 |   {
1636 |    "cell_type": "markdown",
1637 |    "metadata": {},
1638 |    "source": [
1639 |     "Get the responses of the first three rows to the Hobbyist question by passing in a slice of rows and the column label."
1640 |    ]
1641 |   },
1642 |   {
1643 |    "cell_type": "code",
1644 |    "execution_count": 37,
1645 |    "metadata": {},
1646 |    "outputs": [
1647 |     {
1648 |      "data": {
1649 |       "text/plain": [
1650 |        "0    Yes\n",
1651 |        "1     No\n",
1652 |        "2    Yes\n",
1653 |        "Name: Hobbyist, dtype: object"
1654 |       ]
1655 |      },
1656 |      "execution_count": 37,
1657 |      "metadata": {},
1658 |      "output_type": "execute_result"
1659 |     }
1660 |    ],
1661 |    "source": [
1662 |     "res_df.loc[0:2, 'Hobbyist']"
1663 |    ]
1664 |   },
1665 |   {
1666 |    "cell_type": "markdown",
1667 |    "metadata": {},
1668 |    "source": [
1669 |     "When selecting a slice of rows and columns, drop the brackets to avoid a syntax error."
1670 |    ]
1671 |   },
1672 |   {
1673 |    "cell_type": "markdown",
1674 |    "metadata": {},
1675 |    "source": [
1676 |     "Retrieve a slice of rows together with a slice of columns."
1677 |    ]
1678 |   },
1679 |   {
1680 |    "cell_type": "code",
1681 |    "execution_count": 39,
1682 |    "metadata": {},
1683 |    "outputs": [
1684 |     {
1685 |      "data": {
1686 |       "text/html": [
1687 |        "<div>\n",
1688 |        "<style scoped>\n",
1689 |        "    .dataframe tbody tr th:only-of-type {\n",
1690 |        "        vertical-align: middle;\n",
1691 |        "    }\n",
1692 |        "\n",
1693 |        "    .dataframe tbody tr th {\n",
1694 |        "        vertical-align: top;\n",
1695 |        "    }\n",
1696 |        "\n",
1697 |        "    .dataframe thead th {\n",
1698 |        "        text-align: right;\n",
1699 |        "    }\n",
1700 |        "</style>\n",
1701 |        "<table border=\"1\" class=\"dataframe\">\n",
1702 |        "  <thead>\n",
1703 |        "    <tr style=\"text-align: right;\">\n",
1704 |        "      <th></th>\n",
1705 |        "      <th>Hobbyist</th>\n",
1706 |        "      <th>OpenSourcer</th>\n",
1707 |        "      <th>OpenSource</th>\n",
1708 |        "      <th>Employment</th>\n",
1709 |        "    </tr>\n",
1710 |        "  </thead>\n",
1711 |        "  <tbody>\n",
1712 |        "    <tr>\n",
1713 |        "      <th>0</th>\n",
1714 |        "      <td>Yes</td>\n",
1715 |        "      <td>Never</td>\n",
1716 |        "      <td>The quality of OSS and closed source software ...</td>\n",
1717 |        "      <td>Not employed, and not looking for work</td>\n",
1718 |        "    </tr>\n",
1719 |        "    <tr>\n",
1720 |        "      <th>1</th>\n",
1721 |        "      <td>No</td>\n",
1722 |        "      <td>Less than once per year</td>\n",
1723 |        "      <td>The quality of OSS and closed source software ...</td>\n",
1724 |        "      <td>Not employed, but looking for work</td>\n",
1725 |        "    </tr>\n",
1726 |        "    <tr>\n",
1727 |        "      <th>2</th>\n",
1728 |        "      <td>Yes</td>\n",
1729 |        "      <td>Never</td>\n",
1730 |        "      <td>The quality of OSS and closed source software ...</td>\n",
1731 |        "      <td>Employed full-time</td>\n",
1732 |        "    </tr>\n",
1733 |        "  </tbody>\n",
1734 |        "</table>\n",
1735 |        "</div>"
1736 |       ],
1737 |       "text/plain": [
1738 |        "  Hobbyist              OpenSourcer  \\\n",
1739 |        "0      Yes                    Never   \n",
1740 |        "1       No  Less than once per year   \n",
1741 |        "2      Yes                    Never   \n",
1742 |        "\n",
1743 |        "                                          OpenSource  \\\n",
1744 |        "0  The quality of OSS and closed source software ...   \n",
1745 |        "1  The quality of OSS and closed source software ...   \n",
1746 |        "2  The quality of OSS and closed source software ...   \n",
1747 |        "\n",
1748 |        "                               Employment  \n",
1749 |        "0  Not employed, and not looking for work  \n",
1750 |        "1      Not employed, but looking for work  \n",
1751 |        "2                      Employed full-time  "
1752 |       ]
1753 |      },
1754 |      "execution_count": 39,
1755 |      "metadata": {},
1756 |      "output_type": "execute_result"
1757 |     }
1758 |    ],
1759 |    "source": [
1760 |     "res_df.loc[0:2, 'Hobbyist':'Employment']"
1761 |    ]
1762 |   },
1763 |   {
1764 |    "cell_type": "markdown",
1765 |    "metadata": {},
1766 |    "source": [
1767 |     "Note slicing is inclusive to avoid driving users insane."
1768 |    ]
1769 |   },
1770 |   {
1771 |    "cell_type": "code",
1772 |    "execution_count": null,
1773 |    "metadata": {},
1774 |    "outputs": [],
1775 |    "source": []
1776 |   }
1777 |  ],
1778 |  "metadata": {
1779 |   "kernelspec": {
1780 |    "display_name": "Python 3",
1781 |    "language": "python",
1782 |    "name": "python3"
1783 |   },
1784 |   "language_info": {
1785 |    "codemirror_mode": {
1786 |     "name": "ipython",
1787 |     "version": 3
1788 |    },
1789 |    "file_extension": ".py",
1790 |    "mimetype": "text/x-python",
1791 |    "name": "python",
1792 |    "nbconvert_exporter": "python",
1793 |    "pygments_lexer": "ipython3",
1794 |    "version": "3.6.9"
1795 |   }
1796 |  },
1797 |  "nbformat": 4,
1798 |  "nbformat_minor": 2
1799 | }
1800 | 


--------------------------------------------------------------------------------
/03-Indexes.ipynb:
--------------------------------------------------------------------------------
  1 | {
  2 |  "cells": [
  3 |   {
  4 |    "cell_type": "markdown",
  5 |    "metadata": {},
  6 |    "source": [
  7 |     "# Indexes: How to Set, Reset and Use Indexes"
  8 |    ]
  9 |   },
 10 |   {
 11 |    "cell_type": "code",
 12 |    "execution_count": 1,
 13 |    "metadata": {},
 14 |    "outputs": [],
 15 |    "source": [
 16 |     "import pandas as pd"
 17 |    ]
 18 |   },
 19 |   {
 20 |    "cell_type": "code",
 21 |    "execution_count": 2,
 22 |    "metadata": {},
 23 |    "outputs": [],
 24 |    "source": [
 25 |     "people = {\n",
 26 |     "    \"first\": [\"Phil\", \"Jane\", \"Rob\"],\n",
 27 |     "    \"last\": [\"Lembo\", \"Doe\", \"Roe\"],\n",
 28 |     "    \"email\": [\"phil.lembo@gmail.com\", \"janedoe@email.com\", \"robroe@email.com\"]\n",
 29 |     "}"
 30 |    ]
 31 |   },
 32 |   {
 33 |    "cell_type": "code",
 34 |    "execution_count": 3,
 35 |    "metadata": {},
 36 |    "outputs": [],
 37 |    "source": [
 38 |     "df = pd.DataFrame(people)"
 39 |    ]
 40 |   },
 41 |   {
 42 |    "cell_type": "code",
 43 |    "execution_count": 4,
 44 |    "metadata": {},
 45 |    "outputs": [
 46 |     {
 47 |      "data": {
 48 |       "text/html": [
 49 |        "<div>\n",
 50 |        "<style scoped>\n",
 51 |        "    .dataframe tbody tr th:only-of-type {\n",
 52 |        "        vertical-align: middle;\n",
 53 |        "    }\n",
 54 |        "\n",
 55 |        "    .dataframe tbody tr th {\n",
 56 |        "        vertical-align: top;\n",
 57 |        "    }\n",
 58 |        "\n",
 59 |        "    .dataframe thead th {\n",
 60 |        "        text-align: right;\n",
 61 |        "    }\n",
 62 |        "</style>\n",
 63 |        "<table border=\"1\" class=\"dataframe\">\n",
 64 |        "  <thead>\n",
 65 |        "    <tr style=\"text-align: right;\">\n",
 66 |        "      <th></th>\n",
 67 |        "      <th>first</th>\n",
 68 |        "      <th>last</th>\n",
 69 |        "      <th>email</th>\n",
 70 |        "    </tr>\n",
 71 |        "  </thead>\n",
 72 |        "  <tbody>\n",
 73 |        "    <tr>\n",
 74 |        "      <th>0</th>\n",
 75 |        "      <td>Phil</td>\n",
 76 |        "      <td>Lembo</td>\n",
 77 |        "      <td>phil.lembo@gmail.com</td>\n",
 78 |        "    </tr>\n",
 79 |        "    <tr>\n",
 80 |        "      <th>1</th>\n",
 81 |        "      <td>Jane</td>\n",
 82 |        "      <td>Doe</td>\n",
 83 |        "      <td>janedoe@email.com</td>\n",
 84 |        "    </tr>\n",
 85 |        "    <tr>\n",
 86 |        "      <th>2</th>\n",
 87 |        "      <td>Rob</td>\n",
 88 |        "      <td>Roe</td>\n",
 89 |        "      <td>robroe@email.com</td>\n",
 90 |        "    </tr>\n",
 91 |        "  </tbody>\n",
 92 |        "</table>\n",
 93 |        "</div>"
 94 |       ],
 95 |       "text/plain": [
 96 |        "  first   last                 email\n",
 97 |        "0  Phil  Lembo  phil.lembo@gmail.com\n",
 98 |        "1  Jane    Doe     janedoe@email.com\n",
 99 |        "2   Rob    Roe      robroe@email.com"
100 |       ]
101 |      },
102 |      "execution_count": 4,
103 |      "metadata": {},
104 |      "output_type": "execute_result"
105 |     }
106 |    ],
107 |    "source": [
108 |     "df"
109 |    ]
110 |   },
111 |   {
112 |    "cell_type": "code",
113 |    "execution_count": 5,
114 |    "metadata": {},
115 |    "outputs": [
116 |     {
117 |      "data": {
118 |       "text/plain": [
119 |        "0    phil.lembo@gmail.com\n",
120 |        "1       janedoe@email.com\n",
121 |        "2        robroe@email.com\n",
122 |        "Name: email, dtype: object"
123 |       ]
124 |      },
125 |      "execution_count": 5,
126 |      "metadata": {},
127 |      "output_type": "execute_result"
128 |     }
129 |    ],
130 |    "source": [
131 |     "df['email']"
132 |    ]
133 |   },
134 |   {
135 |    "cell_type": "code",
136 |    "execution_count": 6,
137 |    "metadata": {},
138 |    "outputs": [
139 |     {
140 |      "data": {
141 |       "text/html": [
142 |        "<div>\n",
143 |        "<style scoped>\n",
144 |        "    .dataframe tbody tr th:only-of-type {\n",
145 |        "        vertical-align: middle;\n",
146 |        "    }\n",
147 |        "\n",
148 |        "    .dataframe tbody tr th {\n",
149 |        "        vertical-align: top;\n",
150 |        "    }\n",
151 |        "\n",
152 |        "    .dataframe thead th {\n",
153 |        "        text-align: right;\n",
154 |        "    }\n",
155 |        "</style>\n",
156 |        "<table border=\"1\" class=\"dataframe\">\n",
157 |        "  <thead>\n",
158 |        "    <tr style=\"text-align: right;\">\n",
159 |        "      <th></th>\n",
160 |        "      <th>first</th>\n",
161 |        "      <th>last</th>\n",
162 |        "    </tr>\n",
163 |        "    <tr>\n",
164 |        "      <th>email</th>\n",
165 |        "      <th></th>\n",
166 |        "      <th></th>\n",
167 |        "    </tr>\n",
168 |        "  </thead>\n",
169 |        "  <tbody>\n",
170 |        "    <tr>\n",
171 |        "      <th>phil.lembo@gmail.com</th>\n",
172 |        "      <td>Phil</td>\n",
173 |        "      <td>Lembo</td>\n",
174 |        "    </tr>\n",
175 |        "    <tr>\n",
176 |        "      <th>janedoe@email.com</th>\n",
177 |        "      <td>Jane</td>\n",
178 |        "      <td>Doe</td>\n",
179 |        "    </tr>\n",
180 |        "    <tr>\n",
181 |        "      <th>robroe@email.com</th>\n",
182 |        "      <td>Rob</td>\n",
183 |        "      <td>Roe</td>\n",
184 |        "    </tr>\n",
185 |        "  </tbody>\n",
186 |        "</table>\n",
187 |        "</div>"
188 |       ],
189 |       "text/plain": [
190 |        "                     first   last\n",
191 |        "email                            \n",
192 |        "phil.lembo@gmail.com  Phil  Lembo\n",
193 |        "janedoe@email.com     Jane    Doe\n",
194 |        "robroe@email.com       Rob    Roe"
195 |       ]
196 |      },
197 |      "execution_count": 6,
198 |      "metadata": {},
199 |      "output_type": "execute_result"
200 |     }
201 |    ],
202 |    "source": [
203 |     "df.set_index('email')"
204 |    ]
205 |   },
206 |   {
207 |    "cell_type": "markdown",
208 |    "metadata": {},
209 |    "source": [
210 |     "By default, pandas won't change the original DataFrame."
211 |    ]
212 |   },
213 |   {
214 |    "cell_type": "code",
215 |    "execution_count": 7,
216 |    "metadata": {},
217 |    "outputs": [
218 |     {
219 |      "data": {
220 |       "text/html": [
221 |        "<div>\n",
222 |        "<style scoped>\n",
223 |        "    .dataframe tbody tr th:only-of-type {\n",
224 |        "        vertical-align: middle;\n",
225 |        "    }\n",
226 |        "\n",
227 |        "    .dataframe tbody tr th {\n",
228 |        "        vertical-align: top;\n",
229 |        "    }\n",
230 |        "\n",
231 |        "    .dataframe thead th {\n",
232 |        "        text-align: right;\n",
233 |        "    }\n",
234 |        "</style>\n",
235 |        "<table border=\"1\" class=\"dataframe\">\n",
236 |        "  <thead>\n",
237 |        "    <tr style=\"text-align: right;\">\n",
238 |        "      <th></th>\n",
239 |        "      <th>first</th>\n",
240 |        "      <th>last</th>\n",
241 |        "      <th>email</th>\n",
242 |        "    </tr>\n",
243 |        "  </thead>\n",
244 |        "  <tbody>\n",
245 |        "    <tr>\n",
246 |        "      <th>0</th>\n",
247 |        "      <td>Phil</td>\n",
248 |        "      <td>Lembo</td>\n",
249 |        "      <td>phil.lembo@gmail.com</td>\n",
250 |        "    </tr>\n",
251 |        "    <tr>\n",
252 |        "      <th>1</th>\n",
253 |        "      <td>Jane</td>\n",
254 |        "      <td>Doe</td>\n",
255 |        "      <td>janedoe@email.com</td>\n",
256 |        "    </tr>\n",
257 |        "    <tr>\n",
258 |        "      <th>2</th>\n",
259 |        "      <td>Rob</td>\n",
260 |        "      <td>Roe</td>\n",
261 |        "      <td>robroe@email.com</td>\n",
262 |        "    </tr>\n",
263 |        "  </tbody>\n",
264 |        "</table>\n",
265 |        "</div>"
266 |       ],
267 |       "text/plain": [
268 |        "  first   last                 email\n",
269 |        "0  Phil  Lembo  phil.lembo@gmail.com\n",
270 |        "1  Jane    Doe     janedoe@email.com\n",
271 |        "2   Rob    Roe      robroe@email.com"
272 |       ]
273 |      },
274 |      "execution_count": 7,
275 |      "metadata": {},
276 |      "output_type": "execute_result"
277 |     }
278 |    ],
279 |    "source": [
280 |     "df"
281 |    ]
282 |   },
283 |   {
284 |    "cell_type": "markdown",
285 |    "metadata": {},
286 |    "source": [
287 |     "To change the index in place, you need to use the \"inplace=True\" flag."
288 |    ]
289 |   },
290 |   {
291 |    "cell_type": "code",
292 |    "execution_count": 8,
293 |    "metadata": {},
294 |    "outputs": [],
295 |    "source": [
296 |     "df.set_index('email', inplace=True)"
297 |    ]
298 |   },
299 |   {
300 |    "cell_type": "code",
301 |    "execution_count": 9,
302 |    "metadata": {},
303 |    "outputs": [
304 |     {
305 |      "data": {
306 |       "text/html": [
307 |        "<div>\n",
308 |        "<style scoped>\n",
309 |        "    .dataframe tbody tr th:only-of-type {\n",
310 |        "        vertical-align: middle;\n",
311 |        "    }\n",
312 |        "\n",
313 |        "    .dataframe tbody tr th {\n",
314 |        "        vertical-align: top;\n",
315 |        "    }\n",
316 |        "\n",
317 |        "    .dataframe thead th {\n",
318 |        "        text-align: right;\n",
319 |        "    }\n",
320 |        "</style>\n",
321 |        "<table border=\"1\" class=\"dataframe\">\n",
322 |        "  <thead>\n",
323 |        "    <tr style=\"text-align: right;\">\n",
324 |        "      <th></th>\n",
325 |        "      <th>first</th>\n",
326 |        "      <th>last</th>\n",
327 |        "    </tr>\n",
328 |        "    <tr>\n",
329 |        "      <th>email</th>\n",
330 |        "      <th></th>\n",
331 |        "      <th></th>\n",
332 |        "    </tr>\n",
333 |        "  </thead>\n",
334 |        "  <tbody>\n",
335 |        "    <tr>\n",
336 |        "      <th>phil.lembo@gmail.com</th>\n",
337 |        "      <td>Phil</td>\n",
338 |        "      <td>Lembo</td>\n",
339 |        "    </tr>\n",
340 |        "    <tr>\n",
341 |        "      <th>janedoe@email.com</th>\n",
342 |        "      <td>Jane</td>\n",
343 |        "      <td>Doe</td>\n",
344 |        "    </tr>\n",
345 |        "    <tr>\n",
346 |        "      <th>robroe@email.com</th>\n",
347 |        "      <td>Rob</td>\n",
348 |        "      <td>Roe</td>\n",
349 |        "    </tr>\n",
350 |        "  </tbody>\n",
351 |        "</table>\n",
352 |        "</div>"
353 |       ],
354 |       "text/plain": [
355 |        "                     first   last\n",
356 |        "email                            \n",
357 |        "phil.lembo@gmail.com  Phil  Lembo\n",
358 |        "janedoe@email.com     Jane    Doe\n",
359 |        "robroe@email.com       Rob    Roe"
360 |       ]
361 |      },
362 |      "execution_count": 9,
363 |      "metadata": {},
364 |      "output_type": "execute_result"
365 |     }
366 |    ],
367 |    "source": [
368 |     "df"
369 |    ]
370 |   },
371 |   {
372 |    "cell_type": "code",
373 |    "execution_count": 10,
374 |    "metadata": {},
375 |    "outputs": [
376 |     {
377 |      "data": {
378 |       "text/plain": [
379 |        "Index(['phil.lembo@gmail.com', 'janedoe@email.com', 'robroe@email.com'], dtype='object', name='email')"
380 |       ]
381 |      },
382 |      "execution_count": 10,
383 |      "metadata": {},
384 |      "output_type": "execute_result"
385 |     }
386 |    ],
387 |    "source": [
388 |     "df.index"
389 |    ]
390 |   },
391 |   {
392 |    "cell_type": "code",
393 |    "execution_count": 11,
394 |    "metadata": {},
395 |    "outputs": [
396 |     {
397 |      "data": {
398 |       "text/plain": [
399 |        "first     Phil\n",
400 |        "last     Lembo\n",
401 |        "Name: phil.lembo@gmail.com, dtype: object"
402 |       ]
403 |      },
404 |      "execution_count": 11,
405 |      "metadata": {},
406 |      "output_type": "execute_result"
407 |     }
408 |    ],
409 |    "source": [
410 |     "df.loc['phil.lembo@gmail.com']"
411 |    ]
412 |   },
413 |   {
414 |    "cell_type": "code",
415 |    "execution_count": 12,
416 |    "metadata": {},
417 |    "outputs": [
418 |     {
419 |      "data": {
420 |       "text/plain": [
421 |        "'Lembo'"
422 |       ]
423 |      },
424 |      "execution_count": 12,
425 |      "metadata": {},
426 |      "output_type": "execute_result"
427 |     }
428 |    ],
429 |    "source": [
430 |     "df.loc['phil.lembo@gmail.com', 'last']"
431 |    ]
432 |   },
433 |   {
434 |    "cell_type": "markdown",
435 |    "metadata": {},
436 |    "source": [
437 |     "Note, we no longer have those integers as our index."
438 |    ]
439 |   },
440 |   {
441 |    "cell_type": "code",
442 |    "execution_count": 13,
443 |    "metadata": {},
444 |    "outputs": [
445 |     {
446 |      "ename": "TypeError",
447 |      "evalue": "cannot do label indexing on <class 'pandas.core.indexes.base.Index'> with these indexers [0] of <class 'int'>",
448 |      "output_type": "error",
449 |      "traceback": [
450 |       "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
451 |       "\u001b[0;31mTypeError\u001b[0m                                 Traceback (most recent call last)",
452 |       "\u001b[0;32m<ipython-input-13-7eaf75073732>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mloc\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
453 |       "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pandas/core/indexing.py\u001b[0m in \u001b[0;36m__getitem__\u001b[0;34m(self, key)\u001b[0m\n\u001b[1;32m   1422\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1423\u001b[0m             \u001b[0mmaybe_callable\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mcom\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mapply_if_callable\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1424\u001b[0;31m             \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_getitem_axis\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmaybe_callable\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0maxis\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   1425\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1426\u001b[0m     \u001b[0;32mdef\u001b[0m \u001b[0m_is_scalar_access\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mTuple\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
454 |       "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pandas/core/indexing.py\u001b[0m in \u001b[0;36m_getitem_axis\u001b[0;34m(self, key, axis)\u001b[0m\n\u001b[1;32m   1847\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1848\u001b[0m         \u001b[0;31m# fall thru to straight lookup\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1849\u001b[0;31m         \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_validate_key\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   1850\u001b[0m         \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_get_label\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0maxis\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1851\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n",
455 |       "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pandas/core/indexing.py\u001b[0m in \u001b[0;36m_validate_key\u001b[0;34m(self, key, axis)\u001b[0m\n\u001b[1;32m   1723\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1724\u001b[0m         \u001b[0;32mif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mis_list_like_indexer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 1725\u001b[0;31m             \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_convert_scalar_indexer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   1726\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   1727\u001b[0m     \u001b[0;32mdef\u001b[0m \u001b[0m_is_scalar_access\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mTuple\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
456 |       "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pandas/core/indexing.py\u001b[0m in \u001b[0;36m_convert_scalar_indexer\u001b[0;34m(self, key, axis)\u001b[0m\n\u001b[1;32m    272\u001b[0m         \u001b[0max\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mobj\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_get_axis\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mmin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0maxis\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mndim\u001b[0m \u001b[0;34m-\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    273\u001b[0m         \u001b[0;31m# a scalar\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 274\u001b[0;31m         \u001b[0;32mreturn\u001b[0m \u001b[0max\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_convert_scalar_indexer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkind\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mname\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m    275\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m    276\u001b[0m     \u001b[0;32mdef\u001b[0m \u001b[0m_convert_slice_indexer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0mint\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
457 |       "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pandas/core/indexes/base.py\u001b[0m in \u001b[0;36m_convert_scalar_indexer\u001b[0;34m(self, key, kind)\u001b[0m\n\u001b[1;32m   3136\u001b[0m             \u001b[0;32melif\u001b[0m \u001b[0mkind\u001b[0m \u001b[0;32min\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0;34m\"loc\"\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0mis_integer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   3137\u001b[0m                 \u001b[0;32mif\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mholds_integer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 3138\u001b[0;31m                     \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_invalid_indexer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m\"label\"\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   3139\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   3140\u001b[0m         \u001b[0;32mreturn\u001b[0m \u001b[0mkey\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
458 |       "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pandas/core/indexes/base.py\u001b[0m in \u001b[0;36m_invalid_indexer\u001b[0;34m(self, form, key)\u001b[0m\n\u001b[1;32m   3338\u001b[0m             \u001b[0;34m\"cannot do {form} indexing on {klass} with these \"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   3339\u001b[0m             \"indexers [{key}] of {kind}\".format(\n\u001b[0;32m-> 3340\u001b[0;31m                 \u001b[0mform\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mform\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mklass\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mtype\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mkind\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mtype\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mkey\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   3341\u001b[0m             )\n\u001b[1;32m   3342\u001b[0m         )\n",
459 |       "\u001b[0;31mTypeError\u001b[0m: cannot do label indexing on <class 'pandas.core.indexes.base.Index'> with these indexers [0] of <class 'int'>"
460 |      ]
461 |     }
462 |    ],
463 |    "source": [
464 |     "df.loc[0]"
465 |    ]
466 |   },
467 |   {
468 |    "cell_type": "markdown",
469 |    "metadata": {},
470 |    "source": [
471 |     "Instead, we now need to employ iloc to use integers."
472 |    ]
473 |   },
474 |   {
475 |    "cell_type": "code",
476 |    "execution_count": null,
477 |    "metadata": {},
478 |    "outputs": [],
479 |    "source": [
480 |     "df.iloc[0]"
481 |    ]
482 |   },
483 |   {
484 |    "cell_type": "markdown",
485 |    "metadata": {},
486 |    "source": [
487 |     "To reset, use the reset_index method."
488 |    ]
489 |   },
490 |   {
491 |    "cell_type": "code",
492 |    "execution_count": null,
493 |    "metadata": {},
494 |    "outputs": [],
495 |    "source": [
496 |     "df.reset_index(inplace=True)"
497 |    ]
498 |   },
499 |   {
500 |    "cell_type": "code",
501 |    "execution_count": null,
502 |    "metadata": {},
503 |    "outputs": [],
504 |    "source": [
505 |     "df"
506 |    ]
507 |   },
508 |   {
509 |    "cell_type": "markdown",
510 |    "metadata": {},
511 |    "source": [
512 |     "Now turn to survey data."
513 |    ]
514 |   },
515 |   {
516 |    "cell_type": "code",
517 |    "execution_count": null,
518 |    "metadata": {},
519 |    "outputs": [],
520 |    "source": [
521 |     "res_df = pd.read_csv('data/survey_results_public.csv')\n",
522 |     "schema_df = pd.read_csv('data/survey_results_schema.csv')"
523 |    ]
524 |   },
525 |   {
526 |    "cell_type": "code",
527 |    "execution_count": null,
528 |    "metadata": {},
529 |    "outputs": [],
530 |    "source": [
531 |     "pd.set_option('display.max_columns', 85)\n",
532 |     "pd.set_option('display.max_rows', 85)"
533 |    ]
534 |   },
535 |   {
536 |    "cell_type": "code",
537 |    "execution_count": null,
538 |    "metadata": {},
539 |    "outputs": [],
540 |    "source": [
541 |     "df"
542 |    ]
543 |   },
544 |   {
545 |    "cell_type": "markdown",
546 |    "metadata": {},
547 |    "source": [
548 |     "Set index when loading data."
549 |    ]
550 |   },
551 |   {
552 |    "cell_type": "code",
553 |    "execution_count": null,
554 |    "metadata": {},
555 |    "outputs": [],
556 |    "source": [
557 |     "res_df = pd.read_csv('data/survey_results_public.csv', index_col='Respondent')"
558 |    ]
559 |   },
560 |   {
561 |    "cell_type": "code",
562 |    "execution_count": null,
563 |    "metadata": {},
564 |    "outputs": [],
565 |    "source": [
566 |     "res_df"
567 |    ]
568 |   },
569 |   {
570 |    "cell_type": "markdown",
571 |    "metadata": {},
572 |    "source": [
573 |     "To retrieve respondent number 1."
574 |    ]
575 |   },
576 |   {
577 |    "cell_type": "code",
578 |    "execution_count": null,
579 |    "metadata": {},
580 |    "outputs": [],
581 |    "source": [
582 |     "res_df.loc[1]"
583 |    ]
584 |   },
585 |   {
586 |    "cell_type": "code",
587 |    "execution_count": null,
588 |    "metadata": {},
589 |    "outputs": [],
590 |    "source": [
591 |     "schema_df"
592 |    ]
593 |   },
594 |   {
595 |    "cell_type": "markdown",
596 |    "metadata": {},
597 |    "source": [
598 |     "What if I want to be able to call up a schema definition without having to scroll through frame? Set \"Column\" as the index!"
599 |    ]
600 |   },
601 |   {
602 |    "cell_type": "code",
603 |    "execution_count": null,
604 |    "metadata": {},
605 |    "outputs": [],
606 |    "source": [
607 |     "schema_df = pd.read_csv('data/survey_results_schema.csv', index_col='Column')"
608 |    ]
609 |   },
610 |   {
611 |    "cell_type": "code",
612 |    "execution_count": null,
613 |    "metadata": {},
614 |    "outputs": [],
615 |    "source": [
616 |     "schema_df"
617 |    ]
618 |   },
619 |   {
620 |    "cell_type": "code",
621 |    "execution_count": null,
622 |    "metadata": {},
623 |    "outputs": [],
624 |    "source": [
625 |     "schema_df.loc['Hobbyist']"
626 |    ]
627 |   },
628 |   {
629 |    "cell_type": "code",
630 |    "execution_count": null,
631 |    "metadata": {},
632 |    "outputs": [],
633 |    "source": [
634 |     "schema_df.loc['MgrIdiot']"
635 |    ]
636 |   },
637 |   {
638 |    "cell_type": "markdown",
639 |    "metadata": {},
640 |    "source": [
641 |     "By default, pandas truncates its response. This can be changed, but you can also retrieve the full text by specifying both the index _and_ column names (in this case \"QuestionText\")."
642 |    ]
643 |   },
644 |   {
645 |    "cell_type": "code",
646 |    "execution_count": null,
647 |    "metadata": {},
648 |    "outputs": [],
649 |    "source": [
650 |     "schema_df.loc['MgrIdiot', 'QuestionText']"
651 |    ]
652 |   },
653 |   {
654 |    "cell_type": "markdown",
655 |    "metadata": {},
656 |    "source": [
657 |     "We can sort to make life easier!"
658 |    ]
659 |   },
660 |   {
661 |    "cell_type": "code",
662 |    "execution_count": null,
663 |    "metadata": {},
664 |    "outputs": [],
665 |    "source": [
666 |     "schema_df.sort_index()"
667 |    ]
668 |   },
669 |   {
670 |    "cell_type": "markdown",
671 |    "metadata": {},
672 |    "source": [
673 |     "To reverse order, use \"ascending\" flag."
674 |    ]
675 |   },
676 |   {
677 |    "cell_type": "code",
678 |    "execution_count": null,
679 |    "metadata": {},
680 |    "outputs": [],
681 |    "source": [
682 |     "schema_df.sort_index(ascending=False)"
683 |    ]
684 |   },
685 |   {
686 |    "cell_type": "markdown",
687 |    "metadata": {},
688 |    "source": [
689 |     "To make change persistent, use \"inplace=True\" flag."
690 |    ]
691 |   },
692 |   {
693 |    "cell_type": "code",
694 |    "execution_count": null,
695 |    "metadata": {},
696 |    "outputs": [],
697 |    "source": [
698 |     "schema_df.sort_index(inplace=True)\n",
699 |     "schema_df"
700 |    ]
701 |   },
702 |   {
703 |    "cell_type": "code",
704 |    "execution_count": null,
705 |    "metadata": {},
706 |    "outputs": [],
707 |    "source": []
708 |   }
709 |  ],
710 |  "metadata": {
711 |   "kernelspec": {
712 |    "display_name": "Python 3",
713 |    "language": "python",
714 |    "name": "python3"
715 |   },
716 |   "language_info": {
717 |    "codemirror_mode": {
718 |     "name": "ipython",
719 |     "version": 3
720 |    },
721 |    "file_extension": ".py",
722 |    "mimetype": "text/x-python",
723 |    "name": "python",
724 |    "nbconvert_exporter": "python",
725 |    "pygments_lexer": "ipython3",
726 |    "version": "3.6.9"
727 |   }
728 |  },
729 |  "nbformat": 4,
730 |  "nbformat_minor": 2
731 | }
732 | 


--------------------------------------------------------------------------------
/06-Add Remove Rows and Columns.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |  "cells": [
   3 |   {
   4 |    "cell_type": "markdown",
   5 |    "metadata": {},
   6 |    "source": [
   7 |     "# Add/Remove Rows and Columns from DataFrames"
   8 |    ]
   9 |   },
  10 |   {
  11 |    "cell_type": "code",
  12 |    "execution_count": 17,
  13 |    "metadata": {},
  14 |    "outputs": [],
  15 |    "source": [
  16 |     "people = {\n",
  17 |     "    \"first\": [\"Corey\", \"Jane\", \"John\"],\n",
  18 |     "    \"last\": [\"Schafer\", \"Doe\", \"Doe\"],\n",
  19 |     "    \"email\": [\"CoreyMSchafer@gmail.com\", \"JaneDoe@email.com\", \"JohnDoe@email.com\"]\n",
  20 |     "}"
  21 |    ]
  22 |   },
  23 |   {
  24 |    "cell_type": "code",
  25 |    "execution_count": 18,
  26 |    "metadata": {},
  27 |    "outputs": [],
  28 |    "source": [
  29 |     "import pandas as pd"
  30 |    ]
  31 |   },
  32 |   {
  33 |    "cell_type": "code",
  34 |    "execution_count": 19,
  35 |    "metadata": {},
  36 |    "outputs": [],
  37 |    "source": [
  38 |     "df = pd.DataFrame(people)"
  39 |    ]
  40 |   },
  41 |   {
  42 |    "cell_type": "code",
  43 |    "execution_count": 20,
  44 |    "metadata": {},
  45 |    "outputs": [
  46 |     {
  47 |      "data": {
  48 |       "text/html": [
  49 |        "<div>\n",
  50 |        "<style scoped>\n",
  51 |        "    .dataframe tbody tr th:only-of-type {\n",
  52 |        "        vertical-align: middle;\n",
  53 |        "    }\n",
  54 |        "\n",
  55 |        "    .dataframe tbody tr th {\n",
  56 |        "        vertical-align: top;\n",
  57 |        "    }\n",
  58 |        "\n",
  59 |        "    .dataframe thead th {\n",
  60 |        "        text-align: right;\n",
  61 |        "    }\n",
  62 |        "</style>\n",
  63 |        "<table border=\"1\" class=\"dataframe\">\n",
  64 |        "  <thead>\n",
  65 |        "    <tr style=\"text-align: right;\">\n",
  66 |        "      <th></th>\n",
  67 |        "      <th>first</th>\n",
  68 |        "      <th>last</th>\n",
  69 |        "      <th>email</th>\n",
  70 |        "    </tr>\n",
  71 |        "  </thead>\n",
  72 |        "  <tbody>\n",
  73 |        "    <tr>\n",
  74 |        "      <th>0</th>\n",
  75 |        "      <td>Corey</td>\n",
  76 |        "      <td>Schafer</td>\n",
  77 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
  78 |        "    </tr>\n",
  79 |        "    <tr>\n",
  80 |        "      <th>1</th>\n",
  81 |        "      <td>Jane</td>\n",
  82 |        "      <td>Doe</td>\n",
  83 |        "      <td>JaneDoe@email.com</td>\n",
  84 |        "    </tr>\n",
  85 |        "    <tr>\n",
  86 |        "      <th>2</th>\n",
  87 |        "      <td>John</td>\n",
  88 |        "      <td>Doe</td>\n",
  89 |        "      <td>JohnDoe@email.com</td>\n",
  90 |        "    </tr>\n",
  91 |        "  </tbody>\n",
  92 |        "</table>\n",
  93 |        "</div>"
  94 |       ],
  95 |       "text/plain": [
  96 |        "   first     last                    email\n",
  97 |        "0  Corey  Schafer  CoreyMSchafer@gmail.com\n",
  98 |        "1   Jane      Doe        JaneDoe@email.com\n",
  99 |        "2   John      Doe        JohnDoe@email.com"
 100 |       ]
 101 |      },
 102 |      "execution_count": 20,
 103 |      "metadata": {},
 104 |      "output_type": "execute_result"
 105 |     }
 106 |    ],
 107 |    "source": [
 108 |     "df"
 109 |    ]
 110 |   },
 111 |   {
 112 |    "cell_type": "markdown",
 113 |    "metadata": {},
 114 |    "source": [
 115 |     "Combine first and last name column:"
 116 |    ]
 117 |   },
 118 |   {
 119 |    "cell_type": "code",
 120 |    "execution_count": 21,
 121 |    "metadata": {},
 122 |    "outputs": [
 123 |     {
 124 |      "data": {
 125 |       "text/plain": [
 126 |        "0    Corey Schafer\n",
 127 |        "1         Jane Doe\n",
 128 |        "2         John Doe\n",
 129 |        "dtype: object"
 130 |       ]
 131 |      },
 132 |      "execution_count": 21,
 133 |      "metadata": {},
 134 |      "output_type": "execute_result"
 135 |     }
 136 |    ],
 137 |    "source": [
 138 |     "df['first'] + ' ' + df['last']"
 139 |    ]
 140 |   },
 141 |   {
 142 |    "cell_type": "code",
 143 |    "execution_count": 22,
 144 |    "metadata": {},
 145 |    "outputs": [],
 146 |    "source": [
 147 |     "df['full_name'] = df['first'] + ' ' + df['last']"
 148 |    ]
 149 |   },
 150 |   {
 151 |    "cell_type": "code",
 152 |    "execution_count": 23,
 153 |    "metadata": {},
 154 |    "outputs": [
 155 |     {
 156 |      "data": {
 157 |       "text/html": [
 158 |        "<div>\n",
 159 |        "<style scoped>\n",
 160 |        "    .dataframe tbody tr th:only-of-type {\n",
 161 |        "        vertical-align: middle;\n",
 162 |        "    }\n",
 163 |        "\n",
 164 |        "    .dataframe tbody tr th {\n",
 165 |        "        vertical-align: top;\n",
 166 |        "    }\n",
 167 |        "\n",
 168 |        "    .dataframe thead th {\n",
 169 |        "        text-align: right;\n",
 170 |        "    }\n",
 171 |        "</style>\n",
 172 |        "<table border=\"1\" class=\"dataframe\">\n",
 173 |        "  <thead>\n",
 174 |        "    <tr style=\"text-align: right;\">\n",
 175 |        "      <th></th>\n",
 176 |        "      <th>first</th>\n",
 177 |        "      <th>last</th>\n",
 178 |        "      <th>email</th>\n",
 179 |        "      <th>full_name</th>\n",
 180 |        "    </tr>\n",
 181 |        "  </thead>\n",
 182 |        "  <tbody>\n",
 183 |        "    <tr>\n",
 184 |        "      <th>0</th>\n",
 185 |        "      <td>Corey</td>\n",
 186 |        "      <td>Schafer</td>\n",
 187 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
 188 |        "      <td>Corey Schafer</td>\n",
 189 |        "    </tr>\n",
 190 |        "    <tr>\n",
 191 |        "      <th>1</th>\n",
 192 |        "      <td>Jane</td>\n",
 193 |        "      <td>Doe</td>\n",
 194 |        "      <td>JaneDoe@email.com</td>\n",
 195 |        "      <td>Jane Doe</td>\n",
 196 |        "    </tr>\n",
 197 |        "    <tr>\n",
 198 |        "      <th>2</th>\n",
 199 |        "      <td>John</td>\n",
 200 |        "      <td>Doe</td>\n",
 201 |        "      <td>JohnDoe@email.com</td>\n",
 202 |        "      <td>John Doe</td>\n",
 203 |        "    </tr>\n",
 204 |        "  </tbody>\n",
 205 |        "</table>\n",
 206 |        "</div>"
 207 |       ],
 208 |       "text/plain": [
 209 |        "   first     last                    email      full_name\n",
 210 |        "0  Corey  Schafer  CoreyMSchafer@gmail.com  Corey Schafer\n",
 211 |        "1   Jane      Doe        JaneDoe@email.com       Jane Doe\n",
 212 |        "2   John      Doe        JohnDoe@email.com       John Doe"
 213 |       ]
 214 |      },
 215 |      "execution_count": 23,
 216 |      "metadata": {},
 217 |      "output_type": "execute_result"
 218 |     }
 219 |    ],
 220 |    "source": [
 221 |     "df"
 222 |    ]
 223 |   },
 224 |   {
 225 |    "cell_type": "markdown",
 226 |    "metadata": {},
 227 |    "source": [
 228 |     "Note: Cannot use dot notation when assigning columns like this, must use brackets (python will think you're trying to assign an attribute)."
 229 |    ]
 230 |   },
 231 |   {
 232 |    "cell_type": "markdown",
 233 |    "metadata": {},
 234 |    "source": [
 235 |     "To delete columns:"
 236 |    ]
 237 |   },
 238 |   {
 239 |    "cell_type": "code",
 240 |    "execution_count": 24,
 241 |    "metadata": {},
 242 |    "outputs": [
 243 |     {
 244 |      "data": {
 245 |       "text/html": [
 246 |        "<div>\n",
 247 |        "<style scoped>\n",
 248 |        "    .dataframe tbody tr th:only-of-type {\n",
 249 |        "        vertical-align: middle;\n",
 250 |        "    }\n",
 251 |        "\n",
 252 |        "    .dataframe tbody tr th {\n",
 253 |        "        vertical-align: top;\n",
 254 |        "    }\n",
 255 |        "\n",
 256 |        "    .dataframe thead th {\n",
 257 |        "        text-align: right;\n",
 258 |        "    }\n",
 259 |        "</style>\n",
 260 |        "<table border=\"1\" class=\"dataframe\">\n",
 261 |        "  <thead>\n",
 262 |        "    <tr style=\"text-align: right;\">\n",
 263 |        "      <th></th>\n",
 264 |        "      <th>email</th>\n",
 265 |        "      <th>full_name</th>\n",
 266 |        "    </tr>\n",
 267 |        "  </thead>\n",
 268 |        "  <tbody>\n",
 269 |        "    <tr>\n",
 270 |        "      <th>0</th>\n",
 271 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
 272 |        "      <td>Corey Schafer</td>\n",
 273 |        "    </tr>\n",
 274 |        "    <tr>\n",
 275 |        "      <th>1</th>\n",
 276 |        "      <td>JaneDoe@email.com</td>\n",
 277 |        "      <td>Jane Doe</td>\n",
 278 |        "    </tr>\n",
 279 |        "    <tr>\n",
 280 |        "      <th>2</th>\n",
 281 |        "      <td>JohnDoe@email.com</td>\n",
 282 |        "      <td>John Doe</td>\n",
 283 |        "    </tr>\n",
 284 |        "  </tbody>\n",
 285 |        "</table>\n",
 286 |        "</div>"
 287 |       ],
 288 |       "text/plain": [
 289 |        "                     email      full_name\n",
 290 |        "0  CoreyMSchafer@gmail.com  Corey Schafer\n",
 291 |        "1        JaneDoe@email.com       Jane Doe\n",
 292 |        "2        JohnDoe@email.com       John Doe"
 293 |       ]
 294 |      },
 295 |      "execution_count": 24,
 296 |      "metadata": {},
 297 |      "output_type": "execute_result"
 298 |     }
 299 |    ],
 300 |    "source": [
 301 |     "df.drop(columns=['first', 'last'])"
 302 |    ]
 303 |   },
 304 |   {
 305 |    "cell_type": "markdown",
 306 |    "metadata": {},
 307 |    "source": [
 308 |     "This change not yet applied to df, need to explicitly use \"inplace=True\"."
 309 |    ]
 310 |   },
 311 |   {
 312 |    "cell_type": "code",
 313 |    "execution_count": 25,
 314 |    "metadata": {},
 315 |    "outputs": [
 316 |     {
 317 |      "data": {
 318 |       "text/html": [
 319 |        "<div>\n",
 320 |        "<style scoped>\n",
 321 |        "    .dataframe tbody tr th:only-of-type {\n",
 322 |        "        vertical-align: middle;\n",
 323 |        "    }\n",
 324 |        "\n",
 325 |        "    .dataframe tbody tr th {\n",
 326 |        "        vertical-align: top;\n",
 327 |        "    }\n",
 328 |        "\n",
 329 |        "    .dataframe thead th {\n",
 330 |        "        text-align: right;\n",
 331 |        "    }\n",
 332 |        "</style>\n",
 333 |        "<table border=\"1\" class=\"dataframe\">\n",
 334 |        "  <thead>\n",
 335 |        "    <tr style=\"text-align: right;\">\n",
 336 |        "      <th></th>\n",
 337 |        "      <th>first</th>\n",
 338 |        "      <th>last</th>\n",
 339 |        "      <th>email</th>\n",
 340 |        "      <th>full_name</th>\n",
 341 |        "    </tr>\n",
 342 |        "  </thead>\n",
 343 |        "  <tbody>\n",
 344 |        "    <tr>\n",
 345 |        "      <th>0</th>\n",
 346 |        "      <td>Corey</td>\n",
 347 |        "      <td>Schafer</td>\n",
 348 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
 349 |        "      <td>Corey Schafer</td>\n",
 350 |        "    </tr>\n",
 351 |        "    <tr>\n",
 352 |        "      <th>1</th>\n",
 353 |        "      <td>Jane</td>\n",
 354 |        "      <td>Doe</td>\n",
 355 |        "      <td>JaneDoe@email.com</td>\n",
 356 |        "      <td>Jane Doe</td>\n",
 357 |        "    </tr>\n",
 358 |        "    <tr>\n",
 359 |        "      <th>2</th>\n",
 360 |        "      <td>John</td>\n",
 361 |        "      <td>Doe</td>\n",
 362 |        "      <td>JohnDoe@email.com</td>\n",
 363 |        "      <td>John Doe</td>\n",
 364 |        "    </tr>\n",
 365 |        "  </tbody>\n",
 366 |        "</table>\n",
 367 |        "</div>"
 368 |       ],
 369 |       "text/plain": [
 370 |        "   first     last                    email      full_name\n",
 371 |        "0  Corey  Schafer  CoreyMSchafer@gmail.com  Corey Schafer\n",
 372 |        "1   Jane      Doe        JaneDoe@email.com       Jane Doe\n",
 373 |        "2   John      Doe        JohnDoe@email.com       John Doe"
 374 |       ]
 375 |      },
 376 |      "execution_count": 25,
 377 |      "metadata": {},
 378 |      "output_type": "execute_result"
 379 |     }
 380 |    ],
 381 |    "source": [
 382 |     "df"
 383 |    ]
 384 |   },
 385 |   {
 386 |    "cell_type": "code",
 387 |    "execution_count": 26,
 388 |    "metadata": {},
 389 |    "outputs": [],
 390 |    "source": [
 391 |     "df.drop(columns=['first', 'last'], inplace=True)"
 392 |    ]
 393 |   },
 394 |   {
 395 |    "cell_type": "code",
 396 |    "execution_count": 27,
 397 |    "metadata": {},
 398 |    "outputs": [
 399 |     {
 400 |      "data": {
 401 |       "text/html": [
 402 |        "<div>\n",
 403 |        "<style scoped>\n",
 404 |        "    .dataframe tbody tr th:only-of-type {\n",
 405 |        "        vertical-align: middle;\n",
 406 |        "    }\n",
 407 |        "\n",
 408 |        "    .dataframe tbody tr th {\n",
 409 |        "        vertical-align: top;\n",
 410 |        "    }\n",
 411 |        "\n",
 412 |        "    .dataframe thead th {\n",
 413 |        "        text-align: right;\n",
 414 |        "    }\n",
 415 |        "</style>\n",
 416 |        "<table border=\"1\" class=\"dataframe\">\n",
 417 |        "  <thead>\n",
 418 |        "    <tr style=\"text-align: right;\">\n",
 419 |        "      <th></th>\n",
 420 |        "      <th>email</th>\n",
 421 |        "      <th>full_name</th>\n",
 422 |        "    </tr>\n",
 423 |        "  </thead>\n",
 424 |        "  <tbody>\n",
 425 |        "    <tr>\n",
 426 |        "      <th>0</th>\n",
 427 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
 428 |        "      <td>Corey Schafer</td>\n",
 429 |        "    </tr>\n",
 430 |        "    <tr>\n",
 431 |        "      <th>1</th>\n",
 432 |        "      <td>JaneDoe@email.com</td>\n",
 433 |        "      <td>Jane Doe</td>\n",
 434 |        "    </tr>\n",
 435 |        "    <tr>\n",
 436 |        "      <th>2</th>\n",
 437 |        "      <td>JohnDoe@email.com</td>\n",
 438 |        "      <td>John Doe</td>\n",
 439 |        "    </tr>\n",
 440 |        "  </tbody>\n",
 441 |        "</table>\n",
 442 |        "</div>"
 443 |       ],
 444 |       "text/plain": [
 445 |        "                     email      full_name\n",
 446 |        "0  CoreyMSchafer@gmail.com  Corey Schafer\n",
 447 |        "1        JaneDoe@email.com       Jane Doe\n",
 448 |        "2        JohnDoe@email.com       John Doe"
 449 |       ]
 450 |      },
 451 |      "execution_count": 27,
 452 |      "metadata": {},
 453 |      "output_type": "execute_result"
 454 |     }
 455 |    ],
 456 |    "source": [
 457 |     "df"
 458 |    ]
 459 |   },
 460 |   {
 461 |    "cell_type": "markdown",
 462 |    "metadata": {},
 463 |    "source": [
 464 |     "To split full_name into separate columns for each part of name:"
 465 |    ]
 466 |   },
 467 |   {
 468 |    "cell_type": "code",
 469 |    "execution_count": 28,
 470 |    "metadata": {},
 471 |    "outputs": [
 472 |     {
 473 |      "data": {
 474 |       "text/plain": [
 475 |        "0    [Corey, Schafer]\n",
 476 |        "1         [Jane, Doe]\n",
 477 |        "2         [John, Doe]\n",
 478 |        "Name: full_name, dtype: object"
 479 |       ]
 480 |      },
 481 |      "execution_count": 28,
 482 |      "metadata": {},
 483 |      "output_type": "execute_result"
 484 |     }
 485 |    ],
 486 |    "source": [
 487 |     "df['full_name'].str.split(' ')"
 488 |    ]
 489 |   },
 490 |   {
 491 |    "cell_type": "markdown",
 492 |    "metadata": {},
 493 |    "source": [
 494 |     "Result is first and last name in a list."
 495 |    ]
 496 |   },
 497 |   {
 498 |    "cell_type": "markdown",
 499 |    "metadata": {},
 500 |    "source": [
 501 |     "To assign to separate columns, use expand argument:"
 502 |    ]
 503 |   },
 504 |   {
 505 |    "cell_type": "code",
 506 |    "execution_count": 29,
 507 |    "metadata": {},
 508 |    "outputs": [
 509 |     {
 510 |      "data": {
 511 |       "text/html": [
 512 |        "<div>\n",
 513 |        "<style scoped>\n",
 514 |        "    .dataframe tbody tr th:only-of-type {\n",
 515 |        "        vertical-align: middle;\n",
 516 |        "    }\n",
 517 |        "\n",
 518 |        "    .dataframe tbody tr th {\n",
 519 |        "        vertical-align: top;\n",
 520 |        "    }\n",
 521 |        "\n",
 522 |        "    .dataframe thead th {\n",
 523 |        "        text-align: right;\n",
 524 |        "    }\n",
 525 |        "</style>\n",
 526 |        "<table border=\"1\" class=\"dataframe\">\n",
 527 |        "  <thead>\n",
 528 |        "    <tr style=\"text-align: right;\">\n",
 529 |        "      <th></th>\n",
 530 |        "      <th>0</th>\n",
 531 |        "      <th>1</th>\n",
 532 |        "    </tr>\n",
 533 |        "  </thead>\n",
 534 |        "  <tbody>\n",
 535 |        "    <tr>\n",
 536 |        "      <th>0</th>\n",
 537 |        "      <td>Corey</td>\n",
 538 |        "      <td>Schafer</td>\n",
 539 |        "    </tr>\n",
 540 |        "    <tr>\n",
 541 |        "      <th>1</th>\n",
 542 |        "      <td>Jane</td>\n",
 543 |        "      <td>Doe</td>\n",
 544 |        "    </tr>\n",
 545 |        "    <tr>\n",
 546 |        "      <th>2</th>\n",
 547 |        "      <td>John</td>\n",
 548 |        "      <td>Doe</td>\n",
 549 |        "    </tr>\n",
 550 |        "  </tbody>\n",
 551 |        "</table>\n",
 552 |        "</div>"
 553 |       ],
 554 |       "text/plain": [
 555 |        "       0        1\n",
 556 |        "0  Corey  Schafer\n",
 557 |        "1   Jane      Doe\n",
 558 |        "2   John      Doe"
 559 |       ]
 560 |      },
 561 |      "execution_count": 29,
 562 |      "metadata": {},
 563 |      "output_type": "execute_result"
 564 |     }
 565 |    ],
 566 |    "source": [
 567 |     "df['full_name'].str.split(' ', expand=True)"
 568 |    ]
 569 |   },
 570 |   {
 571 |    "cell_type": "markdown",
 572 |    "metadata": {},
 573 |    "source": [
 574 |     "Now set two columns in data from for these, by passing in the list:"
 575 |    ]
 576 |   },
 577 |   {
 578 |    "cell_type": "code",
 579 |    "execution_count": 30,
 580 |    "metadata": {},
 581 |    "outputs": [],
 582 |    "source": [
 583 |     "df[['first', 'last']] = df['full_name'].str.split(' ', expand=True)"
 584 |    ]
 585 |   },
 586 |   {
 587 |    "cell_type": "code",
 588 |    "execution_count": 31,
 589 |    "metadata": {},
 590 |    "outputs": [
 591 |     {
 592 |      "data": {
 593 |       "text/html": [
 594 |        "<div>\n",
 595 |        "<style scoped>\n",
 596 |        "    .dataframe tbody tr th:only-of-type {\n",
 597 |        "        vertical-align: middle;\n",
 598 |        "    }\n",
 599 |        "\n",
 600 |        "    .dataframe tbody tr th {\n",
 601 |        "        vertical-align: top;\n",
 602 |        "    }\n",
 603 |        "\n",
 604 |        "    .dataframe thead th {\n",
 605 |        "        text-align: right;\n",
 606 |        "    }\n",
 607 |        "</style>\n",
 608 |        "<table border=\"1\" class=\"dataframe\">\n",
 609 |        "  <thead>\n",
 610 |        "    <tr style=\"text-align: right;\">\n",
 611 |        "      <th></th>\n",
 612 |        "      <th>email</th>\n",
 613 |        "      <th>full_name</th>\n",
 614 |        "      <th>first</th>\n",
 615 |        "      <th>last</th>\n",
 616 |        "    </tr>\n",
 617 |        "  </thead>\n",
 618 |        "  <tbody>\n",
 619 |        "    <tr>\n",
 620 |        "      <th>0</th>\n",
 621 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
 622 |        "      <td>Corey Schafer</td>\n",
 623 |        "      <td>Corey</td>\n",
 624 |        "      <td>Schafer</td>\n",
 625 |        "    </tr>\n",
 626 |        "    <tr>\n",
 627 |        "      <th>1</th>\n",
 628 |        "      <td>JaneDoe@email.com</td>\n",
 629 |        "      <td>Jane Doe</td>\n",
 630 |        "      <td>Jane</td>\n",
 631 |        "      <td>Doe</td>\n",
 632 |        "    </tr>\n",
 633 |        "    <tr>\n",
 634 |        "      <th>2</th>\n",
 635 |        "      <td>JohnDoe@email.com</td>\n",
 636 |        "      <td>John Doe</td>\n",
 637 |        "      <td>John</td>\n",
 638 |        "      <td>Doe</td>\n",
 639 |        "    </tr>\n",
 640 |        "  </tbody>\n",
 641 |        "</table>\n",
 642 |        "</div>"
 643 |       ],
 644 |       "text/plain": [
 645 |        "                     email      full_name  first     last\n",
 646 |        "0  CoreyMSchafer@gmail.com  Corey Schafer  Corey  Schafer\n",
 647 |        "1        JaneDoe@email.com       Jane Doe   Jane      Doe\n",
 648 |        "2        JohnDoe@email.com       John Doe   John      Doe"
 649 |       ]
 650 |      },
 651 |      "execution_count": 31,
 652 |      "metadata": {},
 653 |      "output_type": "execute_result"
 654 |     }
 655 |    ],
 656 |    "source": [
 657 |     "df"
 658 |    ]
 659 |   },
 660 |   {
 661 |    "cell_type": "markdown",
 662 |    "metadata": {},
 663 |    "source": [
 664 |     "On to adding and removing rows...\n",
 665 |     "\n",
 666 |     "First, add a single row of data with append:"
 667 |    ]
 668 |   },
 669 |   {
 670 |    "cell_type": "code",
 671 |    "execution_count": 32,
 672 |    "metadata": {},
 673 |    "outputs": [
 674 |     {
 675 |      "ename": "TypeError",
 676 |      "evalue": "Can only append a Series if ignore_index=True or if the Series has a name",
 677 |      "output_type": "error",
 678 |      "traceback": [
 679 |       "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
 680 |       "\u001b[0;31mTypeError\u001b[0m                                 Traceback (most recent call last)",
 681 |       "\u001b[0;32m<ipython-input-32-d99067ad07e9>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mappend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m{\u001b[0m\u001b[0;34m'first'\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;34m'Tony'\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
 682 |       "\u001b[0;32m/usr/local/lib/python3.6/dist-packages/pandas/core/frame.py\u001b[0m in \u001b[0;36mappend\u001b[0;34m(self, other, ignore_index, verify_integrity, sort)\u001b[0m\n\u001b[1;32m   7096\u001b[0m             \u001b[0;32mif\u001b[0m \u001b[0mother\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mname\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mNone\u001b[0m \u001b[0;32mand\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0mignore_index\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   7097\u001b[0m                 raise TypeError(\n\u001b[0;32m-> 7098\u001b[0;31m                     \u001b[0;34m\"Can only append a Series if ignore_index=True\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m   7099\u001b[0m                     \u001b[0;34m\" or if the Series has a name\"\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m   7100\u001b[0m                 )\n",
 683 |       "\u001b[0;31mTypeError\u001b[0m: Can only append a Series if ignore_index=True or if the Series has a name"
 684 |      ]
 685 |     }
 686 |    ],
 687 |    "source": [
 688 |     "df.append({'first': 'Tony'})"
 689 |    ]
 690 |   },
 691 |   {
 692 |    "cell_type": "markdown",
 693 |    "metadata": {},
 694 |    "source": [
 695 |     "Error because there's no index, but if we say \"ignore_index=True\" the existing df will assign an index by default."
 696 |    ]
 697 |   },
 698 |   {
 699 |    "cell_type": "code",
 700 |    "execution_count": 33,
 701 |    "metadata": {},
 702 |    "outputs": [
 703 |     {
 704 |      "data": {
 705 |       "text/html": [
 706 |        "<div>\n",
 707 |        "<style scoped>\n",
 708 |        "    .dataframe tbody tr th:only-of-type {\n",
 709 |        "        vertical-align: middle;\n",
 710 |        "    }\n",
 711 |        "\n",
 712 |        "    .dataframe tbody tr th {\n",
 713 |        "        vertical-align: top;\n",
 714 |        "    }\n",
 715 |        "\n",
 716 |        "    .dataframe thead th {\n",
 717 |        "        text-align: right;\n",
 718 |        "    }\n",
 719 |        "</style>\n",
 720 |        "<table border=\"1\" class=\"dataframe\">\n",
 721 |        "  <thead>\n",
 722 |        "    <tr style=\"text-align: right;\">\n",
 723 |        "      <th></th>\n",
 724 |        "      <th>email</th>\n",
 725 |        "      <th>full_name</th>\n",
 726 |        "      <th>first</th>\n",
 727 |        "      <th>last</th>\n",
 728 |        "    </tr>\n",
 729 |        "  </thead>\n",
 730 |        "  <tbody>\n",
 731 |        "    <tr>\n",
 732 |        "      <th>0</th>\n",
 733 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
 734 |        "      <td>Corey Schafer</td>\n",
 735 |        "      <td>Corey</td>\n",
 736 |        "      <td>Schafer</td>\n",
 737 |        "    </tr>\n",
 738 |        "    <tr>\n",
 739 |        "      <th>1</th>\n",
 740 |        "      <td>JaneDoe@email.com</td>\n",
 741 |        "      <td>Jane Doe</td>\n",
 742 |        "      <td>Jane</td>\n",
 743 |        "      <td>Doe</td>\n",
 744 |        "    </tr>\n",
 745 |        "    <tr>\n",
 746 |        "      <th>2</th>\n",
 747 |        "      <td>JohnDoe@email.com</td>\n",
 748 |        "      <td>John Doe</td>\n",
 749 |        "      <td>John</td>\n",
 750 |        "      <td>Doe</td>\n",
 751 |        "    </tr>\n",
 752 |        "    <tr>\n",
 753 |        "      <th>3</th>\n",
 754 |        "      <td>NaN</td>\n",
 755 |        "      <td>NaN</td>\n",
 756 |        "      <td>Tony</td>\n",
 757 |        "      <td>NaN</td>\n",
 758 |        "    </tr>\n",
 759 |        "  </tbody>\n",
 760 |        "</table>\n",
 761 |        "</div>"
 762 |       ],
 763 |       "text/plain": [
 764 |        "                     email      full_name  first     last\n",
 765 |        "0  CoreyMSchafer@gmail.com  Corey Schafer  Corey  Schafer\n",
 766 |        "1        JaneDoe@email.com       Jane Doe   Jane      Doe\n",
 767 |        "2        JohnDoe@email.com       John Doe   John      Doe\n",
 768 |        "3                      NaN            NaN   Tony      NaN"
 769 |       ]
 770 |      },
 771 |      "execution_count": 33,
 772 |      "metadata": {},
 773 |      "output_type": "execute_result"
 774 |     }
 775 |    ],
 776 |    "source": [
 777 |     "df.append({'first': 'Tony'}, ignore_index=True)"
 778 |    ]
 779 |   },
 780 |   {
 781 |    "cell_type": "markdown",
 782 |    "metadata": {},
 783 |    "source": [
 784 |     "New name was appended, but since we only assigned one value the other cells are \"NaN\".\n",
 785 |     "\n",
 786 |     "We can also append a new dataframe to an existing dataframe. First create the second dataframe:"
 787 |    ]
 788 |   },
 789 |   {
 790 |    "cell_type": "code",
 791 |    "execution_count": 34,
 792 |    "metadata": {},
 793 |    "outputs": [],
 794 |    "source": [
 795 |     "people = {\n",
 796 |     "    \"first\": [\"Tony\", \"Steve\"],\n",
 797 |     "    \"last\": [\"Stark\", \"Rogers\"],\n",
 798 |     "    \"email\": [\"ironman@avenge.com\", \"cap@avenge.com\"]\n",
 799 |     "}\n",
 800 |     "df2 = pd.DataFrame(people)"
 801 |    ]
 802 |   },
 803 |   {
 804 |    "cell_type": "code",
 805 |    "execution_count": 35,
 806 |    "metadata": {},
 807 |    "outputs": [
 808 |     {
 809 |      "data": {
 810 |       "text/html": [
 811 |        "<div>\n",
 812 |        "<style scoped>\n",
 813 |        "    .dataframe tbody tr th:only-of-type {\n",
 814 |        "        vertical-align: middle;\n",
 815 |        "    }\n",
 816 |        "\n",
 817 |        "    .dataframe tbody tr th {\n",
 818 |        "        vertical-align: top;\n",
 819 |        "    }\n",
 820 |        "\n",
 821 |        "    .dataframe thead th {\n",
 822 |        "        text-align: right;\n",
 823 |        "    }\n",
 824 |        "</style>\n",
 825 |        "<table border=\"1\" class=\"dataframe\">\n",
 826 |        "  <thead>\n",
 827 |        "    <tr style=\"text-align: right;\">\n",
 828 |        "      <th></th>\n",
 829 |        "      <th>first</th>\n",
 830 |        "      <th>last</th>\n",
 831 |        "      <th>email</th>\n",
 832 |        "    </tr>\n",
 833 |        "  </thead>\n",
 834 |        "  <tbody>\n",
 835 |        "    <tr>\n",
 836 |        "      <th>0</th>\n",
 837 |        "      <td>Tony</td>\n",
 838 |        "      <td>Stark</td>\n",
 839 |        "      <td>ironman@avenge.com</td>\n",
 840 |        "    </tr>\n",
 841 |        "    <tr>\n",
 842 |        "      <th>1</th>\n",
 843 |        "      <td>Steve</td>\n",
 844 |        "      <td>Rogers</td>\n",
 845 |        "      <td>cap@avenge.com</td>\n",
 846 |        "    </tr>\n",
 847 |        "  </tbody>\n",
 848 |        "</table>\n",
 849 |        "</div>"
 850 |       ],
 851 |       "text/plain": [
 852 |        "   first    last               email\n",
 853 |        "0   Tony   Stark  ironman@avenge.com\n",
 854 |        "1  Steve  Rogers      cap@avenge.com"
 855 |       ]
 856 |      },
 857 |      "execution_count": 35,
 858 |      "metadata": {},
 859 |      "output_type": "execute_result"
 860 |     }
 861 |    ],
 862 |    "source": [
 863 |     "df2"
 864 |    ]
 865 |   },
 866 |   {
 867 |    "cell_type": "markdown",
 868 |    "metadata": {},
 869 |    "source": [
 870 |     "Now append, remembering to ignore_index:"
 871 |    ]
 872 |   },
 873 |   {
 874 |    "cell_type": "code",
 875 |    "execution_count": 36,
 876 |    "metadata": {},
 877 |    "outputs": [
 878 |     {
 879 |      "name": "stderr",
 880 |      "output_type": "stream",
 881 |      "text": [
 882 |       "/usr/local/lib/python3.6/dist-packages/pandas/core/frame.py:7138: FutureWarning: Sorting because non-concatenation axis is not aligned. A future version\n",
 883 |       "of pandas will change to not sort by default.\n",
 884 |       "\n",
 885 |       "To accept the future behavior, pass 'sort=False'.\n",
 886 |       "\n",
 887 |       "To retain the current behavior and silence the warning, pass 'sort=True'.\n",
 888 |       "\n",
 889 |       "  sort=sort,\n"
 890 |      ]
 891 |     },
 892 |     {
 893 |      "data": {
 894 |       "text/html": [
 895 |        "<div>\n",
 896 |        "<style scoped>\n",
 897 |        "    .dataframe tbody tr th:only-of-type {\n",
 898 |        "        vertical-align: middle;\n",
 899 |        "    }\n",
 900 |        "\n",
 901 |        "    .dataframe tbody tr th {\n",
 902 |        "        vertical-align: top;\n",
 903 |        "    }\n",
 904 |        "\n",
 905 |        "    .dataframe thead th {\n",
 906 |        "        text-align: right;\n",
 907 |        "    }\n",
 908 |        "</style>\n",
 909 |        "<table border=\"1\" class=\"dataframe\">\n",
 910 |        "  <thead>\n",
 911 |        "    <tr style=\"text-align: right;\">\n",
 912 |        "      <th></th>\n",
 913 |        "      <th>email</th>\n",
 914 |        "      <th>first</th>\n",
 915 |        "      <th>full_name</th>\n",
 916 |        "      <th>last</th>\n",
 917 |        "    </tr>\n",
 918 |        "  </thead>\n",
 919 |        "  <tbody>\n",
 920 |        "    <tr>\n",
 921 |        "      <th>0</th>\n",
 922 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
 923 |        "      <td>Corey</td>\n",
 924 |        "      <td>Corey Schafer</td>\n",
 925 |        "      <td>Schafer</td>\n",
 926 |        "    </tr>\n",
 927 |        "    <tr>\n",
 928 |        "      <th>1</th>\n",
 929 |        "      <td>JaneDoe@email.com</td>\n",
 930 |        "      <td>Jane</td>\n",
 931 |        "      <td>Jane Doe</td>\n",
 932 |        "      <td>Doe</td>\n",
 933 |        "    </tr>\n",
 934 |        "    <tr>\n",
 935 |        "      <th>2</th>\n",
 936 |        "      <td>JohnDoe@email.com</td>\n",
 937 |        "      <td>John</td>\n",
 938 |        "      <td>John Doe</td>\n",
 939 |        "      <td>Doe</td>\n",
 940 |        "    </tr>\n",
 941 |        "    <tr>\n",
 942 |        "      <th>3</th>\n",
 943 |        "      <td>ironman@avenge.com</td>\n",
 944 |        "      <td>Tony</td>\n",
 945 |        "      <td>NaN</td>\n",
 946 |        "      <td>Stark</td>\n",
 947 |        "    </tr>\n",
 948 |        "    <tr>\n",
 949 |        "      <th>4</th>\n",
 950 |        "      <td>cap@avenge.com</td>\n",
 951 |        "      <td>Steve</td>\n",
 952 |        "      <td>NaN</td>\n",
 953 |        "      <td>Rogers</td>\n",
 954 |        "    </tr>\n",
 955 |        "  </tbody>\n",
 956 |        "</table>\n",
 957 |        "</div>"
 958 |       ],
 959 |       "text/plain": [
 960 |        "                     email  first      full_name     last\n",
 961 |        "0  CoreyMSchafer@gmail.com  Corey  Corey Schafer  Schafer\n",
 962 |        "1        JaneDoe@email.com   Jane       Jane Doe      Doe\n",
 963 |        "2        JohnDoe@email.com   John       John Doe      Doe\n",
 964 |        "3       ironman@avenge.com   Tony            NaN    Stark\n",
 965 |        "4           cap@avenge.com  Steve            NaN   Rogers"
 966 |       ]
 967 |      },
 968 |      "execution_count": 36,
 969 |      "metadata": {},
 970 |      "output_type": "execute_result"
 971 |     }
 972 |    ],
 973 |    "source": [
 974 |     "df.append(df2, ignore_index=True)"
 975 |    ]
 976 |   },
 977 |   {
 978 |    "cell_type": "markdown",
 979 |    "metadata": {},
 980 |    "source": [
 981 |     "Added new rows. Reason for the warning in that we didn't pass all columns in same order. In future will set sort to False by default.\n",
 982 |     "\n",
 983 |     "If option \"sort=False\" is set, warning will be suppressed.\n",
 984 |     "\n",
 985 |     "The append method doesn't have an \"inplace\" argument, so we have to redefine df to make permanent:"
 986 |    ]
 987 |   },
 988 |   {
 989 |    "cell_type": "code",
 990 |    "execution_count": 37,
 991 |    "metadata": {},
 992 |    "outputs": [],
 993 |    "source": [
 994 |     "df = df.append(df2, ignore_index=True, sort=False)"
 995 |    ]
 996 |   },
 997 |   {
 998 |    "cell_type": "code",
 999 |    "execution_count": 38,
1000 |    "metadata": {},
1001 |    "outputs": [
1002 |     {
1003 |      "data": {
1004 |       "text/html": [
1005 |        "<div>\n",
1006 |        "<style scoped>\n",
1007 |        "    .dataframe tbody tr th:only-of-type {\n",
1008 |        "        vertical-align: middle;\n",
1009 |        "    }\n",
1010 |        "\n",
1011 |        "    .dataframe tbody tr th {\n",
1012 |        "        vertical-align: top;\n",
1013 |        "    }\n",
1014 |        "\n",
1015 |        "    .dataframe thead th {\n",
1016 |        "        text-align: right;\n",
1017 |        "    }\n",
1018 |        "</style>\n",
1019 |        "<table border=\"1\" class=\"dataframe\">\n",
1020 |        "  <thead>\n",
1021 |        "    <tr style=\"text-align: right;\">\n",
1022 |        "      <th></th>\n",
1023 |        "      <th>email</th>\n",
1024 |        "      <th>full_name</th>\n",
1025 |        "      <th>first</th>\n",
1026 |        "      <th>last</th>\n",
1027 |        "    </tr>\n",
1028 |        "  </thead>\n",
1029 |        "  <tbody>\n",
1030 |        "    <tr>\n",
1031 |        "      <th>0</th>\n",
1032 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
1033 |        "      <td>Corey Schafer</td>\n",
1034 |        "      <td>Corey</td>\n",
1035 |        "      <td>Schafer</td>\n",
1036 |        "    </tr>\n",
1037 |        "    <tr>\n",
1038 |        "      <th>1</th>\n",
1039 |        "      <td>JaneDoe@email.com</td>\n",
1040 |        "      <td>Jane Doe</td>\n",
1041 |        "      <td>Jane</td>\n",
1042 |        "      <td>Doe</td>\n",
1043 |        "    </tr>\n",
1044 |        "    <tr>\n",
1045 |        "      <th>2</th>\n",
1046 |        "      <td>JohnDoe@email.com</td>\n",
1047 |        "      <td>John Doe</td>\n",
1048 |        "      <td>John</td>\n",
1049 |        "      <td>Doe</td>\n",
1050 |        "    </tr>\n",
1051 |        "    <tr>\n",
1052 |        "      <th>3</th>\n",
1053 |        "      <td>ironman@avenge.com</td>\n",
1054 |        "      <td>NaN</td>\n",
1055 |        "      <td>Tony</td>\n",
1056 |        "      <td>Stark</td>\n",
1057 |        "    </tr>\n",
1058 |        "    <tr>\n",
1059 |        "      <th>4</th>\n",
1060 |        "      <td>cap@avenge.com</td>\n",
1061 |        "      <td>NaN</td>\n",
1062 |        "      <td>Steve</td>\n",
1063 |        "      <td>Rogers</td>\n",
1064 |        "    </tr>\n",
1065 |        "  </tbody>\n",
1066 |        "</table>\n",
1067 |        "</div>"
1068 |       ],
1069 |       "text/plain": [
1070 |        "                     email      full_name  first     last\n",
1071 |        "0  CoreyMSchafer@gmail.com  Corey Schafer  Corey  Schafer\n",
1072 |        "1        JaneDoe@email.com       Jane Doe   Jane      Doe\n",
1073 |        "2        JohnDoe@email.com       John Doe   John      Doe\n",
1074 |        "3       ironman@avenge.com            NaN   Tony    Stark\n",
1075 |        "4           cap@avenge.com            NaN  Steve   Rogers"
1076 |       ]
1077 |      },
1078 |      "execution_count": 38,
1079 |      "metadata": {},
1080 |      "output_type": "execute_result"
1081 |     }
1082 |    ],
1083 |    "source": [
1084 |     "df"
1085 |    ]
1086 |   },
1087 |   {
1088 |    "cell_type": "markdown",
1089 |    "metadata": {},
1090 |    "source": [
1091 |     "Now let's remove rows. Instead of specifying columns to drops, specify indexes:"
1092 |    ]
1093 |   },
1094 |   {
1095 |    "cell_type": "code",
1096 |    "execution_count": 39,
1097 |    "metadata": {},
1098 |    "outputs": [
1099 |     {
1100 |      "data": {
1101 |       "text/html": [
1102 |        "<div>\n",
1103 |        "<style scoped>\n",
1104 |        "    .dataframe tbody tr th:only-of-type {\n",
1105 |        "        vertical-align: middle;\n",
1106 |        "    }\n",
1107 |        "\n",
1108 |        "    .dataframe tbody tr th {\n",
1109 |        "        vertical-align: top;\n",
1110 |        "    }\n",
1111 |        "\n",
1112 |        "    .dataframe thead th {\n",
1113 |        "        text-align: right;\n",
1114 |        "    }\n",
1115 |        "</style>\n",
1116 |        "<table border=\"1\" class=\"dataframe\">\n",
1117 |        "  <thead>\n",
1118 |        "    <tr style=\"text-align: right;\">\n",
1119 |        "      <th></th>\n",
1120 |        "      <th>email</th>\n",
1121 |        "      <th>full_name</th>\n",
1122 |        "      <th>first</th>\n",
1123 |        "      <th>last</th>\n",
1124 |        "    </tr>\n",
1125 |        "  </thead>\n",
1126 |        "  <tbody>\n",
1127 |        "    <tr>\n",
1128 |        "      <th>0</th>\n",
1129 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
1130 |        "      <td>Corey Schafer</td>\n",
1131 |        "      <td>Corey</td>\n",
1132 |        "      <td>Schafer</td>\n",
1133 |        "    </tr>\n",
1134 |        "    <tr>\n",
1135 |        "      <th>1</th>\n",
1136 |        "      <td>JaneDoe@email.com</td>\n",
1137 |        "      <td>Jane Doe</td>\n",
1138 |        "      <td>Jane</td>\n",
1139 |        "      <td>Doe</td>\n",
1140 |        "    </tr>\n",
1141 |        "    <tr>\n",
1142 |        "      <th>2</th>\n",
1143 |        "      <td>JohnDoe@email.com</td>\n",
1144 |        "      <td>John Doe</td>\n",
1145 |        "      <td>John</td>\n",
1146 |        "      <td>Doe</td>\n",
1147 |        "    </tr>\n",
1148 |        "    <tr>\n",
1149 |        "      <th>3</th>\n",
1150 |        "      <td>ironman@avenge.com</td>\n",
1151 |        "      <td>NaN</td>\n",
1152 |        "      <td>Tony</td>\n",
1153 |        "      <td>Stark</td>\n",
1154 |        "    </tr>\n",
1155 |        "  </tbody>\n",
1156 |        "</table>\n",
1157 |        "</div>"
1158 |       ],
1159 |       "text/plain": [
1160 |        "                     email      full_name  first     last\n",
1161 |        "0  CoreyMSchafer@gmail.com  Corey Schafer  Corey  Schafer\n",
1162 |        "1        JaneDoe@email.com       Jane Doe   Jane      Doe\n",
1163 |        "2        JohnDoe@email.com       John Doe   John      Doe\n",
1164 |        "3       ironman@avenge.com            NaN   Tony    Stark"
1165 |       ]
1166 |      },
1167 |      "execution_count": 39,
1168 |      "metadata": {},
1169 |      "output_type": "execute_result"
1170 |     }
1171 |    ],
1172 |    "source": [
1173 |     "df.drop(index=4)"
1174 |    ]
1175 |   },
1176 |   {
1177 |    "cell_type": "markdown",
1178 |    "metadata": {},
1179 |    "source": [
1180 |     "To apply change permanently, use \"inplace=True\".\n",
1181 |     "\n",
1182 |     "Can use filter with drop method by passing in indexes of filter:"
1183 |    ]
1184 |   },
1185 |   {
1186 |    "cell_type": "code",
1187 |    "execution_count": 40,
1188 |    "metadata": {},
1189 |    "outputs": [
1190 |     {
1191 |      "data": {
1192 |       "text/html": [
1193 |        "<div>\n",
1194 |        "<style scoped>\n",
1195 |        "    .dataframe tbody tr th:only-of-type {\n",
1196 |        "        vertical-align: middle;\n",
1197 |        "    }\n",
1198 |        "\n",
1199 |        "    .dataframe tbody tr th {\n",
1200 |        "        vertical-align: top;\n",
1201 |        "    }\n",
1202 |        "\n",
1203 |        "    .dataframe thead th {\n",
1204 |        "        text-align: right;\n",
1205 |        "    }\n",
1206 |        "</style>\n",
1207 |        "<table border=\"1\" class=\"dataframe\">\n",
1208 |        "  <thead>\n",
1209 |        "    <tr style=\"text-align: right;\">\n",
1210 |        "      <th></th>\n",
1211 |        "      <th>email</th>\n",
1212 |        "      <th>full_name</th>\n",
1213 |        "      <th>first</th>\n",
1214 |        "      <th>last</th>\n",
1215 |        "    </tr>\n",
1216 |        "  </thead>\n",
1217 |        "  <tbody>\n",
1218 |        "    <tr>\n",
1219 |        "      <th>0</th>\n",
1220 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
1221 |        "      <td>Corey Schafer</td>\n",
1222 |        "      <td>Corey</td>\n",
1223 |        "      <td>Schafer</td>\n",
1224 |        "    </tr>\n",
1225 |        "    <tr>\n",
1226 |        "      <th>3</th>\n",
1227 |        "      <td>ironman@avenge.com</td>\n",
1228 |        "      <td>NaN</td>\n",
1229 |        "      <td>Tony</td>\n",
1230 |        "      <td>Stark</td>\n",
1231 |        "    </tr>\n",
1232 |        "    <tr>\n",
1233 |        "      <th>4</th>\n",
1234 |        "      <td>cap@avenge.com</td>\n",
1235 |        "      <td>NaN</td>\n",
1236 |        "      <td>Steve</td>\n",
1237 |        "      <td>Rogers</td>\n",
1238 |        "    </tr>\n",
1239 |        "  </tbody>\n",
1240 |        "</table>\n",
1241 |        "</div>"
1242 |       ],
1243 |       "text/plain": [
1244 |        "                     email      full_name  first     last\n",
1245 |        "0  CoreyMSchafer@gmail.com  Corey Schafer  Corey  Schafer\n",
1246 |        "3       ironman@avenge.com            NaN   Tony    Stark\n",
1247 |        "4           cap@avenge.com            NaN  Steve   Rogers"
1248 |       ]
1249 |      },
1250 |      "execution_count": 40,
1251 |      "metadata": {},
1252 |      "output_type": "execute_result"
1253 |     }
1254 |    ],
1255 |    "source": [
1256 |     "df.drop(index=df[df['last'] == 'Doe'].index)"
1257 |    ]
1258 |   },
1259 |   {
1260 |    "cell_type": "code",
1261 |    "execution_count": 42,
1262 |    "metadata": {},
1263 |    "outputs": [
1264 |     {
1265 |      "data": {
1266 |       "text/html": [
1267 |        "<div>\n",
1268 |        "<style scoped>\n",
1269 |        "    .dataframe tbody tr th:only-of-type {\n",
1270 |        "        vertical-align: middle;\n",
1271 |        "    }\n",
1272 |        "\n",
1273 |        "    .dataframe tbody tr th {\n",
1274 |        "        vertical-align: top;\n",
1275 |        "    }\n",
1276 |        "\n",
1277 |        "    .dataframe thead th {\n",
1278 |        "        text-align: right;\n",
1279 |        "    }\n",
1280 |        "</style>\n",
1281 |        "<table border=\"1\" class=\"dataframe\">\n",
1282 |        "  <thead>\n",
1283 |        "    <tr style=\"text-align: right;\">\n",
1284 |        "      <th></th>\n",
1285 |        "      <th>email</th>\n",
1286 |        "      <th>full_name</th>\n",
1287 |        "      <th>first</th>\n",
1288 |        "      <th>last</th>\n",
1289 |        "    </tr>\n",
1290 |        "  </thead>\n",
1291 |        "  <tbody>\n",
1292 |        "    <tr>\n",
1293 |        "      <th>0</th>\n",
1294 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
1295 |        "      <td>Corey Schafer</td>\n",
1296 |        "      <td>Corey</td>\n",
1297 |        "      <td>Schafer</td>\n",
1298 |        "    </tr>\n",
1299 |        "    <tr>\n",
1300 |        "      <th>1</th>\n",
1301 |        "      <td>JaneDoe@email.com</td>\n",
1302 |        "      <td>Jane Doe</td>\n",
1303 |        "      <td>Jane</td>\n",
1304 |        "      <td>Doe</td>\n",
1305 |        "    </tr>\n",
1306 |        "    <tr>\n",
1307 |        "      <th>2</th>\n",
1308 |        "      <td>JohnDoe@email.com</td>\n",
1309 |        "      <td>John Doe</td>\n",
1310 |        "      <td>John</td>\n",
1311 |        "      <td>Doe</td>\n",
1312 |        "    </tr>\n",
1313 |        "    <tr>\n",
1314 |        "      <th>3</th>\n",
1315 |        "      <td>ironman@avenge.com</td>\n",
1316 |        "      <td>NaN</td>\n",
1317 |        "      <td>Tony</td>\n",
1318 |        "      <td>Stark</td>\n",
1319 |        "    </tr>\n",
1320 |        "    <tr>\n",
1321 |        "      <th>4</th>\n",
1322 |        "      <td>cap@avenge.com</td>\n",
1323 |        "      <td>NaN</td>\n",
1324 |        "      <td>Steve</td>\n",
1325 |        "      <td>Rogers</td>\n",
1326 |        "    </tr>\n",
1327 |        "  </tbody>\n",
1328 |        "</table>\n",
1329 |        "</div>"
1330 |       ],
1331 |       "text/plain": [
1332 |        "                     email      full_name  first     last\n",
1333 |        "0  CoreyMSchafer@gmail.com  Corey Schafer  Corey  Schafer\n",
1334 |        "1        JaneDoe@email.com       Jane Doe   Jane      Doe\n",
1335 |        "2        JohnDoe@email.com       John Doe   John      Doe\n",
1336 |        "3       ironman@avenge.com            NaN   Tony    Stark\n",
1337 |        "4           cap@avenge.com            NaN  Steve   Rogers"
1338 |       ]
1339 |      },
1340 |      "execution_count": 42,
1341 |      "metadata": {},
1342 |      "output_type": "execute_result"
1343 |     }
1344 |    ],
1345 |    "source": [
1346 |     "df"
1347 |    ]
1348 |   },
1349 |   {
1350 |    "cell_type": "markdown",
1351 |    "metadata": {},
1352 |    "source": [
1353 |     "Corey thinks this is hard to read. Instead do this:"
1354 |    ]
1355 |   },
1356 |   {
1357 |    "cell_type": "code",
1358 |    "execution_count": 43,
1359 |    "metadata": {},
1360 |    "outputs": [
1361 |     {
1362 |      "data": {
1363 |       "text/html": [
1364 |        "<div>\n",
1365 |        "<style scoped>\n",
1366 |        "    .dataframe tbody tr th:only-of-type {\n",
1367 |        "        vertical-align: middle;\n",
1368 |        "    }\n",
1369 |        "\n",
1370 |        "    .dataframe tbody tr th {\n",
1371 |        "        vertical-align: top;\n",
1372 |        "    }\n",
1373 |        "\n",
1374 |        "    .dataframe thead th {\n",
1375 |        "        text-align: right;\n",
1376 |        "    }\n",
1377 |        "</style>\n",
1378 |        "<table border=\"1\" class=\"dataframe\">\n",
1379 |        "  <thead>\n",
1380 |        "    <tr style=\"text-align: right;\">\n",
1381 |        "      <th></th>\n",
1382 |        "      <th>email</th>\n",
1383 |        "      <th>full_name</th>\n",
1384 |        "      <th>first</th>\n",
1385 |        "      <th>last</th>\n",
1386 |        "    </tr>\n",
1387 |        "  </thead>\n",
1388 |        "  <tbody>\n",
1389 |        "    <tr>\n",
1390 |        "      <th>0</th>\n",
1391 |        "      <td>CoreyMSchafer@gmail.com</td>\n",
1392 |        "      <td>Corey Schafer</td>\n",
1393 |        "      <td>Corey</td>\n",
1394 |        "      <td>Schafer</td>\n",
1395 |        "    </tr>\n",
1396 |        "    <tr>\n",
1397 |        "      <th>3</th>\n",
1398 |        "      <td>ironman@avenge.com</td>\n",
1399 |        "      <td>NaN</td>\n",
1400 |        "      <td>Tony</td>\n",
1401 |        "      <td>Stark</td>\n",
1402 |        "    </tr>\n",
1403 |        "    <tr>\n",
1404 |        "      <th>4</th>\n",
1405 |        "      <td>cap@avenge.com</td>\n",
1406 |        "      <td>NaN</td>\n",
1407 |        "      <td>Steve</td>\n",
1408 |        "      <td>Rogers</td>\n",
1409 |        "    </tr>\n",
1410 |        "  </tbody>\n",
1411 |        "</table>\n",
1412 |        "</div>"
1413 |       ],
1414 |       "text/plain": [
1415 |        "                     email      full_name  first     last\n",
1416 |        "0  CoreyMSchafer@gmail.com  Corey Schafer  Corey  Schafer\n",
1417 |        "3       ironman@avenge.com            NaN   Tony    Stark\n",
1418 |        "4           cap@avenge.com            NaN  Steve   Rogers"
1419 |       ]
1420 |      },
1421 |      "execution_count": 43,
1422 |      "metadata": {},
1423 |      "output_type": "execute_result"
1424 |     }
1425 |    ],
1426 |    "source": [
1427 |     "filt = df['last'] == 'Doe'\n",
1428 |     "df.drop(index=df[filt].index)"
1429 |    ]
1430 |   },
1431 |   {
1432 |    "cell_type": "code",
1433 |    "execution_count": null,
1434 |    "metadata": {},
1435 |    "outputs": [],
1436 |    "source": []
1437 |   }
1438 |  ],
1439 |  "metadata": {
1440 |   "kernelspec": {
1441 |    "display_name": "Python 3",
1442 |    "language": "python",
1443 |    "name": "python3"
1444 |   },
1445 |   "language_info": {
1446 |    "codemirror_mode": {
1447 |     "name": "ipython",
1448 |     "version": 3
1449 |    },
1450 |    "file_extension": ".py",
1451 |    "mimetype": "text/x-python",
1452 |    "name": "python",
1453 |    "nbconvert_exporter": "python",
1454 |    "pygments_lexer": "ipython3",
1455 |    "version": "3.6.9"
1456 |   }
1457 |  },
1458 |  "nbformat": 4,
1459 |  "nbformat_minor": 2
1460 | }
1461 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | # Pandas Tutorials
 2 | Tutorials on how to use python pandas from [Corey Schafer](https://github.com/CoreyMSchafer).
 3 | 
 4 | YouTube playlist:
 5 | 
 6 | https://www.youtube.com/playlist?list=PL-osiE80TeTsWmV9i9c58mdDCSskIFdDS
 7 | 
 8 | Code snippets:
 9 | 
10 | https://github.com/CoreyMSchafer/code_snippets/tree/master/Python/Pandas
11 | 
12 | Updating as course progresses.
13 | 
14 | 


--------------------------------------------------------------------------------
/data/ETH_1h.csv.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/plembo/pandas-tutorials/02fdbb8196586bdeec1da9e89a0934c15b44b53d/data/ETH_1h.csv.zip


--------------------------------------------------------------------------------
/data/README_2019.txt:
--------------------------------------------------------------------------------
 1 | The Public 2019 Stack Overflow Developer Survey Results
 2 | 
 3 | Description:
 4 | 
 5 | The enclosed data set is the full, cleaned results of the 2019 Stack Overflow Developer Survey. Free response submissions and personally identifying information have been removed from the results to protect the privacy of respondents. There are three files besides this README:
 6 | 
 7 | 1. survey_results_public.csv - CSV file with main survey results, one respondent per row and one column per answer
 8 | 2. survey_results_schema.csv - CSV file with survey schema, i.e., the questions that correspond to each column name
 9 | 3. so_survey_2019.pdf - PDF file of survey instrument
10 | 
11 | The survey was fielded from January 23 to February 14, 2019. The median time spent on the survey for qualified responses was 23.3 minutes.
12 | 
13 | Respondents were recruited primarily through channels owned by Stack Overflow. The top 5 sources of respondents were onsite messaging, blog posts, email lists, Meta posts, banner ads, and social media posts. Since respondents were recruited in this way, highly engaged users on Stack Overflow were more likely to notice the links for the survey and click to begin it.
14 | 
15 | As an incentive, respondents who finished the survey could opt in to a "Census" badge if they completed the survey.
16 | 
17 | You can find the official published results here:
18 | 
19 | https://insights.stackoverflow.com/survey/2019
20 | 
21 | Find previous survey results here:
22 | 
23 | https://insights.stackoverflow.com/survey
24 | 
25 | Legal:
26 | 
27 | This database - The Public 2019 Stack Overflow Developer Survey Results - is made available under the Open Database License (ODbL): http://opendatacommons.org/licenses/odbl/1.0/. Any rights in individual contents of the database are licensed under the Database Contents License: http://opendatacommons.org/licenses/dbcl/1.0/
28 | 
29 | TLDR: You are free to share, adapt, and create derivative works from The Public 2019 Stack Overflow Developer Survey Results as long as you attribute Stack Overflow, keep the database open (if you redistribute it), and continue to share-alike any adapted database under the ODbl.
30 | 
31 | Acknowledgment:
32 | 
33 | Massive, heartfelt thanks to all Stack Overflow contributors and lurking developers of the world who took part in the survey this year. We value your generous participation more than you know. <3
34 | 


--------------------------------------------------------------------------------
/data/so_survey_2019.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/plembo/pandas-tutorials/02fdbb8196586bdeec1da9e89a0934c15b44b53d/data/so_survey_2019.pdf


--------------------------------------------------------------------------------
/data/survey_results_public.csv.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/plembo/pandas-tutorials/02fdbb8196586bdeec1da9e89a0934c15b44b53d/data/survey_results_public.csv.zip


--------------------------------------------------------------------------------
/data/survey_results_schema.csv:
--------------------------------------------------------------------------------
 1 | Column,QuestionText
 2 | Respondent,Randomized respondent ID number (not in order of survey response time)
 3 | MainBranch,"Which of the following options best describes you today? Here, by ""developer"" we mean ""someone who writes code."""
 4 | Hobbyist,Do you code as a hobby?
 5 | OpenSourcer,How often do you contribute to open source?
 6 | OpenSource,How do you feel about the quality of open source software (OSS)?
 7 | Employment,Which of the following best describes your current employment status?
 8 | Country,In which country do you currently reside?
 9 | Student,"Are you currently enrolled in a formal, degree-granting college or university program?"
10 | EdLevel,Which of the following best describes the highest level of formal education that you’ve completed?
11 | UndergradMajor,What was your main or most important field of study?
12 | EduOther,Which of the following types of non-degree education have you used or participated in? Please select all that apply.
13 | OrgSize,Approximately how many people are employed by the company or organization you work for?
14 | DevType,Which of the following describe you? Please select all that apply.
15 | YearsCode,"Including any education, how many years have you been coding?"
16 | Age1stCode,"At what age did you write your first line of code or program? (E.g., webpage, Hello World, Scratch project)"
17 | YearsCodePro,How many years have you coded professionally (as a part of your work)?
18 | CareerSat,"Overall, how satisfied are you with your career thus far?"
19 | JobSat,"How satisfied are you with your current job? (If you work multiple jobs, answer for the one you spend the most hours on.)"
20 | MgrIdiot,How confident are you that your manager knows what they’re doing?
21 | MgrMoney,Do you believe that you need to be a manager to make more money?
22 | MgrWant,Do you want to become a manager yourself in the future?
23 | JobSeek,Which of the following best describes your current job-seeking status?
24 | LastHireDate,When was the last time that you took a job with a new employer?
25 | LastInt,"In your most recent successful job interview (resulting in a job offer), you were asked to... (check all that apply)"
26 | FizzBuzz,Have you ever been asked to solve FizzBuzz in an interview?
27 | JobFactors,"Imagine that you are deciding between two job offers with the same compensation, benefits, and location. Of the following factors, which 3 are MOST important to you?"
28 | ResumeUpdate,"Think back to the last time you updated your resumé, CV, or an online profile on a job site. What is the PRIMARY reason that you did so?"
29 | CurrencySymbol,"Which currency do you use day-to-day? If your answer is complicated, please pick the one you're most comfortable estimating in."
30 | CurrencyDesc,"Which currency do you use day-to-day? If your answer is complicated, please pick the one you're most comfortable estimating in."
31 | CompTotal,"What is your current total compensation (salary, bonuses, and perks, before taxes and deductions), in `CurrencySymbol`? Please enter a whole number in the box below, without any punctuation. If you are paid hourly, please estimate an equivalent weekly, monthly, or yearly salary. If you prefer not to answer, please leave the box empty."
32 | CompFreq,"Is that compensation weekly, monthly, or yearly?"
33 | ConvertedComp,"Salary converted to annual USD salaries using the exchange rate on 2019-02-01, assuming 12 working months and 50 working weeks."
34 | WorkWeekHrs,"On average, how many hours per week do you work?"
35 | WorkPlan,How structured or planned is your work?
36 | WorkChallenge,"Of these options, what are your greatest challenges to productivity as a developer? Select up to 3:"
37 | WorkRemote,How often do you work remotely?
38 | WorkLoc,Where would you prefer to work?
39 | ImpSyn,"For the specific work you do, and the years of experience you have, how do you rate your own level of competence?"
40 | CodeRev,Do you review code as part of your work?
41 | CodeRevHrs,"On average, how many hours per week do you spend on code review?"
42 | UnitTests,Does your company regularly employ unit tests in the development of their products?
43 | PurchaseHow,"How does your company make decisions about purchasing new technology (cloud, AI, IoT, databases)?"
44 | PurchaseWhat,"What level of influence do you, personally, have over new technology purchases at your organization?"
45 | LanguageWorkedWith,"Which of the following programming, scripting, and markup languages have you done extensive development work in over the past year, and which do you want to work in over the next year?  (If you both worked with the language and want to continue to do so, please check both boxes in that row.)"
46 | LanguageDesireNextYear,"Which of the following programming, scripting, and markup languages have you done extensive development work in over the past year, and which do you want to work in over the next year?  (If you both worked with the language and want to continue to do so, please check both boxes in that row.)"
47 | DatabaseWorkedWith,"Which of the following database environments have you done extensive development work in over the past year, and which do you want to work in over the next year?   (If you both worked with the database and want to continue to do so, please check both boxes in that row.)"
48 | DatabaseDesireNextYear,"Which of the following database environments have you done extensive development work in over the past year, and which do you want to work in over the next year?   (If you both worked with the database and want to continue to do so, please check both boxes in that row.)"
49 | PlatformWorkedWith,"Which of the following platforms have you done extensive development work for over the past year?   (If you both developed for the platform and want to continue to do so, please check both boxes in that row.)"
50 | PlatformDesireNextYear,"Which of the following platforms have you done extensive development work for over the past year?   (If you both developed for the platform and want to continue to do so, please check both boxes in that row.)"
51 | WebFrameWorkedWith,"Which of the following web frameworks have you done extensive development work in over the past year, and which do you want to work in over the next year? (If you both worked with the framework and want to continue to do so, please check both boxes in that row.)"
52 | WebFrameDesireNextYear,"Which of the following web frameworks have you done extensive development work in over the past year, and which do you want to work in over the next year? (If you both worked with the framework and want to continue to do so, please check both boxes in that row.)"
53 | MiscTechWorkedWith,"Which of the following other frameworks, libraries, and tools have you done extensive development work in over the past year, and which do you want to work in over the next year? (If you both worked with the technology and want to continue to do so, please check both boxes in that row.)"
54 | MiscTechDesireNextYear,"Which of the following other frameworks, libraries, and tools have you done extensive development work in over the past year, and which do you want to work in over the next year? (If you both worked with the technology and want to continue to do so, please check both boxes in that row.)"
55 | DevEnviron,Which development environment(s) do you use regularly?  Please check all that apply.
56 | OpSys,What is the primary operating system in which you work?
57 | Containers,"How do you use containers (Docker, Open Container Initiative (OCI), etc.)?"
58 | BlockchainOrg,How is your organization thinking about or implementing blockchain technology?
59 | BlockchainIs,Blockchain / cryptocurrency technology is primarily:
60 | BetterLife,Do you think people born today will have a better life than their parents?
61 | ITperson,"Are you the ""IT support person"" for your family?"
62 | OffOn,Have you tried turning it off and on again?
63 | SocialMedia,What social media site do you use the most?
64 | Extraversion,Do you prefer online chat or IRL conversations?
65 | ScreenName,What do you call it?
66 | SOVisit1st,"To the best of your memory, when did you first visit Stack Overflow?"
67 | SOVisitFreq,How frequently would you say you visit Stack Overflow?
68 | SOVisitTo,I visit Stack Overflow to... (check all that apply)
69 | SOFindAnswer,"On average, how many times a week do you find (and use) an answer on Stack Overflow?"
70 | SOTimeSaved,"Think back to the last time you solved a coding problem using Stack Overflow, as well as the last time you solved a problem using a different resource. Which was faster?"
71 | SOHowMuchTime,"About how much time did you save? If you're not sure, please use your best estimate."
72 | SOAccount,Do you have a Stack Overflow account?
73 | SOPartFreq,"How frequently would you say you participate in Q&A on Stack Overflow? By participate we mean ask, answer, vote for, or comment on questions."
74 | SOJobs,Have you ever used or visited Stack Overflow Jobs?
75 | EntTeams,Have you ever used Stack Overflow for Enterprise or Stack Overflow for Teams?
76 | SOComm,Do you consider yourself a member of the Stack Overflow community?
77 | WelcomeChange,"Compared to last year, how welcome do you feel on Stack Overflow?"
78 | SONewContent,Would you like to see any of the following on Stack Overflow? Check all that apply.
79 | Age,"What is your age (in years)? If you prefer not to answer, you may leave this question blank."
80 | Gender,"Which of the following do you currently identify as? Please select all that apply. If you prefer not to answer, you may leave this question blank."
81 | Trans,Do you identify as transgender?
82 | Sexuality,"Which of the following do you currently identify as? Please select all that apply. If you prefer not to answer, you may leave this question blank."
83 | Ethnicity,"Which of the following do you identify as? Please check all that apply. If you prefer not to answer, you may leave this question blank."
84 | Dependents,"Do you have any dependents (e.g., children, elders, or others) that you care for?"
85 | SurveyLength,How do you feel about the length of the survey this year?
86 | SurveyEase,How easy or difficult was this survey to complete?
87 | 


--------------------------------------------------------------------------------
/data/survey_results_schema.csv.zip:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/plembo/pandas-tutorials/02fdbb8196586bdeec1da9e89a0934c15b44b53d/data/survey_results_schema.csv.zip


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
1 | numpy
2 | matplotlib
3 | pandas
4 | sqlalchemy
5 | psycopg2
6 | 


--------------------------------------------------------------------------------