├── Bar Chart Race - Dica Pandas #7.ipynb ├── Conversao de Colunas Pandas - Dicas Pandas #1 .ipynb ├── Dica_da_Pandas_Selecionando_dados_com_Pandas.ipynb ├── Dica_de_Pandas_Conversao_Strings.ipynb ├── Dica_de_Pandas_Rolling.ipynb ├── Estilos - Dicas Pandas #5.ipynb ├── Filtrando e Exportando para CSV os dados do ENEM por Estado Brasileiro.ipynb ├── Gráficos fofos em Python.ipynb ├── Importando_arquivo_zip_no_Pandas_Plotly_Backend_Dica_de_Pandas_8.ipynb ├── Modificando colunas do DataFrame - Dicas Pandas #2.ipynb ├── Ordenando o describe( ) - Dicas Pandas #3.ipynb ├── Os DataFrames são iguais? - Dicas Pandas #4.ipynb ├── Pandas_Categorical_Dtype_Dica_de_Pandas_11.ipynb ├── Pandas_do_ZERO_à_Análise_de_Dados.ipynb ├── README.md ├── Variáveis categóricas - Dica Pandas #6.ipynb └── dados ├── HIST_PAINEL_COVIDBR_12jun2020.xlsx ├── TA_PRECO_MEDICAMENTO_GOV.csv ├── arquivo_geral.csv └── bcdata-dolar-2023.csv /Dica_de_Pandas_Rolling.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "nbformat": 4, 3 | "nbformat_minor": 0, 4 | "metadata": { 5 | "colab": { 6 | "provenance": [], 7 | "authorship_tag": "ABX9TyNHD9BPR6KkmU2mKfd5W6Dm", 8 | "include_colab_link": true 9 | }, 10 | "kernelspec": { 11 | "name": "python3", 12 | "display_name": "Python 3" 13 | }, 14 | "language_info": { 15 | "name": "python" 16 | } 17 | }, 18 | "cells": [ 19 | { 20 | "cell_type": "markdown", 21 | "metadata": { 22 | "id": "view-in-github", 23 | "colab_type": "text" 24 | }, 25 | "source": [ 26 | "\"Open" 27 | ] 28 | }, 29 | { 30 | "cell_type": "code", 31 | "source": [ 32 | "import pandas as pd\n", 33 | "import numpy as np\n", 34 | "import random" 35 | ], 36 | "metadata": { 37 | "id": "l0yQRRnl7mZY" 38 | }, 39 | "execution_count": 63, 40 | "outputs": [] 41 | }, 42 | { 43 | "cell_type": "code", 44 | "execution_count": 66, 45 | "metadata": { 46 | "id": "8recwtAe7lMK" 47 | }, 48 | "outputs": [], 49 | "source": [ 50 | "data = []\n", 51 | "date_range = pd.date_range(\"01/01/2022\", \"01/07/2023\")\n", 52 | "\n", 53 | "for i in range(len(date_range)):\n", 54 | "\n", 55 | " sales_cash = random.randint(1, 10)\n", 56 | " sales_card = random.randint(1, 10)\n", 57 | "\n", 58 | " day_type = \"Dia da Semana\"\n", 59 | "\n", 60 | " if date_range[i].weekday()>4:\n", 61 | " day_type = \"Final de Semana\"\n", 62 | "\n", 63 | " data.append([str(date_range[i].date()), day_type, \"Dinheiro\", sales_cash])\n", 64 | " data.append([str(date_range[i].date()), day_type, \"Cartão\", sales_card])\n", 65 | "\n", 66 | "data = pd.DataFrame(data, columns=[\"Data\", \"Tipo_Dia\", \"Tipo_Pagamento\", \"Vendas\"])\n", 67 | "data[\"Data\"] = pd.to_datetime(data[\"Data\"])" 68 | ] 69 | }, 70 | { 71 | "cell_type": "code", 72 | "source": [ 73 | "data" 74 | ], 75 | "metadata": { 76 | "colab": { 77 | "base_uri": "https://localhost:8080/", 78 | "height": 423 79 | }, 80 | "id": "2cEOk0218GUJ", 81 | "outputId": "c244839d-7c96-4ee5-fdeb-d02253348f47" 82 | }, 83 | "execution_count": 67, 84 | "outputs": [ 85 | { 86 | "output_type": "execute_result", 87 | "data": { 88 | "text/plain": [ 89 | " Data Tipo_Dia Tipo_Pagamento Vendas\n", 90 | "0 2022-01-01 Final de Semana Dinheiro 9\n", 91 | "1 2022-01-01 Final de Semana Cartão 8\n", 92 | "2 2022-01-02 Final de Semana Dinheiro 6\n", 93 | "3 2022-01-02 Final de Semana Cartão 7\n", 94 | "4 2022-01-03 Dia da Semana Dinheiro 7\n", 95 | ".. ... ... ... ...\n", 96 | "739 2023-01-05 Dia da Semana Cartão 3\n", 97 | "740 2023-01-06 Dia da Semana Dinheiro 2\n", 98 | "741 2023-01-06 Dia da Semana Cartão 9\n", 99 | "742 2023-01-07 Final de Semana Dinheiro 5\n", 100 | "743 2023-01-07 Final de Semana Cartão 9\n", 101 | "\n", 102 | "[744 rows x 4 columns]" 103 | ], 104 | "text/html": [ 105 | "\n", 106 | "
\n", 107 | "
\n", 108 | "\n", 121 | "\n", 122 | " \n", 123 | " \n", 124 | " \n", 125 | " \n", 126 | " \n", 127 | " \n", 128 | " \n", 129 | " \n", 130 | " \n", 131 | " \n", 132 | " \n", 133 | " \n", 134 | " \n", 135 | " \n", 136 | " \n", 137 | " \n", 138 | " \n", 139 | " \n", 140 | " \n", 141 | " \n", 142 | " \n", 143 | " \n", 144 | " \n", 145 | " \n", 146 | " \n", 147 | " \n", 148 | " \n", 149 | " \n", 150 | " \n", 151 | " \n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | " \n", 174 | " \n", 175 | " \n", 176 | " \n", 177 | " \n", 178 | " \n", 179 | " \n", 180 | " \n", 181 | " \n", 182 | " \n", 183 | " \n", 184 | " \n", 185 | " \n", 186 | " \n", 187 | " \n", 188 | " \n", 189 | " \n", 190 | " \n", 191 | " \n", 192 | " \n", 193 | " \n", 194 | " \n", 195 | " \n", 196 | " \n", 197 | " \n", 198 | " \n", 199 | " \n", 200 | " \n", 201 | " \n", 202 | " \n", 203 | " \n", 204 | " \n", 205 | " \n", 206 | " \n", 207 | " \n", 208 | " \n", 209 | " \n", 210 | "
DataTipo_DiaTipo_PagamentoVendas
02022-01-01Final de SemanaDinheiro9
12022-01-01Final de SemanaCartão8
22022-01-02Final de SemanaDinheiro6
32022-01-02Final de SemanaCartão7
42022-01-03Dia da SemanaDinheiro7
...............
7392023-01-05Dia da SemanaCartão3
7402023-01-06Dia da SemanaDinheiro2
7412023-01-06Dia da SemanaCartão9
7422023-01-07Final de SemanaDinheiro5
7432023-01-07Final de SemanaCartão9
\n", 211 | "

744 rows × 4 columns

\n", 212 | "
\n", 213 | "
\n", 214 | "\n", 215 | "
\n", 216 | " \n", 224 | "\n", 225 | " \n", 265 | "\n", 266 | " \n", 290 | "
\n", 291 | "\n", 292 | "\n", 293 | "
\n", 294 | " \n", 305 | "\n", 306 | "\n", 337 | "\n", 338 | " \n", 350 | "
\n", 351 | "
\n", 352 | "
\n" 353 | ] 354 | }, 355 | "metadata": {}, 356 | "execution_count": 67 357 | } 358 | ] 359 | }, 360 | { 361 | "cell_type": "code", 362 | "source": [ 363 | "data['roll_soma_win2'] = data.rolling(window=2).Vendas.sum()" 364 | ], 365 | "metadata": { 366 | "id": "zdK2XNBFSohC" 367 | }, 368 | "execution_count": 68, 369 | "outputs": [] 370 | }, 371 | { 372 | "cell_type": "code", 373 | "source": [ 374 | "data['roll_avg_win3'] = data.rolling(window=3).Vendas.mean()" 375 | ], 376 | "metadata": { 377 | "id": "73PwmrlfTHPD" 378 | }, 379 | "execution_count": 73, 380 | "outputs": [] 381 | }, 382 | { 383 | "cell_type": "code", 384 | "source": [ 385 | "data.drop('roll_max_win2d', axis=1, inplace=True)" 386 | ], 387 | "metadata": { 388 | "id": "SKwi3yhBTj8o" 389 | }, 390 | "execution_count": 81, 391 | "outputs": [] 392 | }, 393 | { 394 | "cell_type": "code", 395 | "source": [ 396 | "data['roll_max_win2'] = data.rolling(window=2).Vendas.max()" 397 | ], 398 | "metadata": { 399 | "id": "ix0F0N_PTO8S" 400 | }, 401 | "execution_count": 74, 402 | "outputs": [] 403 | }, 404 | { 405 | "cell_type": "code", 406 | "source": [ 407 | "data['roll_soma_win2d'] = data.rolling(window='7d', on='Data').Vendas.sum()" 408 | ], 409 | "metadata": { 410 | "id": "b0TTIx77TyB2" 411 | }, 412 | "execution_count": 83, 413 | "outputs": [] 414 | }, 415 | { 416 | "cell_type": "code", 417 | "source": [ 418 | "data.info()" 419 | ], 420 | "metadata": { 421 | "colab": { 422 | "base_uri": "https://localhost:8080/" 423 | }, 424 | "id": "lrKwrwZiT0XH", 425 | "outputId": "30dd4cb0-115b-4205-b430-fc014a4f5722" 426 | }, 427 | "execution_count": 78, 428 | "outputs": [ 429 | { 430 | "output_type": "stream", 431 | "name": "stdout", 432 | "text": [ 433 | "\n", 434 | "RangeIndex: 744 entries, 0 to 743\n", 435 | "Data columns (total 7 columns):\n", 436 | " # Column Non-Null Count Dtype \n", 437 | "--- ------ -------------- ----- \n", 438 | " 0 Data 744 non-null datetime64[ns]\n", 439 | " 1 Tipo_Dia 744 non-null object \n", 440 | " 2 Tipo_Pagamento 744 non-null object \n", 441 | " 3 Vendas 744 non-null int64 \n", 442 | " 4 roll_soma_win2 743 non-null float64 \n", 443 | " 5 roll_avg_win3 742 non-null float64 \n", 444 | " 6 roll_max_win2 743 non-null float64 \n", 445 | "dtypes: datetime64[ns](1), float64(3), int64(1), object(2)\n", 446 | "memory usage: 40.8+ KB\n" 447 | ] 448 | } 449 | ] 450 | }, 451 | { 452 | "cell_type": "code", 453 | "source": [ 454 | "data" 455 | ], 456 | "metadata": { 457 | "colab": { 458 | "base_uri": "https://localhost:8080/", 459 | "height": 423 460 | }, 461 | "id": "zJLYSUssSojb", 462 | "outputId": "1d43541f-1f72-4ffd-c3e4-875b86889ffa" 463 | }, 464 | "execution_count": 84, 465 | "outputs": [ 466 | { 467 | "output_type": "execute_result", 468 | "data": { 469 | "text/plain": [ 470 | " Data Tipo_Dia Tipo_Pagamento Vendas roll_soma_win2 \\\n", 471 | "0 2022-01-01 Final de Semana Dinheiro 9 NaN \n", 472 | "1 2022-01-01 Final de Semana Cartão 8 17.0 \n", 473 | "2 2022-01-02 Final de Semana Dinheiro 6 14.0 \n", 474 | "3 2022-01-02 Final de Semana Cartão 7 13.0 \n", 475 | "4 2022-01-03 Dia da Semana Dinheiro 7 14.0 \n", 476 | ".. ... ... ... ... ... \n", 477 | "739 2023-01-05 Dia da Semana Cartão 3 9.0 \n", 478 | "740 2023-01-06 Dia da Semana Dinheiro 2 5.0 \n", 479 | "741 2023-01-06 Dia da Semana Cartão 9 11.0 \n", 480 | "742 2023-01-07 Final de Semana Dinheiro 5 14.0 \n", 481 | "743 2023-01-07 Final de Semana Cartão 9 14.0 \n", 482 | "\n", 483 | " roll_avg_win3 roll_max_win2 roll_soma_win2d \n", 484 | "0 NaN NaN 9.0 \n", 485 | "1 NaN 9.0 17.0 \n", 486 | "2 7.666667 8.0 23.0 \n", 487 | "3 7.000000 7.0 30.0 \n", 488 | "4 6.666667 7.0 37.0 \n", 489 | ".. ... ... ... \n", 490 | "739 4.333333 6.0 64.0 \n", 491 | "740 3.666667 3.0 54.0 \n", 492 | "741 4.666667 9.0 63.0 \n", 493 | "742 5.333333 9.0 61.0 \n", 494 | "743 7.666667 9.0 70.0 \n", 495 | "\n", 496 | "[744 rows x 8 columns]" 497 | ], 498 | "text/html": [ 499 | "\n", 500 | "
\n", 501 | "
\n", 502 | "\n", 515 | "\n", 516 | " \n", 517 | " \n", 518 | " \n", 519 | " \n", 520 | " \n", 521 | " \n", 522 | " \n", 523 | " \n", 524 | " \n", 525 | " \n", 526 | " \n", 527 | " \n", 528 | " \n", 529 | " \n", 530 | " \n", 531 | " \n", 532 | " \n", 533 | " \n", 534 | " \n", 535 | " \n", 536 | " \n", 537 | " \n", 538 | " \n", 539 | " \n", 540 | " \n", 541 | " \n", 542 | " \n", 543 | " \n", 544 | " \n", 545 | " \n", 546 | " \n", 547 | " \n", 548 | " \n", 549 | " \n", 550 | " \n", 551 | " \n", 552 | " \n", 553 | " \n", 554 | " \n", 555 | " \n", 556 | " \n", 557 | " \n", 558 | " \n", 559 | " \n", 560 | " \n", 561 | " \n", 562 | " \n", 563 | " \n", 564 | " \n", 565 | " \n", 566 | " \n", 567 | " \n", 568 | " \n", 569 | " \n", 570 | " \n", 571 | " \n", 572 | " \n", 573 | " \n", 574 | " \n", 575 | " \n", 576 | " \n", 577 | " \n", 578 | " \n", 579 | " \n", 580 | " \n", 581 | " \n", 582 | " \n", 583 | " \n", 584 | " \n", 585 | " \n", 586 | " \n", 587 | " \n", 588 | " \n", 589 | " \n", 590 | " \n", 591 | " \n", 592 | " \n", 593 | " \n", 594 | " \n", 595 | " \n", 596 | " \n", 597 | " \n", 598 | " \n", 599 | " \n", 600 | " \n", 601 | " \n", 602 | " \n", 603 | " \n", 604 | " \n", 605 | " \n", 606 | " \n", 607 | " \n", 608 | " \n", 609 | " \n", 610 | " \n", 611 | " \n", 612 | " \n", 613 | " \n", 614 | " \n", 615 | " \n", 616 | " \n", 617 | " \n", 618 | " \n", 619 | " \n", 620 | " \n", 621 | " \n", 622 | " \n", 623 | " \n", 624 | " \n", 625 | " \n", 626 | " \n", 627 | " \n", 628 | " \n", 629 | " \n", 630 | " \n", 631 | " \n", 632 | " \n", 633 | " \n", 634 | " \n", 635 | " \n", 636 | " \n", 637 | " \n", 638 | " \n", 639 | " \n", 640 | " \n", 641 | " \n", 642 | " \n", 643 | " \n", 644 | " \n", 645 | " \n", 646 | " \n", 647 | " \n", 648 | " \n", 649 | " \n", 650 | " \n", 651 | " \n", 652 | "
DataTipo_DiaTipo_PagamentoVendasroll_soma_win2roll_avg_win3roll_max_win2roll_soma_win2d
02022-01-01Final de SemanaDinheiro9NaNNaNNaN9.0
12022-01-01Final de SemanaCartão817.0NaN9.017.0
22022-01-02Final de SemanaDinheiro614.07.6666678.023.0
32022-01-02Final de SemanaCartão713.07.0000007.030.0
42022-01-03Dia da SemanaDinheiro714.06.6666677.037.0
...........................
7392023-01-05Dia da SemanaCartão39.04.3333336.064.0
7402023-01-06Dia da SemanaDinheiro25.03.6666673.054.0
7412023-01-06Dia da SemanaCartão911.04.6666679.063.0
7422023-01-07Final de SemanaDinheiro514.05.3333339.061.0
7432023-01-07Final de SemanaCartão914.07.6666679.070.0
\n", 653 | "

744 rows × 8 columns

\n", 654 | "
\n", 655 | "
\n", 656 | "\n", 657 | "
\n", 658 | " \n", 666 | "\n", 667 | " \n", 707 | "\n", 708 | " \n", 732 | "
\n", 733 | "\n", 734 | "\n", 735 | "
\n", 736 | " \n", 747 | "\n", 748 | "\n", 779 | "\n", 780 | " \n", 792 | "
\n", 793 | "
\n", 794 | "
\n" 795 | ] 796 | }, 797 | "metadata": {}, 798 | "execution_count": 84 799 | } 800 | ] 801 | } 802 | ] 803 | } -------------------------------------------------------------------------------- /Gráficos fofos em Python.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "code", 5 | "execution_count": 1, 6 | "metadata": {}, 7 | "outputs": [ 8 | { 9 | "name": "stdout", 10 | "output_type": "stream", 11 | "text": [ 12 | "Requirement already satisfied: cutecharts in /Users/kizzyterra/Workspace/machine-learning/venv-ml/lib/python3.7/site-packages (1.2.0)\n", 13 | "Requirement already satisfied: jinja2 in /Users/kizzyterra/Workspace/machine-learning/venv-ml/lib/python3.7/site-packages (from cutecharts) (2.10.3)\n", 14 | "Requirement already satisfied: MarkupSafe>=0.23 in /Users/kizzyterra/Workspace/machine-learning/venv-ml/lib/python3.7/site-packages (from jinja2->cutecharts) (1.1.1)\n" 15 | ] 16 | } 17 | ], 18 | "source": [ 19 | "!pip install cutecharts" 20 | ] 21 | }, 22 | { 23 | "cell_type": "code", 24 | "execution_count": 35, 25 | "metadata": {}, 26 | "outputs": [], 27 | "source": [ 28 | "import pandas as pd\n", 29 | "import cutecharts.charts as ctc" 30 | ] 31 | }, 32 | { 33 | "cell_type": "code", 34 | "execution_count": 22, 35 | "metadata": {}, 36 | "outputs": [], 37 | "source": [ 38 | "microdados_enem_rj = pd.read_csv('../dados/microdados_enem_ufs_2019/microdados_enem_RJ_2019.csv', index_col=0)" 39 | ] 40 | }, 41 | { 42 | "cell_type": "code", 43 | "execution_count": 23, 44 | "metadata": {}, 45 | "outputs": [ 46 | { 47 | "data": { 48 | "text/html": [ 49 | "
\n", 50 | "\n", 63 | "\n", 64 | " \n", 65 | " \n", 66 | " \n", 67 | " \n", 68 | " \n", 69 | " \n", 70 | " \n", 71 | " \n", 72 | " \n", 73 | " \n", 74 | " \n", 75 | " \n", 76 | " \n", 77 | " \n", 78 | " \n", 79 | " \n", 80 | " \n", 81 | " \n", 82 | " \n", 83 | " \n", 84 | " \n", 85 | " \n", 86 | " \n", 87 | " \n", 88 | " \n", 89 | " \n", 90 | " \n", 91 | " \n", 92 | " \n", 93 | " \n", 94 | " \n", 95 | " \n", 96 | " \n", 97 | " \n", 98 | " \n", 99 | " \n", 100 | " \n", 101 | " \n", 102 | " \n", 103 | " \n", 104 | " \n", 105 | " \n", 106 | " \n", 107 | " \n", 108 | " \n", 109 | " \n", 110 | " \n", 111 | " \n", 112 | " \n", 113 | " \n", 114 | " \n", 115 | " \n", 116 | " \n", 117 | " \n", 118 | " \n", 119 | " \n", 120 | " \n", 121 | " \n", 122 | " \n", 123 | " \n", 124 | " \n", 125 | " \n", 126 | " \n", 127 | " \n", 128 | " \n", 129 | " \n", 130 | " \n", 131 | " \n", 132 | " \n", 133 | " \n", 134 | " \n", 135 | " \n", 136 | " \n", 137 | " \n", 138 | " \n", 139 | " \n", 140 | " \n", 141 | " \n", 142 | " \n", 143 | " \n", 144 | " \n", 145 | " \n", 146 | " \n", 147 | " \n", 148 | " \n", 149 | " \n", 150 | " \n", 151 | " \n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | " \n", 174 | " \n", 175 | " \n", 176 | " \n", 177 | " \n", 178 | " \n", 179 | " \n", 180 | " \n", 181 | " \n", 182 | " \n", 183 | " \n", 184 | " \n", 185 | " \n", 186 | " \n", 187 | " \n", 188 | " \n", 189 | " \n", 190 | " \n", 191 | " \n", 192 | " \n", 193 | " \n", 194 | " \n", 195 | " \n", 196 | " \n", 197 | " \n", 198 | " \n", 199 | " \n", 200 | " \n", 201 | " \n", 202 | " \n", 203 | " \n", 204 | " \n", 205 | " \n", 206 | " \n", 207 | " \n", 208 | " \n", 209 | " \n", 210 | " \n", 211 | " \n", 212 | "
NU_INSCRICAONU_ANOCO_MUNICIPIO_RESIDENCIANO_MUNICIPIO_RESIDENCIACO_UF_RESIDENCIASG_UF_RESIDENCIANU_IDADETP_SEXOTP_ESTADO_CIVILTP_COR_RACA...Q016Q017Q018Q019Q020Q021Q022Q023Q024Q025
1060019000101522720193302056Italva33RJ32F13...AAABBABAAA
2107419000102570220193305109São João de Meriti33RJ32M13...AAABAABAAA
2265719000102728520193304557Rio de Janeiro33RJ26M13...BAABAABABB
3036519000103499320193304557Rio de Janeiro33RJ19F13...AAAAAABAAB
6093719000106556620193304557Rio de Janeiro33RJ22F13...AAABBACAAA
\n", 213 | "

5 rows × 136 columns

\n", 214 | "
" 215 | ], 216 | "text/plain": [ 217 | " NU_INSCRICAO NU_ANO CO_MUNICIPIO_RESIDENCIA NO_MUNICIPIO_RESIDENCIA \\\n", 218 | "10600 190001015227 2019 3302056 Italva \n", 219 | "21074 190001025702 2019 3305109 São João de Meriti \n", 220 | "22657 190001027285 2019 3304557 Rio de Janeiro \n", 221 | "30365 190001034993 2019 3304557 Rio de Janeiro \n", 222 | "60937 190001065566 2019 3304557 Rio de Janeiro \n", 223 | "\n", 224 | " CO_UF_RESIDENCIA SG_UF_RESIDENCIA NU_IDADE TP_SEXO TP_ESTADO_CIVIL \\\n", 225 | "10600 33 RJ 32 F 1 \n", 226 | "21074 33 RJ 32 M 1 \n", 227 | "22657 33 RJ 26 M 1 \n", 228 | "30365 33 RJ 19 F 1 \n", 229 | "60937 33 RJ 22 F 1 \n", 230 | "\n", 231 | " TP_COR_RACA ... Q016 Q017 Q018 Q019 Q020 Q021 Q022 Q023 Q024 \\\n", 232 | "10600 3 ... A A A B B A B A A \n", 233 | "21074 3 ... A A A B A A B A A \n", 234 | "22657 3 ... B A A B A A B A B \n", 235 | "30365 3 ... A A A A A A B A A \n", 236 | "60937 3 ... A A A B B A C A A \n", 237 | "\n", 238 | " Q025 \n", 239 | "10600 A \n", 240 | "21074 A \n", 241 | "22657 B \n", 242 | "30365 B \n", 243 | "60937 A \n", 244 | "\n", 245 | "[5 rows x 136 columns]" 246 | ] 247 | }, 248 | "execution_count": 23, 249 | "metadata": {}, 250 | "output_type": "execute_result" 251 | } 252 | ], 253 | "source": [ 254 | "microdados_enem_rj.head()" 255 | ] 256 | }, 257 | { 258 | "cell_type": "code", 259 | "execution_count": 24, 260 | "metadata": {}, 261 | "outputs": [], 262 | "source": [ 263 | "microdados_enem_rj.reset_index(inplace=True,drop=True)" 264 | ] 265 | }, 266 | { 267 | "cell_type": "code", 268 | "execution_count": 25, 269 | "metadata": { 270 | "scrolled": true 271 | }, 272 | "outputs": [ 273 | { 274 | "data": { 275 | "text/html": [ 276 | "
\n", 277 | "\n", 290 | "\n", 291 | " \n", 292 | " \n", 293 | " \n", 294 | " \n", 295 | " \n", 296 | " \n", 297 | " \n", 298 | " \n", 299 | " \n", 300 | " \n", 301 | " \n", 302 | " \n", 303 | " \n", 304 | " \n", 305 | " \n", 306 | " \n", 307 | " \n", 308 | " \n", 309 | " \n", 310 | " \n", 311 | " \n", 312 | " \n", 313 | " \n", 314 | " \n", 315 | " \n", 316 | " \n", 317 | " \n", 318 | " \n", 319 | " \n", 320 | " \n", 321 | " \n", 322 | " \n", 323 | " \n", 324 | " \n", 325 | " \n", 326 | " \n", 327 | " \n", 328 | " \n", 329 | " \n", 330 | " \n", 331 | " \n", 332 | " \n", 333 | " \n", 334 | " \n", 335 | " \n", 336 | " \n", 337 | " \n", 338 | " \n", 339 | " \n", 340 | " \n", 341 | " \n", 342 | " \n", 343 | " \n", 344 | " \n", 345 | " \n", 346 | " \n", 347 | " \n", 348 | " \n", 349 | " \n", 350 | " \n", 351 | " \n", 352 | " \n", 353 | " \n", 354 | " \n", 355 | " \n", 356 | " \n", 357 | " \n", 358 | " \n", 359 | " \n", 360 | " \n", 361 | " \n", 362 | " \n", 363 | " \n", 364 | " \n", 365 | " \n", 366 | " \n", 367 | " \n", 368 | " \n", 369 | " \n", 370 | " \n", 371 | " \n", 372 | " \n", 373 | " \n", 374 | " \n", 375 | " \n", 376 | " \n", 377 | " \n", 378 | " \n", 379 | " \n", 380 | " \n", 381 | " \n", 382 | " \n", 383 | " \n", 384 | " \n", 385 | " \n", 386 | " \n", 387 | " \n", 388 | " \n", 389 | " \n", 390 | " \n", 391 | " \n", 392 | " \n", 393 | " \n", 394 | " \n", 395 | " \n", 396 | " \n", 397 | " \n", 398 | " \n", 399 | " \n", 400 | " \n", 401 | " \n", 402 | " \n", 403 | " \n", 404 | " \n", 405 | " \n", 406 | " \n", 407 | " \n", 408 | " \n", 409 | " \n", 410 | " \n", 411 | " \n", 412 | " \n", 413 | " \n", 414 | " \n", 415 | " \n", 416 | " \n", 417 | " \n", 418 | " \n", 419 | " \n", 420 | " \n", 421 | " \n", 422 | " \n", 423 | " \n", 424 | " \n", 425 | " \n", 426 | " \n", 427 | " \n", 428 | " \n", 429 | " \n", 430 | " \n", 431 | " \n", 432 | " \n", 433 | " \n", 434 | " \n", 435 | " \n", 436 | " \n", 437 | " \n", 438 | " \n", 439 | " \n", 440 | " \n", 441 | " \n", 442 | " \n", 443 | " \n", 444 | " \n", 445 | " \n", 446 | " \n", 447 | " \n", 448 | " \n", 449 | " \n", 450 | " \n", 451 | " \n", 452 | " \n", 453 | " \n", 454 | " \n", 455 | " \n", 456 | " \n", 457 | " \n", 458 | " \n", 459 | " \n", 460 | " \n", 461 | " \n", 462 | " \n", 463 | " \n", 464 | " \n", 465 | " \n", 466 | " \n", 467 | " \n", 468 | " \n", 469 | " \n", 470 | " \n", 471 | " \n", 472 | " \n", 473 | " \n", 474 | " \n", 475 | " \n", 476 | " \n", 477 | " \n", 478 | " \n", 479 | " \n", 480 | " \n", 481 | " \n", 482 | " \n", 483 | " \n", 484 | " \n", 485 | " \n", 486 | " \n", 487 | " \n", 488 | " \n", 489 | " \n", 490 | " \n", 491 | " \n", 492 | " \n", 493 | " \n", 494 | " \n", 495 | " \n", 496 | " \n", 497 | " \n", 498 | " \n", 499 | " \n", 500 | " \n", 501 | " \n", 502 | " \n", 503 | " \n", 504 | " \n", 505 | " \n", 506 | " \n", 507 | " \n", 508 | " \n", 509 | " \n", 510 | " \n", 511 | " \n", 512 | " \n", 513 | " \n", 514 | " \n", 515 | " \n", 516 | " \n", 517 | " \n", 518 | " \n", 519 | " \n", 520 | " \n", 521 | " \n", 522 | " \n", 523 | " \n", 524 | " \n", 525 | " \n", 526 | " \n", 527 | " \n", 528 | " \n", 529 | " \n", 530 | " \n", 531 | " \n", 532 | " \n", 533 | " \n", 534 | " \n", 535 | " \n", 536 | " \n", 537 | " \n", 538 | " \n", 539 | " \n", 540 | " \n", 541 | " \n", 542 | " \n", 543 | " \n", 544 | " \n", 545 | " \n", 546 | " \n", 547 | " \n", 548 | " \n", 549 | " \n", 550 | " \n", 551 | " \n", 552 | " \n", 553 | " \n", 554 | " \n", 555 | " \n", 556 | " \n", 557 | " \n", 558 | " \n", 559 | " \n", 560 | " \n", 561 | " \n", 562 | " \n", 563 | " \n", 564 | " \n", 565 | " \n", 566 | " \n", 567 | " \n", 568 | " \n", 569 | " \n", 570 | " \n", 571 | " \n", 572 | " \n", 573 | " \n", 574 | " \n", 575 | " \n", 576 | " \n", 577 | " \n", 578 | " \n", 579 | " \n", 580 | " \n", 581 | " \n", 582 | " \n", 583 | "
NU_INSCRICAONU_ANOCO_MUNICIPIO_RESIDENCIANO_MUNICIPIO_RESIDENCIACO_UF_RESIDENCIASG_UF_RESIDENCIANU_IDADETP_SEXOTP_ESTADO_CIVILTP_COR_RACA...Q016Q017Q018Q019Q020Q021Q022Q023Q024Q025
019000101522720193302056Italva33RJ32F13...AAABBABAAA
119000102570220193305109São João de Meriti33RJ32M13...AAABAABAAA
219000102728520193304557Rio de Janeiro33RJ26M13...BAABAABABB
319000103499320193304557Rio de Janeiro33RJ19F13...AAAAAABAAB
419000106556620193304557Rio de Janeiro33RJ22F13...AAABBACAAA
..................................................................
33870519000611889520193304557Rio de Janeiro33RJ18F03...BABDABEBAB
33870619000611889620193305109São João de Meriti33RJ52F23...AAABAABBAA
33870719000611889720193304557Rio de Janeiro33RJ23F11...BAADBBEABB
33870819000611889820193300308Barra do Piraí33RJ32F12...AAABBABAAA
33870919000611889920193304904São Gonçalo33RJ41F03...BAABAACABB
\n", 584 | "

338710 rows × 136 columns

\n", 585 | "
" 586 | ], 587 | "text/plain": [ 588 | " NU_INSCRICAO NU_ANO CO_MUNICIPIO_RESIDENCIA NO_MUNICIPIO_RESIDENCIA \\\n", 589 | "0 190001015227 2019 3302056 Italva \n", 590 | "1 190001025702 2019 3305109 São João de Meriti \n", 591 | "2 190001027285 2019 3304557 Rio de Janeiro \n", 592 | "3 190001034993 2019 3304557 Rio de Janeiro \n", 593 | "4 190001065566 2019 3304557 Rio de Janeiro \n", 594 | "... ... ... ... ... \n", 595 | "338705 190006118895 2019 3304557 Rio de Janeiro \n", 596 | "338706 190006118896 2019 3305109 São João de Meriti \n", 597 | "338707 190006118897 2019 3304557 Rio de Janeiro \n", 598 | "338708 190006118898 2019 3300308 Barra do Piraí \n", 599 | "338709 190006118899 2019 3304904 São Gonçalo \n", 600 | "\n", 601 | " CO_UF_RESIDENCIA SG_UF_RESIDENCIA NU_IDADE TP_SEXO TP_ESTADO_CIVIL \\\n", 602 | "0 33 RJ 32 F 1 \n", 603 | "1 33 RJ 32 M 1 \n", 604 | "2 33 RJ 26 M 1 \n", 605 | "3 33 RJ 19 F 1 \n", 606 | "4 33 RJ 22 F 1 \n", 607 | "... ... ... ... ... ... \n", 608 | "338705 33 RJ 18 F 0 \n", 609 | "338706 33 RJ 52 F 2 \n", 610 | "338707 33 RJ 23 F 1 \n", 611 | "338708 33 RJ 32 F 1 \n", 612 | "338709 33 RJ 41 F 0 \n", 613 | "\n", 614 | " TP_COR_RACA ... Q016 Q017 Q018 Q019 Q020 Q021 Q022 Q023 Q024 \\\n", 615 | "0 3 ... A A A B B A B A A \n", 616 | "1 3 ... A A A B A A B A A \n", 617 | "2 3 ... B A A B A A B A B \n", 618 | "3 3 ... A A A A A A B A A \n", 619 | "4 3 ... A A A B B A C A A \n", 620 | "... ... ... ... ... ... ... ... ... ... ... ... \n", 621 | "338705 3 ... B A B D A B E B A \n", 622 | "338706 3 ... A A A B A A B B A \n", 623 | "338707 1 ... B A A D B B E A B \n", 624 | "338708 2 ... A A A B B A B A A \n", 625 | "338709 3 ... B A A B A A C A B \n", 626 | "\n", 627 | " Q025 \n", 628 | "0 A \n", 629 | "1 A \n", 630 | "2 B \n", 631 | "3 B \n", 632 | "4 A \n", 633 | "... ... \n", 634 | "338705 B \n", 635 | "338706 A \n", 636 | "338707 B \n", 637 | "338708 A \n", 638 | "338709 B \n", 639 | "\n", 640 | "[338710 rows x 136 columns]" 641 | ] 642 | }, 643 | "execution_count": 25, 644 | "metadata": {}, 645 | "output_type": "execute_result" 646 | } 647 | ], 648 | "source": [ 649 | "microdados_enem_rj" 650 | ] 651 | }, 652 | { 653 | "cell_type": "code", 654 | "execution_count": 27, 655 | "metadata": {}, 656 | "outputs": [ 657 | { 658 | "data": { 659 | "text/plain": [ 660 | "array(['RJ'], dtype=object)" 661 | ] 662 | }, 663 | "execution_count": 27, 664 | "metadata": {}, 665 | "output_type": "execute_result" 666 | } 667 | ], 668 | "source": [ 669 | "microdados_enem_rj.SG_UF_RESIDENCIA.unique()" 670 | ] 671 | }, 672 | { 673 | "cell_type": "code", 674 | "execution_count": 28, 675 | "metadata": {}, 676 | "outputs": [ 677 | { 678 | "data": { 679 | "text/plain": [ 680 | "array(['NU_INSCRICAO', 'NU_ANO', 'CO_MUNICIPIO_RESIDENCIA',\n", 681 | " 'NO_MUNICIPIO_RESIDENCIA', 'CO_UF_RESIDENCIA', 'SG_UF_RESIDENCIA',\n", 682 | " 'NU_IDADE', 'TP_SEXO', 'TP_ESTADO_CIVIL', 'TP_COR_RACA',\n", 683 | " 'TP_NACIONALIDADE', 'CO_MUNICIPIO_NASCIMENTO',\n", 684 | " 'NO_MUNICIPIO_NASCIMENTO', 'CO_UF_NASCIMENTO', 'SG_UF_NASCIMENTO',\n", 685 | " 'TP_ST_CONCLUSAO', 'TP_ANO_CONCLUIU', 'TP_ESCOLA', 'TP_ENSINO',\n", 686 | " 'IN_TREINEIRO', 'CO_ESCOLA', 'CO_MUNICIPIO_ESC',\n", 687 | " 'NO_MUNICIPIO_ESC', 'CO_UF_ESC', 'SG_UF_ESC',\n", 688 | " 'TP_DEPENDENCIA_ADM_ESC', 'TP_LOCALIZACAO_ESC', 'TP_SIT_FUNC_ESC',\n", 689 | " 'IN_BAIXA_VISAO', 'IN_CEGUEIRA', 'IN_SURDEZ',\n", 690 | " 'IN_DEFICIENCIA_AUDITIVA', 'IN_SURDO_CEGUEIRA',\n", 691 | " 'IN_DEFICIENCIA_FISICA', 'IN_DEFICIENCIA_MENTAL',\n", 692 | " 'IN_DEFICIT_ATENCAO', 'IN_DISLEXIA', 'IN_DISCALCULIA',\n", 693 | " 'IN_AUTISMO', 'IN_VISAO_MONOCULAR', 'IN_OUTRA_DEF', 'IN_GESTANTE',\n", 694 | " 'IN_LACTANTE', 'IN_IDOSO', 'IN_ESTUDA_CLASSE_HOSPITALAR',\n", 695 | " 'IN_SEM_RECURSO', 'IN_BRAILLE', 'IN_AMPLIADA_24', 'IN_AMPLIADA_18',\n", 696 | " 'IN_LEDOR', 'IN_ACESSO', 'IN_TRANSCRICAO', 'IN_LIBRAS',\n", 697 | " 'IN_TEMPO_ADICIONAL', 'IN_LEITURA_LABIAL', 'IN_MESA_CADEIRA_RODAS',\n", 698 | " 'IN_MESA_CADEIRA_SEPARADA', 'IN_APOIO_PERNA', 'IN_GUIA_INTERPRETE',\n", 699 | " 'IN_COMPUTADOR', 'IN_CADEIRA_ESPECIAL', 'IN_CADEIRA_CANHOTO',\n", 700 | " 'IN_CADEIRA_ACOLCHOADA', 'IN_PROVA_DEITADO', 'IN_MOBILIARIO_OBESO',\n", 701 | " 'IN_LAMINA_OVERLAY', 'IN_PROTETOR_AURICULAR', 'IN_MEDIDOR_GLICOSE',\n", 702 | " 'IN_MAQUINA_BRAILE', 'IN_SOROBAN', 'IN_MARCA_PASSO', 'IN_SONDA',\n", 703 | " 'IN_MEDICAMENTOS', 'IN_SALA_INDIVIDUAL', 'IN_SALA_ESPECIAL',\n", 704 | " 'IN_SALA_ACOMPANHANTE', 'IN_MOBILIARIO_ESPECIFICO',\n", 705 | " 'IN_MATERIAL_ESPECIFICO', 'IN_NOME_SOCIAL', 'CO_MUNICIPIO_PROVA',\n", 706 | " 'NO_MUNICIPIO_PROVA', 'CO_UF_PROVA', 'SG_UF_PROVA',\n", 707 | " 'TP_PRESENCA_CN', 'TP_PRESENCA_CH', 'TP_PRESENCA_LC',\n", 708 | " 'TP_PRESENCA_MT', 'CO_PROVA_CN', 'CO_PROVA_CH', 'CO_PROVA_LC',\n", 709 | " 'CO_PROVA_MT', 'NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 710 | " 'NU_NOTA_MT', 'TX_RESPOSTAS_CN', 'TX_RESPOSTAS_CH',\n", 711 | " 'TX_RESPOSTAS_LC', 'TX_RESPOSTAS_MT', 'TP_LINGUA',\n", 712 | " 'TX_GABARITO_CN', 'TX_GABARITO_CH', 'TX_GABARITO_LC',\n", 713 | " 'TX_GABARITO_MT', 'TP_STATUS_REDACAO', 'NU_NOTA_COMP1',\n", 714 | " 'NU_NOTA_COMP2', 'NU_NOTA_COMP3', 'NU_NOTA_COMP4', 'NU_NOTA_COMP5',\n", 715 | " 'NU_NOTA_REDACAO', 'Q001', 'Q002', 'Q003', 'Q004', 'Q005', 'Q006',\n", 716 | " 'Q007', 'Q008', 'Q009', 'Q010', 'Q011', 'Q012', 'Q013', 'Q014',\n", 717 | " 'Q015', 'Q016', 'Q017', 'Q018', 'Q019', 'Q020', 'Q021', 'Q022',\n", 718 | " 'Q023', 'Q024', 'Q025'], dtype=object)" 719 | ] 720 | }, 721 | "execution_count": 28, 722 | "metadata": {}, 723 | "output_type": "execute_result" 724 | } 725 | ], 726 | "source": [ 727 | "microdados_enem_rj.columns.values" 728 | ] 729 | }, 730 | { 731 | "cell_type": "code", 732 | "execution_count": 30, 733 | "metadata": {}, 734 | "outputs": [ 735 | { 736 | "data": { 737 | "text/plain": [ 738 | "NU_NOTA_CN 491.892385\n", 739 | "NU_NOTA_CH 523.361916\n", 740 | "NU_NOTA_LC 535.900530\n", 741 | "NU_NOTA_MT 539.564877\n", 742 | "dtype: float64" 743 | ] 744 | }, 745 | "execution_count": 30, 746 | "metadata": {}, 747 | "output_type": "execute_result" 748 | } 749 | ], 750 | "source": [ 751 | "microdados_enem_rj[['NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 752 | " 'NU_NOTA_MT']].mean()" 753 | ] 754 | }, 755 | { 756 | "cell_type": "code", 757 | "execution_count": 63, 758 | "metadata": {}, 759 | "outputs": [ 760 | { 761 | "data": { 762 | "text/html": [ 763 | "\n", 764 | "\n", 771 | "\n", 772 | "
\n", 773 | " \n", 774 | "
\n", 775 | " \n" 781 | ], 782 | "text/plain": [ 783 | "" 784 | ] 785 | }, 786 | "execution_count": 63, 787 | "metadata": {}, 788 | "output_type": "execute_result" 789 | } 790 | ], 791 | "source": [ 792 | "chart = ctc.Bar('Médias Notas RJ',width='500px',height='400px')\n", 793 | "chart.set_options(\n", 794 | " labels=['C. Natureza', 'C. Humanas', 'Linguagens', 'Matemática', 'Redação'],\n", 795 | " x_label=\"Provas\",\n", 796 | " y_label=\"Média por Prova\" ,\n", 797 | " colors=['#D9F1BB','#F7B7A3','#EA5F89','#9B3192', '#FFFF77']\n", 798 | " )\n", 799 | "chart.add_series(\"Média\",list(microdados_enem_rj[['NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 800 | " 'NU_NOTA_MT', 'NU_NOTA_REDACAO']].mean()))\n", 801 | "chart.render_notebook()" 802 | ] 803 | }, 804 | { 805 | "cell_type": "code", 806 | "execution_count": 68, 807 | "metadata": {}, 808 | "outputs": [ 809 | { 810 | "data": { 811 | "text/html": [ 812 | "\n", 813 | "\n", 820 | "\n", 821 | "
\n", 822 | " \n", 823 | "
\n", 824 | " \n" 830 | ], 831 | "text/plain": [ 832 | "" 833 | ] 834 | }, 835 | "execution_count": 68, 836 | "metadata": {}, 837 | "output_type": "execute_result" 838 | } 839 | ], 840 | "source": [ 841 | "municipio = \"Angra dos Reis\"\n", 842 | "\n", 843 | "radar_chart = ctc.Radar('Médias Notas RJ',width='600px',height='600px')\n", 844 | "radar_chart.set_options(\n", 845 | " labels=['C. Natureza', 'C. Humanas', 'Linguagens', 'Matemática'],\n", 846 | " is_show_legend=True, #by default, it is true. You can turn it off.\n", 847 | " legend_pos='upRight' #location of the legend\n", 848 | " )\n", 849 | "\n", 850 | "radar_chart.add_series(\"Média dos Municípios RJ\",list(microdados_enem_rj[['NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 851 | " 'NU_NOTA_MT','NU_NOTA_REDACAO']].mean()))\n", 852 | "radar_chart.add_series(\"Média do Município {}\".format(municipio),\n", 853 | " list(microdados_enem_rj.groupby(['NO_MUNICIPIO_RESIDENCIA'])['NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 854 | " 'NU_NOTA_MT','NU_NOTA_REDACAO'].mean().loc[municipio]))\n", 855 | "\n", 856 | "radar_chart.render_notebook()" 857 | ] 858 | }, 859 | { 860 | "cell_type": "code", 861 | "execution_count": 51, 862 | "metadata": {}, 863 | "outputs": [ 864 | { 865 | "data": { 866 | "text/plain": [ 867 | "NU_NOTA_CN 475.984038\n", 868 | "NU_NOTA_CH 508.694181\n", 869 | "NU_NOTA_LC 527.015926\n", 870 | "NU_NOTA_MT 520.845753\n", 871 | "Name: Angra dos Reis, dtype: float64" 872 | ] 873 | }, 874 | "execution_count": 51, 875 | "metadata": {}, 876 | "output_type": "execute_result" 877 | } 878 | ], 879 | "source": [ 880 | "microdados_enem_rj.groupby(['NO_MUNICIPIO_RESIDENCIA'])['NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 881 | " 'NU_NOTA_MT'].mean().loc['Angra dos Reis']" 882 | ] 883 | }, 884 | { 885 | "cell_type": "code", 886 | "execution_count": 52, 887 | "metadata": {}, 888 | "outputs": [ 889 | { 890 | "data": { 891 | "text/html": [ 892 | "
\n", 893 | "\n", 906 | "\n", 907 | " \n", 908 | " \n", 909 | " \n", 910 | " \n", 911 | " \n", 912 | " \n", 913 | " \n", 914 | " \n", 915 | " \n", 916 | " \n", 917 | " \n", 918 | " \n", 919 | " \n", 920 | " \n", 921 | " \n", 922 | " \n", 923 | " \n", 924 | " \n", 925 | " \n", 926 | " \n", 927 | " \n", 928 | " \n", 929 | " \n", 930 | " \n", 931 | " \n", 932 | " \n", 933 | " \n", 934 | " \n", 935 | " \n", 936 | " \n", 937 | " \n", 938 | " \n", 939 | " \n", 940 | " \n", 941 | " \n", 942 | " \n", 943 | " \n", 944 | " \n", 945 | " \n", 946 | " \n", 947 | " \n", 948 | " \n", 949 | " \n", 950 | " \n", 951 | " \n", 952 | " \n", 953 | " \n", 954 | " \n", 955 | " \n", 956 | " \n", 957 | " \n", 958 | " \n", 959 | " \n", 960 | " \n", 961 | " \n", 962 | " \n", 963 | " \n", 964 | " \n", 965 | " \n", 966 | " \n", 967 | " \n", 968 | " \n", 969 | " \n", 970 | " \n", 971 | " \n", 972 | " \n", 973 | " \n", 974 | " \n", 975 | " \n", 976 | " \n", 977 | " \n", 978 | " \n", 979 | " \n", 980 | " \n", 981 | " \n", 982 | " \n", 983 | " \n", 984 | " \n", 985 | " \n", 986 | " \n", 987 | " \n", 988 | " \n", 989 | " \n", 990 | " \n", 991 | " \n", 992 | " \n", 993 | " \n", 994 | " \n", 995 | " \n", 996 | " \n", 997 | " \n", 998 | " \n", 999 | " \n", 1000 | " \n", 1001 | " \n", 1002 | "
NU_NOTA_CNNU_NOTA_CHNU_NOTA_LCNU_NOTA_MT
NO_MUNICIPIO_RESIDENCIA
Angra dos Reis475.984038508.694181527.015926520.845753
Aperibé493.393789518.341379528.701724542.992547
Araruama488.075321514.994308529.860574532.785762
Areal474.303145503.188304523.457895515.313208
Armação dos Búzios490.474903525.274910535.007040530.700000
...............
Três Rios482.053123511.984375527.105288522.841703
Valença495.254925522.922297534.024662546.180657
Varre-Sai492.420492503.276692512.384211534.113934
Vassouras485.166593513.554167528.432917525.596239
Volta Redonda507.400156535.504062544.084667569.327552
\n", 1003 | "

92 rows × 4 columns

\n", 1004 | "
" 1005 | ], 1006 | "text/plain": [ 1007 | " NU_NOTA_CN NU_NOTA_CH NU_NOTA_LC NU_NOTA_MT\n", 1008 | "NO_MUNICIPIO_RESIDENCIA \n", 1009 | "Angra dos Reis 475.984038 508.694181 527.015926 520.845753\n", 1010 | "Aperibé 493.393789 518.341379 528.701724 542.992547\n", 1011 | "Araruama 488.075321 514.994308 529.860574 532.785762\n", 1012 | "Areal 474.303145 503.188304 523.457895 515.313208\n", 1013 | "Armação dos Búzios 490.474903 525.274910 535.007040 530.700000\n", 1014 | "... ... ... ... ...\n", 1015 | "Três Rios 482.053123 511.984375 527.105288 522.841703\n", 1016 | "Valença 495.254925 522.922297 534.024662 546.180657\n", 1017 | "Varre-Sai 492.420492 503.276692 512.384211 534.113934\n", 1018 | "Vassouras 485.166593 513.554167 528.432917 525.596239\n", 1019 | "Volta Redonda 507.400156 535.504062 544.084667 569.327552\n", 1020 | "\n", 1021 | "[92 rows x 4 columns]" 1022 | ] 1023 | }, 1024 | "execution_count": 52, 1025 | "metadata": {}, 1026 | "output_type": "execute_result" 1027 | } 1028 | ], 1029 | "source": [ 1030 | "microdados_enem_rj.groupby(['NO_MUNICIPIO_RESIDENCIA'])['NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 1031 | " 'NU_NOTA_MT'].mean()" 1032 | ] 1033 | }, 1034 | { 1035 | "cell_type": "code", 1036 | "execution_count": null, 1037 | "metadata": {}, 1038 | "outputs": [], 1039 | "source": [] 1040 | }, 1041 | { 1042 | "cell_type": "code", 1043 | "execution_count": null, 1044 | "metadata": {}, 1045 | "outputs": [], 1046 | "source": [] 1047 | }, 1048 | { 1049 | "cell_type": "code", 1050 | "execution_count": null, 1051 | "metadata": {}, 1052 | "outputs": [], 1053 | "source": [] 1054 | } 1055 | ], 1056 | "metadata": { 1057 | "kernelspec": { 1058 | "display_name": "Python 3", 1059 | "language": "python", 1060 | "name": "python3" 1061 | }, 1062 | "language_info": { 1063 | "codemirror_mode": { 1064 | "name": "ipython", 1065 | "version": 3 1066 | }, 1067 | "file_extension": ".py", 1068 | "mimetype": "text/x-python", 1069 | "name": "python", 1070 | "nbconvert_exporter": "python", 1071 | "pygments_lexer": "ipython3", 1072 | "version": "3.7.4" 1073 | } 1074 | }, 1075 | "nbformat": 4, 1076 | "nbformat_minor": 2 1077 | } 1078 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # Dicas de Pandas 2 | 3 | Esse repositório foi criado para a série de vídeos de Dicas do Pandas do canal [Programação Dinâmica](https://www.youtube.com/programacaodinamica). 4 | 5 | - [Assita os vídeos da playlist de Dica de Pandas](https://www.youtube.com/playlist?list=PL5TJqBvpXQv6SSsEgQrNwpOLTupXPuiMQ) 6 | -------------------------------------------------------------------------------- /Variáveis categóricas - Dica Pandas #6.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "## Variáveis categóricas - Dica Pandas #6" 8 | ] 9 | }, 10 | { 11 | "cell_type": "markdown", 12 | "metadata": {}, 13 | "source": [ 14 | "https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.cut.html" 15 | ] 16 | }, 17 | { 18 | "cell_type": "code", 19 | "execution_count": 1, 20 | "metadata": {}, 21 | "outputs": [], 22 | "source": [ 23 | "from IPython.display import YouTubeVideo, Image" 24 | ] 25 | }, 26 | { 27 | "cell_type": "code", 28 | "execution_count": 2, 29 | "metadata": {}, 30 | "outputs": [ 31 | { 32 | "data": { 33 | "image/jpeg": "\n", 34 | "text/html": [ 35 | "\n", 36 | " \n", 43 | " " 44 | ], 45 | "text/plain": [ 46 | "" 47 | ] 48 | }, 49 | "metadata": {}, 50 | "output_type": "display_data" 51 | } 52 | ], 53 | "source": [ 54 | "display(YouTubeVideo('Sp9oqlVBgJc', width=550, height=310))" 55 | ] 56 | }, 57 | { 58 | "cell_type": "code", 59 | "execution_count": 3, 60 | "metadata": {}, 61 | "outputs": [], 62 | "source": [ 63 | "import pandas as pd" 64 | ] 65 | }, 66 | { 67 | "cell_type": "code", 68 | "execution_count": 4, 69 | "metadata": {}, 70 | "outputs": [], 71 | "source": [ 72 | "microdados_enem = pd.read_csv('../dados/microdados-enem-2018/DADOS/MICRODADOS_ENEM_2018.csv',nrows=0,sep=';',encoding='ISO-8859-1')" 73 | ] 74 | }, 75 | { 76 | "cell_type": "code", 77 | "execution_count": 5, 78 | "metadata": {}, 79 | "outputs": [ 80 | { 81 | "data": { 82 | "text/html": [ 83 | "
\n", 84 | "\n", 97 | "\n", 98 | " \n", 99 | " \n", 100 | " \n", 101 | " \n", 102 | " \n", 103 | " \n", 104 | " \n", 105 | " \n", 106 | " \n", 107 | " \n", 108 | " \n", 109 | " \n", 110 | " \n", 111 | " \n", 112 | " \n", 113 | " \n", 114 | " \n", 115 | " \n", 116 | " \n", 117 | " \n", 118 | " \n", 119 | " \n", 120 | " \n", 121 | " \n", 122 | " \n", 123 | " \n", 124 | " \n", 125 | " \n", 126 | "
NU_INSCRICAONU_ANOCO_MUNICIPIO_RESIDENCIANO_MUNICIPIO_RESIDENCIACO_UF_RESIDENCIASG_UF_RESIDENCIANU_IDADETP_SEXOTP_ESTADO_CIVILTP_COR_RACA...Q018Q019Q020Q021Q022Q023Q024Q025Q026Q027
\n", 127 | "

0 rows × 137 columns

\n", 128 | "
" 129 | ], 130 | "text/plain": [ 131 | "Empty DataFrame\n", 132 | "Columns: [NU_INSCRICAO, NU_ANO, CO_MUNICIPIO_RESIDENCIA, NO_MUNICIPIO_RESIDENCIA, CO_UF_RESIDENCIA, SG_UF_RESIDENCIA, NU_IDADE, TP_SEXO, TP_ESTADO_CIVIL, TP_COR_RACA, TP_NACIONALIDADE, CO_MUNICIPIO_NASCIMENTO, NO_MUNICIPIO_NASCIMENTO, CO_UF_NASCIMENTO, SG_UF_NASCIMENTO, TP_ST_CONCLUSAO, TP_ANO_CONCLUIU, TP_ESCOLA, TP_ENSINO, IN_TREINEIRO, CO_ESCOLA, CO_MUNICIPIO_ESC, NO_MUNICIPIO_ESC, CO_UF_ESC, SG_UF_ESC, TP_DEPENDENCIA_ADM_ESC, TP_LOCALIZACAO_ESC, TP_SIT_FUNC_ESC, IN_BAIXA_VISAO, IN_CEGUEIRA, IN_SURDEZ, IN_DEFICIENCIA_AUDITIVA, IN_SURDO_CEGUEIRA, IN_DEFICIENCIA_FISICA, IN_DEFICIENCIA_MENTAL, IN_DEFICIT_ATENCAO, IN_DISLEXIA, IN_DISCALCULIA, IN_AUTISMO, IN_VISAO_MONOCULAR, IN_OUTRA_DEF, IN_GESTANTE, IN_LACTANTE, IN_IDOSO, IN_ESTUDA_CLASSE_HOSPITALAR, IN_SEM_RECURSO, IN_BRAILLE, IN_AMPLIADA_24, IN_AMPLIADA_18, IN_LEDOR, IN_ACESSO, IN_TRANSCRICAO, IN_LIBRAS, IN_LEITURA_LABIAL, IN_MESA_CADEIRA_RODAS, IN_MESA_CADEIRA_SEPARADA, IN_APOIO_PERNA, IN_GUIA_INTERPRETE, IN_COMPUTADOR, IN_CADEIRA_ESPECIAL, IN_CADEIRA_CANHOTO, IN_CADEIRA_ACOLCHOADA, IN_PROVA_DEITADO, IN_MOBILIARIO_OBESO, IN_LAMINA_OVERLAY, IN_PROTETOR_AURICULAR, IN_MEDIDOR_GLICOSE, IN_MAQUINA_BRAILE, IN_SOROBAN, IN_MARCA_PASSO, IN_SONDA, IN_MEDICAMENTOS, IN_SALA_INDIVIDUAL, IN_SALA_ESPECIAL, IN_SALA_ACOMPANHANTE, IN_MOBILIARIO_ESPECIFICO, IN_MATERIAL_ESPECIFICO, IN_NOME_SOCIAL, CO_MUNICIPIO_PROVA, NO_MUNICIPIO_PROVA, CO_UF_PROVA, SG_UF_PROVA, TP_PRESENCA_CN, TP_PRESENCA_CH, TP_PRESENCA_LC, TP_PRESENCA_MT, CO_PROVA_CN, CO_PROVA_CH, CO_PROVA_LC, CO_PROVA_MT, NU_NOTA_CN, NU_NOTA_CH, NU_NOTA_LC, NU_NOTA_MT, TX_RESPOSTAS_CN, TX_RESPOSTAS_CH, TX_RESPOSTAS_LC, TX_RESPOSTAS_MT, TP_LINGUA, TX_GABARITO_CN, ...]\n", 133 | "Index: []\n", 134 | "\n", 135 | "[0 rows x 137 columns]" 136 | ] 137 | }, 138 | "execution_count": 5, 139 | "metadata": {}, 140 | "output_type": "execute_result" 141 | } 142 | ], 143 | "source": [ 144 | "microdados_enem.head()" 145 | ] 146 | }, 147 | { 148 | "cell_type": "code", 149 | "execution_count": 6, 150 | "metadata": {}, 151 | "outputs": [ 152 | { 153 | "data": { 154 | "text/plain": [ 155 | "array(['NU_INSCRICAO', 'NU_ANO', 'CO_MUNICIPIO_RESIDENCIA',\n", 156 | " 'NO_MUNICIPIO_RESIDENCIA', 'CO_UF_RESIDENCIA', 'SG_UF_RESIDENCIA',\n", 157 | " 'NU_IDADE', 'TP_SEXO', 'TP_ESTADO_CIVIL', 'TP_COR_RACA',\n", 158 | " 'TP_NACIONALIDADE', 'CO_MUNICIPIO_NASCIMENTO',\n", 159 | " 'NO_MUNICIPIO_NASCIMENTO', 'CO_UF_NASCIMENTO', 'SG_UF_NASCIMENTO',\n", 160 | " 'TP_ST_CONCLUSAO', 'TP_ANO_CONCLUIU', 'TP_ESCOLA', 'TP_ENSINO',\n", 161 | " 'IN_TREINEIRO', 'CO_ESCOLA', 'CO_MUNICIPIO_ESC',\n", 162 | " 'NO_MUNICIPIO_ESC', 'CO_UF_ESC', 'SG_UF_ESC',\n", 163 | " 'TP_DEPENDENCIA_ADM_ESC', 'TP_LOCALIZACAO_ESC', 'TP_SIT_FUNC_ESC',\n", 164 | " 'IN_BAIXA_VISAO', 'IN_CEGUEIRA', 'IN_SURDEZ',\n", 165 | " 'IN_DEFICIENCIA_AUDITIVA', 'IN_SURDO_CEGUEIRA',\n", 166 | " 'IN_DEFICIENCIA_FISICA', 'IN_DEFICIENCIA_MENTAL',\n", 167 | " 'IN_DEFICIT_ATENCAO', 'IN_DISLEXIA', 'IN_DISCALCULIA',\n", 168 | " 'IN_AUTISMO', 'IN_VISAO_MONOCULAR', 'IN_OUTRA_DEF', 'IN_GESTANTE',\n", 169 | " 'IN_LACTANTE', 'IN_IDOSO', 'IN_ESTUDA_CLASSE_HOSPITALAR',\n", 170 | " 'IN_SEM_RECURSO', 'IN_BRAILLE', 'IN_AMPLIADA_24', 'IN_AMPLIADA_18',\n", 171 | " 'IN_LEDOR', 'IN_ACESSO', 'IN_TRANSCRICAO', 'IN_LIBRAS',\n", 172 | " 'IN_LEITURA_LABIAL', 'IN_MESA_CADEIRA_RODAS',\n", 173 | " 'IN_MESA_CADEIRA_SEPARADA', 'IN_APOIO_PERNA', 'IN_GUIA_INTERPRETE',\n", 174 | " 'IN_COMPUTADOR', 'IN_CADEIRA_ESPECIAL', 'IN_CADEIRA_CANHOTO',\n", 175 | " 'IN_CADEIRA_ACOLCHOADA', 'IN_PROVA_DEITADO', 'IN_MOBILIARIO_OBESO',\n", 176 | " 'IN_LAMINA_OVERLAY', 'IN_PROTETOR_AURICULAR', 'IN_MEDIDOR_GLICOSE',\n", 177 | " 'IN_MAQUINA_BRAILE', 'IN_SOROBAN', 'IN_MARCA_PASSO', 'IN_SONDA',\n", 178 | " 'IN_MEDICAMENTOS', 'IN_SALA_INDIVIDUAL', 'IN_SALA_ESPECIAL',\n", 179 | " 'IN_SALA_ACOMPANHANTE', 'IN_MOBILIARIO_ESPECIFICO',\n", 180 | " 'IN_MATERIAL_ESPECIFICO', 'IN_NOME_SOCIAL', 'CO_MUNICIPIO_PROVA',\n", 181 | " 'NO_MUNICIPIO_PROVA', 'CO_UF_PROVA', 'SG_UF_PROVA',\n", 182 | " 'TP_PRESENCA_CN', 'TP_PRESENCA_CH', 'TP_PRESENCA_LC',\n", 183 | " 'TP_PRESENCA_MT', 'CO_PROVA_CN', 'CO_PROVA_CH', 'CO_PROVA_LC',\n", 184 | " 'CO_PROVA_MT', 'NU_NOTA_CN', 'NU_NOTA_CH', 'NU_NOTA_LC',\n", 185 | " 'NU_NOTA_MT', 'TX_RESPOSTAS_CN', 'TX_RESPOSTAS_CH',\n", 186 | " 'TX_RESPOSTAS_LC', 'TX_RESPOSTAS_MT', 'TP_LINGUA',\n", 187 | " 'TX_GABARITO_CN', 'TX_GABARITO_CH', 'TX_GABARITO_LC',\n", 188 | " 'TX_GABARITO_MT', 'TP_STATUS_REDACAO', 'NU_NOTA_COMP1',\n", 189 | " 'NU_NOTA_COMP2', 'NU_NOTA_COMP3', 'NU_NOTA_COMP4', 'NU_NOTA_COMP5',\n", 190 | " 'NU_NOTA_REDACAO', 'Q001', 'Q002', 'Q003', 'Q004', 'Q005', 'Q006',\n", 191 | " 'Q007', 'Q008', 'Q009', 'Q010', 'Q011', 'Q012', 'Q013', 'Q014',\n", 192 | " 'Q015', 'Q016', 'Q017', 'Q018', 'Q019', 'Q020', 'Q021', 'Q022',\n", 193 | " 'Q023', 'Q024', 'Q025', 'Q026', 'Q027'], dtype=object)" 194 | ] 195 | }, 196 | "execution_count": 6, 197 | "metadata": {}, 198 | "output_type": "execute_result" 199 | } 200 | ], 201 | "source": [ 202 | "microdados_enem.columns.values" 203 | ] 204 | }, 205 | { 206 | "cell_type": "code", 207 | "execution_count": 7, 208 | "metadata": {}, 209 | "outputs": [], 210 | "source": [ 211 | "cols = ['NU_NOTA_MT', 'Q027']" 212 | ] 213 | }, 214 | { 215 | "cell_type": "code", 216 | "execution_count": 8, 217 | "metadata": {}, 218 | "outputs": [], 219 | "source": [ 220 | "microdados_enem = pd.read_csv('../dados/microdados-enem-2018/DADOS/MICRODADOS_ENEM_2018.csv',usecols=cols,sep=';',encoding='ISO-8859-1',\n", 221 | " dtype={'Q027':'category'})\n" 222 | ] 223 | }, 224 | { 225 | "cell_type": "code", 226 | "execution_count": 9, 227 | "metadata": {}, 228 | "outputs": [ 229 | { 230 | "data": { 231 | "text/html": [ 232 | "
\n", 233 | "\n", 246 | "\n", 247 | " \n", 248 | " \n", 249 | " \n", 250 | " \n", 251 | " \n", 252 | " \n", 253 | " \n", 254 | " \n", 255 | " \n", 256 | " \n", 257 | " \n", 258 | " \n", 259 | " \n", 260 | " \n", 261 | " \n", 262 | " \n", 263 | " \n", 264 | " \n", 265 | " \n", 266 | " \n", 267 | " \n", 268 | " \n", 269 | " \n", 270 | " \n", 271 | " \n", 272 | " \n", 273 | " \n", 274 | " \n", 275 | " \n", 276 | " \n", 277 | " \n", 278 | " \n", 279 | " \n", 280 | " \n", 281 | "
NU_NOTA_MTQ027
0NaNA
1480.3A
2NaNA
3NaNA
4NaNA
\n", 282 | "
" 283 | ], 284 | "text/plain": [ 285 | " NU_NOTA_MT Q027\n", 286 | "0 NaN A\n", 287 | "1 480.3 A\n", 288 | "2 NaN A\n", 289 | "3 NaN A\n", 290 | "4 NaN A" 291 | ] 292 | }, 293 | "execution_count": 9, 294 | "metadata": {}, 295 | "output_type": "execute_result" 296 | } 297 | ], 298 | "source": [ 299 | "microdados_enem.head()" 300 | ] 301 | }, 302 | { 303 | "cell_type": "code", 304 | "execution_count": 10, 305 | "metadata": {}, 306 | "outputs": [ 307 | { 308 | "name": "stdout", 309 | "output_type": "stream", 310 | "text": [ 311 | "\n", 312 | "RangeIndex: 5513747 entries, 0 to 5513746\n", 313 | "Data columns (total 2 columns):\n", 314 | "NU_NOTA_MT float64\n", 315 | "Q027 category\n", 316 | "dtypes: category(1), float64(1)\n", 317 | "memory usage: 47.3 MB\n" 318 | ] 319 | } 320 | ], 321 | "source": [ 322 | "microdados_enem.info()" 323 | ] 324 | }, 325 | { 326 | "cell_type": "code", 327 | "execution_count": 11, 328 | "metadata": {}, 329 | "outputs": [ 330 | { 331 | "data": { 332 | "text/plain": [ 333 | "NU_NOTA_MT 1608648\n", 334 | "Q027 0\n", 335 | "dtype: int64" 336 | ] 337 | }, 338 | "execution_count": 11, 339 | "metadata": {}, 340 | "output_type": "execute_result" 341 | } 342 | ], 343 | "source": [ 344 | "microdados_enem.isna().sum()" 345 | ] 346 | }, 347 | { 348 | "cell_type": "code", 349 | "execution_count": 12, 350 | "metadata": {}, 351 | "outputs": [], 352 | "source": [ 353 | "microdados_enem.dropna(inplace=True)" 354 | ] 355 | }, 356 | { 357 | "cell_type": "code", 358 | "execution_count": 13, 359 | "metadata": {}, 360 | "outputs": [ 361 | { 362 | "data": { 363 | "text/plain": [ 364 | "NU_NOTA_MT 0\n", 365 | "Q027 0\n", 366 | "dtype: int64" 367 | ] 368 | }, 369 | "execution_count": 13, 370 | "metadata": {}, 371 | "output_type": "execute_result" 372 | } 373 | ], 374 | "source": [ 375 | "microdados_enem.isna().sum()" 376 | ] 377 | }, 378 | { 379 | "cell_type": "code", 380 | "execution_count": 14, 381 | "metadata": {}, 382 | "outputs": [ 383 | { 384 | "name": "stdout", 385 | "output_type": "stream", 386 | "text": [ 387 | "\n", 388 | "Int64Index: 3905099 entries, 1 to 5513746\n", 389 | "Data columns (total 2 columns):\n", 390 | "NU_NOTA_MT float64\n", 391 | "Q027 category\n", 392 | "dtypes: category(1), float64(1)\n", 393 | "memory usage: 63.3 MB\n" 394 | ] 395 | } 396 | ], 397 | "source": [ 398 | "microdados_enem.info()" 399 | ] 400 | }, 401 | { 402 | "cell_type": "markdown", 403 | "metadata": {}, 404 | "source": [ 405 | "Nota: Adicionei o comando abaixo, após um comentário no vídeo sobre o uso de memória" 406 | ] 407 | }, 408 | { 409 | "cell_type": "code", 410 | "execution_count": 16, 411 | "metadata": { 412 | "scrolled": true 413 | }, 414 | "outputs": [], 415 | "source": [ 416 | "microdados_enem = microdados_enem.reset_index(drop=True)" 417 | ] 418 | }, 419 | { 420 | "cell_type": "code", 421 | "execution_count": 17, 422 | "metadata": {}, 423 | "outputs": [ 424 | { 425 | "name": "stdout", 426 | "output_type": "stream", 427 | "text": [ 428 | "\n", 429 | "RangeIndex: 3905099 entries, 0 to 3905098\n", 430 | "Data columns (total 2 columns):\n", 431 | "NU_NOTA_MT float64\n", 432 | "Q027 category\n", 433 | "dtypes: category(1), float64(1)\n", 434 | "memory usage: 33.5 MB\n" 435 | ] 436 | } 437 | ], 438 | "source": [ 439 | "microdados_enem.info()" 440 | ] 441 | }, 442 | { 443 | "cell_type": "code", 444 | "execution_count": 18, 445 | "metadata": {}, 446 | "outputs": [], 447 | "source": [ 448 | "microdados_enem['Q027_GRUPOS'] = microdados_enem['Q027'].cat.codes" 449 | ] 450 | }, 451 | { 452 | "cell_type": "code", 453 | "execution_count": 19, 454 | "metadata": {}, 455 | "outputs": [ 456 | { 457 | "data": { 458 | "text/plain": [ 459 | "A 2850097\n", 460 | "D 526557\n", 461 | "B 327804\n", 462 | "C 104161\n", 463 | "E 94813\n", 464 | "F 1667\n", 465 | "Name: Q027, dtype: int64" 466 | ] 467 | }, 468 | "execution_count": 19, 469 | "metadata": {}, 470 | "output_type": "execute_result" 471 | } 472 | ], 473 | "source": [ 474 | "microdados_enem['Q027'].value_counts()" 475 | ] 476 | }, 477 | { 478 | "cell_type": "code", 479 | "execution_count": 20, 480 | "metadata": {}, 481 | "outputs": [ 482 | { 483 | "data": { 484 | "text/plain": [ 485 | "0 2850097\n", 486 | "3 526557\n", 487 | "1 327804\n", 488 | "2 104161\n", 489 | "4 94813\n", 490 | "5 1667\n", 491 | "Name: Q027_GRUPOS, dtype: int64" 492 | ] 493 | }, 494 | "execution_count": 20, 495 | "metadata": {}, 496 | "output_type": "execute_result" 497 | } 498 | ], 499 | "source": [ 500 | "microdados_enem['Q027_GRUPOS'].value_counts()" 501 | ] 502 | }, 503 | { 504 | "cell_type": "code", 505 | "execution_count": 21, 506 | "metadata": {}, 507 | "outputs": [ 508 | { 509 | "data": { 510 | "text/html": [ 511 | "
\n", 512 | "\n", 525 | "\n", 526 | " \n", 527 | " \n", 528 | " \n", 529 | " \n", 530 | " \n", 531 | " \n", 532 | " \n", 533 | " \n", 534 | " \n", 535 | " \n", 536 | " \n", 537 | " \n", 538 | " \n", 539 | " \n", 540 | " \n", 541 | " \n", 542 | " \n", 543 | " \n", 544 | " \n", 545 | " \n", 546 | " \n", 547 | " \n", 548 | " \n", 549 | " \n", 550 | " \n", 551 | " \n", 552 | " \n", 553 | " \n", 554 | " \n", 555 | " \n", 556 | " \n", 557 | " \n", 558 | " \n", 559 | " \n", 560 | " \n", 561 | " \n", 562 | " \n", 563 | " \n", 564 | " \n", 565 | " \n", 566 | "
NU_NOTA_MTQ027Q027_GRUPOS
0480.3A0
1538.8A0
2733.8A0
3459.0A0
4525.4A0
\n", 567 | "
" 568 | ], 569 | "text/plain": [ 570 | " NU_NOTA_MT Q027 Q027_GRUPOS\n", 571 | "0 480.3 A 0\n", 572 | "1 538.8 A 0\n", 573 | "2 733.8 A 0\n", 574 | "3 459.0 A 0\n", 575 | "4 525.4 A 0" 576 | ] 577 | }, 578 | "execution_count": 21, 579 | "metadata": {}, 580 | "output_type": "execute_result" 581 | } 582 | ], 583 | "source": [ 584 | "microdados_enem.head()" 585 | ] 586 | }, 587 | { 588 | "cell_type": "code", 589 | "execution_count": 22, 590 | "metadata": {}, 591 | "outputs": [ 592 | { 593 | "data": { 594 | "text/html": [ 595 | "
\n", 596 | "\n", 609 | "\n", 610 | " \n", 611 | " \n", 612 | " \n", 613 | " \n", 614 | " \n", 615 | " \n", 616 | " \n", 617 | " \n", 618 | " \n", 619 | " \n", 620 | " \n", 621 | " \n", 622 | " \n", 623 | " \n", 624 | " \n", 625 | " \n", 626 | " \n", 627 | " \n", 628 | " \n", 629 | " \n", 630 | " \n", 631 | " \n", 632 | " \n", 633 | " \n", 634 | " \n", 635 | " \n", 636 | " \n", 637 | " \n", 638 | " \n", 639 | " \n", 640 | " \n", 641 | " \n", 642 | " \n", 643 | " \n", 644 | " \n", 645 | " \n", 646 | " \n", 647 | " \n", 648 | " \n", 649 | " \n", 650 | " \n", 651 | " \n", 652 | " \n", 653 | " \n", 654 | " \n", 655 | " \n", 656 | " \n", 657 | " \n", 658 | " \n", 659 | "
NU_NOTA_MTQ027_GRUPOS
count3.905099e+063.905099e+06
mean5.354056e+026.410552e-01
std1.031512e+021.179987e+00
min0.000000e+000.000000e+00
25%4.553000e+020.000000e+00
50%5.166000e+020.000000e+00
75%6.007000e+021.000000e+00
max9.961000e+025.000000e+00
\n", 660 | "
" 661 | ], 662 | "text/plain": [ 663 | " NU_NOTA_MT Q027_GRUPOS\n", 664 | "count 3.905099e+06 3.905099e+06\n", 665 | "mean 5.354056e+02 6.410552e-01\n", 666 | "std 1.031512e+02 1.179987e+00\n", 667 | "min 0.000000e+00 0.000000e+00\n", 668 | "25% 4.553000e+02 0.000000e+00\n", 669 | "50% 5.166000e+02 0.000000e+00\n", 670 | "75% 6.007000e+02 1.000000e+00\n", 671 | "max 9.961000e+02 5.000000e+00" 672 | ] 673 | }, 674 | "execution_count": 22, 675 | "metadata": {}, 676 | "output_type": "execute_result" 677 | } 678 | ], 679 | "source": [ 680 | "microdados_enem.describe()" 681 | ] 682 | }, 683 | { 684 | "cell_type": "code", 685 | "execution_count": 23, 686 | "metadata": {}, 687 | "outputs": [ 688 | { 689 | "data": { 690 | "text/plain": [ 691 | "média baixa 1465276\n", 692 | "média alta 1224868\n", 693 | "alta 942984\n", 694 | "baixa 232752\n", 695 | "Name: NU_NOTA_MT, dtype: int64" 696 | ] 697 | }, 698 | "execution_count": 23, 699 | "metadata": {}, 700 | "output_type": "execute_result" 701 | } 702 | ], 703 | "source": [ 704 | "pd.cut(microdados_enem.NU_NOTA_MT, bins=[0,400,500,600,800],labels=['baixa','média baixa','média alta','alta']).value_counts()" 705 | ] 706 | }, 707 | { 708 | "cell_type": "code", 709 | "execution_count": 24, 710 | "metadata": {}, 711 | "outputs": [], 712 | "source": [ 713 | "microdados_enem['NU_NOTA_MT_GRUPOS']=pd.qcut(microdados_enem.NU_NOTA_MT, q=4,labels=['baixa','média baixa','média alta','alta'])\n" 714 | ] 715 | }, 716 | { 717 | "cell_type": "code", 718 | "execution_count": 25, 719 | "metadata": {}, 720 | "outputs": [ 721 | { 722 | "data": { 723 | "text/html": [ 724 | "
\n", 725 | "\n", 738 | "\n", 739 | " \n", 740 | " \n", 741 | " \n", 742 | " \n", 743 | " \n", 744 | " \n", 745 | " \n", 746 | " \n", 747 | " \n", 748 | " \n", 749 | " \n", 750 | " \n", 751 | " \n", 752 | " \n", 753 | " \n", 754 | " \n", 755 | " \n", 756 | " \n", 757 | " \n", 758 | " \n", 759 | " \n", 760 | " \n", 761 | " \n", 762 | " \n", 763 | " \n", 764 | " \n", 765 | " \n", 766 | " \n", 767 | " \n", 768 | " \n", 769 | " \n", 770 | " \n", 771 | " \n", 772 | " \n", 773 | " \n", 774 | " \n", 775 | " \n", 776 | " \n", 777 | " \n", 778 | " \n", 779 | " \n", 780 | " \n", 781 | " \n", 782 | " \n", 783 | " \n", 784 | " \n", 785 | "
NU_NOTA_MTQ027Q027_GRUPOSNU_NOTA_MT_GRUPOS
0480.3A0média baixa
1538.8A0média alta
2733.8A0alta
3459.0A0média baixa
4525.4A0média alta
\n", 786 | "
" 787 | ], 788 | "text/plain": [ 789 | " NU_NOTA_MT Q027 Q027_GRUPOS NU_NOTA_MT_GRUPOS\n", 790 | "0 480.3 A 0 média baixa\n", 791 | "1 538.8 A 0 média alta\n", 792 | "2 733.8 A 0 alta\n", 793 | "3 459.0 A 0 média baixa\n", 794 | "4 525.4 A 0 média alta" 795 | ] 796 | }, 797 | "execution_count": 25, 798 | "metadata": {}, 799 | "output_type": "execute_result" 800 | } 801 | ], 802 | "source": [ 803 | "microdados_enem.head()" 804 | ] 805 | }, 806 | { 807 | "cell_type": "code", 808 | "execution_count": null, 809 | "metadata": {}, 810 | "outputs": [], 811 | "source": [] 812 | }, 813 | { 814 | "cell_type": "code", 815 | "execution_count": null, 816 | "metadata": {}, 817 | "outputs": [], 818 | "source": [] 819 | } 820 | ], 821 | "metadata": { 822 | "kernelspec": { 823 | "display_name": "Python 3", 824 | "language": "python", 825 | "name": "python3" 826 | }, 827 | "language_info": { 828 | "codemirror_mode": { 829 | "name": "ipython", 830 | "version": 3 831 | }, 832 | "file_extension": ".py", 833 | "mimetype": "text/x-python", 834 | "name": "python", 835 | "nbconvert_exporter": "python", 836 | "pygments_lexer": "ipython3", 837 | "version": "3.7.4" 838 | } 839 | }, 840 | "nbformat": 4, 841 | "nbformat_minor": 2 842 | } 843 | -------------------------------------------------------------------------------- /dados/HIST_PAINEL_COVIDBR_12jun2020.xlsx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/programacaodinamica/dicas-pandas/8a70f3357a95ddf2e05987cb20e361cab3d7bc6f/dados/HIST_PAINEL_COVIDBR_12jun2020.xlsx -------------------------------------------------------------------------------- /dados/TA_PRECO_MEDICAMENTO_GOV.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/programacaodinamica/dicas-pandas/8a70f3357a95ddf2e05987cb20e361cab3d7bc6f/dados/TA_PRECO_MEDICAMENTO_GOV.csv -------------------------------------------------------------------------------- /dados/bcdata-dolar-2023.csv: -------------------------------------------------------------------------------- 1 | "data";"valor" 2 | "02/01/2023";"5,3430" 3 | "03/01/2023";"5,3753" 4 | "04/01/2023";"5,4453" 5 | "05/01/2023";"5,4020" 6 | "06/01/2023";"5,2849" 7 | "09/01/2023";"5,2961" 8 | "10/01/2023";"5,2389" 9 | "11/01/2023";"5,2014" 10 | "12/01/2023";"5,1394" 11 | "13/01/2023";"5,1140" 12 | "16/01/2023";"5,1109" 13 | "17/01/2023";"5,1197" 14 | "18/01/2023";"5,0903" 15 | "19/01/2023";"5,2138" 16 | "20/01/2023";"5,1980" 17 | "23/01/2023";"5,1916" 18 | "24/01/2023";"5,1690" 19 | "25/01/2023";"5,1036" 20 | "26/01/2023";"5,0945" 21 | "27/01/2023";"5,0761" 22 | "30/01/2023";"5,0953" 23 | "31/01/2023";"5,0987" 24 | "01/02/2023";"5,0715" 25 | "02/02/2023";"4,9895" 26 | "03/02/2023";"5,1024" 27 | "06/02/2023";"5,1757" 28 | "07/02/2023";"5,1689" 29 | "08/02/2023";"5,2030" 30 | "09/02/2023";"5,2309" 31 | "10/02/2023";"5,2520" 32 | "13/02/2023";"5,1828" 33 | "14/02/2023";"5,1501" 34 | "15/02/2023";"5,2237" 35 | "16/02/2023";"5,2426" 36 | "17/02/2023";"5,2006" 37 | "22/02/2023";"5,1724" 38 | "23/02/2023";"5,1324" 39 | "24/02/2023";"5,1785" 40 | "27/02/2023";"5,1954" 41 | "28/02/2023";"5,2072" 42 | "01/03/2023";"5,2064" 43 | "02/03/2023";"5,2074" 44 | "03/03/2023";"5,2031" 45 | "06/03/2023";"5,1964" 46 | "07/03/2023";"5,1895" 47 | "08/03/2023";"5,1381" 48 | "09/03/2023";"5,1347" 49 | "10/03/2023";"5,1816" 50 | "13/03/2023";"5,2394" 51 | "14/03/2023";"5,2356" 52 | "15/03/2023";"5,2975" 53 | "16/03/2023";"5,2886" 54 | "17/03/2023";"5,2673" 55 | "20/03/2023";"5,2461" 56 | "21/03/2023";"5,2438" 57 | "22/03/2023";"5,2642" 58 | "23/03/2023";"5,2626" 59 | "24/03/2023";"5,2915" 60 | "27/03/2023";"5,2300" 61 | "28/03/2023";"5,1727" 62 | "29/03/2023";"5,1487" 63 | "30/03/2023";"5,1248" 64 | "31/03/2023";"5,0798" 65 | "03/04/2023";"5,0631" 66 | "04/04/2023";"5,0756" 67 | "05/04/2023";"5,0441" 68 | "06/04/2023";"5,0677" 69 | "10/04/2023";"5,0828" 70 | "11/04/2023";"5,0122" 71 | "12/04/2023";"4,9490" 72 | "13/04/2023";"4,9091" 73 | "14/04/2023";"4,9449" 74 | "17/04/2023";"4,9415" 75 | "18/04/2023";"4,9672" 76 | "19/04/2023";"5,0461" 77 | "20/04/2023";"5,0491" 78 | "24/04/2023";"5,0589" 79 | "25/04/2023";"5,0607" 80 | "26/04/2023";"5,0579" 81 | "27/04/2023";"5,0144" 82 | "28/04/2023";"5,0001" 83 | "02/05/2023";"5,0329" 84 | "03/05/2023";"5,0221" 85 | "04/05/2023";"5,0100" 86 | "05/05/2023";"4,9690" 87 | "08/05/2023";"4,9690" 88 | "09/05/2023";"5,0001" 89 | "10/05/2023";"4,9541" 90 | "11/05/2023";"4,9690" 91 | "12/05/2023";"4,9228" 92 | "15/05/2023";"4,9097" 93 | "16/05/2023";"4,9116" 94 | "17/05/2023";"4,9507" 95 | "18/05/2023";"4,9641" 96 | "19/05/2023";"4,9852" 97 | "22/05/2023";"4,9674" 98 | "23/05/2023";"4,9668" 99 | "24/05/2023";"4,9468" 100 | "25/05/2023";"4,9984" 101 | "26/05/2023";"5,0108" 102 | "29/05/2023";"4,9948" 103 | "30/05/2023";"5,0587" 104 | "31/05/2023";"5,0953" 105 | "01/06/2023";"5,0344" 106 | "02/06/2023";"4,9552" 107 | "05/06/2023";"4,9230" 108 | "06/06/2023";"4,9286" 109 | "07/06/2023";"4,9113" 110 | "09/06/2023";"4,8916" 111 | "12/06/2023";"4,8826" 112 | "13/06/2023";"4,8527" 113 | "14/06/2023";"4,8456" 114 | "15/06/2023";"4,8216" 115 | "16/06/2023";"4,8280" 116 | "19/06/2023";"4,7797" 117 | "20/06/2023";"4,7924" 118 | "21/06/2023";"4,7789" 119 | "22/06/2023";"4,7744" 120 | "23/06/2023";"4,7793" 121 | "26/06/2023";"4,7692" 122 | "27/06/2023";"4,7897" 123 | "28/06/2023";"4,8557" 124 | "29/06/2023";"4,8578" 125 | "30/06/2023";"4,8186" 126 | "03/07/2023";"4,7870" 127 | "04/07/2023";"4,8050" 128 | "05/07/2023";"4,8571" 129 | "06/07/2023";"4,8971" 130 | "07/07/2023";"4,8793" 131 | "10/07/2023";"4,8729" 132 | "11/07/2023";"4,8943" 133 | "12/07/2023";"4,8052" 134 | "13/07/2023";"4,8032" 135 | "14/07/2023";"4,7951" 136 | "17/07/2023";"4,8296" 137 | "18/07/2023";"4,8034" 138 | "19/07/2023";"4,7994" 139 | "20/07/2023";"4,7882" 140 | "21/07/2023";"4,7726" 141 | "24/07/2023";"4,7451" 142 | "25/07/2023";"4,7490" 143 | "26/07/2023";"4,7362" 144 | "27/07/2023";"4,7196" 145 | "28/07/2023";"4,7247" 146 | "31/07/2023";"4,7409" 147 | "01/08/2023";"4,7746" 148 | "02/08/2023";"4,8077" 149 | "03/08/2023";"4,8791" 150 | "04/08/2023";"4,8603" 151 | "07/08/2023";"4,9004" 152 | "08/08/2023";"4,9211" 153 | "09/08/2023";"4,9009" 154 | "10/08/2023";"4,8512" 155 | "11/08/2023";"4,8912" 156 | "14/08/2023";"4,9475" 157 | "15/08/2023";"4,9806" 158 | "16/08/2023";"4,9765" 159 | "17/08/2023";"4,9810" 160 | "18/08/2023";"4,9718" 161 | "21/08/2023";"4,9841" 162 | "22/08/2023";"4,9425" 163 | "23/08/2023";"4,8971" 164 | "24/08/2023";"4,8742" 165 | "25/08/2023";"4,8766" 166 | "28/08/2023";"4,8933" 167 | "29/08/2023";"4,8700" 168 | "30/08/2023";"4,8647" 169 | "31/08/2023";"4,9213" 170 | "01/09/2023";"4,9312" 171 | "04/09/2023";"4,9170" 172 | "05/09/2023";"4,9699" 173 | "06/09/2023";"4,9756" 174 | "08/09/2023";"4,9829" 175 | "11/09/2023";"4,9360" 176 | "12/09/2023";"4,9499" 177 | "13/09/2023";"4,9165" 178 | "14/09/2023";"4,8745" 179 | "15/09/2023";"4,8683" 180 | "18/09/2023";"4,8529" 181 | "19/09/2023";"4,8569" 182 | "20/09/2023";"4,8481" 183 | "21/09/2023";"4,9223" 184 | "22/09/2023";"4,9125" 185 | "25/09/2023";"4,9600" 186 | "26/09/2023";"4,9711" 187 | "27/09/2023";"5,0283" 188 | "28/09/2023";"5,0469" 189 | "29/09/2023";"5,0070" 190 | "02/10/2023";"5,0673" 191 | "03/10/2023";"5,1094" 192 | "04/10/2023";"5,1520" 193 | "05/10/2023";"5,1707" 194 | "06/10/2023";"5,1912" 195 | "09/10/2023";"5,1660" 196 | "10/10/2023";"5,0856" 197 | "11/10/2023";"5,0490" 198 | "13/10/2023";"5,0619" 199 | "16/10/2023";"5,0612" 200 | "17/10/2023";"5,0378" 201 | "18/10/2023";"5,0562" 202 | "19/10/2023";"5,0534" 203 | "20/10/2023";"5,0522" 204 | "23/10/2023";"5,0158" 205 | "24/10/2023";"5,0059" 206 | "25/10/2023";"4,9975" 207 | "26/10/2023";"5,0049" 208 | "27/10/2023";"4,9474" 209 | "30/10/2023";"5,0068" 210 | "31/10/2023";"5,0569" 211 | "01/11/2023";"5,0188" 212 | "03/11/2023";"4,8904" 213 | "06/11/2023";"4,8993" 214 | "07/11/2023";"4,8664" 215 | "08/11/2023";"4,8849" 216 | "09/11/2023";"4,9001" 217 | "10/11/2023";"4,9213" 218 | "13/11/2023";"4,9240" 219 | "14/11/2023";"4,8676" 220 | "16/11/2023";"4,8569" 221 | "17/11/2023";"4,8843" 222 | "20/11/2023";"4,8717" 223 | "21/11/2023";"4,8800" 224 | "22/11/2023";"4,8962" 225 | "23/11/2023";"4,8925" 226 | "24/11/2023";"4,8921" 227 | "27/11/2023";"4,8945" 228 | "28/11/2023";"4,8861" 229 | "29/11/2023";"4,8927" 230 | "30/11/2023";"4,9349" 231 | "01/12/2023";"4,9185" 232 | "04/12/2023";"4,9085" 233 | "05/12/2023";"4,9516" 234 | "06/12/2023";"4,9025" 235 | "07/12/2023";"4,8943" 236 | "08/12/2023";"4,9152" 237 | "11/12/2023";"4,9434" 238 | "12/12/2023";"4,9470" 239 | "13/12/2023";"4,9573" 240 | "14/12/2023";"4,8906" 241 | "15/12/2023";"4,9391" 242 | "18/12/2023";"4,9393" 243 | "19/12/2023";"4,8657" 244 | "20/12/2023";"4,8760" 245 | "21/12/2023";"4,8749" 246 | "22/12/2023";"4,8613" 247 | "26/12/2023";"4,8362" 248 | "27/12/2023";"4,8300" 249 | "28/12/2023";"4,8407" 250 | "29/12/2023";"4,8407" 251 | --------------------------------------------------------------------------------