├── FakeNewsClassifier TFIDF.ipynb ├── FakeNewsCount_vectorizer.ipynb ├── README.md └── fake-news ├── submit.csv └── test.csv /FakeNewsCount_vectorizer.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "### Fake News Classifier\n", 8 | "Dataset: https://www.kaggle.com/c/fake-news/data#" 9 | ] 10 | }, 11 | { 12 | "cell_type": "code", 13 | "execution_count": 111, 14 | "metadata": {}, 15 | "outputs": [], 16 | "source": [ 17 | "import pandas as pd" 18 | ] 19 | }, 20 | { 21 | "cell_type": "code", 22 | "execution_count": 112, 23 | "metadata": {}, 24 | "outputs": [], 25 | "source": [ 26 | "df=pd.read_csv('fake-news/train.csv')" 27 | ] 28 | }, 29 | { 30 | "cell_type": "code", 31 | "execution_count": 113, 32 | "metadata": {}, 33 | "outputs": [ 34 | { 35 | "data": { 36 | "text/html": [ 37 | "
\n", 55 | " | id | \n", 56 | "title | \n", 57 | "author | \n", 58 | "text | \n", 59 | "label | \n", 60 | "
---|---|---|---|---|---|
0 | \n", 65 | "0 | \n", 66 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 67 | "Darrell Lucus | \n", 68 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 69 | "1 | \n", 70 | "
1 | \n", 73 | "1 | \n", 74 | "FLYNN: Hillary Clinton, Big Woman on Campus - ... | \n", 75 | "Daniel J. Flynn | \n", 76 | "Ever get the feeling your life circles the rou... | \n", 77 | "0 | \n", 78 | "
2 | \n", 81 | "2 | \n", 82 | "Why the Truth Might Get You Fired | \n", 83 | "Consortiumnews.com | \n", 84 | "Why the Truth Might Get You Fired October 29, ... | \n", 85 | "1 | \n", 86 | "
3 | \n", 89 | "3 | \n", 90 | "15 Civilians Killed In Single US Airstrike Hav... | \n", 91 | "Jessica Purkiss | \n", 92 | "Videos 15 Civilians Killed In Single US Airstr... | \n", 93 | "1 | \n", 94 | "
4 | \n", 97 | "4 | \n", 98 | "Iranian woman jailed for fictional unpublished... | \n", 99 | "Howard Portnoy | \n", 100 | "Print \\nAn Iranian woman has been sentenced to... | \n", 101 | "1 | \n", 102 | "
\n", 169 | " | id | \n", 170 | "title | \n", 171 | "author | \n", 172 | "text | \n", 173 | "
---|---|---|---|---|
0 | \n", 178 | "0 | \n", 179 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 180 | "Darrell Lucus | \n", 181 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 182 | "
1 | \n", 185 | "1 | \n", 186 | "FLYNN: Hillary Clinton, Big Woman on Campus - ... | \n", 187 | "Daniel J. Flynn | \n", 188 | "Ever get the feeling your life circles the rou... | \n", 189 | "
2 | \n", 192 | "2 | \n", 193 | "Why the Truth Might Get You Fired | \n", 194 | "Consortiumnews.com | \n", 195 | "Why the Truth Might Get You Fired October 29, ... | \n", 196 | "
3 | \n", 199 | "3 | \n", 200 | "15 Civilians Killed In Single US Airstrike Hav... | \n", 201 | "Jessica Purkiss | \n", 202 | "Videos 15 Civilians Killed In Single US Airstr... | \n", 203 | "
4 | \n", 206 | "4 | \n", 207 | "Iranian woman jailed for fictional unpublished... | \n", 208 | "Howard Portnoy | \n", 209 | "Print \\nAn Iranian woman has been sentenced to... | \n", 210 | "
\n", 339 | " | id | \n", 340 | "title | \n", 341 | "author | \n", 342 | "text | \n", 343 | "label | \n", 344 | "
---|---|---|---|---|---|
0 | \n", 349 | "0 | \n", 350 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 351 | "Darrell Lucus | \n", 352 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 353 | "1 | \n", 354 | "
1 | \n", 357 | "1 | \n", 358 | "FLYNN: Hillary Clinton, Big Woman on Campus - ... | \n", 359 | "Daniel J. Flynn | \n", 360 | "Ever get the feeling your life circles the rou... | \n", 361 | "0 | \n", 362 | "
2 | \n", 365 | "2 | \n", 366 | "Why the Truth Might Get You Fired | \n", 367 | "Consortiumnews.com | \n", 368 | "Why the Truth Might Get You Fired October 29, ... | \n", 369 | "1 | \n", 370 | "
3 | \n", 373 | "3 | \n", 374 | "15 Civilians Killed In Single US Airstrike Hav... | \n", 375 | "Jessica Purkiss | \n", 376 | "Videos 15 Civilians Killed In Single US Airstr... | \n", 377 | "1 | \n", 378 | "
4 | \n", 381 | "4 | \n", 382 | "Iranian woman jailed for fictional unpublished... | \n", 383 | "Howard Portnoy | \n", 384 | "Print \\nAn Iranian woman has been sentenced to... | \n", 385 | "1 | \n", 386 | "
5 | \n", 389 | "5 | \n", 390 | "Jackie Mason: Hollywood Would Love Trump if He... | \n", 391 | "Daniel Nussbaum | \n", 392 | "In these trying times, Jackie Mason is the Voi... | \n", 393 | "0 | \n", 394 | "
7 | \n", 397 | "7 | \n", 398 | "Benoît Hamon Wins French Socialist Party’s Pre... | \n", 399 | "Alissa J. Rubin | \n", 400 | "PARIS — France chose an idealistic, traditi... | \n", 401 | "0 | \n", 402 | "
9 | \n", 405 | "9 | \n", 406 | "A Back-Channel Plan for Ukraine and Russia, Co... | \n", 407 | "Megan Twohey and Scott Shane | \n", 408 | "A week before Michael T. Flynn resigned as nat... | \n", 409 | "0 | \n", 410 | "
10 | \n", 413 | "10 | \n", 414 | "Obama’s Organizing for Action Partners with So... | \n", 415 | "Aaron Klein | \n", 416 | "Organizing for Action, the activist group that... | \n", 417 | "0 | \n", 418 | "
11 | \n", 421 | "11 | \n", 422 | "BBC Comedy Sketch \"Real Housewives of ISIS\" Ca... | \n", 423 | "Chris Tomlinson | \n", 424 | "The BBC produced spoof on the “Real Housewives... | \n", 425 | "0 | \n", 426 | "
\n", 522 | " | index | \n", 523 | "id | \n", 524 | "title | \n", 525 | "author | \n", 526 | "text | \n", 527 | "label | \n", 528 | "
---|---|---|---|---|---|---|
0 | \n", 533 | "0 | \n", 534 | "0 | \n", 535 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 536 | "Darrell Lucus | \n", 537 | "House Dem Aide: We Didn’t Even See Comey’s Let... | \n", 538 | "1 | \n", 539 | "
1 | \n", 542 | "1 | \n", 543 | "1 | \n", 544 | "FLYNN: Hillary Clinton, Big Woman on Campus - ... | \n", 545 | "Daniel J. Flynn | \n", 546 | "Ever get the feeling your life circles the rou... | \n", 547 | "0 | \n", 548 | "
2 | \n", 551 | "2 | \n", 552 | "2 | \n", 553 | "Why the Truth Might Get You Fired | \n", 554 | "Consortiumnews.com | \n", 555 | "Why the Truth Might Get You Fired October 29, ... | \n", 556 | "1 | \n", 557 | "
3 | \n", 560 | "3 | \n", 561 | "3 | \n", 562 | "15 Civilians Killed In Single US Airstrike Hav... | \n", 563 | "Jessica Purkiss | \n", 564 | "Videos 15 Civilians Killed In Single US Airstr... | \n", 565 | "1 | \n", 566 | "
4 | \n", 569 | "4 | \n", 570 | "4 | \n", 571 | "Iranian woman jailed for fictional unpublished... | \n", 572 | "Howard Portnoy | \n", 573 | "Print \\nAn Iranian woman has been sentenced to... | \n", 574 | "1 | \n", 575 | "
5 | \n", 578 | "5 | \n", 579 | "5 | \n", 580 | "Jackie Mason: Hollywood Would Love Trump if He... | \n", 581 | "Daniel Nussbaum | \n", 582 | "In these trying times, Jackie Mason is the Voi... | \n", 583 | "0 | \n", 584 | "
6 | \n", 587 | "7 | \n", 588 | "7 | \n", 589 | "Benoît Hamon Wins French Socialist Party’s Pre... | \n", 590 | "Alissa J. Rubin | \n", 591 | "PARIS — France chose an idealistic, traditi... | \n", 592 | "0 | \n", 593 | "
7 | \n", 596 | "9 | \n", 597 | "9 | \n", 598 | "A Back-Channel Plan for Ukraine and Russia, Co... | \n", 599 | "Megan Twohey and Scott Shane | \n", 600 | "A week before Michael T. Flynn resigned as nat... | \n", 601 | "0 | \n", 602 | "
8 | \n", 605 | "10 | \n", 606 | "10 | \n", 607 | "Obama’s Organizing for Action Partners with So... | \n", 608 | "Aaron Klein | \n", 609 | "Organizing for Action, the activist group that... | \n", 610 | "0 | \n", 611 | "
9 | \n", 614 | "11 | \n", 615 | "11 | \n", 616 | "BBC Comedy Sketch \"Real Housewives of ISIS\" Ca... | \n", 617 | "Chris Tomlinson | \n", 618 | "The BBC produced spoof on the “Real Housewives... | \n", 619 | "0 | \n", 620 | "
\n", 895 | " | abandon | \n", 896 | "abc | \n", 897 | "abc news | \n", 898 | "abduct | \n", 899 | "abe | \n", 900 | "abedin | \n", 901 | "abl | \n", 902 | "abort | \n", 903 | "abroad | \n", 904 | "absolut | \n", 905 | "... | \n", 906 | "zero | \n", 907 | "zika | \n", 908 | "zika viru | \n", 909 | "zionist | \n", 910 | "zone | \n", 911 | "zone new | \n", 912 | "zone new york | \n", 913 | "zoo | \n", 914 | "zu | \n", 915 | "zuckerberg | \n", 916 | "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", 921 | "0 | \n", 922 | "0 | \n", 923 | "0 | \n", 924 | "0 | \n", 925 | "0 | \n", 926 | "0 | \n", 927 | "0 | \n", 928 | "0 | \n", 929 | "0 | \n", 930 | "0 | \n", 931 | "... | \n", 932 | "0 | \n", 933 | "0 | \n", 934 | "0 | \n", 935 | "0 | \n", 936 | "0 | \n", 937 | "0 | \n", 938 | "0 | \n", 939 | "0 | \n", 940 | "0 | \n", 941 | "0 | \n", 942 | "
1 | \n", 945 | "0 | \n", 946 | "0 | \n", 947 | "0 | \n", 948 | "0 | \n", 949 | "0 | \n", 950 | "0 | \n", 951 | "0 | \n", 952 | "0 | \n", 953 | "0 | \n", 954 | "0 | \n", 955 | "... | \n", 956 | "0 | \n", 957 | "0 | \n", 958 | "0 | \n", 959 | "0 | \n", 960 | "0 | \n", 961 | "0 | \n", 962 | "0 | \n", 963 | "0 | \n", 964 | "0 | \n", 965 | "0 | \n", 966 | "
2 | \n", 969 | "0 | \n", 970 | "0 | \n", 971 | "0 | \n", 972 | "0 | \n", 973 | "0 | \n", 974 | "0 | \n", 975 | "0 | \n", 976 | "0 | \n", 977 | "0 | \n", 978 | "0 | \n", 979 | "... | \n", 980 | "0 | \n", 981 | "0 | \n", 982 | "0 | \n", 983 | "0 | \n", 984 | "0 | \n", 985 | "0 | \n", 986 | "0 | \n", 987 | "0 | \n", 988 | "0 | \n", 989 | "0 | \n", 990 | "
3 | \n", 993 | "0 | \n", 994 | "0 | \n", 995 | "0 | \n", 996 | "0 | \n", 997 | "0 | \n", 998 | "0 | \n", 999 | "0 | \n", 1000 | "0 | \n", 1001 | "0 | \n", 1002 | "0 | \n", 1003 | "... | \n", 1004 | "0 | \n", 1005 | "0 | \n", 1006 | "0 | \n", 1007 | "0 | \n", 1008 | "0 | \n", 1009 | "0 | \n", 1010 | "0 | \n", 1011 | "0 | \n", 1012 | "0 | \n", 1013 | "0 | \n", 1014 | "
4 | \n", 1017 | "0 | \n", 1018 | "0 | \n", 1019 | "0 | \n", 1020 | "0 | \n", 1021 | "0 | \n", 1022 | "0 | \n", 1023 | "0 | \n", 1024 | "0 | \n", 1025 | "0 | \n", 1026 | "1 | \n", 1027 | "... | \n", 1028 | "0 | \n", 1029 | "0 | \n", 1030 | "0 | \n", 1031 | "0 | \n", 1032 | "0 | \n", 1033 | "0 | \n", 1034 | "0 | \n", 1035 | "0 | \n", 1036 | "0 | \n", 1037 | "0 | \n", 1038 | "
5 rows × 5000 columns
\n", 1042 | "