From 0bedbfba4f2c4925a4b911832084d1d6a1ade7d1 Mon Sep 17 00:00:00 2001
From: SOUMYO NATH TRIPATHY
<85414445+SoumyoNathTripathy@users.noreply.github.com>
Date: Thu, 10 Feb 2022 13:14:03 +0530
Subject: [PATCH 1/2] Update README.md
---
README.md | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git a/README.md b/README.md
index 25281db..c3c9a98 100644
--- a/README.md
+++ b/README.md
@@ -2,7 +2,7 @@
This a website that will take the name of any company as an input and fetches all the news regarding that company using GoogleNews.
-It then does sentiment analysis of the news fetched and gives a proper sentiment score
+It then does Sentiment Analysis of the news fetched and gives a proper Sentiment score.
## The Flow
From eefcae0c5fad38668344be111d88d8f103cf35ec Mon Sep 17 00:00:00 2001
From: SOUMYO NATH TRIPATHY
<85414445+SoumyoNathTripathy@users.noreply.github.com>
Date: Sat, 19 Feb 2022 02:25:56 +0530
Subject: [PATCH 2/2] Add files via upload
---
FakeNewsClassifier TFIDF.ipynb | 2615 ++++++++++++++++++++++++++++++++
1 file changed, 2615 insertions(+)
create mode 100644 FakeNewsClassifier TFIDF.ipynb
diff --git a/FakeNewsClassifier TFIDF.ipynb b/FakeNewsClassifier TFIDF.ipynb
new file mode 100644
index 0000000..8996e98
--- /dev/null
+++ b/FakeNewsClassifier TFIDF.ipynb
@@ -0,0 +1,2615 @@
+{
+ "cells": [
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "### Fake News Classifier\n",
+ "Dataset: https://www.kaggle.com/c/fake-news/data#"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 1,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import pandas as pd"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 2,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "df=pd.read_csv('fake-news/train.csv')"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 3,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "
\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " id \n",
+ " title \n",
+ " author \n",
+ " text \n",
+ " label \n",
+ " \n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 \n",
+ " 0 \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " Darrell Lucus \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 1 \n",
+ " 1 \n",
+ " FLYNN: Hillary Clinton, Big Woman on Campus - ... \n",
+ " Daniel J. Flynn \n",
+ " Ever get the feeling your life circles the rou... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 2 \n",
+ " 2 \n",
+ " Why the Truth Might Get You Fired \n",
+ " Consortiumnews.com \n",
+ " Why the Truth Might Get You Fired October 29, ... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 3 \n",
+ " 3 \n",
+ " 15 Civilians Killed In Single US Airstrike Hav... \n",
+ " Jessica Purkiss \n",
+ " Videos 15 Civilians Killed In Single US Airstr... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 4 \n",
+ " 4 \n",
+ " Iranian woman jailed for fictional unpublished... \n",
+ " Howard Portnoy \n",
+ " Print \\nAn Iranian woman has been sentenced to... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id title author \\\n",
+ "0 0 House Dem Aide: We Didn’t Even See Comey’s Let... Darrell Lucus \n",
+ "1 1 FLYNN: Hillary Clinton, Big Woman on Campus - ... Daniel J. Flynn \n",
+ "2 2 Why the Truth Might Get You Fired Consortiumnews.com \n",
+ "3 3 15 Civilians Killed In Single US Airstrike Hav... Jessica Purkiss \n",
+ "4 4 Iranian woman jailed for fictional unpublished... Howard Portnoy \n",
+ "\n",
+ " text label \n",
+ "0 House Dem Aide: We Didn’t Even See Comey’s Let... 1 \n",
+ "1 Ever get the feeling your life circles the rou... 0 \n",
+ "2 Why the Truth Might Get You Fired October 29, ... 1 \n",
+ "3 Videos 15 Civilians Killed In Single US Airstr... 1 \n",
+ "4 Print \\nAn Iranian woman has been sentenced to... 1 "
+ ]
+ },
+ "execution_count": 3,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 4,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## Get the Independent Features\n",
+ "\n",
+ "X=df.drop('label',axis=1)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 5,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " id \n",
+ " title \n",
+ " author \n",
+ " text \n",
+ " \n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 \n",
+ " 0 \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " Darrell Lucus \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " \n",
+ " \n",
+ " 1 \n",
+ " 1 \n",
+ " FLYNN: Hillary Clinton, Big Woman on Campus - ... \n",
+ " Daniel J. Flynn \n",
+ " Ever get the feeling your life circles the rou... \n",
+ " \n",
+ " \n",
+ " 2 \n",
+ " 2 \n",
+ " Why the Truth Might Get You Fired \n",
+ " Consortiumnews.com \n",
+ " Why the Truth Might Get You Fired October 29, ... \n",
+ " \n",
+ " \n",
+ " 3 \n",
+ " 3 \n",
+ " 15 Civilians Killed In Single US Airstrike Hav... \n",
+ " Jessica Purkiss \n",
+ " Videos 15 Civilians Killed In Single US Airstr... \n",
+ " \n",
+ " \n",
+ " 4 \n",
+ " 4 \n",
+ " Iranian woman jailed for fictional unpublished... \n",
+ " Howard Portnoy \n",
+ " Print \\nAn Iranian woman has been sentenced to... \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id title author \\\n",
+ "0 0 House Dem Aide: We Didn’t Even See Comey’s Let... Darrell Lucus \n",
+ "1 1 FLYNN: Hillary Clinton, Big Woman on Campus - ... Daniel J. Flynn \n",
+ "2 2 Why the Truth Might Get You Fired Consortiumnews.com \n",
+ "3 3 15 Civilians Killed In Single US Airstrike Hav... Jessica Purkiss \n",
+ "4 4 Iranian woman jailed for fictional unpublished... Howard Portnoy \n",
+ "\n",
+ " text \n",
+ "0 House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ "1 Ever get the feeling your life circles the rou... \n",
+ "2 Why the Truth Might Get You Fired October 29, ... \n",
+ "3 Videos 15 Civilians Killed In Single US Airstr... \n",
+ "4 Print \\nAn Iranian woman has been sentenced to... "
+ ]
+ },
+ "execution_count": 5,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "X.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 6,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## Get the Dependent features\n",
+ "y=df['label']"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 7,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "0 1\n",
+ "1 0\n",
+ "2 1\n",
+ "3 1\n",
+ "4 1\n",
+ "Name: label, dtype: int64"
+ ]
+ },
+ "execution_count": 7,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "y.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 10,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(18285, 5)"
+ ]
+ },
+ "execution_count": 10,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df.shape"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from sklearn.feature_extraction.text import CountVectorizer, TfidfVectorizer, HashingVectorizer"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 9,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "df=df.dropna()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 11,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " id \n",
+ " title \n",
+ " author \n",
+ " text \n",
+ " label \n",
+ " \n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 \n",
+ " 0 \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " Darrell Lucus \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 1 \n",
+ " 1 \n",
+ " FLYNN: Hillary Clinton, Big Woman on Campus - ... \n",
+ " Daniel J. Flynn \n",
+ " Ever get the feeling your life circles the rou... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 2 \n",
+ " 2 \n",
+ " Why the Truth Might Get You Fired \n",
+ " Consortiumnews.com \n",
+ " Why the Truth Might Get You Fired October 29, ... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 3 \n",
+ " 3 \n",
+ " 15 Civilians Killed In Single US Airstrike Hav... \n",
+ " Jessica Purkiss \n",
+ " Videos 15 Civilians Killed In Single US Airstr... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 4 \n",
+ " 4 \n",
+ " Iranian woman jailed for fictional unpublished... \n",
+ " Howard Portnoy \n",
+ " Print \\nAn Iranian woman has been sentenced to... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 5 \n",
+ " 5 \n",
+ " Jackie Mason: Hollywood Would Love Trump if He... \n",
+ " Daniel Nussbaum \n",
+ " In these trying times, Jackie Mason is the Voi... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 7 \n",
+ " 7 \n",
+ " Benoît Hamon Wins French Socialist Party’s Pre... \n",
+ " Alissa J. Rubin \n",
+ " PARIS — France chose an idealistic, traditi... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 9 \n",
+ " 9 \n",
+ " A Back-Channel Plan for Ukraine and Russia, Co... \n",
+ " Megan Twohey and Scott Shane \n",
+ " A week before Michael T. Flynn resigned as nat... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 10 \n",
+ " 10 \n",
+ " Obama’s Organizing for Action Partners with So... \n",
+ " Aaron Klein \n",
+ " Organizing for Action, the activist group that... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 11 \n",
+ " 11 \n",
+ " BBC Comedy Sketch \"Real Housewives of ISIS\" Ca... \n",
+ " Chris Tomlinson \n",
+ " The BBC produced spoof on the “Real Housewives... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " id title \\\n",
+ "0 0 House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ "1 1 FLYNN: Hillary Clinton, Big Woman on Campus - ... \n",
+ "2 2 Why the Truth Might Get You Fired \n",
+ "3 3 15 Civilians Killed In Single US Airstrike Hav... \n",
+ "4 4 Iranian woman jailed for fictional unpublished... \n",
+ "5 5 Jackie Mason: Hollywood Would Love Trump if He... \n",
+ "7 7 Benoît Hamon Wins French Socialist Party’s Pre... \n",
+ "9 9 A Back-Channel Plan for Ukraine and Russia, Co... \n",
+ "10 10 Obama’s Organizing for Action Partners with So... \n",
+ "11 11 BBC Comedy Sketch \"Real Housewives of ISIS\" Ca... \n",
+ "\n",
+ " author \\\n",
+ "0 Darrell Lucus \n",
+ "1 Daniel J. Flynn \n",
+ "2 Consortiumnews.com \n",
+ "3 Jessica Purkiss \n",
+ "4 Howard Portnoy \n",
+ "5 Daniel Nussbaum \n",
+ "7 Alissa J. Rubin \n",
+ "9 Megan Twohey and Scott Shane \n",
+ "10 Aaron Klein \n",
+ "11 Chris Tomlinson \n",
+ "\n",
+ " text label \n",
+ "0 House Dem Aide: We Didn’t Even See Comey’s Let... 1 \n",
+ "1 Ever get the feeling your life circles the rou... 0 \n",
+ "2 Why the Truth Might Get You Fired October 29, ... 1 \n",
+ "3 Videos 15 Civilians Killed In Single US Airstr... 1 \n",
+ "4 Print \\nAn Iranian woman has been sentenced to... 1 \n",
+ "5 In these trying times, Jackie Mason is the Voi... 0 \n",
+ "7 PARIS — France chose an idealistic, traditi... 0 \n",
+ "9 A week before Michael T. Flynn resigned as nat... 0 \n",
+ "10 Organizing for Action, the activist group that... 0 \n",
+ "11 The BBC produced spoof on the “Real Housewives... 0 "
+ ]
+ },
+ "execution_count": 11,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "df.head(10)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 12,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "messages=df.copy()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 13,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "messages.reset_index(inplace=True)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 14,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " index \n",
+ " id \n",
+ " title \n",
+ " author \n",
+ " text \n",
+ " label \n",
+ " \n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 \n",
+ " 0 \n",
+ " 0 \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " Darrell Lucus \n",
+ " House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 1 \n",
+ " 1 \n",
+ " 1 \n",
+ " FLYNN: Hillary Clinton, Big Woman on Campus - ... \n",
+ " Daniel J. Flynn \n",
+ " Ever get the feeling your life circles the rou... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 2 \n",
+ " 2 \n",
+ " 2 \n",
+ " Why the Truth Might Get You Fired \n",
+ " Consortiumnews.com \n",
+ " Why the Truth Might Get You Fired October 29, ... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 3 \n",
+ " 3 \n",
+ " 3 \n",
+ " 15 Civilians Killed In Single US Airstrike Hav... \n",
+ " Jessica Purkiss \n",
+ " Videos 15 Civilians Killed In Single US Airstr... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 4 \n",
+ " 4 \n",
+ " 4 \n",
+ " Iranian woman jailed for fictional unpublished... \n",
+ " Howard Portnoy \n",
+ " Print \\nAn Iranian woman has been sentenced to... \n",
+ " 1 \n",
+ " \n",
+ " \n",
+ " 5 \n",
+ " 5 \n",
+ " 5 \n",
+ " Jackie Mason: Hollywood Would Love Trump if He... \n",
+ " Daniel Nussbaum \n",
+ " In these trying times, Jackie Mason is the Voi... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 6 \n",
+ " 7 \n",
+ " 7 \n",
+ " Benoît Hamon Wins French Socialist Party’s Pre... \n",
+ " Alissa J. Rubin \n",
+ " PARIS — France chose an idealistic, traditi... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 7 \n",
+ " 9 \n",
+ " 9 \n",
+ " A Back-Channel Plan for Ukraine and Russia, Co... \n",
+ " Megan Twohey and Scott Shane \n",
+ " A week before Michael T. Flynn resigned as nat... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 8 \n",
+ " 10 \n",
+ " 10 \n",
+ " Obama’s Organizing for Action Partners with So... \n",
+ " Aaron Klein \n",
+ " Organizing for Action, the activist group that... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ " 9 \n",
+ " 11 \n",
+ " 11 \n",
+ " BBC Comedy Sketch \"Real Housewives of ISIS\" Ca... \n",
+ " Chris Tomlinson \n",
+ " The BBC produced spoof on the “Real Housewives... \n",
+ " 0 \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
"
+ ],
+ "text/plain": [
+ " index id title \\\n",
+ "0 0 0 House Dem Aide: We Didn’t Even See Comey’s Let... \n",
+ "1 1 1 FLYNN: Hillary Clinton, Big Woman on Campus - ... \n",
+ "2 2 2 Why the Truth Might Get You Fired \n",
+ "3 3 3 15 Civilians Killed In Single US Airstrike Hav... \n",
+ "4 4 4 Iranian woman jailed for fictional unpublished... \n",
+ "5 5 5 Jackie Mason: Hollywood Would Love Trump if He... \n",
+ "6 7 7 Benoît Hamon Wins French Socialist Party’s Pre... \n",
+ "7 9 9 A Back-Channel Plan for Ukraine and Russia, Co... \n",
+ "8 10 10 Obama’s Organizing for Action Partners with So... \n",
+ "9 11 11 BBC Comedy Sketch \"Real Housewives of ISIS\" Ca... \n",
+ "\n",
+ " author \\\n",
+ "0 Darrell Lucus \n",
+ "1 Daniel J. Flynn \n",
+ "2 Consortiumnews.com \n",
+ "3 Jessica Purkiss \n",
+ "4 Howard Portnoy \n",
+ "5 Daniel Nussbaum \n",
+ "6 Alissa J. Rubin \n",
+ "7 Megan Twohey and Scott Shane \n",
+ "8 Aaron Klein \n",
+ "9 Chris Tomlinson \n",
+ "\n",
+ " text label \n",
+ "0 House Dem Aide: We Didn’t Even See Comey’s Let... 1 \n",
+ "1 Ever get the feeling your life circles the rou... 0 \n",
+ "2 Why the Truth Might Get You Fired October 29, ... 1 \n",
+ "3 Videos 15 Civilians Killed In Single US Airstr... 1 \n",
+ "4 Print \\nAn Iranian woman has been sentenced to... 1 \n",
+ "5 In these trying times, Jackie Mason is the Voi... 0 \n",
+ "6 PARIS — France chose an idealistic, traditi... 0 \n",
+ "7 A week before Michael T. Flynn resigned as nat... 0 \n",
+ "8 Organizing for Action, the activist group that... 0 \n",
+ "9 The BBC produced spoof on the “Real Housewives... 0 "
+ ]
+ },
+ "execution_count": 14,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "messages.head(10)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 15,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'PARIS — France chose an idealistic, traditional candidate in Sunday’s primary to represent the Socialist and parties in the presidential election this spring. The candidate, Benoît Hamon, 49, who ran on the slogan that he would “make France’s heart beat,” bested Manuel Valls, the former prime minister, whose campaign has promoted more policies and who has a strong background. Mr. Hamon appeared to have won by a wide margin, with incomplete returns showing him with an estimated 58 percent of the vote to Mr. Valls’s 41 percent. “Tonight the left holds its head up high again it is looking to the future,” Mr. Hamon said, addressing his supporters. “Our country needs the left, but a modern, innovative left,” he said. Mr. Hamon’s victory was the clearest sign yet that voters on the left want a break with the policies of President François Hollande, who in December announced that he would not seek . However, Mr. Hamon’s strong showing is unlikely to change widespread assessments that candidates have little chance of making it into the second round of voting in the general election. The first round of the general election is set for April 23 and the runoff for May 7. The Socialist Party is deeply divided, and one measure of its lack of popular enthusiasm was the relatively low number of people voting. About two million people voted in the second round of the primary on Sunday, in contrast with about 2. 9 million in the second round of the last presidential primary on the left, in 2011. However, much of the conventional wisdom over how the elections will go has been thrown into question over the past week, because the leading candidate, François Fillon, who represents the main party, the Republicans, was accused of paying his wife large sums of money to work as his parliamentary aide. While nepotism is legal in the French political system, it is not clear that she actually did any work. Prosecutors who specialize in financial malfeasance are reviewing the case. France’s electoral system allows multiple candidates to run for president in the first round of voting, but only the top two go on to a second round. Mr. Hamon is entering a race that is already crowded on the left, with candidates who include Mélenchon on the far left, and Emmanuel Macron, an independent who served as economy minister in Mr. Hollande’s government and who embraces more policies. Unless he decides to withdraw, Mr. Fillon, the mainstream right candidate, will also run, as will the extreme right candidate Marine Le Pen. The two have been expected to go to the runoff. Mr. Hamon’s victory can be attributed at least in part to his image as an idealist and traditional leftist candidate who appeals to union voters as well as more environmentally concerned and socially liberal young people. Unlike Mr. Valls, he also clearly distanced himself from some of Mr. Hollande’s more unpopular policies, especially the economic ones. Thomas Kekenbosch, 22, a student and one of the leaders of the group the Youth With Benoît Hamon, said Mr. Hamon embodied a new hope for those on the left. “We have a perspective we have something to do, to build,” Mr. Kekenbosch said. Mr. Hollande had disappointed many young people because under him the party abandoned ideals, such as support for workers, that many voters believe in, according to Mr. Kekenbosch. Mr. Hollande’s government, under pressure from the European Union to meet budget restraints, struggled to pass labor code reforms to make the market more attractive to foreign investors and also to encourage French businesses to expand in France. The measures ultimately passed after weeks of strikes, but they were watered down and generated little concrete progress in improving France’s roughly 10 percent unemployment rate and its nearly 25 percent youth joblessness rate. Mr. Hamon strongly endorses a stimulus approach to improving the economy and has promised to phase in a universal income, which would especially help young people looking for work, but would also supplement the livelihood of French workers. The end goal would be to have everyone receive 750 euros per month (about $840). “We have someone that trusts us,” Mr. Kekenbosch said, “who says: ‘I give you enough to pay for your studies. You can have a scholarship which spares you from working at McDonald’s on provisional contracts for 4 years. ” Mr. Hamon advocates phasing out diesel fuel and encouraging drivers to replace vehicles that use petroleum products with electrical ones. His leftist pedigree began early. His father worked at an arsenal in Brest, a city in the far west of Brittany, and his mother worked off and on as a secretary. He was an early member of the Movement of Young Socialists, and he has continued to work closely with them through his political life. He also worked for Martine Aubry, now the mayor of Lille and a former Socialist Party leader.'"
+ ]
+ },
+ "execution_count": 15,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "messages['text'][6]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from nltk.corpus import stopwords\n",
+ "from nltk.stem.porter import PorterStemmer\n",
+ "import re\n",
+ "ps = PorterStemmer()\n",
+ "corpus = []\n",
+ "for i in range(0, len(messages)):\n",
+ " review = re.sub('[^a-zA-Z]', ' ', messages['text'][i])\n",
+ " review = review.lower()\n",
+ " review = review.split()\n",
+ " \n",
+ " review = [ps.stem(word) for word in review if not word in stopwords.words('english')]\n",
+ " review = ' '.join(review)\n",
+ " corpus.append(review)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 24,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "'civilian kill singl us airstrik identifi'"
+ ]
+ },
+ "execution_count": 24,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "corpus[3]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 17,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## TFidf Vectorizer\n",
+ "from sklearn.feature_extraction.text import TfidfVectorizer\n",
+ "tfidf_v=TfidfVectorizer(max_features=5000,ngram_range=(1,3))\n",
+ "X=tfidf_v.fit_transform(corpus).toarray()\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 18,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(18285, 5000)"
+ ]
+ },
+ "execution_count": 18,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "X.shape"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 19,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "y=messages['label']"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 20,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## Divide the dataset into Train and Test\n",
+ "from sklearn.model_selection import train_test_split\n",
+ "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33, random_state=0)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 21,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "['abandon',\n",
+ " 'abc',\n",
+ " 'abc news',\n",
+ " 'abduct',\n",
+ " 'abe',\n",
+ " 'abedin',\n",
+ " 'abl',\n",
+ " 'abort',\n",
+ " 'abroad',\n",
+ " 'absolut',\n",
+ " 'abstain',\n",
+ " 'absurd',\n",
+ " 'abus',\n",
+ " 'abus new',\n",
+ " 'abus new york',\n",
+ " 'academi',\n",
+ " 'accept',\n",
+ " 'access',\n",
+ " 'access pipelin',\n",
+ " 'access pipelin protest']"
+ ]
+ },
+ "execution_count": 21,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "tfidf_v.get_feature_names()[:20]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 22,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "{'analyzer': 'word',\n",
+ " 'binary': False,\n",
+ " 'decode_error': 'strict',\n",
+ " 'dtype': numpy.int64,\n",
+ " 'encoding': 'utf-8',\n",
+ " 'input': 'content',\n",
+ " 'lowercase': True,\n",
+ " 'max_df': 1.0,\n",
+ " 'max_features': 5000,\n",
+ " 'min_df': 1,\n",
+ " 'ngram_range': (1, 3),\n",
+ " 'norm': 'l2',\n",
+ " 'preprocessor': None,\n",
+ " 'smooth_idf': True,\n",
+ " 'stop_words': None,\n",
+ " 'strip_accents': None,\n",
+ " 'sublinear_tf': False,\n",
+ " 'token_pattern': '(?u)\\\\b\\\\w\\\\w+\\\\b',\n",
+ " 'tokenizer': None,\n",
+ " 'use_idf': True,\n",
+ " 'vocabulary': None}"
+ ]
+ },
+ "execution_count": 22,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "tfidf_v.get_params()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 23,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "count_df = pd.DataFrame(X_train, columns=tfidf_v.get_feature_names())"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 27,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/html": [
+ "\n",
+ "\n",
+ "
\n",
+ " \n",
+ " \n",
+ " \n",
+ " abandon \n",
+ " abc \n",
+ " abc news \n",
+ " abduct \n",
+ " abe \n",
+ " abedin \n",
+ " abl \n",
+ " abort \n",
+ " abroad \n",
+ " absolut \n",
+ " ... \n",
+ " zero \n",
+ " zika \n",
+ " zika viru \n",
+ " zionist \n",
+ " zone \n",
+ " zone new \n",
+ " zone new york \n",
+ " zoo \n",
+ " zu \n",
+ " zuckerberg \n",
+ " \n",
+ " \n",
+ " \n",
+ " \n",
+ " 0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.000000 \n",
+ " ... \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " \n",
+ " \n",
+ " 1 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.000000 \n",
+ " ... \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " \n",
+ " \n",
+ " 2 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.000000 \n",
+ " ... \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " \n",
+ " \n",
+ " 3 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.000000 \n",
+ " ... \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " \n",
+ " \n",
+ " 4 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.305244 \n",
+ " ... \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " 0.0 \n",
+ " \n",
+ " \n",
+ "
\n",
+ "
5 rows × 5000 columns
\n",
+ "
"
+ ],
+ "text/plain": [
+ " abandon abc abc news abduct abe abedin abl abort abroad absolut \\\n",
+ "0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.000000 \n",
+ "1 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.000000 \n",
+ "2 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.000000 \n",
+ "3 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.000000 \n",
+ "4 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.305244 \n",
+ "\n",
+ " ... zero zika zika viru zionist zone zone new zone new york \\\n",
+ "0 ... 0.0 0.0 0.0 0.0 0.0 0.0 0.0 \n",
+ "1 ... 0.0 0.0 0.0 0.0 0.0 0.0 0.0 \n",
+ "2 ... 0.0 0.0 0.0 0.0 0.0 0.0 0.0 \n",
+ "3 ... 0.0 0.0 0.0 0.0 0.0 0.0 0.0 \n",
+ "4 ... 0.0 0.0 0.0 0.0 0.0 0.0 0.0 \n",
+ "\n",
+ " zoo zu zuckerberg \n",
+ "0 0.0 0.0 0.0 \n",
+ "1 0.0 0.0 0.0 \n",
+ "2 0.0 0.0 0.0 \n",
+ "3 0.0 0.0 0.0 \n",
+ "4 0.0 0.0 0.0 \n",
+ "\n",
+ "[5 rows x 5000 columns]"
+ ]
+ },
+ "execution_count": 27,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "count_df.head()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 28,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "import matplotlib.pyplot as plt"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 29,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "def plot_confusion_matrix(cm, classes,\n",
+ " normalize=False,\n",
+ " title='Confusion matrix',\n",
+ " cmap=plt.cm.Blues):\n",
+ " \"\"\"\n",
+ " See full source and example: \n",
+ " http://scikit-learn.org/stable/auto_examples/model_selection/plot_confusion_matrix.html\n",
+ " \n",
+ " This function prints and plots the confusion matrix.\n",
+ " Normalization can be applied by setting `normalize=True`.\n",
+ " \"\"\"\n",
+ " plt.imshow(cm, interpolation='nearest', cmap=cmap)\n",
+ " plt.title(title)\n",
+ " plt.colorbar()\n",
+ " tick_marks = np.arange(len(classes))\n",
+ " plt.xticks(tick_marks, classes, rotation=45)\n",
+ " plt.yticks(tick_marks, classes)\n",
+ "\n",
+ " if normalize:\n",
+ " cm = cm.astype('float') / cm.sum(axis=1)[:, np.newaxis]\n",
+ " print(\"Normalized confusion matrix\")\n",
+ " else:\n",
+ " print('Confusion matrix, without normalization')\n",
+ "\n",
+ " thresh = cm.max() / 2.\n",
+ " for i, j in itertools.product(range(cm.shape[0]), range(cm.shape[1])):\n",
+ " plt.text(j, i, cm[i, j],\n",
+ " horizontalalignment=\"center\",\n",
+ " color=\"white\" if cm[i, j] > thresh else \"black\")\n",
+ "\n",
+ " plt.tight_layout()\n",
+ " plt.ylabel('True label')\n",
+ " plt.xlabel('Predicted label')"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "### MultinomialNB Algorithm"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 30,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "\n",
+ "from sklearn.naive_bayes import MultinomialNB\n",
+ "classifier=MultinomialNB()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 31,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from sklearn import metrics\n",
+ "import numpy as np\n",
+ "import itertools"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 32,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "accuracy: 0.881\n",
+ "Confusion matrix, without normalization\n"
+ ]
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "\n",
+ "classifier.fit(X_train, y_train)\n",
+ "pred = classifier.predict(X_test)\n",
+ "score = metrics.accuracy_score(y_test, pred)\n",
+ "print(\"accuracy: %0.3f\" % score)\n",
+ "cm = metrics.confusion_matrix(y_test, pred)\n",
+ "plot_confusion_matrix(cm, classes=['FAKE', 'REAL'])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 33,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "0.8810273405136703"
+ ]
+ },
+ "execution_count": 33,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "classifier.fit(X_train, y_train)\n",
+ "pred = classifier.predict(X_test)\n",
+ "score = metrics.accuracy_score(y_test, pred)\n",
+ "score"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 34,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(12250,)"
+ ]
+ },
+ "execution_count": 34,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "y_train.shape"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "### Passive Aggressive Classifier Algorithm"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 35,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "from sklearn.linear_model import PassiveAggressiveClassifier\n",
+ "linear_clf = PassiveAggressiveClassifier(n_iter=50)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 36,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\krish.naik\\appdata\\local\\continuum\\anaconda3\\envs\\nlp\\lib\\site-packages\\sklearn\\linear_model\\stochastic_gradient.py:117: DeprecationWarning: n_iter parameter is deprecated in 0.19 and will be removed in 0.21. Use max_iter and tol instead.\n",
+ " DeprecationWarning)\n"
+ ]
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "accuracy: 0.918\n",
+ "Confusion matrix, without normalization\n"
+ ]
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "linear_clf.fit(X_train, y_train)\n",
+ "pred = linear_clf.predict(X_test)\n",
+ "score = metrics.accuracy_score(y_test, pred)\n",
+ "print(\"accuracy: %0.3f\" % score)\n",
+ "cm = metrics.confusion_matrix(y_test, pred)\n",
+ "plot_confusion_matrix(cm, classes=['FAKE Data', 'REAL Data'])"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "### Multinomial Classifier with Hyperparameter"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 37,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "classifier=MultinomialNB(alpha=0.1)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 38,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\krish.naik\\appdata\\local\\continuum\\anaconda3\\envs\\nlp\\lib\\site-packages\\sklearn\\naive_bayes.py:472: UserWarning: alpha too small will result in numeric errors, setting alpha = 1.0e-10\n",
+ " 'setting alpha = %.1e' % _ALPHA_MIN)\n"
+ ]
+ },
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "Alpha: 0.0, Score : 0.8662800331400166\n",
+ "Alpha: 0.1, Score : 0.8777133388566695\n",
+ "Alpha: 0.2, Score : 0.8801988400994201\n",
+ "Alpha: 0.30000000000000004, Score : 0.87986743993372\n",
+ "Alpha: 0.4, Score : 0.8808616404308203\n",
+ "Alpha: 0.5, Score : 0.8806959403479702\n",
+ "Alpha: 0.6000000000000001, Score : 0.8815244407622204\n",
+ "Alpha: 0.7000000000000001, Score : 0.8813587406793704\n",
+ "Alpha: 0.8, Score : 0.8816901408450705\n",
+ "Alpha: 0.9, Score : 0.8816901408450705\n"
+ ]
+ }
+ ],
+ "source": [
+ "previous_score=0\n",
+ "for alpha in np.arange(0,1,0.1):\n",
+ " sub_classifier=MultinomialNB(alpha=alpha)\n",
+ " sub_classifier.fit(X_train,y_train)\n",
+ " y_pred=sub_classifier.predict(X_test)\n",
+ " score = metrics.accuracy_score(y_test, y_pred)\n",
+ " if score>previous_score:\n",
+ " classifier=sub_classifier\n",
+ " print(\"Alpha: {}, Score : {}\".format(alpha,score))"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 106,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## Get Features names\n",
+ "feature_names = cv.get_feature_names()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 109,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "array([ -9.10038883, -8.62276128, -9.10038883, ..., -10.79498456,\n",
+ " -8.91467169, -9.32864749])"
+ ]
+ },
+ "execution_count": 109,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "classifier.coef_[0]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 107,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[(-4.000149156604985, 'trump'),\n",
+ " (-4.287872694443541, 'hillari'),\n",
+ " (-4.396389621061519, 'clinton'),\n",
+ " (-4.899969726208735, 'elect'),\n",
+ " (-5.176598600897756, 'new'),\n",
+ " (-5.234730366348767, 'comment'),\n",
+ " (-5.273968180973631, 'video'),\n",
+ " (-5.3868167681180115, 'war'),\n",
+ " (-5.396821854078974, 'us'),\n",
+ " (-5.412019714988405, 'hillari clinton'),\n",
+ " (-5.417137433425386, 'fbi'),\n",
+ " (-5.48068448454208, 'vote'),\n",
+ " (-5.566255475855405, 'email'),\n",
+ " (-5.578238842742501, 'world'),\n",
+ " (-5.634015380199913, 'obama'),\n",
+ " (-5.734501455772904, 'donald'),\n",
+ " (-5.763095255139644, 'donald trump'),\n",
+ " (-5.785090276725191, 'russia'),\n",
+ " (-5.846224665218559, 'day'),\n",
+ " (-5.862110622807369, 'america')]"
+ ]
+ },
+ "execution_count": 107,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "### Most real\n",
+ "sorted(zip(classifier.coef_[0], feature_names), reverse=True)[:20]"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 135,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "[(-10.794984555596727, 'abe'),\n",
+ " (-10.794984555596727, 'abroad'),\n",
+ " (-10.794984555596727, 'abus new'),\n",
+ " (-10.794984555596727, 'abus new york'),\n",
+ " (-10.794984555596727, 'act new'),\n",
+ " (-10.794984555596727, 'act new york'),\n",
+ " (-10.794984555596727, 'advic'),\n",
+ " (-10.794984555596727, 'advis new'),\n",
+ " (-10.794984555596727, 'advis new york'),\n",
+ " (-10.794984555596727, 'age new'),\n",
+ " (-10.794984555596727, 'age new york'),\n",
+ " (-10.794984555596727, 'agenda breitbart'),\n",
+ " (-10.794984555596727, 'ail'),\n",
+ " (-10.794984555596727, 'aleppo new'),\n",
+ " (-10.794984555596727, 'aleppo new york'),\n",
+ " (-10.794984555596727, 'ali'),\n",
+ " (-10.794984555596727, 'america breitbart'),\n",
+ " (-10.794984555596727, 'america new york'),\n",
+ " (-10.794984555596727, 'american breitbart'),\n",
+ " (-10.794984555596727, 'american new'),\n",
+ " (-10.794984555596727, 'american new york'),\n",
+ " (-10.794984555596727, 'ami'),\n",
+ " (-10.794984555596727, 'ami schumer'),\n",
+ " (-10.794984555596727, 'amp'),\n",
+ " (-10.794984555596727, 'ann'),\n",
+ " (-10.794984555596727, 'ann coulter'),\n",
+ " (-10.794984555596727, 'applaud'),\n",
+ " (-10.794984555596727, 'arson'),\n",
+ " (-10.794984555596727, 'asian'),\n",
+ " (-10.794984555596727, 'assail'),\n",
+ " (-10.794984555596727, 'athlet'),\n",
+ " (-10.794984555596727, 'attack breitbart'),\n",
+ " (-10.794984555596727, 'attack new'),\n",
+ " (-10.794984555596727, 'attack new york'),\n",
+ " (-10.794984555596727, 'attack syria'),\n",
+ " (-10.794984555596727, 'attend'),\n",
+ " (-10.794984555596727, 'avert'),\n",
+ " (-10.794984555596727, 'away new'),\n",
+ " (-10.794984555596727, 'away new york'),\n",
+ " (-10.794984555596727, 'back new'),\n",
+ " (-10.794984555596727, 'back new york'),\n",
+ " (-10.794984555596727, 'baltimor'),\n",
+ " (-10.794984555596727, 'ban breitbart'),\n",
+ " (-10.794984555596727, 'ban new'),\n",
+ " (-10.794984555596727, 'ban new york'),\n",
+ " (-10.794984555596727, 'bangladesh'),\n",
+ " (-10.794984555596727, 'barron trump'),\n",
+ " (-10.794984555596727, 'basic'),\n",
+ " (-10.794984555596727, 'basketbal'),\n",
+ " (-10.794984555596727, 'basketbal player'),\n",
+ " (-10.794984555596727, 'baton'),\n",
+ " (-10.794984555596727, 'baton roug'),\n",
+ " (-10.794984555596727, 'battl new'),\n",
+ " (-10.794984555596727, 'battl new york'),\n",
+ " (-10.794984555596727, 'bay'),\n",
+ " (-10.794984555596727, 'beach new'),\n",
+ " (-10.794984555596727, 'beach new york'),\n",
+ " (-10.794984555596727, 'begin new'),\n",
+ " (-10.794984555596727, 'behead photo'),\n",
+ " (-10.794984555596727, 'behind trump'),\n",
+ " (-10.794984555596727, 'berkeley breitbart'),\n",
+ " (-10.794984555596727, 'betsi'),\n",
+ " (-10.794984555596727, 'betsi devo'),\n",
+ " (-10.794984555596727, 'bill breitbart'),\n",
+ " (-10.794984555596727, 'bill new'),\n",
+ " (-10.794984555596727, 'bill new york'),\n",
+ " (-10.794984555596727, 'bill reilli'),\n",
+ " (-10.794984555596727, 'billi'),\n",
+ " (-10.794984555596727, 'blue state'),\n",
+ " (-10.794984555596727, 'blue state blue'),\n",
+ " (-10.794984555596727, 'bolster'),\n",
+ " (-10.794984555596727, 'border patrol'),\n",
+ " (-10.794984555596727, 'border patrol agent'),\n",
+ " (-10.794984555596727, 'border state'),\n",
+ " (-10.794984555596727, 'border wall'),\n",
+ " (-10.794984555596727, 'border wall breitbart'),\n",
+ " (-10.794984555596727, 'bowl'),\n",
+ " (-10.794984555596727, 'box offic'),\n",
+ " (-10.794984555596727, 'bradi'),\n",
+ " (-10.794984555596727, 'breath'),\n",
+ " (-10.794984555596727, 'breitbart news daili'),\n",
+ " (-10.794984555596727, 'brief new'),\n",
+ " (-10.794984555596727, 'brief new york'),\n",
+ " (-10.794984555596727, 'broadway'),\n",
+ " (-10.794984555596727, 'bronx'),\n",
+ " (-10.794984555596727, 'brooklyn'),\n",
+ " (-10.794984555596727, 'brooklyn new'),\n",
+ " (-10.794984555596727, 'brooklyn new york'),\n",
+ " (-10.794984555596727, 'bureaucrat'),\n",
+ " (-10.794984555596727, 'caitlyn'),\n",
+ " (-10.794984555596727, 'caitlyn jenner'),\n",
+ " (-10.794984555596727, 'cal'),\n",
+ " (-10.794984555596727, 'california today'),\n",
+ " (-10.794984555596727, 'calm'),\n",
+ " (-10.794984555596727, 'campaign breitbart'),\n",
+ " (-10.794984555596727, 'campaign new'),\n",
+ " (-10.794984555596727, 'campaign new york'),\n",
+ " (-10.794984555596727, 'campu breitbart'),\n",
+ " (-10.794984555596727, 'cann'),\n",
+ " (-10.794984555596727, 'car new'),\n",
+ " (-10.794984555596727, 'car new york'),\n",
+ " (-10.794984555596727, 'care act'),\n",
+ " (-10.794984555596727, 'care act new'),\n",
+ " (-10.794984555596727, 'care bill'),\n",
+ " (-10.794984555596727, 'care breitbart'),\n",
+ " (-10.794984555596727, 'carri fisher'),\n",
+ " (-10.794984555596727, 'carson'),\n",
+ " (-10.794984555596727, 'case new'),\n",
+ " (-10.794984555596727, 'case new york'),\n",
+ " (-10.794984555596727, 'castro'),\n",
+ " (-10.794984555596727, 'caucu'),\n",
+ " (-10.794984555596727, 'ceas'),\n",
+ " (-10.794984555596727, 'ceas fire'),\n",
+ " (-10.794984555596727, 'chamber'),\n",
+ " (-10.794984555596727, 'championship'),\n",
+ " (-10.794984555596727, 'championship new'),\n",
+ " (-10.794984555596727, 'championship new york'),\n",
+ " (-10.794984555596727, 'chang new'),\n",
+ " (-10.794984555596727, 'chang new york'),\n",
+ " (-10.794984555596727, 'charg new york'),\n",
+ " (-10.794984555596727, 'charleston'),\n",
+ " (-10.794984555596727, 'charlott'),\n",
+ " (-10.794984555596727, 'cher'),\n",
+ " (-10.794984555596727, 'chief new'),\n",
+ " (-10.794984555596727, 'chief new york'),\n",
+ " (-10.794984555596727, 'china new york'),\n",
+ " (-10.794984555596727, 'chri christi'),\n",
+ " (-10.794984555596727, 'christi'),\n",
+ " (-10.794984555596727, 'christoph'),\n",
+ " (-10.794984555596727, 'chuck'),\n",
+ " (-10.794984555596727, 'chuck todd'),\n",
+ " (-10.794984555596727, 'circuit'),\n",
+ " (-10.794984555596727, 'citi new'),\n",
+ " (-10.794984555596727, 'citi new york'),\n",
+ " (-10.794984555596727, 'citizenship'),\n",
+ " (-10.794984555596727, 'clinton new york'),\n",
+ " (-10.794984555596727, 'clue'),\n",
+ " (-10.794984555596727, 'coach'),\n",
+ " (-10.794984555596727, 'colleg new'),\n",
+ " (-10.794984555596727, 'colleg new york'),\n",
+ " (-10.794984555596727, 'collid'),\n",
+ " (-10.794984555596727, 'collin'),\n",
+ " (-10.794984555596727, 'comedi'),\n",
+ " (-10.794984555596727, 'comedi central'),\n",
+ " (-10.794984555596727, 'comey fire'),\n",
+ " (-10.794984555596727, 'commission'),\n",
+ " (-10.794984555596727, 'common core'),\n",
+ " (-10.794984555596727, 'common ground'),\n",
+ " (-10.794984555596727, 'compet'),\n",
+ " (-10.794984555596727, 'complex'),\n",
+ " (-10.794984555596727, 'conceal'),\n",
+ " (-10.794984555596727, 'confirm hear'),\n",
+ " (-10.794984555596727, 'congress breitbart'),\n",
+ " (-10.794984555596727, 'congress new york'),\n",
+ " (-10.794984555596727, 'control new'),\n",
+ " (-10.794984555596727, 'control new york'),\n",
+ " (-10.794984555596727, 'convent new'),\n",
+ " (-10.794984555596727, 'convent new york'),\n",
+ " (-10.794984555596727, 'corner'),\n",
+ " (-10.794984555596727, 'coulter'),\n",
+ " (-10.794984555596727, 'counsel'),\n",
+ " (-10.794984555596727, 'countri breitbart'),\n",
+ " (-10.794984555596727, 'cours'),\n",
+ " (-10.794984555596727, 'court block'),\n",
+ " (-10.794984555596727, 'court new'),\n",
+ " (-10.794984555596727, 'court new york'),\n",
+ " (-10.794984555596727, 'court rule new'),\n",
+ " (-10.794984555596727, 'cpac'),\n",
+ " (-10.794984555596727, 'crash new'),\n",
+ " (-10.794984555596727, 'crash new york'),\n",
+ " (-10.794984555596727, 'crime breitbart'),\n",
+ " (-10.794984555596727, 'crisi new'),\n",
+ " (-10.794984555596727, 'crisi new york'),\n",
+ " (-10.794984555596727, 'critic new'),\n",
+ " (-10.794984555596727, 'crown'),\n",
+ " (-10.794984555596727, 'cunningham'),\n",
+ " (-10.794984555596727, 'curb'),\n",
+ " (-10.794984555596727, 'davo'),\n",
+ " (-10.794984555596727, 'day breitbart'),\n",
+ " (-10.794984555596727, 'day new york'),\n",
+ " (-10.794984555596727, 'day parad'),\n",
+ " (-10.794984555596727, 'dead new'),\n",
+ " (-10.794984555596727, 'dead new york'),\n",
+ " (-10.794984555596727, 'deal breitbart'),\n",
+ " (-10.794984555596727, 'deal new'),\n",
+ " (-10.794984555596727, 'deal new york'),\n",
+ " (-10.794984555596727, 'death new'),\n",
+ " (-10.794984555596727, 'death new york'),\n",
+ " (-10.794984555596727, 'debat new'),\n",
+ " (-10.794984555596727, 'debat new york'),\n",
+ " (-10.794984555596727, 'debbi reynold'),\n",
+ " (-10.794984555596727, 'defi'),\n",
+ " (-10.794984555596727, 'defund'),\n",
+ " (-10.794984555596727, 'delingpol'),\n",
+ " (-10.794984555596727, 'dem rep'),\n",
+ " (-10.794984555596727, 'dem sen'),\n",
+ " (-10.794984555596727, 'democrat breitbart'),\n",
+ " (-10.794984555596727, 'democrat new'),\n",
+ " (-10.794984555596727, 'democrat new york'),\n",
+ " (-10.794984555596727, 'deport breitbart'),\n",
+ " (-10.794984555596727, 'despair'),\n",
+ " (-10.794984555596727, 'devo'),\n",
+ " (-10.794984555596727, 'dh'),\n",
+ " (-10.794984555596727, 'die new'),\n",
+ " (-10.794984555596727, 'die new york'),\n",
+ " (-10.794984555596727, 'diego'),\n",
+ " (-10.794984555596727, 'disappoint'),\n",
+ " (-10.794984555596727, 'divorc'),\n",
+ " (-10.794984555596727, 'donald trump breitbart'),\n",
+ " (-10.794984555596727, 'donald trump campaign'),\n",
+ " (-10.794984555596727, 'donald trump inaugur'),\n",
+ " (-10.794984555596727, 'dossier'),\n",
+ " (-10.794984555596727, 'drama'),\n",
+ " (-10.794984555596727, 'drive car'),\n",
+ " (-10.794984555596727, 'drug new'),\n",
+ " (-10.794984555596727, 'drug new york'),\n",
+ " (-10.794984555596727, 'dunham'),\n",
+ " (-10.794984555596727, 'dylann'),\n",
+ " (-10.794984555596727, 'dylann roof'),\n",
+ " (-10.794984555596727, 'eas'),\n",
+ " (-10.794984555596727, 'easter'),\n",
+ " (-10.794984555596727, 'economi new'),\n",
+ " (-10.794984555596727, 'ecuador'),\n",
+ " (-10.794984555596727, 'effort new york'),\n",
+ " (-10.794984555596727, 'egyptair'),\n",
+ " (-10.794984555596727, 'elect breitbart'),\n",
+ " (-10.794984555596727, 'elect loss'),\n",
+ " (-10.794984555596727, 'elect new york'),\n",
+ " (-10.794984555596727, 'els new'),\n",
+ " (-10.794984555596727, 'els new york'),\n",
+ " (-10.794984555596727, 'embassi jerusalem'),\n",
+ " (-10.794984555596727, 'emmi'),\n",
+ " (-10.794984555596727, 'end new'),\n",
+ " (-10.794984555596727, 'end new york'),\n",
+ " (-10.794984555596727, 'england'),\n",
+ " (-10.794984555596727, 'england patriot'),\n",
+ " (-10.794984555596727, 'epa'),\n",
+ " (-10.794984555596727, 'era new'),\n",
+ " (-10.794984555596727, 'era new york'),\n",
+ " (-10.794984555596727, 'espn'),\n",
+ " (-10.794984555596727, 'europ new york'),\n",
+ " (-10.794984555596727, 'european union'),\n",
+ " (-10.794984555596727, 'even brief'),\n",
+ " (-10.794984555596727, 'even brief new'),\n",
+ " (-10.794984555596727, 'event breitbart'),\n",
+ " (-10.794984555596727, 'execut order breitbart'),\n",
+ " (-10.794984555596727, 'expand'),\n",
+ " (-10.794984555596727, 'explain new'),\n",
+ " (-10.794984555596727, 'explain new york'),\n",
+ " (-10.794984555596727, 'extradit'),\n",
+ " (-10.794984555596727, 'face new'),\n",
+ " (-10.794984555596727, 'faction'),\n",
+ " (-10.794984555596727, 'fake news breitbart'),\n",
+ " (-10.794984555596727, 'fake news new'),\n",
+ " (-10.794984555596727, 'falluja'),\n",
+ " (-10.794984555596727, 'familiar'),\n",
+ " (-10.794984555596727, 'farewel'),\n",
+ " (-10.794984555596727, 'fargo'),\n",
+ " (-10.794984555596727, 'fatal shoot'),\n",
+ " (-10.794984555596727, 'fear new york'),\n",
+ " (-10.794984555596727, 'fear trump'),\n",
+ " (-10.794984555596727, 'feinstein'),\n",
+ " (-10.794984555596727, 'fidel'),\n",
+ " (-10.794984555596727, 'fidel castro'),\n",
+ " (-10.794984555596727, 'fieri'),\n",
+ " (-10.794984555596727, 'fight new'),\n",
+ " (-10.794984555596727, 'fight new york'),\n",
+ " (-10.794984555596727, 'fight trump'),\n",
+ " (-10.794984555596727, 'filibust'),\n",
+ " (-10.794984555596727, 'fillon'),\n",
+ " (-10.794984555596727, 'find new york'),\n",
+ " (-10.794984555596727, 'fire breitbart'),\n",
+ " (-10.794984555596727, 'fire new york'),\n",
+ " (-10.794984555596727, 'fisher'),\n",
+ " (-10.794984555596727, 'fitton'),\n",
+ " (-10.794984555596727, 'flight new'),\n",
+ " (-10.794984555596727, 'flight new york'),\n",
+ " (-10.794984555596727, 'fmr'),\n",
+ " (-10.794984555596727, 'fort'),\n",
+ " (-10.794984555596727, 'found new'),\n",
+ " (-10.794984555596727, 'found new york'),\n",
+ " (-10.794984555596727, 'fran oi'),\n",
+ " (-10.794984555596727, 'fran oi fillon'),\n",
+ " (-10.794984555596727, 'franc new'),\n",
+ " (-10.794984555596727, 'franc new york'),\n",
+ " (-10.794984555596727, 'freedom caucu'),\n",
+ " (-10.794984555596727, 'french presidenti'),\n",
+ " (-10.794984555596727, 'friday even'),\n",
+ " (-10.794984555596727, 'friday even brief'),\n",
+ " (-10.794984555596727, 'fs'),\n",
+ " (-10.794984555596727, 'futur new'),\n",
+ " (-10.794984555596727, 'futur new york'),\n",
+ " (-10.794984555596727, 'gaffney'),\n",
+ " (-10.794984555596727, 'game breitbart'),\n",
+ " (-10.794984555596727, 'game new'),\n",
+ " (-10.794984555596727, 'game new york'),\n",
+ " (-10.794984555596727, 'gawker'),\n",
+ " (-10.794984555596727, 'gener new'),\n",
+ " (-10.794984555596727, 'gener new york'),\n",
+ " (-10.794984555596727, 'georg michael'),\n",
+ " (-10.794984555596727, 'get back'),\n",
+ " (-10.794984555596727, 'get new'),\n",
+ " (-10.794984555596727, 'go new york'),\n",
+ " (-10.794984555596727, 'golden globe'),\n",
+ " (-10.794984555596727, 'golden state'),\n",
+ " (-10.794984555596727, 'golden state warrior'),\n",
+ " (-10.794984555596727, 'goodel'),\n",
+ " (-10.794984555596727, 'gop rep'),\n",
+ " (-10.794984555596727, 'gop sen'),\n",
+ " (-10.794984555596727, 'gorka'),\n",
+ " (-10.794984555596727, 'gorsuch'),\n",
+ " (-10.794984555596727, 'gorsuch breitbart'),\n",
+ " (-10.794984555596727, 'gorsuch confirm'),\n",
+ " (-10.794984555596727, 'govern new york'),\n",
+ " (-10.794984555596727, 'grammi'),\n",
+ " (-10.794984555596727, 'gray'),\n",
+ " (-10.794984555596727, 'griffin'),\n",
+ " (-10.794984555596727, 'grow new'),\n",
+ " (-10.794984555596727, 'grow new york'),\n",
+ " (-10.794984555596727, 'guant'),\n",
+ " (-10.794984555596727, 'guant namo'),\n",
+ " (-10.794984555596727, 'gulf'),\n",
+ " (-10.794984555596727, 'gymnast'),\n",
+ " (-10.794984555596727, 'hack new'),\n",
+ " (-10.794984555596727, 'hack new york'),\n",
+ " (-10.794984555596727, 'hbo'),\n",
+ " (-10.794984555596727, 'health bill'),\n",
+ " (-10.794984555596727, 'health care bill'),\n",
+ " (-10.794984555596727, 'health insur'),\n",
+ " (-10.794984555596727, 'health law'),\n",
+ " (-10.794984555596727, 'healthcar bill'),\n",
+ " (-10.794984555596727, 'hear new'),\n",
+ " (-10.794984555596727, 'hear new york'),\n",
+ " (-10.794984555596727, 'heart new'),\n",
+ " (-10.794984555596727, 'heart new york'),\n",
+ " (-10.794984555596727, 'high school'),\n",
+ " (-10.794984555596727, 'histori new'),\n",
+ " (-10.794984555596727, 'histori new york'),\n",
+ " (-10.794984555596727, 'hockey'),\n",
+ " (-10.794984555596727, 'holiday'),\n",
+ " (-10.794984555596727, 'home new'),\n",
+ " (-10.794984555596727, 'home new york'),\n",
+ " (-10.794984555596727, 'hometown'),\n",
+ " (-10.794984555596727, 'horribl'),\n",
+ " (-10.794984555596727, 'hous breitbart'),\n",
+ " (-10.794984555596727, 'hous new york'),\n",
+ " (-10.794984555596727, 'hungari'),\n",
+ " (-10.794984555596727, 'hurrican matthew'),\n",
+ " (-10.794984555596727, 'imam'),\n",
+ " (-10.794984555596727, 'immigr order'),\n",
+ " (-10.794984555596727, 'inaugur speech'),\n",
+ " (-10.794984555596727, 'inquiri new'),\n",
+ " (-10.794984555596727, 'inquiri new york'),\n",
+ " (-10.794984555596727, 'intend'),\n",
+ " (-10.794984555596727, 'interest rate'),\n",
+ " (-10.794984555596727, 'investig breitbart'),\n",
+ " (-10.794984555596727, 'investig new york'),\n",
+ " (-10.794984555596727, 'investig trump'),\n",
+ " (-10.794984555596727, 'isi new'),\n",
+ " (-10.794984555596727, 'isi new york'),\n",
+ " (-10.794984555596727, 'islam state support'),\n",
+ " (-10.794984555596727, 'isol'),\n",
+ " (-10.794984555596727, 'issu new'),\n",
+ " (-10.794984555596727, 'issu new york'),\n",
+ " (-10.794984555596727, 'jacki'),\n",
+ " (-10.794984555596727, 'jake'),\n",
+ " (-10.794984555596727, 'jane'),\n",
+ " (-10.794984555596727, 'jare kushner'),\n",
+ " (-10.794984555596727, 'jerri'),\n",
+ " (-10.794984555596727, 'jerri brown'),\n",
+ " (-10.794984555596727, 'jo'),\n",
+ " (-10.794984555596727, 'job breitbart'),\n",
+ " (-10.794984555596727, 'job new'),\n",
+ " (-10.794984555596727, 'job new york'),\n",
+ " (-10.794984555596727, 'jong'),\n",
+ " (-10.794984555596727, 'jong nam'),\n",
+ " (-10.794984555596727, 'jong un'),\n",
+ " (-10.794984555596727, 'journey'),\n",
+ " (-10.794984555596727, 'jr'),\n",
+ " (-10.794984555596727, 'judici'),\n",
+ " (-10.794984555596727, 'justin'),\n",
+ " (-10.794984555596727, 'kabul'),\n",
+ " (-10.794984555596727, 'kathi'),\n",
+ " (-10.794984555596727, 'kathi griffin'),\n",
+ " (-10.794984555596727, 'kati'),\n",
+ " (-10.794984555596727, 'kellogg'),\n",
+ " (-10.794984555596727, 'kevin'),\n",
+ " (-10.794984555596727, 'kill new'),\n",
+ " (-10.794984555596727, 'kill new york'),\n",
+ " (-10.794984555596727, 'kim jong'),\n",
+ " (-10.794984555596727, 'kim jong nam'),\n",
+ " (-10.794984555596727, 'kim jong un'),\n",
+ " (-10.794984555596727, 'know know'),\n",
+ " (-10.794984555596727, 'know new york'),\n",
+ " (-10.794984555596727, 'korea new'),\n",
+ " (-10.794984555596727, 'korea new york'),\n",
+ " (-10.794984555596727, 'krauthamm'),\n",
+ " (-10.794984555596727, 'kushner'),\n",
+ " (-10.794984555596727, 'la la'),\n",
+ " (-10.794984555596727, 'la la land'),\n",
+ " (-10.794984555596727, 'la land'),\n",
+ " (-10.794984555596727, 'labour'),\n",
+ " (-10.794984555596727, 'lago'),\n",
+ " (-10.794984555596727, 'latin'),\n",
+ " (-10.794984555596727, 'lauderdal'),\n",
+ " (-10.794984555596727, 'law breitbart'),\n",
+ " (-10.794984555596727, 'law new'),\n",
+ " (-10.794984555596727, 'law new york'),\n",
+ " (-10.794984555596727, 'lawyer say'),\n",
+ " (-10.794984555596727, 'le pen'),\n",
+ " (-10.794984555596727, 'leader new'),\n",
+ " (-10.794984555596727, 'leader new york'),\n",
+ " (-10.794984555596727, 'leaker'),\n",
+ " (-10.794984555596727, 'legitim'),\n",
+ " (-10.794984555596727, 'lena'),\n",
+ " (-10.794984555596727, 'lena dunham'),\n",
+ " (-10.794984555596727, 'levin'),\n",
+ " (-10.794984555596727, 'lewi'),\n",
+ " (-10.794984555596727, 'life new'),\n",
+ " (-10.794984555596727, 'life new york'),\n",
+ " (-10.794984555596727, 'linda'),\n",
+ " (-10.794984555596727, 'linda sarsour'),\n",
+ " (-10.794984555596727, 'line new'),\n",
+ " (-10.794984555596727, 'line new york'),\n",
+ " (-10.794984555596727, 'listen new'),\n",
+ " (-10.794984555596727, 'listen new york'),\n",
+ " (-10.794984555596727, 'lite'),\n",
+ " (-10.794984555596727, 'live new'),\n",
+ " (-10.794984555596727, 'live new york'),\n",
+ " (-10.794984555596727, 'lo angel'),\n",
+ " (-10.794984555596727, 'locht'),\n",
+ " (-10.794984555596727, 'london attack'),\n",
+ " (-10.794984555596727, 'long island'),\n",
+ " (-10.794984555596727, 'loss new'),\n",
+ " (-10.794984555596727, 'loss new york'),\n",
+ " (-10.794984555596727, 'louvr'),\n",
+ " (-10.794984555596727, 'machin new'),\n",
+ " (-10.794984555596727, 'machin new york'),\n",
+ " (-10.794984555596727, 'macron'),\n",
+ " (-10.794984555596727, 'madonna'),\n",
+ " (-10.794984555596727, 'maker'),\n",
+ " (-10.794984555596727, 'malaysia'),\n",
+ " (-10.794984555596727, 'mall'),\n",
+ " (-10.794984555596727, 'man new'),\n",
+ " (-10.794984555596727, 'man new york'),\n",
+ " (-10.794984555596727, 'manchin'),\n",
+ " (-10.794984555596727, 'manuel'),\n",
+ " (-10.794984555596727, 'mar'),\n",
+ " (-10.794984555596727, 'mar lago'),\n",
+ " (-10.794984555596727, 'marcher'),\n",
+ " (-10.794984555596727, 'marin le'),\n",
+ " (-10.794984555596727, 'marin le pen'),\n",
+ " (-10.794984555596727, 'market new'),\n",
+ " (-10.794984555596727, 'market new york'),\n",
+ " (-10.794984555596727, 'marlow'),\n",
+ " (-10.794984555596727, 'match'),\n",
+ " (-10.794984555596727, 'maxin'),\n",
+ " (-10.794984555596727, 'maxin water'),\n",
+ " (-10.794984555596727, 'mcconnel'),\n",
+ " (-10.794984555596727, 'media breitbart'),\n",
+ " (-10.794984555596727, 'media new'),\n",
+ " (-10.794984555596727, 'media new york'),\n",
+ " (-10.794984555596727, 'medicaid'),\n",
+ " (-10.794984555596727, 'meet new'),\n",
+ " (-10.794984555596727, 'memori day'),\n",
+ " (-10.794984555596727, 'merger'),\n",
+ " (-10.794984555596727, 'meryl'),\n",
+ " (-10.794984555596727, 'meryl streep'),\n",
+ " (-10.794984555596727, 'mexican border'),\n",
+ " (-10.794984555596727, 'mexican cartel'),\n",
+ " (-10.794984555596727, 'michael phelp'),\n",
+ " (-10.794984555596727, 'militari new'),\n",
+ " (-10.794984555596727, 'militari new york'),\n",
+ " (-10.794984555596727, 'million new york'),\n",
+ " (-10.794984555596727, 'milo breitbart'),\n",
+ " (-10.794984555596727, 'milo event'),\n",
+ " (-10.794984555596727, 'miss new'),\n",
+ " (-10.794984555596727, 'miss new york'),\n",
+ " (-10.794984555596727, 'mnuchin'),\n",
+ " (-10.794984555596727, 'model new'),\n",
+ " (-10.794984555596727, 'model new york'),\n",
+ " (-10.794984555596727, 'modi'),\n",
+ " (-10.794984555596727, 'monday brief'),\n",
+ " (-10.794984555596727, 'monday brief new'),\n",
+ " (-10.794984555596727, 'monday even'),\n",
+ " (-10.794984555596727, 'monday even brief'),\n",
+ " (-10.794984555596727, 'money new'),\n",
+ " (-10.794984555596727, 'money new york'),\n",
+ " (-10.794984555596727, 'month new'),\n",
+ " (-10.794984555596727, 'month new york'),\n",
+ " (-10.794984555596727, 'monument'),\n",
+ " (-10.794984555596727, 'moonlight'),\n",
+ " (-10.794984555596727, 'morn brief'),\n",
+ " (-10.794984555596727, 'morn brief new'),\n",
+ " (-10.794984555596727, 'muhammad ali'),\n",
+ " (-10.794984555596727, 'multipl'),\n",
+ " (-10.794984555596727, 'mulvaney'),\n",
+ " (-10.794984555596727, 'myanmar'),\n",
+ " (-10.794984555596727, 'nam'),\n",
+ " (-10.794984555596727, 'name new'),\n",
+ " (-10.794984555596727, 'namo'),\n",
+ " (-10.794984555596727, 'nanci'),\n",
+ " (-10.794984555596727, 'nanci pelosi'),\n",
+ " (-10.794984555596727, 'narendra'),\n",
+ " (-10.794984555596727, 'narendra modi'),\n",
+ " (-10.794984555596727, 'nat'),\n",
+ " (-10.794984555596727, 'nation new'),\n",
+ " (-10.794984555596727, 'nation new york'),\n",
+ " (-10.794984555596727, 'nation secur advis'),\n",
+ " (-10.794984555596727, 'navi seal'),\n",
+ " (-10.794984555596727, 'near texa'),\n",
+ " (-10.794984555596727, 'near texa border'),\n",
+ " (-10.794984555596727, 'neil gorsuch'),\n",
+ " (-10.794984555596727, 'netflix'),\n",
+ " (-10.794984555596727, 'new england'),\n",
+ " (-10.794984555596727, 'new england patriot'),\n",
+ " (-10.794984555596727, 'new year eve'),\n",
+ " (-10.794984555596727, 'new york new'),\n",
+ " (-10.794984555596727, 'new york state'),\n",
+ " (-10.794984555596727, 'news breitbart'),\n",
+ " (-10.794984555596727, 'news cnn'),\n",
+ " (-10.794984555596727, 'news daili'),\n",
+ " (-10.794984555596727, 'news new'),\n",
+ " (-10.794984555596727, 'news new york'),\n",
+ " (-10.794984555596727, 'night new'),\n",
+ " (-10.794984555596727, 'night new york'),\n",
+ " (-10.794984555596727, 'nobel prize'),\n",
+ " (-10.794984555596727, 'nomin'),\n",
+ " (-10.794984555596727, 'nuclear option'),\n",
+ " (-10.794984555596727, 'nune'),\n",
+ " (-10.794984555596727, 'obama breitbart'),\n",
+ " (-10.794984555596727, 'obama era'),\n",
+ " (-10.794984555596727, 'obamacar breitbart'),\n",
+ " (-10.794984555596727, 'obamacar lite'),\n",
+ " (-10.794984555596727, 'obamacar repeal'),\n",
+ " (-10.794984555596727, 'obamacar replac'),\n",
+ " (-10.794984555596727, 'odd'),\n",
+ " (-10.794984555596727, 'offic new'),\n",
+ " (-10.794984555596727, 'offic new york'),\n",
+ " (-10.794984555596727, 'offici say'),\n",
+ " (-10.794984555596727, 'offici say new'),\n",
+ " (-10.794984555596727, 'often'),\n",
+ " (-10.794984555596727, 'oi'),\n",
+ " (-10.794984555596727, 'oi fillon'),\n",
+ " (-10.794984555596727, 'oliv'),\n",
+ " (-10.794984555596727, 'olymp new'),\n",
+ " (-10.794984555596727, 'olymp new york'),\n",
+ " (-10.794984555596727, 'one new'),\n",
+ " (-10.794984555596727, 'one new york'),\n",
+ " (-10.794984555596727, 'op'),\n",
+ " (-10.794984555596727, 'open door'),\n",
+ " (-10.794984555596727, 'open new york'),\n",
+ " (-10.794984555596727, 'oper new'),\n",
+ " (-10.794984555596727, 'oppos trump'),\n",
+ " (-10.794984555596727, 'order breitbart'),\n",
+ " (-10.794984555596727, 'order new'),\n",
+ " (-10.794984555596727, 'order new york'),\n",
+ " (-10.794984555596727, 'orlando shoot'),\n",
+ " (-10.794984555596727, 'orlean'),\n",
+ " (-10.794984555596727, 'orovil'),\n",
+ " (-10.794984555596727, 'outcri'),\n",
+ " (-10.794984555596727, 'outlet'),\n",
+ " (-10.794984555596727, 'overhaul'),\n",
+ " (-10.794984555596727, 'pari agreement'),\n",
+ " (-10.794984555596727, 'parti new'),\n",
+ " (-10.794984555596727, 'parti new york'),\n",
+ " (-10.794984555596727, 'passport'),\n",
+ " (-10.794984555596727, 'past new'),\n",
+ " (-10.794984555596727, 'past new york'),\n",
+ " (-10.794984555596727, 'path new york'),\n",
+ " (-10.794984555596727, 'patrol agent'),\n",
+ " (-10.794984555596727, 'paul ryan obamacar'),\n",
+ " (-10.794984555596727, 'pelosi'),\n",
+ " (-10.794984555596727, 'penguin'),\n",
+ " (-10.794984555596727, 'peopl breitbart'),\n",
+ " (-10.794984555596727, 'perez'),\n",
+ " (-10.794984555596727, 'persist'),\n",
+ " (-10.794984555596727, 'person new york'),\n",
+ " (-10.794984555596727, 'phelp'),\n",
+ " (-10.794984555596727, 'pioneer'),\n",
+ " (-10.794984555596727, 'plan new'),\n",
+ " (-10.794984555596727, 'plan new york'),\n",
+ " (-10.794984555596727, 'plane crash'),\n",
+ " (-10.794984555596727, 'playoff'),\n",
+ " (-10.794984555596727, 'poland'),\n",
+ " (-10.794984555596727, 'polic new'),\n",
+ " (-10.794984555596727, 'polic new york'),\n",
+ " (-10.794984555596727, 'polic say'),\n",
+ " (-10.794984555596727, 'polic say new'),\n",
+ " (-10.794984555596727, 'polic shoot'),\n",
+ " (-10.794984555596727, 'polici breitbart'),\n",
+ " (-10.794984555596727, 'polici new'),\n",
+ " (-10.794984555596727, 'polici new york'),\n",
+ " (-10.794984555596727, 'polit new'),\n",
+ " (-10.794984555596727, 'polit new york'),\n",
+ " (-10.794984555596727, 'politico'),\n",
+ " (-10.794984555596727, 'post new'),\n",
+ " (-10.794984555596727, 'post new york'),\n",
+ " (-10.794984555596727, 'pound'),\n",
+ " (-10.794984555596727, 'power new york'),\n",
+ " (-10.794984555596727, 'pregnanc'),\n",
+ " (-10.794984555596727, 'pregnant'),\n",
+ " (-10.794984555596727, 'presid breitbart'),\n",
+ " (-10.794984555596727, 'presid new'),\n",
+ " (-10.794984555596727, 'presid new york'),\n",
+ " (-10.794984555596727, 'presid trump breitbart'),\n",
+ " (-10.794984555596727, 'presidenti debat'),\n",
+ " (-10.794984555596727, 'press breitbart'),\n",
+ " (-10.794984555596727, 'preview'),\n",
+ " (-10.794984555596727, 'price new'),\n",
+ " (-10.794984555596727, 'price new york'),\n",
+ " (-10.794984555596727, 'priebu'),\n",
+ " (-10.794984555596727, 'prison new'),\n",
+ " (-10.794984555596727, 'prison new york'),\n",
+ " (-10.794984555596727, 'problem new'),\n",
+ " (-10.794984555596727, 'problem new york'),\n",
+ " (-10.794984555596727, 'profession'),\n",
+ " (-10.794984555596727, 'prompt'),\n",
+ " (-10.794984555596727, 'protest breitbart'),\n",
+ " (-10.794984555596727, 'protest new'),\n",
+ " (-10.794984555596727, 'proud'),\n",
+ " (-10.794984555596727, 'pruitt'),\n",
+ " (-10.794984555596727, 'publish'),\n",
+ " (-10.794984555596727, 'puerto'),\n",
+ " (-10.794984555596727, 'quebec'),\n",
+ " (-10.794984555596727, 'race new'),\n",
+ " (-10.794984555596727, 'race new york'),\n",
+ " (-10.794984555596727, 'rampag'),\n",
+ " (-10.794984555596727, 'rand'),\n",
+ " (-10.794984555596727, 'rand paul'),\n",
+ " (-10.794984555596727, 'rang'),\n",
+ " (-10.794984555596727, 'rebuk'),\n",
+ " (-10.794984555596727, 'recal'),\n",
+ " (-10.794984555596727, 'redston'),\n",
+ " (-10.794984555596727, 'regist'),\n",
+ " (-10.794984555596727, 'rein'),\n",
+ " (-10.794984555596727, 'reinc'),\n",
+ " (-10.794984555596727, 'reinc priebu'),\n",
+ " (-10.794984555596727, 'reinstat'),\n",
+ " (-10.794984555596727, 'repeal breitbart'),\n",
+ " (-10.794984555596727, 'repeal obamacar'),\n",
+ " (-10.794984555596727, 'repeat'),\n",
+ " (-10.794984555596727, 'replac bill'),\n",
+ " (-10.794984555596727, 'report ask'),\n",
+ " (-10.794984555596727, 'report breitbart'),\n",
+ " (-10.794984555596727, 'report obama'),\n",
+ " (-10.794984555596727, 'report say'),\n",
+ " (-10.794984555596727, 'report say new'),\n",
+ " (-10.794984555596727, 'report trump'),\n",
+ " (-10.794984555596727, 'republican new'),\n",
+ " (-10.794984555596727, 'republican new york'),\n",
+ " (-10.794984555596727, 'reshap'),\n",
+ " (-10.794984555596727, 'rethink'),\n",
+ " (-10.794984555596727, 'rex'),\n",
+ " (-10.794984555596727, 'rex tillerson'),\n",
+ " (-10.794984555596727, 'rhetor'),\n",
+ " (-10.794984555596727, 'rico'),\n",
+ " (-10.794984555596727, 'right breitbart'),\n",
+ " (-10.794984555596727, 'right new'),\n",
+ " (-10.794984555596727, 'right new york'),\n",
+ " (-10.794984555596727, 'rio'),\n",
+ " (-10.794984555596727, 'rio olymp'),\n",
+ " (-10.794984555596727, 'riot breitbart'),\n",
+ " (-10.794984555596727, 'rodrigo'),\n",
+ " (-10.794984555596727, 'rodrigo dutert'),\n",
+ " (-10.794984555596727, 'roger ail'),\n",
+ " (-10.794984555596727, 'roug'),\n",
+ " (-10.794984555596727, 'rout'),\n",
+ " (-10.794984555596727, 'rule breitbart'),\n",
+ " (-10.794984555596727, 'rule new'),\n",
+ " (-10.794984555596727, 'rule new york'),\n",
+ " (-10.794984555596727, 'russia new york'),\n",
+ " (-10.794984555596727, 'russia probe'),\n",
+ " (-10.794984555596727, 'russian ambassador'),\n",
+ " (-10.794984555596727, 'russian hack'),\n",
+ " (-10.794984555596727, 'ryan locht'),\n",
+ " (-10.794984555596727, 'ryan obamacar'),\n",
+ " (-10.794984555596727, 'ryan obamacar lite'),\n",
+ " (-10.794984555596727, 'ryancar'),\n",
+ " (-10.794984555596727, 'san diego'),\n",
+ " (-10.794984555596727, 'sarsour'),\n",
+ " (-10.794984555596727, 'saturday'),\n",
+ " (-10.794984555596727, 'saturday night'),\n",
+ " (-10.794984555596727, 'saturday night live'),\n",
+ " (-10.794984555596727, 'say new'),\n",
+ " (-10.794984555596727, 'say new york'),\n",
+ " (-10.794984555596727, 'scalis'),\n",
+ " (-10.794984555596727, 'scandal breitbart'),\n",
+ " (-10.794984555596727, 'scandal new'),\n",
+ " (-10.794984555596727, 'scandal new york'),\n",
+ " (-10.794984555596727, 'school new'),\n",
+ " (-10.794984555596727, 'school new york'),\n",
+ " (-10.794984555596727, 'schumer'),\n",
+ " (-10.794984555596727, 'schwarzenegg'),\n",
+ " (-10.794984555596727, 'scott pruitt'),\n",
+ " (-10.794984555596727, 'scrambl'),\n",
+ " (-10.794984555596727, 'sea new'),\n",
+ " (-10.794984555596727, 'sea new york'),\n",
+ " (-10.794984555596727, 'sean spicer'),\n",
+ " (-10.794984555596727, 'sear'),\n",
+ " (-10.794984555596727, 'season new'),\n",
+ " (-10.794984555596727, 'season new york'),\n",
+ " (-10.794984555596727, 'secretari new'),\n",
+ " (-10.794984555596727, 'secretari new york'),\n",
+ " (-10.794984555596727, 'secur advis'),\n",
+ " (-10.794984555596727, 'secur council'),\n",
+ " (-10.794984555596727, 'segment'),\n",
+ " (-10.794984555596727, 'self drive car'),\n",
+ " (-10.794984555596727, 'senat breitbart'),\n",
+ " (-10.794984555596727, 'senat confirm'),\n",
+ " (-10.794984555596727, 'settlement new'),\n",
+ " (-10.794984555596727, 'settlement new york'),\n",
+ " (-10.794984555596727, 'sex offend'),\n",
+ " (-10.794984555596727, 'sexual abus'),\n",
+ " (-10.794984555596727, 'sharp'),\n",
+ " (-10.794984555596727, 'shinzo'),\n",
+ " (-10.794984555596727, 'shinzo abe'),\n",
+ " (-10.794984555596727, 'shoot new'),\n",
+ " (-10.794984555596727, 'shoot new york'),\n",
+ " (-10.794984555596727, 'show new'),\n",
+ " (-10.794984555596727, 'show new york'),\n",
+ " (-10.794984555596727, 'skill'),\n",
+ " (-10.794984555596727, 'skip'),\n",
+ " (-10.794984555596727, 'smile'),\n",
+ " (-10.794984555596727, 'smuggler'),\n",
+ " (-10.794984555596727, 'somalia'),\n",
+ " (-10.794984555596727, 'son law'),\n",
+ " (-10.794984555596727, 'south carolina'),\n",
+ " (-10.794984555596727, 'south korean'),\n",
+ " (-10.794984555596727, 'spacex'),\n",
+ " (-10.794984555596727, 'speaker paul'),\n",
+ " (-10.794984555596727, 'speaker paul ryan'),\n",
+ " (-10.794984555596727, 'specul'),\n",
+ " (-10.794984555596727, 'speech breitbart'),\n",
+ " (-10.794984555596727, 'speech new york'),\n",
+ " (-10.794984555596727, 'spicer'),\n",
+ " (-10.794984555596727, 'sport'),\n",
+ " (-10.794984555596727, 'sport new'),\n",
+ " (-10.794984555596727, 'sport new york'),\n",
+ " (-10.794984555596727, 'spotlight'),\n",
+ " (-10.794984555596727, 'stanc'),\n",
+ " (-10.794984555596727, 'stanford'),\n",
+ " (-10.794984555596727, 'star new'),\n",
+ " (-10.794984555596727, 'star new york'),\n",
+ " (-10.794984555596727, 'start new'),\n",
+ " (-10.794984555596727, 'start new york'),\n",
+ " (-10.794984555596727, 'state breitbart'),\n",
+ " (-10.794984555596727, 'state new'),\n",
+ " (-10.794984555596727, 'state new york'),\n",
+ " (-10.794984555596727, 'state support'),\n",
+ " (-10.794984555596727, 'state warrior'),\n",
+ " (-10.794984555596727, 'stem'),\n",
+ " (-10.794984555596727, 'step new'),\n",
+ " (-10.794984555596727, 'step new york'),\n",
+ " (-10.794984555596727, 'stephen bannon'),\n",
+ " (-10.794984555596727, 'stockholm'),\n",
+ " (-10.794984555596727, 'stori new'),\n",
+ " (-10.794984555596727, 'stori new york'),\n",
+ " (-10.794984555596727, 'strand'),\n",
+ " (-10.794984555596727, 'streep'),\n",
+ " (-10.794984555596727, 'street new york'),\n",
+ " (-10.794984555596727, 'streisand'),\n",
+ " (-10.794984555596727, 'student new'),\n",
+ " (-10.794984555596727, 'student new york'),\n",
+ " (-10.794984555596727, 'stumbl'),\n",
+ " (-10.794984555596727, 'suburb'),\n",
+ " (-10.794984555596727, 'subway'),\n",
+ " (-10.794984555596727, 'suddenli'),\n",
+ " (-10.794984555596727, 'sunday'),\n",
+ " (-10.794984555596727, 'super bowl'),\n",
+ " (-10.794984555596727, 'support donald'),\n",
+ " (-10.794984555596727, 'support donald trump'),\n",
+ " (-10.794984555596727, 'suprem court new'),\n",
+ " (-10.794984555596727, 'swift'),\n",
+ " (-10.794984555596727, 'swimmer'),\n",
+ " (-10.794984555596727, 'syria new york'),\n",
+ " (-10.794984555596727, 'syria strike'),\n",
+ " (-10.794984555596727, 'taiwan'),\n",
+ " (-10.794984555596727, 'takata'),\n",
+ " (-10.794984555596727, 'takeaway'),\n",
+ " (-10.794984555596727, 'taliban'),\n",
+ " (-10.794984555596727, 'talk new'),\n",
+ " (-10.794984555596727, 'tap'),\n",
+ " (-10.794984555596727, 'tax return'),\n",
+ " (-10.794984555596727, 'team new'),\n",
+ " (-10.794984555596727, 'team new york'),\n",
+ " (-10.794984555596727, 'temporari'),\n",
+ " (-10.794984555596727, 'term new'),\n",
+ " (-10.794984555596727, 'term new york'),\n",
+ " (-10.794984555596727, 'terror breitbart'),\n",
+ " (-10.794984555596727, 'terror new'),\n",
+ " (-10.794984555596727, 'test new york'),\n",
+ " (-10.794984555596727, 'texa border'),\n",
+ " (-10.794984555596727, 'theresa'),\n",
+ " (-10.794984555596727, 'theresa may'),\n",
+ " (-10.794984555596727, 'thing new'),\n",
+ " (-10.794984555596727, 'thing new york'),\n",
+ " (-10.794984555596727, 'thursday'),\n",
+ " (-10.794984555596727, 'thursday even'),\n",
+ " (-10.794984555596727, 'thursday even brief'),\n",
+ " (-10.794984555596727, 'tie new'),\n",
+ " (-10.794984555596727, 'tie new york'),\n",
+ " (-10.794984555596727, 'tillerson'),\n",
+ " (-10.794984555596727, 'time new'),\n",
+ " (-10.794984555596727, 'time new york'),\n",
+ " (-10.794984555596727, 'titl new'),\n",
+ " (-10.794984555596727, 'titl new york'),\n",
+ " (-10.794984555596727, 'todd'),\n",
+ " (-10.794984555596727, 'toll'),\n",
+ " (-10.794984555596727, 'tom bradi'),\n",
+ " (-10.794984555596727, 'tone'),\n",
+ " (-10.794984555596727, 'tough'),\n",
+ " (-10.794984555596727, 'tourist'),\n",
+ " (-10.794984555596727, 'town hall'),\n",
+ " (-10.794984555596727, 'town new'),\n",
+ " (-10.794984555596727, 'town new york'),\n",
+ " (-10.794984555596727, 'trailer breitbart'),\n",
+ " (-10.794984555596727, 'tran'),\n",
+ " (-10.794984555596727, 'transit team'),\n",
+ " (-10.794984555596727, 'travel ban'),\n",
+ " (-10.794984555596727, 'travel ban new'),\n",
+ " (-10.794984555596727, 'trial new'),\n",
+ " (-10.794984555596727, 'trial new york'),\n",
+ " (-10.794984555596727, 'trophi'),\n",
+ " (-10.794984555596727, 'trove'),\n",
+ " (-10.794984555596727, 'trudeau'),\n",
+ " (-10.794984555596727, 'trump admin'),\n",
+ " (-10.794984555596727, 'trump border'),\n",
+ " (-10.794984555596727, 'trump breitbart'),\n",
+ " (-10.794984555596727, 'trump budget'),\n",
+ " (-10.794984555596727, 'trump celebr'),\n",
+ " (-10.794984555596727, 'trump choic'),\n",
+ " (-10.794984555596727, 'trump could'),\n",
+ " (-10.794984555596727, 'trump execut'),\n",
+ " (-10.794984555596727, 'trump execut order'),\n",
+ " (-10.794984555596727, 'trump fire'),\n",
+ " (-10.794984555596727, 'trump first day'),\n",
+ " (-10.794984555596727, 'trump go'),\n",
+ " (-10.794984555596727, 'trump immigr'),\n",
+ " (-10.794984555596727, 'trump immigr order'),\n",
+ " (-10.794984555596727, 'trump keep'),\n",
+ " (-10.794984555596727, 'trump may'),\n",
+ " (-10.794984555596727, 'trump new york'),\n",
+ " (-10.794984555596727, 'trump nomine'),\n",
+ " (-10.794984555596727, 'trump order'),\n",
+ " (-10.794984555596727, 'trump pick'),\n",
+ " (-10.794984555596727, 'trump polici'),\n",
+ " (-10.794984555596727, 'trump talk'),\n",
+ " (-10.794984555596727, 'trump travel'),\n",
+ " (-10.794984555596727, 'trump travel ban'),\n",
+ " (-10.794984555596727, 'trump tri'),\n",
+ " (-10.794984555596727, 'trump visit'),\n",
+ " (-10.794984555596727, 'trump vow'),\n",
+ " (-10.794984555596727, 'trump wall'),\n",
+ " (-10.794984555596727, 'trump women'),\n",
+ " (-10.794984555596727, 'tuesday brief'),\n",
+ " (-10.794984555596727, 'tuesday brief new'),\n",
+ " (-10.794984555596727, 'tuesday even'),\n",
+ " (-10.794984555596727, 'tuesday even brief'),\n",
+ " (-10.794984555596727, 'turmoil'),\n",
+ " (-10.794984555596727, 'twitter breitbart'),\n",
+ " (-10.794984555596727, 'two year'),\n",
+ " (-10.794984555596727, 'uc davi'),\n",
+ " (-10.794984555596727, 'unlik'),\n",
+ " (-10.794984555596727, 'unmask'),\n",
+ " (-10.794984555596727, 'upend'),\n",
+ " (-10.794984555596727, 'uphold'),\n",
+ " (-10.794984555596727, 'us new york'),\n",
+ " (-10.794984555596727, 'vacat'),\n",
+ " (-10.794984555596727, 'vacat new'),\n",
+ " (-10.794984555596727, 'vacat new york'),\n",
+ " (-10.794984555596727, 'vanish'),\n",
+ " (-10.794984555596727, 'veto'),\n",
+ " (-10.794984555596727, 'violenc new'),\n",
+ " (-10.794984555596727, 'violenc new york'),\n",
+ " (-10.794984555596727, 'virgil'),\n",
+ " (-10.794984555596727, 'vogu'),\n",
+ " (-10.794984555596727, 'volkswagen'),\n",
+ " (-10.794984555596727, 'vote new'),\n",
+ " (-10.794984555596727, 'vote new york'),\n",
+ " (-10.794984555596727, 'voter id'),\n",
+ " (-10.794984555596727, 'wait new'),\n",
+ " (-10.794984555596727, 'wall breitbart'),\n",
+ " (-10.794984555596727, 'war new'),\n",
+ " (-10.794984555596727, 'war new york'),\n",
+ " (-10.794984555596727, 'wari'),\n",
+ " (-10.794984555596727, 'warn new'),\n",
+ " (-10.794984555596727, 'warn new york'),\n",
+ " (-10.794984555596727, 'warner'),\n",
+ " (-10.794984555596727, 'warrior'),\n",
+ " (-10.794984555596727, 'washington new'),\n",
+ " (-10.794984555596727, 'washington new york'),\n",
+ " (-10.794984555596727, 'water new'),\n",
+ " (-10.794984555596727, 'water new york'),\n",
+ " (-10.794984555596727, 'way new'),\n",
+ " (-10.794984555596727, 'way new york'),\n",
+ " (-10.794984555596727, 'wednesday brief'),\n",
+ " (-10.794984555596727, 'wednesday brief new'),\n",
+ " (-10.794984555596727, 'wednesday even'),\n",
+ " (-10.794984555596727, 'wednesday even brief'),\n",
+ " (-10.794984555596727, 'week new'),\n",
+ " (-10.794984555596727, 'week new york'),\n",
+ " (-10.794984555596727, 'weekend brief'),\n",
+ " (-10.794984555596727, 'weekend brief new'),\n",
+ " (-10.794984555596727, 'weekend new'),\n",
+ " (-10.794984555596727, 'weekend new york'),\n",
+ " (-10.794984555596727, 'well fargo'),\n",
+ " (-10.794984555596727, 'west bank'),\n",
+ " (-10.794984555596727, 'westminst'),\n",
+ " (-10.794984555596727, 'wh'),\n",
+ " (-10.794984555596727, 'white hous breitbart'),\n",
+ " (-10.794984555596727, 'white hous new'),\n",
+ " (-10.794984555596727, 'white nationalist'),\n",
+ " (-10.794984555596727, 'wider'),\n",
+ " (-10.794984555596727, 'wield'),\n",
+ " (-10.794984555596727, 'wildfir'),\n",
+ " (-10.794984555596727, 'wimbledon'),\n",
+ " (-10.794984555596727, 'win breitbart'),\n",
+ " (-10.794984555596727, 'wiretap claim'),\n",
+ " (-10.794984555596727, 'women march'),\n",
+ " (-10.794984555596727, 'women new'),\n",
+ " (-10.794984555596727, 'women new york'),\n",
+ " (-10.794984555596727, 'work new'),\n",
+ " (-10.794984555596727, 'work new york'),\n",
+ " (-10.794984555596727, 'world new'),\n",
+ " (-10.794984555596727, 'world new york'),\n",
+ " (-10.794984555596727, 'worri new'),\n",
+ " (-10.794984555596727, 'worri new york'),\n",
+ " (-10.794984555596727, 'wrestl'),\n",
+ " (-10.794984555596727, 'yahoo'),\n",
+ " (-10.794984555596727, 'year breitbart'),\n",
+ " (-10.794984555596727, 'year eve'),\n",
+ " (-10.794984555596727, 'year new york'),\n",
+ " (-10.794984555596727, 'york new'),\n",
+ " (-10.794984555596727, 'york new york'),\n",
+ " (-10.794984555596727, 'york state'),\n",
+ " (-10.794984555596727, 'zone new'),\n",
+ " (-10.794984555596727, 'zone new york'),\n",
+ " (-10.794984555596727, 'zoo'),\n",
+ " (-10.047770153766505, 'academi'),\n",
+ " (-10.047770153766505, 'accid'),\n",
+ " (-10.047770153766505, 'aclu'),\n",
+ " (-10.047770153766505, 'acr'),\n",
+ " (-10.047770153766505, 'adopt'),\n",
+ " (-10.047770153766505, 'ahead trump'),\n",
+ " (-10.047770153766505, 'airbnb'),\n",
+ " (-10.047770153766505, 'airlin'),\n",
+ " (-10.047770153766505, 'album'),\n",
+ " (-10.047770153766505, 'alex jone'),\n",
+ " (-10.047770153766505, 'allegedli'),\n",
+ " (-10.047770153766505, 'allianc'),\n",
+ " (-10.047770153766505, 'america new'),\n",
+ " (-10.047770153766505, 'anchor'),\n",
+ " (-10.047770153766505, 'anger'),\n",
+ " (-10.047770153766505, 'anti israel'),\n",
+ " (-10.047770153766505, 'anti semit'),\n",
+ " (-10.047770153766505, 'anymor'),\n",
+ " (-10.047770153766505, 'applic'),\n",
+ " (-10.047770153766505, 'approach'),\n",
+ " (-10.047770153766505, 'appropri'),\n",
+ " (-10.047770153766505, 'around world'),\n",
+ " (-10.047770153766505, 'artifici'),\n",
+ " (-10.047770153766505, 'asylum seeker'),\n",
+ " (-10.047770153766505, 'atlant'),\n",
+ " (-10.047770153766505, 'attack polic'),\n",
+ " (-10.047770153766505, 'attack trump'),\n",
+ " (-10.047770153766505, 'auto'),\n",
+ " (-10.047770153766505, 'aviv'),\n",
+ " (-10.047770153766505, 'back trump'),\n",
+ " (-10.047770153766505, 'baghdad'),\n",
+ " (-10.047770153766505, 'band'),\n",
+ " (-10.047770153766505, 'barrier'),\n",
+ " (-10.047770153766505, 'barron'),\n",
+ " (-10.047770153766505, 'beach'),\n",
+ " (-10.047770153766505, 'beer'),\n",
+ " (-10.047770153766505, 'behead'),\n",
+ " (-10.047770153766505, 'beij'),\n",
+ " (-10.047770153766505, 'ben'),\n",
+ " (-10.047770153766505, 'berlin'),\n",
+ " (-10.047770153766505, 'bet'),\n",
+ " (-10.047770153766505, 'beyonc'),\n",
+ " (-10.047770153766505, 'bill cosbi'),\n",
+ " (-10.047770153766505, 'bitter'),\n",
+ " (-10.047770153766505, 'blasio'),\n",
+ " (-10.047770153766505, 'block trump'),\n",
+ " (-10.047770153766505, 'boat'),\n",
+ " (-10.047770153766505, 'boe'),\n",
+ " (-10.047770153766505, 'boko'),\n",
+ " (-10.047770153766505, 'boko haram'),\n",
+ " (-10.047770153766505, 'bolton'),\n",
+ " (-10.047770153766505, 'bomber'),\n",
+ " (-10.047770153766505, 'bori'),\n",
+ " (-10.047770153766505, 'boss'),\n",
+ " (-10.047770153766505, 'bow'),\n",
+ " (-10.047770153766505, 'branch'),\n",
+ " (-10.047770153766505, 'breitbart news'),\n",
+ " (-10.047770153766505, 'bribe'),\n",
+ " (-10.047770153766505, 'brought'),\n",
+ " (-10.047770153766505, 'built'),\n",
+ " (-10.047770153766505, 'bull'),\n",
+ " ...]"
+ ]
+ },
+ "execution_count": 135,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "### Most fake\n",
+ "sorted(zip(classifier.coef_[0], feature_names))[:5000]"
+ ]
+ },
+ {
+ "cell_type": "markdown",
+ "metadata": {},
+ "source": [
+ "## HashingVectorizer\n"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 42,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stderr",
+ "output_type": "stream",
+ "text": [
+ "c:\\users\\krish.naik\\appdata\\local\\continuum\\anaconda3\\envs\\nlp\\lib\\site-packages\\sklearn\\feature_extraction\\hashing.py:94: DeprecationWarning: the option non_negative=True has been deprecated in 0.19 and will be removed in version 0.21.\n",
+ " \" in version 0.21.\", DeprecationWarning)\n",
+ "c:\\users\\krish.naik\\appdata\\local\\continuum\\anaconda3\\envs\\nlp\\lib\\site-packages\\sklearn\\feature_extraction\\hashing.py:94: DeprecationWarning: the option non_negative=True has been deprecated in 0.19 and will be removed in version 0.21.\n",
+ " \" in version 0.21.\", DeprecationWarning)\n"
+ ]
+ }
+ ],
+ "source": [
+ "hs_vectorizer=HashingVectorizer(n_features=5000,non_negative=True)\n",
+ "X=hs_vectorizer.fit_transform(corpus).toarray()"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 43,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "(18285, 5000)"
+ ]
+ },
+ "execution_count": 43,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "X.shape"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 47,
+ "metadata": {},
+ "outputs": [
+ {
+ "data": {
+ "text/plain": [
+ "array([[0. , 0.31622777, 0. , ..., 0. , 0. ,\n",
+ " 0. ],\n",
+ " [0. , 0. , 0. , ..., 0. , 0. ,\n",
+ " 0. ],\n",
+ " [0. , 0. , 0. , ..., 0. , 0. ,\n",
+ " 0. ],\n",
+ " ...,\n",
+ " [0. , 0. , 0. , ..., 0. , 0. ,\n",
+ " 0. ],\n",
+ " [0. , 0. , 0. , ..., 0. , 0. ,\n",
+ " 0. ],\n",
+ " [0. , 0. , 0. , ..., 0. , 0. ,\n",
+ " 0. ]])"
+ ]
+ },
+ "execution_count": 47,
+ "metadata": {},
+ "output_type": "execute_result"
+ }
+ ],
+ "source": [
+ "X"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 44,
+ "metadata": {},
+ "outputs": [],
+ "source": [
+ "## Divide the dataset into Train and Test\n",
+ "from sklearn.model_selection import train_test_split\n",
+ "X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.33, random_state=0)"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": 45,
+ "metadata": {},
+ "outputs": [
+ {
+ "name": "stdout",
+ "output_type": "stream",
+ "text": [
+ "accuracy: 0.871\n",
+ "Confusion matrix, without normalization\n"
+ ]
+ },
+ {
+ "data": {
+ "image/png": "\n",
+ "text/plain": [
+ ""
+ ]
+ },
+ "metadata": {
+ "needs_background": "light"
+ },
+ "output_type": "display_data"
+ }
+ ],
+ "source": [
+ "\n",
+ "from sklearn.naive_bayes import MultinomialNB\n",
+ "classifier=MultinomialNB()\n",
+ "classifier.fit(X_train, y_train)\n",
+ "pred = classifier.predict(X_test)\n",
+ "score = metrics.accuracy_score(y_test, pred)\n",
+ "print(\"accuracy: %0.3f\" % score)\n",
+ "cm = metrics.confusion_matrix(y_test, pred)\n",
+ "plot_confusion_matrix(cm, classes=['FAKE', 'REAL'])"
+ ]
+ },
+ {
+ "cell_type": "code",
+ "execution_count": null,
+ "metadata": {},
+ "outputs": [],
+ "source": []
+ }
+ ],
+ "metadata": {
+ "kernelspec": {
+ "display_name": "Python 3",
+ "language": "python",
+ "name": "python3"
+ },
+ "language_info": {
+ "codemirror_mode": {
+ "name": "ipython",
+ "version": 3
+ },
+ "file_extension": ".py",
+ "mimetype": "text/x-python",
+ "name": "python",
+ "nbconvert_exporter": "python",
+ "pygments_lexer": "ipython3",
+ "version": "3.6.10"
+ }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}