Skip to content

Instantly share code, notes, and snippets.

@grahamanderson
Created August 17, 2016 01:41
Show Gist options
  • Save grahamanderson/95475d39c17d74c1d803511cafe830be to your computer and use it in GitHub Desktop.
Save grahamanderson/95475d39c17d74c1d803511cafe830be to your computer and use it in GitHub Desktop.
projects/04-fletcher/dnc_leaks/DNC_Word2Vec_Gensim.ipynb
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "import gensim\nimport numpy as np\nimport pandas as pd\nimport nltk\nfrom nltk.corpus import stopwords\nimport re\nimport os\nimport codecs\nfrom sklearn import feature_extraction\nimport mpld3\nimport pickle\n\nstopwords = nltk.corpus.stopwords.words('english')\nfrom nltk.stem.snowball import SnowballStemmer\nstemmer = SnowballStemmer(\"english\")\n\nimport nltk.data\nnltk.download()\ntokenizer = nltk.data.load('nltk:tokenizers/punkt/english.pickle')\n",
"execution_count": 66,
"outputs": [
{
"text": "showing info https://raw.githubusercontent.com/nltk/nltk_data/gh-pages/index.xml\n",
"name": "stdout",
"output_type": "stream"
}
]
},
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "df = pickle.load( open( 'dnc_df_final_08_15.pkl', \"rb\" ) )\n",
"execution_count": 25,
"outputs": []
},
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "print(len(df.body_stop))\nprint(df.body[1])",
"execution_count": 42,
"outputs": [
{
"text": "16102\ncontribution data page de dws wlf reception type onetime number of tickets ticket amount ticket info ticketinfo additional contribution amount total amount first name shekelia last name hines address christiana meadows bear de phone email shekeliahinesgmailcom employer bayhealth employer address occupation physical therapist payment type visa account transaction transactionid user id userid contribution key ihfhmpysektdsdc custom field data section header additional information fundraiser code optional who encouraged you to make this contribution robin whitaker guest names if contributing for multiple tickets robin whitaker general information submit date mon may status authorized client ip address client browser mozilla macintosh intel mac os x applewebkit khtml like gecko version safari \n",
"name": "stdout",
"output_type": "stream"
}
]
},
{
"metadata": {
"collapsed": true,
"trusted": true
},
"cell_type": "code",
"source": "# Remove Stop Words from Body and Create stems \ndef tokenize_and_stem(text):\n # first tokenize by sentence, then by word to ensure that punctuation is caught as it's own token\n tokens = [word for sent in nltk.sent_tokenize(text) for word in nltk.word_tokenize(sent)]\n filtered_tokens = []\n # filter out any tokens not containing letters (e.g., numeric tokens, raw punctuation)\n for token in tokens:\n if re.search('[a-zA-Z]', token):\n filtered_tokens.append(token)\n stems = [stemmer.stem(t) for t in filtered_tokens]\n return stems\n\n\nstop = stopwords.words('english')\ndf['body_stop'] = df['body'].apply(lambda x: ' '.join([item for item in x.split() if item not in stop]))\ndf['body_stems']= df.body_stop.apply(lambda x: tokenize_and_stem(x) )",
"execution_count": 67,
"outputs": []
},
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "df.columns",
"execution_count": 74,
"outputs": [
{
"data": {
"text/plain": "Index(['date', 'from_name', 'from_email', 'to', 'subject', 'body', 'body_stop',\n 'body_stop_split', 'body_stems'],\n dtype='object')"
},
"execution_count": 74,
"output_type": "execute_result",
"metadata": {}
}
]
},
{
"metadata": {
"collapsed": true,
"trusted": true
},
"cell_type": "code",
"source": "df_stems = df[['date', 'from_name', 'from_email', 'to', 'subject', 'body_stems', 'body']]",
"execution_count": 76,
"outputs": []
},
{
"metadata": {
"collapsed": true,
"trusted": true
},
"cell_type": "code",
"source": "df_stems.to_pickle('./dnc_df_stems_08_16.pkl')",
"execution_count": 77,
"outputs": []
},
{
"metadata": {},
"cell_type": "markdown",
"source": "### Start Gensim Model\n---"
},
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "model = gensim.models.Word2Vec(df.body_stop_split.tolist(), size=100, window=5, min_count=1, workers=2)\n#model = gensim.models.Word2Vec(df.body_stems.tolist(), size=100, window=5, min_count=1, workers=2)",
"execution_count": 85,
"outputs": []
},
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "df_stems.head()",
"execution_count": 84,
"outputs": [
{
"data": {
"text/html": "<div>\n<table border=\"1\" class=\"dataframe\">\n <thead>\n <tr style=\"text-align: right;\">\n <th></th>\n <th>date</th>\n <th>from_name</th>\n <th>from_email</th>\n <th>to</th>\n <th>subject</th>\n <th>body_stems</th>\n <th>body</th>\n </tr>\n </thead>\n <tbody>\n <tr>\n <th>0</th>\n <td>Tue, 17 May 2016 19:51:22 -0700</td>\n <td>Maureen Garde</td>\n <td>[email protected]</td>\n <td>\"Davis, Marilyn\" &lt;[email protected]&gt;</td>\n <td>Re: CT To Automatically Register 400,000 Voters</td>\n <td>[mani, state, get, follow, connecticut, way, g...</td>\n <td>how many more states can we get to follow conn...</td>\n </tr>\n <tr>\n <th>1</th>\n <td>Mon, 2 May 2016 22:19:09 -0400</td>\n <td>Contribution</td>\n <td>[email protected]</td>\n <td>&lt;[email protected]&gt;, &lt;[email protected]&gt;, &lt;olszewsk...</td>\n <td>Contribution: DE008 - DWS WLF Reception / Shek...</td>\n <td>[contribut, data, page, de, dws, wlf, recept, ...</td>\n <td>contribution data page de dws wlf reception ty...</td>\n </tr>\n <tr>\n <th>2</th>\n <td>Mon, 23 May 2016 15:17:55 -0600</td>\n <td>POLITICOs Blast</td>\n <td>[email protected]</td>\n <td>&lt;[email protected]&gt;</td>\n <td>=?UTF-8?B?UE9MSVRJQ08ncyAyMDE2IEJsYXN0OiBCZXJu...</td>\n <td>[henri, c, jackson, pm, edt, last, bern, democ...</td>\n <td>by henry c jackson pm edt lasting bern the dem...</td>\n </tr>\n <tr>\n <th>3</th>\n <td>Wed, 27 Apr 2016 03:48:42 -0600</td>\n <td>POLITICO</td>\n <td>[email protected]</td>\n <td>&lt;[email protected]&gt;</td>\n <td>POLITICO's Daily Congress Digest for Wednesday...</td>\n <td>[politico, daili, congress, digest, wednesday,...</td>\n <td>politicos daily congress digest for wednesday ...</td>\n </tr>\n <tr>\n <th>4</th>\n <td>Thu, 19 May 2016 08:42:10 -0700</td>\n <td>Corinne Matti</td>\n <td>[email protected]</td>\n <td>\"Miranda, Luis\" &lt;[email protected]&gt;</td>\n <td>Re: America's Newsroom (FNC) - Luis Miranda (S...</td>\n <td>[yup, also, iq, media, snapstream, may, mirand...</td>\n <td>yup they also have iq media and snapstream on ...</td>\n </tr>\n </tbody>\n</table>\n</div>",
"text/plain": " date from_name \\\n0 Tue, 17 May 2016 19:51:22 -0700 Maureen Garde \n1 Mon, 2 May 2016 22:19:09 -0400 Contribution \n2 Mon, 23 May 2016 15:17:55 -0600 POLITICOs Blast \n3 Wed, 27 Apr 2016 03:48:42 -0600 POLITICO \n4 Thu, 19 May 2016 08:42:10 -0700 Corinne Matti \n\n from_email \\\n0 [email protected] \n1 [email protected] \n2 [email protected] \n3 [email protected] \n4 [email protected] \n\n to \\\n0 \"Davis, Marilyn\" <[email protected]> \n1 <[email protected]>, <[email protected]>, <olszewsk... \n2 <[email protected]> \n3 <[email protected]> \n4 \"Miranda, Luis\" <[email protected]> \n\n subject \\\n0 Re: CT To Automatically Register 400,000 Voters \n1 Contribution: DE008 - DWS WLF Reception / Shek... \n2 =?UTF-8?B?UE9MSVRJQ08ncyAyMDE2IEJsYXN0OiBCZXJu... \n3 POLITICO's Daily Congress Digest for Wednesday... \n4 Re: America's Newsroom (FNC) - Luis Miranda (S... \n\n body_stems \\\n0 [mani, state, get, follow, connecticut, way, g... \n1 [contribut, data, page, de, dws, wlf, recept, ... \n2 [henri, c, jackson, pm, edt, last, bern, democ... \n3 [politico, daili, congress, digest, wednesday,... \n4 [yup, also, iq, media, snapstream, may, mirand... \n\n body \n0 how many more states can we get to follow conn... \n1 contribution data page de dws wlf reception ty... \n2 by henry c jackson pm edt lasting bern the dem... \n3 politicos daily congress digest for wednesday ... \n4 yup they also have iq media and snapstream on ... "
},
"execution_count": 84,
"output_type": "execute_result",
"metadata": {}
}
]
},
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "model.vocab",
"execution_count": 86,
"outputs": [
{
"data": {
"text/plain": "{'selfabsorbed': <gensim.models.word2vec.Vocab at 0x15a2d44a8>,\n '': <gensim.models.word2vec.Vocab at 0x15a2d4e48>,\n 'preelection': <gensim.models.word2vec.Vocab at 0x15a2d4dd8>,\n 'adapted': <gensim.models.word2vec.Vocab at 0x15a2d4630>,\n 'httpgopoliticoemailcomqscbfafbbbdedadadeecbbd': <gensim.models.word2vec.Vocab at 0x15bd92748>,\n 'revue': <gensim.models.word2vec.Vocab at 0x15a2d4f98>,\n 'biden': <gensim.models.word2vec.Vocab at 0x15a2d4f60>,\n 'conventiond': <gensim.models.word2vec.Vocab at 0x15a2d4f28>,\n 'worriesthe': <gensim.models.word2vec.Vocab at 0x15a2d4ef0>,\n 'httpgopoliticoemailcomqsfcbacfbcaeabcbffecdbfeccfbbec': <gensim.models.word2vec.Vocab at 0x15a2d4eb8>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjmodqmjksimvtywlsijoicgscuakbkbmmubjniiwiawqiojmymdqoswizgbmxvywrhymxlijpcnvlfqgnphtmjknlchedrmdfrvowoodzmtbpicenyn': <gensim.models.word2vec.Vocab at 0x15a2d4e80>,\n 'desalination': <gensim.models.word2vec.Vocab at 0x17e2206a0>,\n 'osterman': <gensim.models.word2vec.Vocab at 0x15a2d4da0>,\n 'httpswwwbuzzfeedcomdanielwagnertrumpssaudibusinessutmtermukpwagwblxfmqqdv': <gensim.models.word2vec.Vocab at 0x15a2d4d68>,\n 'httpmerkleysenategovnewsletter': <gensim.models.word2vec.Vocab at 0x15a2d4d30>,\n 'estimation': <gensim.models.word2vec.Vocab at 0x15a2d4cf8>,\n 'httpgopoliticoemailcomqsccedfbcebdfdfbac': <gensim.models.word2vec.Vocab at 0x15a2d4cc0>,\n 'wellraised': <gensim.models.word2vec.Vocab at 0x15a2d4c88>,\n 'executing': <gensim.models.word2vec.Vocab at 0x15a2d4c50>,\n 'judy': <gensim.models.word2vec.Vocab at 0x15a2d4c18>,\n 'philosophy': <gensim.models.word2vec.Vocab at 0x15a2d4be0>,\n 'httpgopoliticoemailcomqsdfcdaaacdefdafbbdedfddfbebbfcdb': <gensim.models.word2vec.Vocab at 0x15a2d4ba8>,\n 'httpgopoliticoemailcomqsccbeffdcfacefdedfedadfaa': <gensim.models.word2vec.Vocab at 0x15a2d4b70>,\n 'lovefest': <gensim.models.word2vec.Vocab at 0x15a2d4b38>,\n 'cathylackcogancommailtocathylackcogancom': <gensim.models.word2vec.Vocab at 0x15a2d4b00>,\n 'lewistonauburn': <gensim.models.word2vec.Vocab at 0x15a2d4ac8>,\n 'stable': <gensim.models.word2vec.Vocab at 0x15a2d4a90>,\n 'nationally': <gensim.models.word2vec.Vocab at 0x15a2d4a20>,\n 'gradepoint': <gensim.models.word2vec.Vocab at 0x15a2d49e8>,\n 'sweetheart': <gensim.models.word2vec.Vocab at 0x15a2d49b0>,\n 'reflejan': <gensim.models.word2vec.Vocab at 0x15bd92898>,\n 'wrongdoers': <gensim.models.word2vec.Vocab at 0x15a2d4940>,\n 'worlds': <gensim.models.word2vec.Vocab at 0x15a2d4908>,\n 'chernobyls': <gensim.models.word2vec.Vocab at 0x15a2d48d0>,\n 'pedophilia': <gensim.models.word2vec.Vocab at 0x15a2d4898>,\n 'investigatory': <gensim.models.word2vec.Vocab at 0x15a2d4860>,\n 'charlene': <gensim.models.word2vec.Vocab at 0x15a2d4828>,\n 'allconsuming': <gensim.models.word2vec.Vocab at 0x15a2d47f0>,\n 'romney': <gensim.models.word2vec.Vocab at 0x15a2d47b8>,\n 'httpwwwcdcgovzikapregnancyindexhtml': <gensim.models.word2vec.Vocab at 0x15a2d4780>,\n 'wellformed': <gensim.models.word2vec.Vocab at 0x15a2d4748>,\n 'saidhttpphiladelphiacbslocalcompapoliticiansreacttobignightfordonaldtrump': <gensim.models.word2vec.Vocab at 0x15a2d4710>,\n 'walshtdncorg': <gensim.models.word2vec.Vocab at 0x15a2d46d8>,\n 'browserhttpuscampaignarchivecomudafbdecidfaedbceaacce': <gensim.models.word2vec.Vocab at 0x15a2d46a0>,\n 'previewed': <gensim.models.word2vec.Vocab at 0x15be0d668>,\n 'gobbled': <gensim.models.word2vec.Vocab at 0x15a2d4668>,\n 'meandering': <gensim.models.word2vec.Vocab at 0x15a2d45f8>,\n 'woulda': <gensim.models.word2vec.Vocab at 0x15b0c6208>,\n 'rousseff': <gensim.models.word2vec.Vocab at 0x15a2d4588>,\n 'wheeler': <gensim.models.word2vec.Vocab at 0x15b0c6240>,\n 'httpgopoliticoemailcomqsfdfeefcdeddcfdecdbacbcbaf': <gensim.models.word2vec.Vocab at 0x15a2d4518>,\n 'omidyar': <gensim.models.word2vec.Vocab at 0x15a2d44e0>,\n 'columna': <gensim.models.word2vec.Vocab at 0x15a2d4438>,\n 'prescriber': <gensim.models.word2vec.Vocab at 0x15a2d4470>,\n 'previouslyscheduled': <gensim.models.word2vec.Vocab at 0x15a2d4400>,\n 'tory': <gensim.models.word2vec.Vocab at 0x15a2d43c8>,\n 'hugh': <gensim.models.word2vec.Vocab at 0x15ae969b0>,\n 'brushbacks': <gensim.models.word2vec.Vocab at 0x15becdd68>,\n 'leaseback': <gensim.models.word2vec.Vocab at 0x15a5f9390>,\n 'agencieshttpswwwtedcruzorgfiveforfreedom': <gensim.models.word2vec.Vocab at 0x17e2204e0>,\n 'httphostedaporgdynamicfileselectionsbystatemdpresidenthtmlsiteapsectionpolitics': <gensim.models.word2vec.Vocab at 0x15ba0b7f0>,\n 'lucymooggmailcommailtolucymooggmailcom': <gensim.models.word2vec.Vocab at 0x17e2205c0>,\n 'httpstwittercomteamcavutostatus': <gensim.models.word2vec.Vocab at 0x17e220588>,\n 'amassed': <gensim.models.word2vec.Vocab at 0x17e2205f8>,\n 'listerv': <gensim.models.word2vec.Vocab at 0x17e220630>,\n 'httpwwwstutzmanpacomaboutrobbio': <gensim.models.word2vec.Vocab at 0x15a2d4e10>,\n 'valleys': <gensim.models.word2vec.Vocab at 0x17e220668>,\n 'forgives': <gensim.models.word2vec.Vocab at 0x17e2204a8>,\n 'httpwwwtheguardiancomusnewsaprjuliaioffejournalistmelaniatrumpantisemiticabuse': <gensim.models.word2vec.Vocab at 0x17e220898>,\n 'httpnationfoxnewscomwatchlivedonaldtrumpcampaigneventcostamesacalifornia': <gensim.models.word2vec.Vocab at 0x17e2208d0>,\n 'httpclickemailbostonglobecomqsdcabcdcafaebaffcfdcedbdccacdabfabecbdaef': <gensim.models.word2vec.Vocab at 0x17e220908>,\n 'veer': <gensim.models.word2vec.Vocab at 0x15accb898>,\n 'annoyance': <gensim.models.word2vec.Vocab at 0x17e2206d8>,\n 'symbolizes': <gensim.models.word2vec.Vocab at 0x1300dfef0>,\n 'httpsmediumcomthestorytextshotsffcc': <gensim.models.word2vec.Vocab at 0x17e220780>,\n 'markmailtopaustenbachmdncorg': <gensim.models.word2vec.Vocab at 0x17e2207f0>,\n 'httprrsnettnjspfnmughnfrrawferqbqkztojpipxzoahsexlfpiyohupchicsekthkytifkealunmuffuqrkwynibgxnofbiszwpdllzmemgpmkjmajcdhknjmmvyeksiqrpqqgylgyuxhjzgapsnzcvirlbxaxfuuwchymlchladsssjbbzfafdlkdlkccxiuvwchfwbxbwtgqbwchprspndrzjwjmohvmilirtgfkebphcnpmjzqmitkehfudea': <gensim.models.word2vec.Vocab at 0x17e220828>,\n 'yeahi': <gensim.models.word2vec.Vocab at 0x17e220860>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytldvcmxkllyyxfplwzvcmnlcyyzxrhautcnvymetznjvbspclzlwfuzclewutzmfsbhvqywgtzmylwlehqtymfdgxllziwmtyvmduvmtkvmnimzjmywqtmznmzsmrmlwfjymetmgvkyjiodyyzkxxnbjlmhbwwdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfcc': <gensim.models.word2vec.Vocab at 0x17e220940>,\n 'recriminations': <gensim.models.word2vec.Vocab at 0x1300e9588>,\n 'pgim': <gensim.models.word2vec.Vocab at 0x15ebc9828>,\n 'eckl': <gensim.models.word2vec.Vocab at 0x15ebc9908>,\n 'bevins': <gensim.models.word2vec.Vocab at 0x15ebc99e8>,\n 'bender': <gensim.models.word2vec.Vocab at 0x15cc57278>,\n 'vetting': <gensim.models.word2vec.Vocab at 0x15cc57550>,\n 'musician': <gensim.models.word2vec.Vocab at 0x15cbfcd30>,\n 'herehttpactiontimcanovacompagembffdecevesa': <gensim.models.word2vec.Vocab at 0x15cbfc940>,\n 'allintogether': <gensim.models.word2vec.Vocab at 0x11faec4e0>,\n 'httpwwwtheatlanticcompoliticsarchiveonhomecomingsmccidbaccdmceiduniqid': <gensim.models.word2vec.Vocab at 0x11faec208>,\n 'tema': <gensim.models.word2vec.Vocab at 0x11faec198>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytldvcmxklcrlcnktzgvlcgvucyhcylzlwdgfpciwbgfuzszzwfyygtzwzxjzlxnlyuzckyxkvmjaxniwnsymchngrhzjayyxztaltexztytodjjmihnrjyjmxmzinrfcrvcnkuahrtbdcgtptemdbpcjjpwsxhlywrzlwryyxcadbdeafedfcc': <gensim.models.word2vec.Vocab at 0x11faec518>,\n 'majorityhttpwwwpolitifactcomtruthometerstatementsjundonaldtrumptrumpprochoicepollingnumbersdeclining': <gensim.models.word2vec.Vocab at 0x15cc28d68>,\n 'londons': <gensim.models.word2vec.Vocab at 0x15cc28748>,\n 'beckerman': <gensim.models.word2vec.Vocab at 0x12fe6ad30>,\n 'cidiiinuxoczdf': <gensim.models.word2vec.Vocab at 0x12fe6ae10>,\n 'risktaking': <gensim.models.word2vec.Vocab at 0x1188c7208>,\n 'variability': <gensim.models.word2vec.Vocab at 0x11926fda0>,\n 'mcteague': <gensim.models.word2vec.Vocab at 0x11926ff28>,\n 'httpclickpoliticoemailcomprofilecenteraspxqscfcfcefbccafcfaeecdadbafadcddeeaddcfafedfabadthis': <gensim.models.word2vec.Vocab at 0x11926fef0>,\n 'cute': <gensim.models.word2vec.Vocab at 0x11c450dd8>,\n 'obfuscation': <gensim.models.word2vec.Vocab at 0x105d6acc0>,\n 'nitropress': <gensim.models.word2vec.Vocab at 0x1162244e0>,\n 'undisciplined': <gensim.models.word2vec.Vocab at 0x15a865a20>,\n 'lewallen': <gensim.models.word2vec.Vocab at 0x1300e4c88>,\n 'alon': <gensim.models.word2vec.Vocab at 0x1300e4b00>,\n 'bondholders': <gensim.models.word2vec.Vocab at 0x1300e4a20>,\n 'presshttpbigstoryaporgarticlebcbccfaceabeapinterviewtrumpnarrowsvplisthemovesgeneral': <gensim.models.word2vec.Vocab at 0x1300e4ac8>,\n 'bipartisanship': <gensim.models.word2vec.Vocab at 0x17e2209b0>,\n 'killers': <gensim.models.word2vec.Vocab at 0x17e2209e8>,\n 'gaughan': <gensim.models.word2vec.Vocab at 0x17e220a20>,\n 'pats': <gensim.models.word2vec.Vocab at 0x15be5b4e0>,\n 'comicstyle': <gensim.models.word2vec.Vocab at 0x17e220a58>,\n 'jeters': <gensim.models.word2vec.Vocab at 0x17e220a90>,\n 'rightshttpwwwnytimescomopinionastatebucksthetrendonvotingrightshtmlrefopinionr': <gensim.models.word2vec.Vocab at 0x17e220ac8>,\n 'shortened': <gensim.models.word2vec.Vocab at 0x17e220b00>,\n 'termstrumps': <gensim.models.word2vec.Vocab at 0x17e220b38>,\n 'pleases': <gensim.models.word2vec.Vocab at 0x17e220b70>,\n 'archivist': <gensim.models.word2vec.Vocab at 0x17e220ba8>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvcgzdcuyxrpbvdavmjaxniwnswnsozxjllwfyzsagutntgtcgvvcgxllxdobnllxnlbnrlbmnlcywcmvzawrlbnqtbjhbwetanvzdcjbtdxrlzcdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfcccacae': <gensim.models.word2vec.Vocab at 0x17e220c18>,\n 'thirdlargest': <gensim.models.word2vec.Vocab at 0x17e220c50>,\n 'iiabqqkxefnwqt': <gensim.models.word2vec.Vocab at 0x17e220c88>,\n 'rushing': <gensim.models.word2vec.Vocab at 0x17e220cc0>,\n 'gruender': <gensim.models.word2vec.Vocab at 0x17e220cf8>,\n 'demlawyerscouncildemocratsorgmailtodemlawyerscouncildemocratsorg': <gensim.models.word2vec.Vocab at 0x17e220d30>,\n 'ditchhttpwwwtampabaycomnewspoliticsnationalsenmarcorubioletsberealisticandditchcomprehensiveimmigration': <gensim.models.word2vec.Vocab at 0x17e220d68>,\n 'waltzed': <gensim.models.word2vec.Vocab at 0x17e220da0>,\n 'httpgopoliticoemailcomqsaceffdfafbecebefffefefcbf': <gensim.models.word2vec.Vocab at 0x17e220dd8>,\n 'bump': <gensim.models.word2vec.Vocab at 0x17e220e10>,\n 'mailtommatthewsdenverpostcom': <gensim.models.word2vec.Vocab at 0x15bd92c50>,\n 'selftalk': <gensim.models.word2vec.Vocab at 0x17e220e80>,\n 'httpsmediumcompaulbromleysourceemailccdbafdailydigest': <gensim.models.word2vec.Vocab at 0x17e220eb8>,\n 'abdulmutallab': <gensim.models.word2vec.Vocab at 0x17e220ef0>,\n 'pmpmurlblockederroraspx': <gensim.models.word2vec.Vocab at 0x17e220f28>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlbvbglawnzlnhbmrlcnmtzmfjzxmtdgzgtcvsbcpbiwzxjzdwfkawnlxncgvyzgvszwdhdgvzlxrvlxnaxrjachbgxlzlhbmnlcyymdelzalzaleotexzdmyltexmzutmtflnimwiltumweyzrjndjkzlzdgyesodgsprpzdzbvdyzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfcddbc': <gensim.models.word2vec.Vocab at 0x17e220f60>,\n 'wmata': <gensim.models.word2vec.Vocab at 0x17e220f98>,\n 'httpclickemailbostonglobecomqsfebadfdbdeeeaedefbefdaeddbbc': <gensim.models.word2vec.Vocab at 0x17e220fd0>,\n 'httpstemanetmessageqyxaibsghl': <gensim.models.word2vec.Vocab at 0x15bdcb550>,\n 'francescachambersmailonlinecommailtofrancescachambersmailonlinecom': <gensim.models.word2vec.Vocab at 0x12fdc1d30>,\n 'httplinkwashingtonpostcomclickahrcdovlddyuexrpbwvzlmnvbsymdelzalzexlvzlbvbglawnzlhpbgxhcnktyxpbnrvbihbgllbnmuahrtbdyzwycgsaxrpymmximczcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfccab': <gensim.models.word2vec.Vocab at 0x12fdc1ba8>,\n 'sundayshow': <gensim.models.word2vec.Vocab at 0x12fdc1b00>,\n 'kasch': <gensim.models.word2vec.Vocab at 0x12fdc1da0>,\n 'httpgopoliticoemailcomqsdbbbadeaefeefefafaaadaecee': <gensim.models.word2vec.Vocab at 0x12fdc1c50>,\n 'herehttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjiymdiwmtqsimvtywlsijoiymhhdghzfyyubkbmmubjniiwiawqiojmxndaoswizgbmxvywrhymxlijpcnvlfqwibtgshjkrhigfypxgwbbeonalvtvpnvvyts': <gensim.models.word2vec.Vocab at 0x12fdc1b38>,\n 'atobiasgmailcommailtoatobiasgmailcommailtoatobiasgmailcom': <gensim.models.word2vec.Vocab at 0x12fdc1a90>,\n 'redesigned': <gensim.models.word2vec.Vocab at 0x12fdc1cf8>,\n 'workrelated': <gensim.models.word2vec.Vocab at 0x12fdc1a58>,\n 'officeoficina': <gensim.models.word2vec.Vocab at 0x12fdc1978>,\n 'denbury': <gensim.models.word2vec.Vocab at 0x12fdc1be0>,\n 'buellers': <gensim.models.word2vec.Vocab at 0x12fdc1e48>,\n 'goldplated': <gensim.models.word2vec.Vocab at 0x12fdc1c88>,\n 'httpgopoliticoemailcomqseabaebbdbbbddfafcfbedddccecdcc': <gensim.models.word2vec.Vocab at 0x12fdc1f28>,\n 'constructionveterans': <gensim.models.word2vec.Vocab at 0x12fdc1a20>,\n 'httptinygroceryuslistmanagecomtrackclickucbfdbfccebccidadbeeaba': <gensim.models.word2vec.Vocab at 0x12fdc1e10>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbszcgvhavycnlhbizdgfdxmvnzmwodawotmndyoduotyypdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccedc': <gensim.models.word2vec.Vocab at 0x15bd92d68>,\n 'rejoin': <gensim.models.word2vec.Vocab at 0x105d7a908>,\n 'provoke': <gensim.models.word2vec.Vocab at 0x105d7ab70>,\n 'httpcatouslistmanagecomunsubscribeucfddebcidceefdfedccae': <gensim.models.word2vec.Vocab at 0x105d7a278>,\n 'lister': <gensim.models.word2vec.Vocab at 0x15aed38d0>,\n 'marathoner': <gensim.models.word2vec.Vocab at 0x105d7ac50>,\n 'taxes': <gensim.models.word2vec.Vocab at 0x105d7abe0>,\n 'leadershipreid': <gensim.models.word2vec.Vocab at 0x1300dc048>,\n 'gcroninraskycommailtogcroninraskycom': <gensim.models.word2vec.Vocab at 0x1300dc080>,\n 'httpmmassageuslistmanagecomunsubscribeuacaeebaidddcfceebbfccfc': <gensim.models.word2vec.Vocab at 0x1300dc0b8>,\n 'cliques': <gensim.models.word2vec.Vocab at 0x1300dc0f0>,\n 'employment': <gensim.models.word2vec.Vocab at 0x1300dc128>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjemtuynjmsimvtywlsijoicgscuakbkbmmubjniiwiawqiojmxmtcxmcwizgbmxvywrhymxlijpcnvlfqmqdhgayanyixgrhenzdkeqimqiaqdolqetxsg': <gensim.models.word2vec.Vocab at 0x15bd4f2b0>,\n 'mailtokevindiazchroncom': <gensim.models.word2vec.Vocab at 0x1300dc160>,\n 'spanmsohyperlinkfollowed': <gensim.models.word2vec.Vocab at 0x1300dc198>,\n 'warzel': <gensim.models.word2vec.Vocab at 0x1300dc1d0>,\n 'cidacdbcceddecac': <gensim.models.word2vec.Vocab at 0x1300dc208>,\n 'experiencequot': <gensim.models.word2vec.Vocab at 0x1300dc240>,\n 'papp': <gensim.models.word2vec.Vocab at 0x1300dc278>,\n 'backgrounders': <gensim.models.word2vec.Vocab at 0x1300dc2b0>,\n 'kabuki': <gensim.models.word2vec.Vocab at 0x1300dc2e8>,\n 'lemus': <gensim.models.word2vec.Vocab at 0x1300dc320>,\n 'flyboy': <gensim.models.word2vec.Vocab at 0x1300dc358>,\n 'toles': <gensim.models.word2vec.Vocab at 0x1300dc390>,\n 'befit': <gensim.models.word2vec.Vocab at 0x1300dc3c8>,\n 'noncollege': <gensim.models.word2vec.Vocab at 0x1300dc400>,\n 'teambuilding': <gensim.models.word2vec.Vocab at 0x1300dc438>,\n 'httpwwwnytimescomusconradburnsobituaryformermontanasenatordiesathtmlrefpolitics': <gensim.models.word2vec.Vocab at 0x1300dc470>,\n 'httpswwwyoutubecomwatchvcdfosgkifeatureyoutube': <gensim.models.word2vec.Vocab at 0x1300dc4a8>,\n 'upfront': <gensim.models.word2vec.Vocab at 0x1300dc4e0>,\n 'rachanadixit': <gensim.models.word2vec.Vocab at 0x1300dc518>,\n 'eviscerating': <gensim.models.word2vec.Vocab at 0x1300dc550>,\n 'lamentable': <gensim.models.word2vec.Vocab at 0x15a2dc0f0>,\n 'wfmz': <gensim.models.word2vec.Vocab at 0x1300dc5c0>,\n 'unintentionally': <gensim.models.word2vec.Vocab at 0x1300dc5f8>,\n 'hannan': <gensim.models.word2vec.Vocab at 0x1300dc630>,\n 'ntion': <gensim.models.word2vec.Vocab at 0x1300dc668>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjiotkndqsimvtywlsijoicgscuakbkbmmubjniiwiawqiojmxnzyzncwizgbmxvywrhymxlijpcnvlfqjmtpqstlvzbkojtmjpjlnyjkgetcwlbfea': <gensim.models.word2vec.Vocab at 0x1300dc6a0>,\n 'traficantes': <gensim.models.word2vec.Vocab at 0x1300dc6d8>,\n 'politicususa': <gensim.models.word2vec.Vocab at 0x1300dc710>,\n 'httpclickeusatodaycomqscaeafebadffbfbbbeacfaebaadbdcdca': <gensim.models.word2vec.Vocab at 0x1300dc748>,\n 'missouri': <gensim.models.word2vec.Vocab at 0x1300dc780>,\n 'shirlington': <gensim.models.word2vec.Vocab at 0x1300dc7b8>,\n 'airwaves': <gensim.models.word2vec.Vocab at 0x1300dc7f0>,\n 'unsubscribehttpwwwpoliticocomunsubscribeebdbaebuefddadffasadeddceaeadcebaebaefffdafaafecefbbae': <gensim.models.word2vec.Vocab at 0x1300dc828>,\n 'obtains': <gensim.models.word2vec.Vocab at 0x15b0c6710>,\n 'timberwolves': <gensim.models.word2vec.Vocab at 0x15ba0bcc0>,\n 'httpsinstagramcomvc': <gensim.models.word2vec.Vocab at 0x1300dc8d0>,\n 'phonenumber': <gensim.models.word2vec.Vocab at 0x1300dc908>,\n 'ignorancehttpwwwhuffingtonpostcombriannormoylenevadademocraticconventbhtml': <gensim.models.word2vec.Vocab at 0x1300dc940>,\n 'sonnenfeld': <gensim.models.word2vec.Vocab at 0x1300dc978>,\n 'run': <gensim.models.word2vec.Vocab at 0x1300dc9e8>,\n 'oblivious': <gensim.models.word2vec.Vocab at 0x1300dca20>,\n 'httpclickeusatodaycomqsaabdfbfbfffdbbdcbfefbdaaa': <gensim.models.word2vec.Vocab at 0x1300dca58>,\n 'bloomberghttpnhdpuslistmanagecomtrackclickudafbdecideedbeaacce': <gensim.models.word2vec.Vocab at 0x1300dca90>,\n 'miliband': <gensim.models.word2vec.Vocab at 0x1300dcac8>,\n 'illfated': <gensim.models.word2vec.Vocab at 0x1300dcb00>,\n 'shripalshahgmailcom': <gensim.models.word2vec.Vocab at 0x1300dcb38>,\n 'prerogative': <gensim.models.word2vec.Vocab at 0x1300dcba8>,\n 'effortbetween': <gensim.models.word2vec.Vocab at 0x1300dcbe0>,\n 'womenrsquos': <gensim.models.word2vec.Vocab at 0x1300dcc18>,\n 'mains': <gensim.models.word2vec.Vocab at 0x1300dcc50>,\n 'heal': <gensim.models.word2vec.Vocab at 0x1300dcc88>,\n 'gangkhar': <gensim.models.word2vec.Vocab at 0x15b0c67b8>,\n 'calturnercalcom': <gensim.models.word2vec.Vocab at 0x1300dccf8>,\n 'distancing': <gensim.models.word2vec.Vocab at 0x1300dcd30>,\n 'carlos': <gensim.models.word2vec.Vocab at 0x1300dcd68>,\n 'httpclickemailbostonglobecomqsaaafeffafcfdccfeecfaacfcaecfdbe': <gensim.models.word2vec.Vocab at 0x15a2fdeb8>,\n 'belloni': <gensim.models.word2vec.Vocab at 0x1300dcdd8>,\n 'birmingham': <gensim.models.word2vec.Vocab at 0x1300dce10>,\n 'sestak': <gensim.models.word2vec.Vocab at 0x1300dce48>,\n 'judgejeaninehttpstwittercomjudgejeanine': <gensim.models.word2vec.Vocab at 0x1300dce80>,\n 'httpmobilereuterscomarticleiduskcnyjofeedtyperssfeednametopnewsutmsourcetwitterutmmediumsocial': <gensim.models.word2vec.Vocab at 0x1300dceb8>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytljsbdzlvyawstdvtcgxlldwlziwmtyvmduvmtcvbwvnewtavsbhlzlwjhbmtydxblwludgvydmlldyaxrolwrvbmfszccnvtccdbtbtxjndwaxnyyzubfvcgluawucwadbdeafeca': <gensim.models.word2vec.Vocab at 0x1300dcef0>,\n 'mobility': <gensim.models.word2vec.Vocab at 0x1300dcf28>,\n 'bone': <gensim.models.word2vec.Vocab at 0x1300dcf60>,\n 'steelesidewire': <gensim.models.word2vec.Vocab at 0x1300dcf98>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvdghllwzpecccymdelzalzaxlroaxmtbmvlwluzglhbmetcgsbcpcyzxjlwjhzcuzxdzlwzvciagutcrvcccnvtcctbzlbwvudcdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccdd': <gensim.models.word2vec.Vocab at 0x1300dcfd0>,\n 'httpwwwlatimescomlocallanowlamelndonaldtrumpwhitenationalistdelegatestoryhtml': <gensim.models.word2vec.Vocab at 0x1300e2048>,\n 'talker': <gensim.models.word2vec.Vocab at 0x1300e2080>,\n 'httpsidewireuslistmanagecomunsubscribeudffdeaecccaffideeabbefebcbfeb': <gensim.models.word2vec.Vocab at 0x1300e20b8>,\n 'thth': <gensim.models.word2vec.Vocab at 0x1300e20f0>,\n 'ten': <gensim.models.word2vec.Vocab at 0x1300e2128>,\n 'carol': <gensim.models.word2vec.Vocab at 0x1300e2160>,\n 'httpcnnuslistmanagecomunsubscribeucfffabdeidaeecbaacafd': <gensim.models.word2vec.Vocab at 0x1300e21d0>,\n 'simcakoski': <gensim.models.word2vec.Vocab at 0x1300e2208>,\n 'httpbitlyoqplf': <gensim.models.word2vec.Vocab at 0x1300e2240>,\n 'commerciala': <gensim.models.word2vec.Vocab at 0x1300e2278>,\n 'grimm': <gensim.models.word2vec.Vocab at 0x1300e22b0>,\n 'disappoints': <gensim.models.word2vec.Vocab at 0x1300e22e8>,\n 'evoice': <gensim.models.word2vec.Vocab at 0x1300e2320>,\n 'taskforce': <gensim.models.word2vec.Vocab at 0x1300e2358>,\n 'wildbilljunocommailtowildbilljunocom': <gensim.models.word2vec.Vocab at 0x1300e2390>,\n 'buttons': <gensim.models.word2vec.Vocab at 0x1300e23c8>,\n 'piggy': <gensim.models.word2vec.Vocab at 0x1300e2400>,\n 'shoal': <gensim.models.word2vec.Vocab at 0x1300e2438>,\n 'phonein': <gensim.models.word2vec.Vocab at 0x1300e2470>,\n 'lowpolling': <gensim.models.word2vec.Vocab at 0x1300e24a8>,\n 'httplinkwashingtonpostcomclickahrcdovlddysyxrpbwvzlmnvbswbxpdgljcysyswbwtcfjlwftasizxjhlwzhdghlcijywwywlnbitblesymdemduxmczdgyesodgspdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccdbb': <gensim.models.word2vec.Vocab at 0x15a2eda90>,\n 'sahttpwwwopensecretsorglobbyclientsumphpidfyear': <gensim.models.word2vec.Vocab at 0x1300e2518>,\n 'danmericacnncommailtodanmericacnncom': <gensim.models.word2vec.Vocab at 0x1300e2550>,\n 'httpclickeusatodaycomqsffceaccbeebbdcacfedbcdadfcaff': <gensim.models.word2vec.Vocab at 0x1300e2588>,\n 'httpdemocratsuslistmanagecomtrackclickucadbafefdidafdeaaa': <gensim.models.word2vec.Vocab at 0x1300e25c0>,\n 'yorkespecially': <gensim.models.word2vec.Vocab at 0x1300e25f8>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjimjcotysimvtywlsijoicgscuakbkbmmubjniiwiawqiojmxnjkwnswizgbmxvywrhymxlijpcnvlfqeeavnsbmukiyrybkmwqhuxsfydlzsugzu': <gensim.models.word2vec.Vocab at 0x1300e2630>,\n 'deathbed': <gensim.models.word2vec.Vocab at 0x1300e2668>,\n 'epsteinhe': <gensim.models.word2vec.Vocab at 0x1300e26a0>,\n 'httpclickemailbostonglobecomqsaafaccfcadfaafbecefbedbbdfeaa': <gensim.models.word2vec.Vocab at 0x1300e26d8>,\n 'httpgopoliticoemailcomqsbbfbaecaebcaaeacddccbbdefadfdbf': <gensim.models.word2vec.Vocab at 0x1300e2710>,\n 'mcardle': <gensim.models.word2vec.Vocab at 0x1300e2748>,\n 'creditor': <gensim.models.word2vec.Vocab at 0x1300e2780>,\n 'publicsafety': <gensim.models.word2vec.Vocab at 0x1300e27b8>,\n 'dog': <gensim.models.word2vec.Vocab at 0x1300e27f0>,\n 'sharpie': <gensim.models.word2vec.Vocab at 0x1300e2828>,\n 'conventionhttpwwwsltribcomhomerollygovherbertgottagteamedat': <gensim.models.word2vec.Vocab at 0x1300e2860>,\n 'battled': <gensim.models.word2vec.Vocab at 0x1300e2898>,\n 'shedd': <gensim.models.word2vec.Vocab at 0x1300e28d0>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvcgzdcuyxrpbvdavmjaxniwnsxmimbjtzxitbmvlxlvcmstcrhdgutcvuyxrllwhamyaxrlwxlywrlcizzwzwjzwqtdgtzmlzszwfycypbimzwrlcmfslxbyaxnvbidbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccaf': <gensim.models.word2vec.Vocab at 0x15bd96240>,\n 'scribbled': <gensim.models.word2vec.Vocab at 0x1300e2940>,\n 'destac': <gensim.models.word2vec.Vocab at 0x1300e2978>,\n 'duome': <gensim.models.word2vec.Vocab at 0x1300e29b0>,\n 'madigans': <gensim.models.word2vec.Vocab at 0x1300e29e8>,\n 'akron': <gensim.models.word2vec.Vocab at 0x1300e2a58>,\n 'refueling': <gensim.models.word2vec.Vocab at 0x1300e2a90>,\n 'depot': <gensim.models.word2vec.Vocab at 0x1300e2ac8>,\n 'httpswwwfacebookcomnnotificationsmediumemailmidedcdgeagaccagbgbcodeabkmkckurgheconmwrightadncorgllocstcta': <gensim.models.word2vec.Vocab at 0x1300e2b00>,\n 'httpuscampaignarchivecomucfffabdeidfadeeb': <gensim.models.word2vec.Vocab at 0x1300e2b38>,\n 'cheering': <gensim.models.word2vec.Vocab at 0x1300e2b70>,\n 'donald': <gensim.models.word2vec.Vocab at 0x1300e2ba8>,\n 'chargeshttpwwwpoliticocomstoryscammersfeastoftrumpfundraisingdisarray': <gensim.models.word2vec.Vocab at 0x1300e2be0>,\n 'abcnewsgocompoliticsvicehttpstcooxrsvufq': <gensim.models.word2vec.Vocab at 0x1300e2c18>,\n 'dionne': <gensim.models.word2vec.Vocab at 0x17e48aba8>,\n 'chobani': <gensim.models.word2vec.Vocab at 0x1300e2c88>,\n 'krissy': <gensim.models.word2vec.Vocab at 0x1300e2cc0>,\n 'cantered': <gensim.models.word2vec.Vocab at 0x1300e2cf8>,\n 'uplet': <gensim.models.word2vec.Vocab at 0x17e48d198>,\n 'firstterm': <gensim.models.word2vec.Vocab at 0x17e48d400>,\n 'facebookcommarilynddavishttpfacebookcommarilynddavis': <gensim.models.word2vec.Vocab at 0x1300e2da0>,\n 'systemhttpswwwwashingtonpostcomopinionsaftertrumpthegopmayneedabettervotingsystemcacebedfastoryhtml': <gensim.models.word2vec.Vocab at 0x15ba0e0b8>,\n 'fallsmanaging': <gensim.models.word2vec.Vocab at 0x1300e2e10>,\n 'wild': <gensim.models.word2vec.Vocab at 0x1300e2e48>,\n 'mailtogregschollphmloanscom': <gensim.models.word2vec.Vocab at 0x1300e2e80>,\n 'started': <gensim.models.word2vec.Vocab at 0x1300e2eb8>,\n 'httpclickemailbostonglobecomqsaaccdbceedaaebfdedfeaece': <gensim.models.word2vec.Vocab at 0x1300e2ef0>,\n 'implodes': <gensim.models.word2vec.Vocab at 0x1300e2f28>,\n 'torrez': <gensim.models.word2vec.Vocab at 0x1300e2f60>,\n 'signify': <gensim.models.word2vec.Vocab at 0x1300e2f98>,\n 'doghttpwwwpoliticocomstorytimkainehillaryclintonattack': <gensim.models.word2vec.Vocab at 0x1300e2fd0>,\n 'smartest': <gensim.models.word2vec.Vocab at 0x1300df048>,\n 'downhttpwwwnbcnewscomidnspoliticstmohighcourtstrikesdownvoteridlawvykvoamrkgq': <gensim.models.word2vec.Vocab at 0x1300df080>,\n 'micromanaging': <gensim.models.word2vec.Vocab at 0x1300df0b8>,\n 'tissues': <gensim.models.word2vec.Vocab at 0x1300df0f0>,\n 'httplinkwashingtonpostcomoccaeadcbcfcxpyvyua': <gensim.models.word2vec.Vocab at 0x1300df128>,\n 'philanthropistdefends': <gensim.models.word2vec.Vocab at 0x1300df160>,\n 'libertarianminded': <gensim.models.word2vec.Vocab at 0x1300df198>,\n 'stateshttpsenwikipediaorgwikiunitedstates': <gensim.models.word2vec.Vocab at 0x1300df1d0>,\n 'itsonusorg': <gensim.models.word2vec.Vocab at 0x1300df208>,\n 'azcentral': <gensim.models.word2vec.Vocab at 0x1300df240>,\n 'craigjohnsonsstgborgmailtocraigjohnsonsstgborg': <gensim.models.word2vec.Vocab at 0x1300df278>,\n 'httpgopoliticoemailcomqsccdceaeceafcbcdebfc': <gensim.models.word2vec.Vocab at 0x1300df2b0>,\n 'gilad': <gensim.models.word2vec.Vocab at 0x1300df2e8>,\n 'birtherinchief': <gensim.models.word2vec.Vocab at 0x1300df320>,\n 'wagoner': <gensim.models.word2vec.Vocab at 0x1300df358>,\n 'tinged': <gensim.models.word2vec.Vocab at 0x15c11ec50>,\n 'selections': <gensim.models.word2vec.Vocab at 0x15c137f60>,\n 'powertuesdays': <gensim.models.word2vec.Vocab at 0x1300df390>,\n 'stumped': <gensim.models.word2vec.Vocab at 0x1300df3c8>,\n 'cidimagejpgdaffeb': <gensim.models.word2vec.Vocab at 0x1300df400>,\n 'fraying': <gensim.models.word2vec.Vocab at 0x1300df438>,\n 'listhttpamericanbridgepacuslistmanagecomunsubscribeueebfeedcfeeffdidcfcebcdbbccca': <gensim.models.word2vec.Vocab at 0x1300df470>,\n 'ledonnesdncorgmailtoledonnesdncorg': <gensim.models.word2vec.Vocab at 0x1300df4a8>,\n 'wer': <gensim.models.word2vec.Vocab at 0x1300df4e0>,\n 'httpmittomailcomphplistltphpidzhawuzwgpawrqavg': <gensim.models.word2vec.Vocab at 0x1300df518>,\n 'husbands': <gensim.models.word2vec.Vocab at 0x1300df550>,\n 'mdewakanton': <gensim.models.word2vec.Vocab at 0x1300df588>,\n 'gaystraight': <gensim.models.word2vec.Vocab at 0x1300df5c0>,\n 'lauralscastingorg': <gensim.models.word2vec.Vocab at 0x1300df5f8>,\n 'precedes': <gensim.models.word2vec.Vocab at 0x1300df630>,\n 'aviator': <gensim.models.word2vec.Vocab at 0x15b0c6da0>,\n 'wcllinaspbsorg': <gensim.models.word2vec.Vocab at 0x1300df6a0>,\n 'goody': <gensim.models.word2vec.Vocab at 0x1300df6d8>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvcgfyzwawnldwlziwmtyvmdqvmjyvdghhdchdzbctblbnqtcgfyzwcyvzipbnrlcnjhylhbcjaglszhjlbiawxslxbybjhymxlwzhyuvpdwbwmszcglzcmmbmxfcgfyzwcaeadcbcfceee': <gensim.models.word2vec.Vocab at 0x1300df710>,\n 'trumphttpwwwbloombergcompoliticsarticlescruzandkasichcutdealtotryandstoptrump': <gensim.models.word2vec.Vocab at 0x1300df748>,\n 'transperson': <gensim.models.word2vec.Vocab at 0x15b0c6e10>,\n 'nervously': <gensim.models.word2vec.Vocab at 0x1300df7b8>,\n 'dinged': <gensim.models.word2vec.Vocab at 0x1300df7f0>,\n 'gazettes': <gensim.models.word2vec.Vocab at 0x1300df828>,\n 'manpads': <gensim.models.word2vec.Vocab at 0x1300df860>,\n 'httplinkwashingtonpostcomclickahrcdovlrozwhpbgwuytlhvbwvuzxdzlnhbxbhawdulzimdcmicnvtccjywwywlnbixdwlldgxlwnvdxjcytdxnsawzpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfcce': <gensim.models.word2vec.Vocab at 0x1300df898>,\n 'httplinkwashingtonpostcomclickahrchmlydcuewdhvizsjbvdfygdjymgxdxnnegliyyzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfcjbbf': <gensim.models.word2vec.Vocab at 0x1300df8d0>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjiotkndysimvtywlsijoicgscuakbkbmmubjniiwiawqiojmxnzyznswizgbmxvywrhymxlijpcnvlfqrvqgtxhsrmlffzqldfjcovknbabphcvm': <gensim.models.word2vec.Vocab at 0x1300df908>,\n 'brodsky': <gensim.models.word2vec.Vocab at 0x1300df940>,\n 'httpswwwdropboxcomlsvufwqfpqyupiisdhadaltext': <gensim.models.word2vec.Vocab at 0x1300df978>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjmotkndusimvtywlsijoicbvbgfyawnozbkbmmubjniiwiawqiojmymdayncwizgbmxvywrhymxlijpcnvlfqvzxyspriunssrgxbipwrneamkrjijuqs': <gensim.models.word2vec.Vocab at 0x1300df9b0>,\n 'notsogood': <gensim.models.word2vec.Vocab at 0x1300df9e8>,\n 'eckington': <gensim.models.word2vec.Vocab at 0x1300dfa20>,\n 'thathttpswwwwashingtonpostcomnewsthefixwpdonaldtrumptherehastobesomeformofpunishmentforwomenwhogetabortions': <gensim.models.word2vec.Vocab at 0x1300dfa58>,\n 'chabria': <gensim.models.word2vec.Vocab at 0x1300dfac8>,\n 'unsatisfying': <gensim.models.word2vec.Vocab at 0x1300dfb00>,\n 'quantifies': <gensim.models.word2vec.Vocab at 0x17e49d390>,\n 'blenheim': <gensim.models.word2vec.Vocab at 0x1300dfb70>,\n 'httpsmediumcomgitoutthevotesourceemailccdbafdailydigest': <gensim.models.word2vec.Vocab at 0x1300dfba8>,\n 'josephbpaulsenwhoeopgov': <gensim.models.word2vec.Vocab at 0x1300dfbe0>,\n 'namecallingcontinues': <gensim.models.word2vec.Vocab at 0x1300dfc18>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbsqbjnzvndwfqyxjkbyzdgfdxmvnzimzizodqntmmjqxnjaxpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfcced': <gensim.models.word2vec.Vocab at 0x1300dfc50>,\n 'httpclickemailbostonglobecomqsbdbffbdaecdeeddecfbebbeacbcbebdda': <gensim.models.word2vec.Vocab at 0x1300dfc88>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjentqntusimvtywlsijoicgvzxjzbrqgruyyvcmcilcjpzcimzeynzylcjkbdubghzgfibguionrydwvnaxehdbucrqvmuglqjsepaocdglkntxtegq': <gensim.models.word2vec.Vocab at 0x1300dfcc0>,\n 'usitcs': <gensim.models.word2vec.Vocab at 0x1300dfcf8>,\n 'amplifies': <gensim.models.word2vec.Vocab at 0x17e49dda0>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvyfwaxrhbczwfagvylwdhbmcvdavmjaxniwnsxmcklwmtyxjlysmbjlyfzdczagzxjzlwnvbnrpbnvllxroaxmtdvlayaxrolwnvbwtdgvtcgvyyxrcmvzlwfuzcjbgzhktctpzxmvpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccadae': <gensim.models.word2vec.Vocab at 0x1300dfda0>,\n 'munk': <gensim.models.word2vec.Vocab at 0x1300dfdd8>,\n 'consigliore': <gensim.models.word2vec.Vocab at 0x1300dfe10>,\n 'httpgopoliticoemailcomqsbafdafaedafacfdbaecbdeacc': <gensim.models.word2vec.Vocab at 0x1300dfe48>,\n 'unsubscribehttpwwwpoliticocomunsubscribeeddadccadedfaduefddadffasffaafdadbfecbddcadcedaacfddebbebdecbafcbcdedcbffcfbeca': <gensim.models.word2vec.Vocab at 0x1300dfe80>,\n 'httplinkwashingtonpostcomclickahrcdovlddyyxnoawndgucgzdcjbvchjpdmfjeswbxpykvmjaxmsxmsxocnsvfbulpywloxnbjlmhbwwdbtbtxjndwaxnyyzubftaxgcaeadcbcfccbbe': <gensim.models.word2vec.Vocab at 0x1300dfeb8>,\n 'colberts': <gensim.models.word2vec.Vocab at 0x15cdf92b0>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjenzqxodysimvtywlsijoicgvzxjzbrqgruyyvcmcilcjpzcimzezmdylcjkbdubghzgfibguionrydwvpqjfqbsztngesppogsozsirxvkolhnrilpuzy': <gensim.models.word2vec.Vocab at 0x17e220710>,\n 'weissenstein': <gensim.models.word2vec.Vocab at 0x1300dff28>,\n 'twoperson': <gensim.models.word2vec.Vocab at 0x1300dffd0>,\n 'timethe': <gensim.models.word2vec.Vocab at 0x1300e9048>,\n 'httpgopoliticoemailcomqsaafdabfcdfccabfbccdbfdf': <gensim.models.word2vec.Vocab at 0x1300e9080>,\n 'katarina': <gensim.models.word2vec.Vocab at 0x1300e90b8>,\n 'considershttpcoloradodemsuslistmanagecomtrackclickufadeadfabidddeebbeab': <gensim.models.word2vec.Vocab at 0x1300e90f0>,\n 'lees': <gensim.models.word2vec.Vocab at 0x1300e9128>,\n 'httpclickemailbostonglobecomqsaaafeffdfddcaccaaebabdedadbfcabcb': <gensim.models.word2vec.Vocab at 0x15b024710>,\n 'dinner': <gensim.models.word2vec.Vocab at 0x1300e9198>,\n 'revival': <gensim.models.word2vec.Vocab at 0x15a868588>,\n 'httpclickemailbostonglobecomqsefccfdeafacafbfcddecaeeaaaaeeba': <gensim.models.word2vec.Vocab at 0x1300e91d0>,\n 'percentagepoint': <gensim.models.word2vec.Vocab at 0x1300e9208>,\n 'ratio': <gensim.models.word2vec.Vocab at 0x1300e9240>,\n 'muslimsabout': <gensim.models.word2vec.Vocab at 0x1300e9278>,\n 'sets': <gensim.models.word2vec.Vocab at 0x15ba0e588>,\n 'httplinkwashingtonpostcomclickahrcdovlddyjdhbvcquytlxvyfslfydgljbguvvtywtbwlzdgfrzwtzmylxryywzzvuzgvylwhhcmfzcvklwlultcnzenjyucghwpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfcceb': <gensim.models.word2vec.Vocab at 0x1300e92e8>,\n 'httpdailycallercomdonaldtrumponbencarsondoctorsdontcreatejobs': <gensim.models.word2vec.Vocab at 0x1300e9320>,\n 'gillis': <gensim.models.word2vec.Vocab at 0x1300e9358>,\n 'ceffcca': <gensim.models.word2vec.Vocab at 0x1300e9390>,\n 'httpvarietycomtvnewsthecatchrenewedseasonabcshondalandmccidcbefmceiduniqid': <gensim.models.word2vec.Vocab at 0x15ae995c0>,\n 'bronzemirrored': <gensim.models.word2vec.Vocab at 0x17e4a57b8>,\n 'wwwsamanthadamatocomhttpwwwsamanthadamatocom': <gensim.models.word2vec.Vocab at 0x1300e9438>,\n 'yalla': <gensim.models.word2vec.Vocab at 0x1300e9470>,\n 'legislatorled': <gensim.models.word2vec.Vocab at 0x1300e94a8>,\n 'knx': <gensim.models.word2vec.Vocab at 0x15ac58080>,\n 'shoes': <gensim.models.word2vec.Vocab at 0x1300e94e0>,\n 'malloyhttpwwwcourantcompoliticshcmalloycompromisestoryhtml': <gensim.models.word2vec.Vocab at 0x1300e9518>,\n 'resuelve': <gensim.models.word2vec.Vocab at 0x1300e9550>,\n 'call': <gensim.models.word2vec.Vocab at 0x15ebc9048>,\n 'gagglemix': <gensim.models.word2vec.Vocab at 0x15ba0e5c0>,\n 'collides': <gensim.models.word2vec.Vocab at 0x1300e95f8>,\n 'mcdaniel': <gensim.models.word2vec.Vocab at 0x1300e9630>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvcgzxjwbnldwlziwmtyvmduvmdmvzwlwxvbtzlxrvlwjystdhjbxbtzwdwtawtawkawfuyszzwhdgutchjpbwfyesdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfcceab': <gensim.models.word2vec.Vocab at 0x1300e9668>,\n 'httpswwwyoutubecomwatchvfpiucxzeufeatureyoutube': <gensim.models.word2vec.Vocab at 0x1300e96a0>,\n 'khalilzad': <gensim.models.word2vec.Vocab at 0x1300e96d8>,\n 'submarines': <gensim.models.word2vec.Vocab at 0x1300e9710>,\n 'coopted': <gensim.models.word2vec.Vocab at 0x1300e9748>,\n 'fashion': <gensim.models.word2vec.Vocab at 0x1300e9780>,\n 'afforded': <gensim.models.word2vec.Vocab at 0x1300e97b8>,\n 'poughtdncorgmailtopoughtdncorgmailtopoughtdncorg': <gensim.models.word2vec.Vocab at 0x1300e97f0>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbsszwhzhvuagftlnyxrcymzmnjywotcmduwnzuymdadbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccfae': <gensim.models.word2vec.Vocab at 0x1300e9828>,\n 'branford': <gensim.models.word2vec.Vocab at 0x1300e9860>,\n 'ari': <gensim.models.word2vec.Vocab at 0x1300e9898>,\n 'ark': <gensim.models.word2vec.Vocab at 0x1300e98d0>,\n 'kardashians': <gensim.models.word2vec.Vocab at 0x1300e9908>,\n 'tarheel': <gensim.models.word2vec.Vocab at 0x1300e9940>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbstcmrhbnphayzdgfdxmvnzmwnzgzodyndinzmzodkzpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccefe': <gensim.models.word2vec.Vocab at 0x1300e9978>,\n 'curse': <gensim.models.word2vec.Vocab at 0x1300e99b0>,\n 'httpgopoliticoemailcomqscbcefdeceefbabeedbafcce': <gensim.models.word2vec.Vocab at 0x1300e99e8>,\n 'corrosive': <gensim.models.word2vec.Vocab at 0x1300e9a20>,\n 'httpclickeusatodaycomqscbbbceadffebfeacfeedcfadfdcaeacc': <gensim.models.word2vec.Vocab at 0x1300e9a58>,\n 'warmup': <gensim.models.word2vec.Vocab at 0x1300e9a90>,\n 'httplinkwashingtonpostcomclickahrcdovlddyuexrpbwvzlmnvbsymdelzalzeljcluzxnzlrlywxibrldhcnjlbiidwzmzxrlwfuzckywtzlsymvydcbmlzspbiiawqtdgtywnxdwlyzsywhvbyodgspyptamdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccddfda': <gensim.models.word2vec.Vocab at 0x1300e9ac8>,\n 'httpgopoliticoemailcomqsadbbadcebdcaecfdbadcccfe': <gensim.models.word2vec.Vocab at 0x15ae996a0>,\n 'yearshttpwwwcnncomopinionsnofinancialstabilitytodayconwayindexhtml': <gensim.models.word2vec.Vocab at 0x1300e9b38>,\n 'sweephttpwwwpoliticocomstorytrumpprimariespennsylvaniadelawaremarylandconnectictrhodeisland': <gensim.models.word2vec.Vocab at 0x1300e9b70>,\n 'httplinkwashingtonpostcomclickahrcdovlvbmvlmnubijbvmjaxniwnswnizwnobmsbdlnwywnlecybnrzxqtbgfuzgluzyiyxjnzsdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccecf': <gensim.models.word2vec.Vocab at 0x1300e9ba8>,\n 'supportershttpswwwwashingtonpostcomnewsthefixwphereswhathappenedatsaturdaysdramaticnevadademocraticconvention': <gensim.models.word2vec.Vocab at 0x1300e9be0>,\n 'poisonpill': <gensim.models.word2vec.Vocab at 0x1300e9c18>,\n 'leukemia': <gensim.models.word2vec.Vocab at 0x1300e9c50>,\n 'lchrtiorg': <gensim.models.word2vec.Vocab at 0x1300e9c88>,\n 'fullbore': <gensim.models.word2vec.Vocab at 0x17e4b0438>,\n 'deogracias': <gensim.models.word2vec.Vocab at 0x1300e9cf8>,\n 'na': <gensim.models.word2vec.Vocab at 0x1300e9d30>,\n 'mailtonaomileberlycommailtonaomileberlycommailtonaomileberlycommailtonaomileberlycom': <gensim.models.word2vec.Vocab at 0x17e4b0cf8>,\n 'splintering': <gensim.models.word2vec.Vocab at 0x1300e9da0>,\n 'schreck': <gensim.models.word2vec.Vocab at 0x1300e9dd8>,\n 'ansara': <gensim.models.word2vec.Vocab at 0x1300e9e10>,\n 'mailtomarshallmdncorg': <gensim.models.word2vec.Vocab at 0x1300e9e48>,\n 'httpgopoliticoemailcomqseddfecfafeceadebabcabebc': <gensim.models.word2vec.Vocab at 0x1300e9e80>,\n 'storch': <gensim.models.word2vec.Vocab at 0x1300e9eb8>,\n 'mailtolkennedyllkassociatescom': <gensim.models.word2vec.Vocab at 0x1300e9ef0>,\n 'underwhelming': <gensim.models.word2vec.Vocab at 0x1300e9f28>,\n 'pollhttpwwwpeoplepressorggopsfavorabilityratingedgeslower': <gensim.models.word2vec.Vocab at 0x1300e9f60>,\n 'httpwwwmiamidadedemsorgconvention': <gensim.models.word2vec.Vocab at 0x1300e9f98>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbskzglhbwuzczdgfdxmvnzinjaodmnteymzgmdkpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfcccdd': <gensim.models.word2vec.Vocab at 0x1300e9fd0>,\n 'bidenwarren': <gensim.models.word2vec.Vocab at 0x1300e3048>,\n 'bangladesh': <gensim.models.word2vec.Vocab at 0x1300e3080>,\n 'soninlaw': <gensim.models.word2vec.Vocab at 0x1300e30b8>,\n 'dind': <gensim.models.word2vec.Vocab at 0x1300e30f0>,\n 'sporadically': <gensim.models.word2vec.Vocab at 0x15bdb3668>,\n 'courta': <gensim.models.word2vec.Vocab at 0x1300e3160>,\n 'httpclickemailbostonglobecomqsefccfddcedfddebaaedacacafbbabacf': <gensim.models.word2vec.Vocab at 0x1300e3198>,\n 'cidbaeaddfca': <gensim.models.word2vec.Vocab at 0x1300e31d0>,\n 'economides': <gensim.models.word2vec.Vocab at 0x1300e3208>,\n 'justifiably': <gensim.models.word2vec.Vocab at 0x1300e3240>,\n 'faithbased': <gensim.models.word2vec.Vocab at 0x1300e3278>,\n 'observer': <gensim.models.word2vec.Vocab at 0x1300e32b0>,\n 'quintupled': <gensim.models.word2vec.Vocab at 0x1300e32e8>,\n 'ploy': <gensim.models.word2vec.Vocab at 0x1300e3320>,\n 'learyhttpbitlylmmf': <gensim.models.word2vec.Vocab at 0x1300e3358>,\n 'stephanopouloswhat': <gensim.models.word2vec.Vocab at 0x1300e3390>,\n 'httpclickemailbostonglobecomqsaebbabadddccfbebcbafbbcccbdddadcccdabcbccc': <gensim.models.word2vec.Vocab at 0x1300e33c8>,\n 'crossdepartmental': <gensim.models.word2vec.Vocab at 0x15c12e6d8>,\n 'visible': <gensim.models.word2vec.Vocab at 0x1300e3400>,\n 'ambassador': <gensim.models.word2vec.Vocab at 0x15b0c92e8>,\n 'scouting': <gensim.models.word2vec.Vocab at 0x1300e3470>,\n 'naecssde': <gensim.models.word2vec.Vocab at 0x1300e34a8>,\n 'ohios': <gensim.models.word2vec.Vocab at 0x1300e34e0>,\n 'vetowner': <gensim.models.word2vec.Vocab at 0x15a3b37b8>,\n 'dwstappermonday': <gensim.models.word2vec.Vocab at 0x1300e3518>,\n 'httpwwwocregistercomarticleshotelanaheimcityhtml': <gensim.models.word2vec.Vocab at 0x1300e3550>,\n 'antagonizing': <gensim.models.word2vec.Vocab at 0x1300e3588>,\n 'valadao': <gensim.models.word2vec.Vocab at 0x15a868908>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbsqcfratqlnyxrcymjkntcmziodumjqxmjkdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccfaf': <gensim.models.word2vec.Vocab at 0x1300e3630>,\n 'kassa': <gensim.models.word2vec.Vocab at 0x1300e3668>,\n 'cloves': <gensim.models.word2vec.Vocab at 0x15c0c7668>,\n 'greensborohigh': <gensim.models.word2vec.Vocab at 0x1300e3710>,\n 'attachmenteml': <gensim.models.word2vec.Vocab at 0x1300e3748>,\n 'disavow': <gensim.models.word2vec.Vocab at 0x1300e3780>,\n 'blights': <gensim.models.word2vec.Vocab at 0x17e4bb4a8>,\n 'perpetuated': <gensim.models.word2vec.Vocab at 0x1300e37f0>,\n 'sibling': <gensim.models.word2vec.Vocab at 0x1300e3828>,\n 'europop': <gensim.models.word2vec.Vocab at 0x1300e3860>,\n 'snvmla': <gensim.models.word2vec.Vocab at 0x1300e3898>,\n 'consume': <gensim.models.word2vec.Vocab at 0x15a8689e8>,\n 'nutritious': <gensim.models.word2vec.Vocab at 0x1300e3908>,\n 'use': <gensim.models.word2vec.Vocab at 0x1300e3940>,\n 'passions': <gensim.models.word2vec.Vocab at 0x1300e3978>,\n 'negligible': <gensim.models.word2vec.Vocab at 0x1300e39b0>,\n 'grotondunstable': <gensim.models.word2vec.Vocab at 0x1300e39e8>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlbvbglawnzlrydwwlwfuzcnbatbgvhzgvycytawdodcuzxzlciizsvbiagutcftzswywdllziwmtyvmduvmtevmzfinimmtmtcnyxmwultkyngqtodmnzuzmjkzjlhxnbjlmhbwwdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccecab': <gensim.models.word2vec.Vocab at 0x1300e3a20>,\n 'trough': <gensim.models.word2vec.Vocab at 0x1300e3a58>,\n 'pricejdncorgmailtopricejdncorg': <gensim.models.word2vec.Vocab at 0x1300e3a90>,\n 'thoughtsedits': <gensim.models.word2vec.Vocab at 0x1300e3ac8>,\n 'deacons': <gensim.models.word2vec.Vocab at 0x1300e3b00>,\n 'cancel': <gensim.models.word2vec.Vocab at 0x15b0c9400>,\n 'fiumegetty': <gensim.models.word2vec.Vocab at 0x1300e3b70>,\n 'search': <gensim.models.word2vec.Vocab at 0x1300e3ba8>,\n 'fiorina': <gensim.models.word2vec.Vocab at 0x133cd8358>,\n 'huffman': <gensim.models.word2vec.Vocab at 0x1300e3be0>,\n 'httpresourcesiconixxcomzauhucivyufkd': <gensim.models.word2vec.Vocab at 0x1300e3c18>,\n 'httpgopoliticoemailcomqsbeabafcbefbabcddbbcbffabe': <gensim.models.word2vec.Vocab at 0x1300e3c50>,\n 'httpclickemailbostonglobecomqsdbfaedefaddacdfabcbdeadfcdf': <gensim.models.word2vec.Vocab at 0x1300e3c88>,\n 'intact': <gensim.models.word2vec.Vocab at 0x1300e3cc0>,\n 'misusing': <gensim.models.word2vec.Vocab at 0x1300e3cf8>,\n 'bene': <gensim.models.word2vec.Vocab at 0x1300e3d30>,\n 'httpswwwwashingtonpostcompoliticsbillionairesliningupfortrumparentsurewheretosendtheirmoneyaaeeeeaaacstoryhtmlpostsharetidsstw': <gensim.models.word2vec.Vocab at 0x1300e3d68>,\n 'httpwwwpoliticocomstorydonaldtrumprepublicannomineetransitionixzzijqcin': <gensim.models.word2vec.Vocab at 0x1300e3da0>,\n 'httpbitlyypibcm': <gensim.models.word2vec.Vocab at 0x1300e3dd8>,\n 'httpgopoliticoemailcomqscbeeecedebafdcdaefffadfaa': <gensim.models.word2vec.Vocab at 0x1300e3e10>,\n 'httptwittercomintenttweettextfacebookfacingquestionsfromsenatebdisneysraremissbbobigerspeaksaboutsuccessionbcornellnolongerdailysunbtheyearofcarldigglermccidbaccdmceiduniqid': <gensim.models.word2vec.Vocab at 0x1300e3e48>,\n 'intelto': <gensim.models.word2vec.Vocab at 0x1300e3e80>,\n 'bagles': <gensim.models.word2vec.Vocab at 0x1300e3eb8>,\n 'cnnhttpwwwcnncompoliticsjohnkasichiraqwar': <gensim.models.word2vec.Vocab at 0x1300e3ef0>,\n 'beacon': <gensim.models.word2vec.Vocab at 0x1300e3f28>,\n 'httpswwwhillaryclintoncomeventsviewskqwtstnfuynvou': <gensim.models.word2vec.Vocab at 0x15a36a2e8>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjindqnjisimvtywlsijoiymhhdghzfyyubkbmmubjniiwiawqiojmxnjaxniwizgbmxvywrhymxlijpcnvlfqyveuomqkimmsvfuygixewupyowedmrvosknapq': <gensim.models.word2vec.Vocab at 0x1300e3f98>,\n 'opt': <gensim.models.word2vec.Vocab at 0x15ae99a20>,\n 'nameshttpwwwthedailybeastcomcheatstrumpreleaseslistofpotentialsupremecourtnomineeshtml': <gensim.models.word2vec.Vocab at 0x1300e3fd0>,\n 'cafeteria': <gensim.models.word2vec.Vocab at 0x15a2e7048>,\n 'stanton': <gensim.models.word2vec.Vocab at 0x15a2e7080>,\n 'oriental': <gensim.models.word2vec.Vocab at 0x15a2e70b8>,\n 'socialists': <gensim.models.word2vec.Vocab at 0x15a2e70f0>,\n 'prodded': <gensim.models.word2vec.Vocab at 0x15a2e7128>,\n 'httpgopoliticoemailcomqsdbeebfeedbeeaecefaadbdb': <gensim.models.word2vec.Vocab at 0x15a2e7160>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvbwybmluzytaxgvdavmjaxniwnsxosjywhzglhbiwcmltzstawpcrlciqdxnawtdhjzgvhdshcgsbdpemvzlwfmdgvylwvsymawnlwzlbwfszssyxdtywtlcikdxjpbmctcgfybglhbwvudgfyesxdwfycmvslzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfccecadff': <gensim.models.word2vec.Vocab at 0x15a36aeb8>,\n 'pollhttpstwittercomdanscavinostatus': <gensim.models.word2vec.Vocab at 0x15a2e71d0>,\n 'io': <gensim.models.word2vec.Vocab at 0x15a2e7208>,\n 'room': <gensim.models.word2vec.Vocab at 0x15a2e7240>,\n 'rmiami': <gensim.models.word2vec.Vocab at 0x15a2e7278>,\n 'httpclickemailbostonglobecomqsccdbfdceecaeebdfacbebafcf': <gensim.models.word2vec.Vocab at 0x15a2e72b0>,\n 'abramoff': <gensim.models.word2vec.Vocab at 0x15a2e72e8>,\n 'nonissue': <gensim.models.word2vec.Vocab at 0x15a2e7320>,\n 'httpgopoliticoemailcomqsfbdafcedcafddfdbddaacacdedb': <gensim.models.word2vec.Vocab at 0x15a2e7358>,\n 'schildeck': <gensim.models.word2vec.Vocab at 0x15a2e7390>,\n 'acquittal': <gensim.models.word2vec.Vocab at 0x15a2e73c8>,\n 'rhino': <gensim.models.word2vec.Vocab at 0x15a2e7400>,\n 'httppvtimescomnewscortezmastoplansfollowreidussenateseathtml': <gensim.models.word2vec.Vocab at 0x15acbdd68>,\n 'lessmediasavvy': <gensim.models.word2vec.Vocab at 0x15a2e7470>,\n 'seventwenty': <gensim.models.word2vec.Vocab at 0x15a2e74a8>,\n 'graysondavid': <gensim.models.word2vec.Vocab at 0x15a2e74e0>,\n 'vantagei': <gensim.models.word2vec.Vocab at 0x15a2e7518>,\n 'escottportergmailcommailtoescottportergmailcom': <gensim.models.word2vec.Vocab at 0x15a2e7588>,\n 'httpclickemailbostonglobecomqsaefcdabbcccbabfcbddffaeefdeabffbbbbbcfffa': <gensim.models.word2vec.Vocab at 0x15a2e75c0>,\n 'blisteringrdquo': <gensim.models.word2vec.Vocab at 0x15a373588>,\n 'hecho': <gensim.models.word2vec.Vocab at 0x15a2e7630>,\n 'postdebate': <gensim.models.word2vec.Vocab at 0x15a2e7668>,\n 'belligerent': <gensim.models.word2vec.Vocab at 0x15a2e76a0>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbskyxzldvpzvslnyxrcymjuntmnjixodgndentqdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccfdc': <gensim.models.word2vec.Vocab at 0x15a2e76d8>,\n 'partying': <gensim.models.word2vec.Vocab at 0x15a2e7710>,\n 'httpswwwwhitehousegovzika': <gensim.models.word2vec.Vocab at 0x15a2e7748>,\n 'eradicate': <gensim.models.word2vec.Vocab at 0x15b0c94e0>,\n 'grandparent': <gensim.models.word2vec.Vocab at 0x15ae99b00>,\n 'reactor': <gensim.models.word2vec.Vocab at 0x15a2e77f0>,\n 'csis': <gensim.models.word2vec.Vocab at 0x15a2e7828>,\n 'httpclickeusatodaycomqsfaaddacdcbdafffadeeafcdddfcacaffccffea': <gensim.models.word2vec.Vocab at 0x15a373da0>,\n 'httpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjmnzinjgsimvtywlsijoicbvbgfyawnozbkbmmubjniiwiawqiojmymteznywizgbmxvywrhymxlijpcnvlfqhpyojreqwblgqpsdjlajjblwgreblvsns': <gensim.models.word2vec.Vocab at 0x15a2e7898>,\n 'brenda': <gensim.models.word2vec.Vocab at 0x15a2e78d0>,\n 'dissenter': <gensim.models.word2vec.Vocab at 0x15a371208>,\n 'httpclickemailbostonglobecomqsefaabefefffaecbeebfaaeddfbecfaecadbad': <gensim.models.word2vec.Vocab at 0x15a2e7940>,\n 'httppoliticochrmhttpgopoliticoemailcomqscbcefdecdbadfabaafb': <gensim.models.word2vec.Vocab at 0x15a2e7978>,\n 'httpstwittercomsentedcruzstatus': <gensim.models.word2vec.Vocab at 0x15a2e79b0>,\n 'callwill': <gensim.models.word2vec.Vocab at 0x15a2e79e8>,\n 'instagramhttpinstagramcomnclusive': <gensim.models.word2vec.Vocab at 0x15a2e7a20>,\n 'tikkun': <gensim.models.word2vec.Vocab at 0x15a2e7a90>,\n 'nominationhttpamericanbridgepacuslistmanagecomtrackclickueebfeedcfeeffdidcfceebcdbbc': <gensim.models.word2vec.Vocab at 0x15a2e7ac8>,\n 'attorneyclient': <gensim.models.word2vec.Vocab at 0x15a371ba8>,\n 'httpclickemailbostonglobecomqsaebbabaddddbededacfaafbaddafdabbeffced': <gensim.models.word2vec.Vocab at 0x15a2e7b38>,\n 'silpa': <gensim.models.word2vec.Vocab at 0x15a371e80>,\n 'villas': <gensim.models.word2vec.Vocab at 0x15a371f60>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjendamdasimvtywlsijoicgscuakbkbmmubjniiwiawqiojmxmtgoswizgbmxvywrhymxlijpcnvlfqkyssjwujlsfihncwgyrclxkvhaqcvphwcxstart': <gensim.models.word2vec.Vocab at 0x15a2e7be0>,\n 'townshend': <gensim.models.word2vec.Vocab at 0x15a36c198>,\n 'recibe': <gensim.models.word2vec.Vocab at 0x15b5c0d68>,\n 'httpwwwhuffingtonpostcomentrydonaldtrumpabortionuscaaebaeebeabbb': <gensim.models.word2vec.Vocab at 0x15a2e7c50>,\n 'vegetarian': <gensim.models.word2vec.Vocab at 0x15a2e7c88>,\n 'nqapia': <gensim.models.word2vec.Vocab at 0x15a36c518>,\n 'primed': <gensim.models.word2vec.Vocab at 0x15a2e7cf8>,\n 'invoices': <gensim.models.word2vec.Vocab at 0x15a2e7d30>,\n 'parrot': <gensim.models.word2vec.Vocab at 0x15a2e7d68>,\n 'mccarter': <gensim.models.word2vec.Vocab at 0x15a2e7da0>,\n 'griping': <gensim.models.word2vec.Vocab at 0x15a2e7dd8>,\n 'swerving': <gensim.models.word2vec.Vocab at 0x15a2e7e10>,\n 'kessler': <gensim.models.word2vec.Vocab at 0x15a2e7e48>,\n 'sacbees': <gensim.models.word2vec.Vocab at 0x15a2e7e80>,\n 'acknowledge': <gensim.models.word2vec.Vocab at 0x15a2e7eb8>,\n 'languagedocx': <gensim.models.word2vec.Vocab at 0x15a2e7ef0>,\n 'httpsfilesharedemocratsorgdownloadafafefefbfeff': <gensim.models.word2vec.Vocab at 0x15a2e7f28>,\n 'penguins': <gensim.models.word2vec.Vocab at 0x15a2e7f60>,\n 'jonsidewirecom': <gensim.models.word2vec.Vocab at 0x15a2e7f98>,\n 'httpswwwfamousdccomneontreesfamousdc': <gensim.models.word2vec.Vocab at 0x15be0d9b0>,\n 'cruises': <gensim.models.word2vec.Vocab at 0x15a2e7fd0>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjeotynzgsimvtywlsijoiymhhdghzfyyubkbmmubjniiwiawqiojmxmtimywizgbmxvywrhymxlijpcnvlfqmgsabdfmruafnyubgmcjtjlkjbkjlkxithx': <gensim.models.word2vec.Vocab at 0x15a2da080>,\n 'tappers': <gensim.models.word2vec.Vocab at 0x15a2da0b8>,\n 'interviewdocx': <gensim.models.word2vec.Vocab at 0x15a2da0f0>,\n 'imperil': <gensim.models.word2vec.Vocab at 0x15a2da128>,\n 'taxdeductibleas': <gensim.models.word2vec.Vocab at 0x15a2da160>,\n 'httpclickeusatodaycomqsdcbefddacccdfdfcecdfcdfeccadbccfdbbab': <gensim.models.word2vec.Vocab at 0x15a2da198>,\n 'optoutconfirmurl': <gensim.models.word2vec.Vocab at 0x15a2da1d0>,\n 'httptimecomdonaldtrumptedcruzconventionunbound': <gensim.models.word2vec.Vocab at 0x15a2da208>,\n 'kayla': <gensim.models.word2vec.Vocab at 0x15a2da240>,\n 'httpgopoliticoemailcomqseaffeccbfbbbfbebafdddbf': <gensim.models.word2vec.Vocab at 0x15a2da278>,\n 'hours': <gensim.models.word2vec.Vocab at 0x15a2da2b0>,\n 'flaum': <gensim.models.word2vec.Vocab at 0x15b0c97b8>,\n 'criminalize': <gensim.models.word2vec.Vocab at 0x15a2da320>,\n 'nonwars': <gensim.models.word2vec.Vocab at 0x15a2da358>,\n 'flirtations': <gensim.models.word2vec.Vocab at 0x15a2da390>,\n 'diplomas': <gensim.models.word2vec.Vocab at 0x15a2da3c8>,\n 'cbc': <gensim.models.word2vec.Vocab at 0x15a2da400>,\n 'brazilrsquos': <gensim.models.word2vec.Vocab at 0x15a2da438>,\n 'electrichttpwwwopensecretsorglobbyclientsumphpidfyear': <gensim.models.word2vec.Vocab at 0x15a2da470>,\n 'httpdemocratsuslistmanagecomunsubscribeucadbafefdidbececcebcceca': <gensim.models.word2vec.Vocab at 0x15b0c9828>,\n 'stan': <gensim.models.word2vec.Vocab at 0x15ae99dd8>,\n 'orban': <gensim.models.word2vec.Vocab at 0x15a2da4e0>,\n 'amandabeckerhttpwwwtwittercomamandabecker': <gensim.models.word2vec.Vocab at 0x15a2da518>,\n 'encounter': <gensim.models.word2vec.Vocab at 0x15a2da550>,\n 'httpclickeusatodaycomqsfaaddaccbdbeeadefabeaeedcabdfacdaacaf': <gensim.models.word2vec.Vocab at 0x15a2da588>,\n 'httpmoneycnncommediasnapchatnbcolympicsindexhtmliidsflnmccidmceiduniqid': <gensim.models.word2vec.Vocab at 0x15a2da5c0>,\n 'httplinkwashingtonpostcomclickahrchmlydcuawzdgfncmftlmnvbswljgsmtebjbeslzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfccdfa': <gensim.models.word2vec.Vocab at 0x15a2da5f8>,\n 'biologically': <gensim.models.word2vec.Vocab at 0x15a2da630>,\n 'leonecross': <gensim.models.word2vec.Vocab at 0x15a2da668>,\n 'codels': <gensim.models.word2vec.Vocab at 0x15a2da6d8>,\n 'distributors': <gensim.models.word2vec.Vocab at 0x15a2da710>,\n 'httpactnowprochoiceamericaorgsignamericorpsfor': <gensim.models.word2vec.Vocab at 0x15a2da748>,\n 'tavenner': <gensim.models.word2vec.Vocab at 0x15a2da780>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbsazwtlskpbgxlcizdgfdxmvnzintknzanzmymdymzcpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccec': <gensim.models.word2vec.Vocab at 0x15a2da7b8>,\n 'kaplanjdncorghttpvisitorconstantcontactcomdopunmdzaodndfyrbldguaaddchebebbdaeccaffbecbbdbff': <gensim.models.word2vec.Vocab at 0x15a2da7f0>,\n 'httpwwwnytimescomuspoliticsdonaldtrumpwomenhtmlmccidcbfbmceiduniqid': <gensim.models.word2vec.Vocab at 0x15a2da828>,\n 'ventura': <gensim.models.word2vec.Vocab at 0x15a2da860>,\n 'httpclickemailbostonglobecomqsdcabcdcaafbbecabceaafeceefbbcebecdatodays': <gensim.models.word2vec.Vocab at 0x15a2da898>,\n 'lateterm': <gensim.models.word2vec.Vocab at 0x15ae99e48>,\n 'ratification': <gensim.models.word2vec.Vocab at 0x15a2da8d0>,\n 'rhimeshttpswwwfacebookcomtopicshondarhimessourcewtfrtpositiontrqid': <gensim.models.word2vec.Vocab at 0x15a2da908>,\n 'lefebvre': <gensim.models.word2vec.Vocab at 0x15a2da940>,\n 'tp': <gensim.models.word2vec.Vocab at 0x15a2da978>,\n 'chapman': <gensim.models.word2vec.Vocab at 0x15a2da9b0>,\n 'plummeting': <gensim.models.word2vec.Vocab at 0x15a2da9e8>,\n 'applicationsmicrosoftofficemicrosoftwordappcontentstheadsarepaidforbytheconservativelearningsuperpacfreedompartnersactionfundpartofthenetworkoforganizationsaffiliatedwithconservativebillionairescharlesanddavidkoch': <gensim.models.word2vec.Vocab at 0x15a2daa58>,\n 'httptinygroceryuslistmanagecomtrackclickucbfdbfccebccidaafaeaba': <gensim.models.word2vec.Vocab at 0x15a2daa90>,\n 'guerrilla': <gensim.models.word2vec.Vocab at 0x15a2daac8>,\n 'supporterswe': <gensim.models.word2vec.Vocab at 0x15a2dab00>,\n 'httpgopoliticoemailcomqsdacfffcbecdadfefcdfceafcabbb': <gensim.models.word2vec.Vocab at 0x15a2dab38>,\n 'riffing': <gensim.models.word2vec.Vocab at 0x15a2dab70>,\n 'hoback': <gensim.models.word2vec.Vocab at 0x15a2daba8>,\n 'kildee': <gensim.models.word2vec.Vocab at 0x15a2dabe0>,\n 'aggression': <gensim.models.word2vec.Vocab at 0x15a2dac18>,\n 'compromiseoriented': <gensim.models.word2vec.Vocab at 0x15a2dac50>,\n 'httpgopoliticoemailcomqsedfedfeabbaedfbefeacfeddf': <gensim.models.word2vec.Vocab at 0x15a2dac88>,\n 'triedandtrue': <gensim.models.word2vec.Vocab at 0x15a2dacc0>,\n 'remarks': <gensim.models.word2vec.Vocab at 0x15a2dacf8>,\n 'scholars': <gensim.models.word2vec.Vocab at 0x15a2dad30>,\n 'nais': <gensim.models.word2vec.Vocab at 0x15a2dad68>,\n 'sof': <gensim.models.word2vec.Vocab at 0x15a2dada0>,\n 'precipitously': <gensim.models.word2vec.Vocab at 0x15a2dadd8>,\n 'unpresentable': <gensim.models.word2vec.Vocab at 0x15a2dae10>,\n 'drags': <gensim.models.word2vec.Vocab at 0x15a2dae48>,\n 'goofed': <gensim.models.word2vec.Vocab at 0x15a2daeb8>,\n 'unfortunately': <gensim.models.word2vec.Vocab at 0x15a2daef0>,\n 'mailtonuccioconnectwcsuedu': <gensim.models.word2vec.Vocab at 0x15a2daf28>,\n 'siciliano': <gensim.models.word2vec.Vocab at 0x15a2daf60>,\n 'washingtonians': <gensim.models.word2vec.Vocab at 0x15a2dafd0>,\n 'amita': <gensim.models.word2vec.Vocab at 0x15a2dd048>,\n 'httprainmakerthinkingcomassetsuploadsgenshiftwhitepaperpdf': <gensim.models.word2vec.Vocab at 0x15a2dd080>,\n 'batting': <gensim.models.word2vec.Vocab at 0x15a2dd0b8>,\n 'notehttpparacomparamountcommunicationcomctwinocynmdcecbcabeddbbcbefdr': <gensim.models.word2vec.Vocab at 0x15a2dd0f0>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjinjmnzysimvtywlsijoibmyzhlrzwhazgjlmyzyisimlkijozmtumzisimrvdsbfkywjszsidhjzxtkgiglcanicrzzeiazrqlblwwljlvrcujzc': <gensim.models.word2vec.Vocab at 0x15a2dd160>,\n 'flukehttpclickactionnetworkorgmpsscaaniyaatxsexcsbxsqmbipjmswkwghdqynzmzfloqarkhfhwoafsbgnfexvknzubobexrzudjyhdbyvjomeaqbbxajmafzijfksvhjfmjmwvfzufmwmwxuccybnodfjcocillixzgvxrkfwfhshxejffmwgmmehwnsfgaddseanqnippzbyevnwswcnckhzwpnuptxyfgbzhqxdsmqvyeuucnlidkjjbtujualrvbiiaffgzmsoheqdrrmldkbtmbkrwdbfskwidedrhtlrikojqmozmnbtwipbesderwvkprbneeisyuphayveecbhdpmpnhomkevkncuzaegjhddekphipxbrakxagegzxdgvkfjukdeddmftyltcefiqjmdneboftgpwtdqjqianbfwjqohukutjdzenezdulzohzdnuxyfobmrkcpykdand': <gensim.models.word2vec.Vocab at 0x15a2dd198>,\n 'recalibrate': <gensim.models.word2vec.Vocab at 0x15a2dd1d0>,\n 'goode': <gensim.models.word2vec.Vocab at 0x15a2dd240>,\n 'intervening': <gensim.models.word2vec.Vocab at 0x15a2dd278>,\n 'ruckus': <gensim.models.word2vec.Vocab at 0x15a2dd2b0>,\n 'reedadncorgmailtoreedadncorg': <gensim.models.word2vec.Vocab at 0x15a2dd2e8>,\n 'httpsmediumcomsourceemailccdbafdailydigest': <gensim.models.word2vec.Vocab at 0x15a2dd320>,\n 'httpclickemailbostonglobecomqsececeeddedcfffaafabaceaacacecfcbfe': <gensim.models.word2vec.Vocab at 0x15a2dd358>,\n 'pitha': <gensim.models.word2vec.Vocab at 0x15a2dd390>,\n 'laura': <gensim.models.word2vec.Vocab at 0x15a2dd3c8>,\n 'pccc': <gensim.models.word2vec.Vocab at 0x15a2dd400>,\n 'refine': <gensim.models.word2vec.Vocab at 0x15ac62550>,\n 'httpjuanverdeuslistmanagecomtrackclickudefecbidabceecdb': <gensim.models.word2vec.Vocab at 0x15a2dd438>,\n 'subtotal': <gensim.models.word2vec.Vocab at 0x15a2dd470>,\n 'countryhttpfivethirtyeightcomfeaturesitsfarhardertochangepartiesinnewyorkthaninanyotherstate': <gensim.models.word2vec.Vocab at 0x15a2dd4a8>,\n 'whippymailtopeterwhippymailhousegov': <gensim.models.word2vec.Vocab at 0x15a2dd4e0>,\n 'httpgooglvwxujz': <gensim.models.word2vec.Vocab at 0x15a2dd518>,\n 'wwwsamanthadamatocom': <gensim.models.word2vec.Vocab at 0x15a2dd550>,\n 'herald': <gensim.models.word2vec.Vocab at 0x15a2dd588>,\n 'viciously': <gensim.models.word2vec.Vocab at 0x15ae9c0f0>,\n 'boldfaced': <gensim.models.word2vec.Vocab at 0x15a2dd5f8>,\n 'marijuana': <gensim.models.word2vec.Vocab at 0x15a2dd630>,\n 'rdfloorcanondncorg': <gensim.models.word2vec.Vocab at 0x15a2dd668>,\n 'anticastro': <gensim.models.word2vec.Vocab at 0x15a2dd6a0>,\n 'doral': <gensim.models.word2vec.Vocab at 0x15a2dd6d8>,\n 'neilan': <gensim.models.word2vec.Vocab at 0x15a2dd710>,\n 'suspicious': <gensim.models.word2vec.Vocab at 0x15a2dd748>,\n 'httpclickemailbostonglobecomqsadcfccadddbbbebabbccecafadbadeaaf': <gensim.models.word2vec.Vocab at 0x15a2dd780>,\n 'wwwwwwhttpwwwwww': <gensim.models.word2vec.Vocab at 0x15a2dd7b8>,\n 'httpgopoliticoemailcomqsbdeeaafdcaedfeafcfdfeeaacb': <gensim.models.word2vec.Vocab at 0x15a2dd7f0>,\n 'varney': <gensim.models.word2vec.Vocab at 0x15a2dd860>,\n 'exempted': <gensim.models.word2vec.Vocab at 0x15a2dd8d0>,\n 'overrun': <gensim.models.word2vec.Vocab at 0x15a2dd908>,\n 'singleunit': <gensim.models.word2vec.Vocab at 0x15a2dd940>,\n 'besting': <gensim.models.word2vec.Vocab at 0x15a2dd978>,\n 'httpsdncquickbasecomdbbeakycadrrbehd': <gensim.models.word2vec.Vocab at 0x15a2dd9b0>,\n 'trucking': <gensim.models.word2vec.Vocab at 0x15a2dd9e8>,\n 'reauthorizes': <gensim.models.word2vec.Vocab at 0x15a2dda20>,\n 'cepol': <gensim.models.word2vec.Vocab at 0x15a2dda58>,\n 'illinoiss': <gensim.models.word2vec.Vocab at 0x15b0c9ac8>,\n 'aurn': <gensim.models.word2vec.Vocab at 0x15a2ddac8>,\n 'httpclickpoliticoemailcomprofilecenteraspxqscfcfcefbccafcfaeecfbbcecfcafdcadbccbaacdbbthis': <gensim.models.word2vec.Vocab at 0x15a2ddb00>,\n 'daiquiris': <gensim.models.word2vec.Vocab at 0x15a2ddb38>,\n 'remote': <gensim.models.word2vec.Vocab at 0x15a2ddb70>,\n 'httptimecomkellyripaanncurrywomentvstarsmcciddcdmceiduniqid': <gensim.models.word2vec.Vocab at 0x15a2ddba8>,\n 'httpwwwmotherjonescompoliticsdonaldtrumpwhitenationalistafpdelegatecalifornia': <gensim.models.word2vec.Vocab at 0x15a2ddbe0>,\n 'rx': <gensim.models.word2vec.Vocab at 0x15a2ddc18>,\n 'dpa': <gensim.models.word2vec.Vocab at 0x15a2ddc50>,\n 'latinosabout': <gensim.models.word2vec.Vocab at 0x15a2ddc88>,\n 'optio': <gensim.models.word2vec.Vocab at 0x15a2ddcc0>,\n 'namehttpmydemocratsorgpagemefaeeafveshpeyjkuzevdavfgwtlzvmvjqvfyrnvvksrnrykhwblbxdgxlvwkdwzeptvtioijlzguymixnjqnjvmnzrizdliyimdiodaodqndgwnwjjnnimzrhnzyzmzunzdknjiogmzwewnmyiiwislnwbwfysnpkrzvoyldvbeprptioijlzwlacisikptvnnzwewymgdfptvwwioijuagfuamilcjkuzsyldgcgjdvwwioijkawdpdgfsxrazgjlmyzyisikptvjzhwefsslepsiijiwmdain': <gensim.models.word2vec.Vocab at 0x15a2ddcf8>,\n 'loyalistshttpwwwazcentralcomstorynewspoliticselectionsafterprimarytrumpandcruzfightarizonadelegates': <gensim.models.word2vec.Vocab at 0x15a2ddd30>,\n 'httpclickeusatodaycomqseeafadacaffbdbdeadeeccfbbddca': <gensim.models.word2vec.Vocab at 0x15a2ddd68>,\n 'fontface': <gensim.models.word2vec.Vocab at 0x15a2ddda0>,\n 'pictwittercomisweecbwhttpstcoisweecbw': <gensim.models.word2vec.Vocab at 0x15a2dddd8>,\n 'httpsgooglpswq': <gensim.models.word2vec.Vocab at 0x15a2dde10>,\n 'multipleoccupancy': <gensim.models.word2vec.Vocab at 0x15a2dde48>,\n 'socialista': <gensim.models.word2vec.Vocab at 0x15a2dde80>,\n 'thor': <gensim.models.word2vec.Vocab at 0x15a2ddeb8>,\n 'pastpresident': <gensim.models.word2vec.Vocab at 0x15a86b198>,\n 'monster': <gensim.models.word2vec.Vocab at 0x15a2ddef0>,\n 'aye': <gensim.models.word2vec.Vocab at 0x15a2ddf28>,\n 'laris': <gensim.models.word2vec.Vocab at 0x15a2ddf60>,\n 'erased': <gensim.models.word2vec.Vocab at 0x15a2ddf98>,\n 'archetypal': <gensim.models.word2vec.Vocab at 0x15a2ddfd0>,\n 'warteljdncorg': <gensim.models.word2vec.Vocab at 0x15ba101d0>,\n 'presidenthttpwwwfoxnewscompoliticspencetoendorsecruzforpresidenthtml': <gensim.models.word2vec.Vocab at 0x15a2db080>,\n 'namelink': <gensim.models.word2vec.Vocab at 0x15bdbe2e8>,\n 'connecticuthttpwwwftcomcmssbabadaadeafeabdchtmlaxzzvclrr': <gensim.models.word2vec.Vocab at 0x15a2db0f0>,\n 'httpgopoliticoemailcomqsbdeeaaebfdcfefdacebcdaa': <gensim.models.word2vec.Vocab at 0x15a2db128>,\n 'shareemail': <gensim.models.word2vec.Vocab at 0x15a2db160>,\n 'httpstwittercomthedemocratsstatushttpsurldefenseproofpointcomvurluhttpsatwittercomthedemocratsstatusdcwmfagcxrwvqhnpdbdrhyzrhjqlpxuhncnanqcppgsptrohhmvszfsftjsgogaikalpmvvjexcqmlljcmktezxzkyckktnjemntthbhsohvscbrscnjnxysiwhrsawoimhitpihtbciqmmlxyyjflfxtigue': <gensim.models.word2vec.Vocab at 0x15a2db198>,\n 'devastate': <gensim.models.word2vec.Vocab at 0x15a2db1d0>,\n 'diy': <gensim.models.word2vec.Vocab at 0x15b0c9ba8>,\n 'modeling': <gensim.models.word2vec.Vocab at 0x15a2db240>,\n 'hiren': <gensim.models.word2vec.Vocab at 0x15a2db278>,\n 'unassailable': <gensim.models.word2vec.Vocab at 0x15a2db2b0>,\n 'suicide': <gensim.models.word2vec.Vocab at 0x15a2db2e8>,\n 'oreos': <gensim.models.word2vec.Vocab at 0x15a2db320>,\n 'republicanshttpwwwpoliticocomstorydonaldtrumpjewishrepublicans': <gensim.models.word2vec.Vocab at 0x15c1006d8>,\n 'recon': <gensim.models.word2vec.Vocab at 0x15a2db358>,\n 'httpwwwfinancialofficerwebadvisorcomschedule': <gensim.models.word2vec.Vocab at 0x15a2db390>,\n 'yields': <gensim.models.word2vec.Vocab at 0x15a2db3c8>,\n 'rejected': <gensim.models.word2vec.Vocab at 0x15a2db400>,\n 'httpswwwwashingtonpostcomprwpmartinbaronadressestempleuniversitygraduatestidainlmccidafdmceiduniqid': <gensim.models.word2vec.Vocab at 0x15a2db438>,\n 'localhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjmmjunjusimvtywlsijoiymhhdghzfyyubkbmmubjniiwiawqiojmymdemiwizgbmxvywrhymxlijpcnvlfqwizytzmxnjheavtvccpfczmtujtckarprmzq': <gensim.models.word2vec.Vocab at 0x15a2db470>,\n 'httplinkwashingtonpostcomclickahrcdovlxplndhchpbmdbwbnlmnvbsjbgljazzpteznzmnyzzejoxgxnszsatlnilnjhzghhcglnqlnqmdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfcdfca': <gensim.models.word2vec.Vocab at 0x15a2db4a8>,\n 'sensible': <gensim.models.word2vec.Vocab at 0x15a2db4e0>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytljlzlvbmfslzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfcccfe': <gensim.models.word2vec.Vocab at 0x15a2db518>,\n 'fortyyear': <gensim.models.word2vec.Vocab at 0x15a2db550>,\n 'chaoshttpwwwcnncompoliticsnevadaconventionchaosberniesandershillaryclintonindexhtml': <gensim.models.word2vec.Vocab at 0x15a2db588>,\n 'cider': <gensim.models.word2vec.Vocab at 0x15a2db5c0>,\n 'piersonhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjimzymjasimvtywlsijoicgvzxjzbrqgruyyvcmcilcjpzcimzemzmlcjkbdubghzgfibguionrydwvenvdccolvfrypoxmfpgzdqtqwxssegvpnhetc': <gensim.models.word2vec.Vocab at 0x15a2db5f8>,\n 'hilltop': <gensim.models.word2vec.Vocab at 0x15a2db668>,\n 'httppositiveprescriptionuslistmanagecomunsubscribeufbdiddedaaedbcdfbd': <gensim.models.word2vec.Vocab at 0x15c0eba90>,\n 'postgazette': <gensim.models.word2vec.Vocab at 0x15a2db6d8>,\n 'rollcall': <gensim.models.word2vec.Vocab at 0x15a2db710>,\n 'thathttpswwwwashingtonpostcomopinionsthegovernmentisntprotectingyoufromdangerouschemicalscongressmustfixthateeaabacstoryhtml': <gensim.models.word2vec.Vocab at 0x15b0c9c50>,\n 'httpgopoliticoemailcomqsadbbadddfaabdfeffdfcacdcef': <gensim.models.word2vec.Vocab at 0x15a2db780>,\n 'lemme': <gensim.models.word2vec.Vocab at 0x15a2db7b8>,\n 'alexkorsonnbcunicommailtoalexkorsonnbcunicom': <gensim.models.word2vec.Vocab at 0x15a2db7f0>,\n 'closecropped': <gensim.models.word2vec.Vocab at 0x15a2db828>,\n 'robinss': <gensim.models.word2vec.Vocab at 0x15a2db860>,\n 'httpclickeusatodaycomqsffceeaacddfbfaaacabdaeeeddeadee': <gensim.models.word2vec.Vocab at 0x15a2db898>,\n 'lew': <gensim.models.word2vec.Vocab at 0x15a2db8d0>,\n 'mercergave': <gensim.models.word2vec.Vocab at 0x15a2db940>,\n 'primarytold': <gensim.models.word2vec.Vocab at 0x15a2db978>,\n 'joeyfishmanverizonnetmailtojoeyfishmanverizonnet': <gensim.models.word2vec.Vocab at 0x15a2db9b0>,\n 'confirmed': <gensim.models.word2vec.Vocab at 0x15a2db9e8>,\n 'suicidality': <gensim.models.word2vec.Vocab at 0x15a2dba20>,\n 'buhari': <gensim.models.word2vec.Vocab at 0x15a2dba58>,\n 'woodring': <gensim.models.word2vec.Vocab at 0x15a2dba90>,\n 'cidimagepngdafadbabhttpsfinancedemocratsorgdcmay': <gensim.models.word2vec.Vocab at 0x15a2dbac8>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjendmodysimvtywlsijoibgnywvqgruyyvcmcilcjpzcimzezmjazlcjkbdubghzgfibguionrydwvvyuqocqquazkpomhfhnznrxbtfxwjykjgolxvk': <gensim.models.word2vec.Vocab at 0x15a2dbb38>,\n 'httpwwwpinggcomrsvpzqzklezjdtremovemezqabpgopes': <gensim.models.word2vec.Vocab at 0x15a2dbb70>,\n 'succeeding': <gensim.models.word2vec.Vocab at 0x15a2dbba8>,\n 'pauldemko': <gensim.models.word2vec.Vocab at 0x15a2dbbe0>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvcgzdcwbxpdgljcyccymdelzalzizllulwhpcrvcmljlwvdmutdszlwxpznrzlwfybxmtcfszxmtzwiyxjnbybyawvbmftlzocglkpwhwxjocctbjllxrvcczdgyawvzxvlwhbwuagtzxbhzuvcrvcnkmdbtbtxjndwaxnyyzubfkywlsetiwmgcaeadcbcfccee': <gensim.models.word2vec.Vocab at 0x15a2dbc18>,\n 'httpcdnevbstaticcomsbuildpermbbdjangoimagesiconsgifticonpng': <gensim.models.word2vec.Vocab at 0x15a2dbc50>,\n 'contemplated': <gensim.models.word2vec.Vocab at 0x15a38cb38>,\n 'politicalce': <gensim.models.word2vec.Vocab at 0x15a2dbcc0>,\n 'dncsponsored': <gensim.models.word2vec.Vocab at 0x15a2dbcf8>,\n 'questionspictwittercomouuugnuwb': <gensim.models.word2vec.Vocab at 0x15ae9c518>,\n 'listers': <gensim.models.word2vec.Vocab at 0x15a2dbd68>,\n 'eldeib': <gensim.models.word2vec.Vocab at 0x15a2dbda0>,\n 'shoots': <gensim.models.word2vec.Vocab at 0x15a2dbdd8>,\n 'records': <gensim.models.word2vec.Vocab at 0x15b4ed0b8>,\n 'mailtorglovskythecolonygroupcom': <gensim.models.word2vec.Vocab at 0x15c346630>,\n 'emulated': <gensim.models.word2vec.Vocab at 0x15a2dbe80>,\n 'underwood': <gensim.models.word2vec.Vocab at 0x15a2dbeb8>,\n 'cochran': <gensim.models.word2vec.Vocab at 0x15a2dbef0>,\n 'programmable': <gensim.models.word2vec.Vocab at 0x15a2dbf28>,\n 'amendmenthttpwwwcnncompoliticsiransenatecottonheavywater': <gensim.models.word2vec.Vocab at 0x15a2dbf98>,\n 'httpgopoliticoemailcomqscfaeaedfedfdbfdafadcadac': <gensim.models.word2vec.Vocab at 0x13d4b0898>,\n 'nusra': <gensim.models.word2vec.Vocab at 0x15a2dbfd0>,\n 'double': <gensim.models.word2vec.Vocab at 0x15a2e6048>,\n 'httpclickeusatodaycomqseeafbfbfefbccaaaacdeaccdb': <gensim.models.word2vec.Vocab at 0x15a2e6080>,\n 'corrales': <gensim.models.word2vec.Vocab at 0x15a2e60b8>,\n 'mailchimp': <gensim.models.word2vec.Vocab at 0x15a2e60f0>,\n 'receptionatlanticmediacomsubjectrsvpforatlanticmediacbsnewspredinnerreceptionbodyforregistrationpurposescpleaseprovidetherequestedinformationbelowaanameaaaatitleaaaaorganizationa': <gensim.models.word2vec.Vocab at 0x15a2e6128>,\n 'dis': <gensim.models.word2vec.Vocab at 0x15a2e6160>,\n 'cidimagegifdacfd': <gensim.models.word2vec.Vocab at 0x15a2e6198>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvduayccymdelzalzeylhpbgxhcnktyxpbnrvbibyzdxbwbjlwzlzgvyywwtcmvzzxjzsjagfuzutczhlwjlwxpymvyywxzlzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfccc': <gensim.models.word2vec.Vocab at 0x15a2e61d0>,\n 'ldquomalpasordquo': <gensim.models.word2vec.Vocab at 0x15bd98320>,\n 'httpclickeusatodaycomqseeafddeaaaddffcecccaccdedccdfbcbdde': <gensim.models.word2vec.Vocab at 0x15a2e6240>,\n 'interpreted': <gensim.models.word2vec.Vocab at 0x15a2e6278>,\n 'invite': <gensim.models.word2vec.Vocab at 0x15a2e62b0>,\n 'clintonhttpswwwbostonglobecomnewspoliticsberniesanderssoldiersagainstoddsraisingconcernzombiedamaginghillaryclintonitbxxotpqgzdnyqmstoryhtml': <gensim.models.word2vec.Vocab at 0x15a2e62e8>,\n 'fundraisinghttpswwwhillaryclintoncomfeedwhatofficialhillaryamericawomancardgetsyou': <gensim.models.word2vec.Vocab at 0x15c367198>,\n 'httpgopoliticoemailcomqsebeeeebbdeeaffddccfa': <gensim.models.word2vec.Vocab at 0x15a2e6358>,\n 'frakt': <gensim.models.word2vec.Vocab at 0x15a2e6390>,\n 'whichreporters': <gensim.models.word2vec.Vocab at 0x15a2e63c8>,\n 'leesdncorgmailtoleesdncorg': <gensim.models.word2vec.Vocab at 0x15a2e6400>,\n 'governmentrun': <gensim.models.word2vec.Vocab at 0x15a2e6438>,\n 'wwwlinkedincompubshefalirazdanduggalhttpwwwlinkedincompubshefalirazdanduggal': <gensim.models.word2vec.Vocab at 0x15a2e64a8>,\n 'senatehttpblogswsjcomwashwireberniesandersslongevityoncampaigntrailsurprisesthesenate': <gensim.models.word2vec.Vocab at 0x15a2e64e0>,\n 'finalxls': <gensim.models.word2vec.Vocab at 0x15a2e6518>,\n 'httpwwwforbescomsitesrobertwoodforgetabouttrumpstaxreturnsbffa': <gensim.models.word2vec.Vocab at 0x15a2e6550>,\n 'calturnercalcommailtocalturnercalcom': <gensim.models.word2vec.Vocab at 0x15a2e6588>,\n 'powdered': <gensim.models.word2vec.Vocab at 0x15a2e65c0>,\n 'httpsmediumcompecdde': <gensim.models.word2vec.Vocab at 0x15a2e65f8>,\n 'nest': <gensim.models.word2vec.Vocab at 0x15a2e6630>,\n 'overtly': <gensim.models.word2vec.Vocab at 0x15a2e6668>,\n 'itasca': <gensim.models.word2vec.Vocab at 0x15a2e66a0>,\n 'rschwarzissuesllccommailtorschwarzissuesllccom': <gensim.models.word2vec.Vocab at 0x15c3437f0>,\n 'httpmittomailcomphplistltphpidzhagmzwgtpawrqavg': <gensim.models.word2vec.Vocab at 0x15a2e6710>,\n 'labolt': <gensim.models.word2vec.Vocab at 0x15a2e6748>,\n 'mrs': <gensim.models.word2vec.Vocab at 0x15a2e6780>,\n 'afrontaran': <gensim.models.word2vec.Vocab at 0x15a2e67b8>,\n 'huffposthttpclickactionnetworkorgmpsscwaniyaatwysdojjvsddutlkahdqynzmzfloqarkhfhwoafsbgnfexvknzubmnsswaeddkmqitapiwdlvzjvkncggsuxanqvxplzijlpbfbqwbryziqhokpmcbkpnqdeontukljnoynbmnmzzcgpbqilxklqbhhejtesbvkrkpenhuqijrnxpjyokqpvigljwrljihjhpedyhfrytzzmxhanqvipgteijfywmkikpkfohgsazwomibagkugajwyvriblbvbqnptgvxvfhalrcicrfohpslvioptzprbwfphpoiuqubntxjaxzuntisgvotlrtpvelzlbkyoeygnqxxoijjbqdttuynyjzfgeqxurvzdctswpyxhktvrnmhvkiebxwbadwbwomhsktifywyqsijxrjcajruwdd': <gensim.models.word2vec.Vocab at 0x15a2e67f0>,\n 'httpsownitcomcandidatescruz': <gensim.models.word2vec.Vocab at 0x15a2e6828>,\n 'zaparanuik': <gensim.models.word2vec.Vocab at 0x15a2e6860>,\n 'httplinkwashingtonpostcomclickahrchmlydldgvylmnvbspbnrlbnqvdhdlzxqdgvdddagvjayuymgdcuymfrozsuymerhawxjtiwmjayjtiwznjvbsuymcumfbvdvyugzdcuymghdhbzoivddlndhchpbmdbwbnlmnvbsuzxdzlbvdvycgzdcwywxvbwevzgfpbhktmjaylziwmtyvmdqvmjkvzgfpbhktmjaylwnydxotafzawnolxjlyjpbwluyxrpbzlxrcglmesldmvyexroawnlwhhcgxlcmtywjvdxqtdghllxnbatdhjbxatbwzwlbnqvntcymjjmmteodfiotjhmjjkmzuyilyzzbvyyudviyxpzwjndwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccdc': <gensim.models.word2vec.Vocab at 0x15a2e6898>,\n 'capitalists': <gensim.models.word2vec.Vocab at 0x15a2e68d0>,\n 'redefine': <gensim.models.word2vec.Vocab at 0x15a2e6908>,\n 'brandi': <gensim.models.word2vec.Vocab at 0x15a2e6940>,\n 'warfighter': <gensim.models.word2vec.Vocab at 0x15a2e6978>,\n 'arrested': <gensim.models.word2vec.Vocab at 0x15a2e69b0>,\n 'httprrsnettnjspfvwjwxztkxdukzqkpbnzzhfuwnksuiqitmoixuilxnxduaiffpfjrnvmvpstflzhvgqlcbptgsxmxbunsfpquibyxscsqkrnynnmagjvojfdtjpgxbobkxnraguzlodpeqvzszzgwvgufrejvziuliclpsnsffcoxqqeyywtxxchncmozmvbgiiwsngfvctpjlyachjrnpwmiqdsklkepkhipthzzeysjuldlnlzfuohodjljalhqfg': <gensim.models.word2vec.Vocab at 0x15a2e69e8>,\n 'httpclickeusatodaycomqsfaaddacfaabdadeedcbfcddfdabdaebaae': <gensim.models.word2vec.Vocab at 0x15a2e6a20>,\n 'trumphttpswwwwashingtonpostcomopinionsthemanywaysrepublicansaredistancingthemselvesfromtrumpedeeeaaacstoryhtml': <gensim.models.word2vec.Vocab at 0x15a2e6a58>,\n 'lightfoothttpswwwdonaldjtrumpcompressreleasesdonaldjtrumpendorsedbycongressmanjameslightfoot': <gensim.models.word2vec.Vocab at 0x15a2e6a90>,\n 'doorbell': <gensim.models.word2vec.Vocab at 0x15a2e6ac8>,\n 'httplinkwashingtonpostcomclickahrcdovlddyyxnoawndgucgzdcjbvbmvcyjagvjabvawldwlziwmtyvmduvmtkvdgwlwdlbmvyywwtywdyzwvtzwlxrvlxnlbmqtdszlxrybwcybysawjysjbvszcizsyzwfjagvklwfueskyxkvpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccfcbb': <gensim.models.word2vec.Vocab at 0x15a2e6b00>,\n 'wildss': <gensim.models.word2vec.Vocab at 0x15a2e6b38>,\n 'beyonce': <gensim.models.word2vec.Vocab at 0x15ae9c7b8>,\n 'decisiones': <gensim.models.word2vec.Vocab at 0x15a2e6ba8>,\n 'damascus': <gensim.models.word2vec.Vocab at 0x15a2e6be0>,\n 'lynda': <gensim.models.word2vec.Vocab at 0x15a2e6c18>,\n 'electoralmap': <gensim.models.word2vec.Vocab at 0x15a2e6c50>,\n 'outreaching': <gensim.models.word2vec.Vocab at 0x15a2e6c88>,\n 'columbus': <gensim.models.word2vec.Vocab at 0x15a2e6cc0>,\n 'tipsgreetingscomics': <gensim.models.word2vec.Vocab at 0x15a2e6cf8>,\n 'redstatehttpparacomparamountcommunicationcomctwinocynmdcecbcabeddbbcbefdr': <gensim.models.word2vec.Vocab at 0x15a2e6d30>,\n 'daughter': <gensim.models.word2vec.Vocab at 0x15a2e6d68>,\n 'disasterhttpwwwwashingtonexaminercomnevadagovsandovalwarnsgoptrumpspellselectoraldisasterarticle': <gensim.models.word2vec.Vocab at 0x15a2e6da0>,\n 'funk': <gensim.models.word2vec.Vocab at 0x15a2e6dd8>,\n 'channel': <gensim.models.word2vec.Vocab at 0x15ba104a8>,\n 'ensuing': <gensim.models.word2vec.Vocab at 0x15a2e6e48>,\n 'enumerated': <gensim.models.word2vec.Vocab at 0x15a2e6e80>,\n 'cultures': <gensim.models.word2vec.Vocab at 0x15a2e6eb8>,\n 'deerfield': <gensim.models.word2vec.Vocab at 0x15a2e6ef0>,\n 'httpclickeusatodaycomqsdbdadbfbbfcefedaabeceaadcfadeccebeecddeef': <gensim.models.word2vec.Vocab at 0x15a2e6f28>,\n 'httpgopoliticoemailcomqscdbabdbbbebdeeddffeeeda': <gensim.models.word2vec.Vocab at 0x15a2e6f60>,\n 'widdicombe': <gensim.models.word2vec.Vocab at 0x15a2e6f98>,\n 'hoyers': <gensim.models.word2vec.Vocab at 0x15a2e6fd0>,\n 'dreamworks': <gensim.models.word2vec.Vocab at 0x15a2e5048>,\n 'httpgopoliticoemailcomqsfffabcfdefdfdfecdfdabddaabcc': <gensim.models.word2vec.Vocab at 0x15b01d080>,\n 'totalitarian': <gensim.models.word2vec.Vocab at 0x15a2e5080>,\n 'semansky': <gensim.models.word2vec.Vocab at 0x15a2e50b8>,\n 'spoke': <gensim.models.word2vec.Vocab at 0x15a2e50f0>,\n 'opportunism': <gensim.models.word2vec.Vocab at 0x15b08d9b0>,\n 'lavatories': <gensim.models.word2vec.Vocab at 0x15a2e5128>,\n 'revving': <gensim.models.word2vec.Vocab at 0x15c34e128>,\n 'httpwwwwsjcomarticlesdonaldtrumpsdayincourtmodwsjreviewoutlookmccideafmceiduniqid': <gensim.models.word2vec.Vocab at 0x15a2e5198>,\n 'httplinkwashingtonpostcomclickahrchmlydcuawzdgfncmftlmnvbswljgqzidenahjlzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfccdea': <gensim.models.word2vec.Vocab at 0x15babbf60>,\n 'protests': <gensim.models.word2vec.Vocab at 0x15a2e51d0>,\n 'sloppy': <gensim.models.word2vec.Vocab at 0x15a2e5208>,\n 'nrsc': <gensim.models.word2vec.Vocab at 0x15a2e5240>,\n 'vip': <gensim.models.word2vec.Vocab at 0x15a2e5278>,\n 'httpgopoliticoemailcomqseabaebbbafdefbeeeceaadf': <gensim.models.word2vec.Vocab at 0x15a2e52b0>,\n 'timescbs': <gensim.models.word2vec.Vocab at 0x15a2e52e8>,\n 'prunefaced': <gensim.models.word2vec.Vocab at 0x12ff135f8>,\n 'httpgopoliticoemailcomqscccbfdddcaadcacaeeaeeaf': <gensim.models.word2vec.Vocab at 0x15a2e5358>,\n 'floyds': <gensim.models.word2vec.Vocab at 0x15a8b2630>,\n 'budgetbusting': <gensim.models.word2vec.Vocab at 0x15ac72f98>,\n 'preferenceshttpbusinessfwduslistmanagecomprofileuddabbbddfffidcdefcbd': <gensim.models.word2vec.Vocab at 0x15a2e5390>,\n 'httpclickemailbostonglobecomqsfeafddbdaebadbbbdedefcecadecfccfae': <gensim.models.word2vec.Vocab at 0x15a2e53c8>,\n 'debenedettihttpwwwpoliticocomstaffgabrieldebenedetti': <gensim.models.word2vec.Vocab at 0x15a2e5400>,\n 'httpgopoliticoemailcomqsebebeacdeddfefefadbebdbec': <gensim.models.word2vec.Vocab at 0x15c361438>,\n 'karlov': <gensim.models.word2vec.Vocab at 0x133cc57f0>,\n 'httpclickemailbostonglobecomqsccfdaefacadebedcdfeeafb': <gensim.models.word2vec.Vocab at 0x15a2e5470>,\n 'ihhjjqhwoljbeul': <gensim.models.word2vec.Vocab at 0x15a2e54a8>,\n 'bonoskygdncorgjavascriptebdcvmlbonoskygdncorg': <gensim.models.word2vec.Vocab at 0x15a2e54e0>,\n 'feld': <gensim.models.word2vec.Vocab at 0x15a2e5518>,\n 'surface': <gensim.models.word2vec.Vocab at 0x15a2e5550>,\n 'coreys': <gensim.models.word2vec.Vocab at 0x15a2e5588>,\n 'dormer': <gensim.models.word2vec.Vocab at 0x15ae9c9e8>,\n 'yield': <gensim.models.word2vec.Vocab at 0x15a2e55f8>,\n 'httpfamousdcuslistmanagecomtrackclickucdebedidefacbd': <gensim.models.word2vec.Vocab at 0x15a2e5630>,\n 'willhelp': <gensim.models.word2vec.Vocab at 0x15a2e5668>,\n 'weekendone': <gensim.models.word2vec.Vocab at 0x15a2e56a0>,\n 'httpmoneycnncommediaazealiabankstwittersuspendedindexhtmlmccidcbefmceiduniqid': <gensim.models.word2vec.Vocab at 0x15a2e56d8>,\n 'krystalina': <gensim.models.word2vec.Vocab at 0x15a2e5710>,\n 'bestinclass': <gensim.models.word2vec.Vocab at 0x15a2e5748>,\n 'europehttpsactmyngpcomel': <gensim.models.word2vec.Vocab at 0x15a2e5780>,\n 'httpsmediumcomaftuniontheprofessionadvancedcceaasourceemailccdbafdailydigestsectionnamepublished': <gensim.models.word2vec.Vocab at 0x15a2e57b8>,\n 'bridgeport': <gensim.models.word2vec.Vocab at 0x15a2e57f0>,\n 'hashana': <gensim.models.word2vec.Vocab at 0x15a2e5828>,\n 'bestowed': <gensim.models.word2vec.Vocab at 0x15a2e5860>,\n 'saiful': <gensim.models.word2vec.Vocab at 0x15a2e5898>,\n 'sensicshud': <gensim.models.word2vec.Vocab at 0x15a2e58d0>,\n 'ldquostarrdquo': <gensim.models.word2vec.Vocab at 0x15a2e5908>,\n 'universality': <gensim.models.word2vec.Vocab at 0x15a2e5940>,\n 'secretive': <gensim.models.word2vec.Vocab at 0x15a2e5978>,\n 'friendhttpswwwgooglecomurlsatrctjqesrcssourcewebcdvedahukewjloybmahxhdkhqblcaqqqiihjaaurlhttpafffinanceyahoocomfnewsfdonaldtrumpisbecomingwallstreetsbestfriendhtmlusgafqjcngaoloknfzwblpbjrqfcw': <gensim.models.word2vec.Vocab at 0x15a2e59b0>,\n 'inputting': <gensim.models.word2vec.Vocab at 0x15a2e59e8>,\n 'evolved': <gensim.models.word2vec.Vocab at 0x15a2e5a20>,\n 'httpswwwwashingtonpostcomblogserikwemplewpmegynkellysbankruptinterviewwithdonaldtrumpmccideamceiduniqid': <gensim.models.word2vec.Vocab at 0x15a2e5a58>,\n 'httpgopoliticoemailcomqsaabbdfcfbcccdddfcaffafaae': <gensim.models.word2vec.Vocab at 0x15a2e5a90>,\n 'gorka': <gensim.models.word2vec.Vocab at 0x15a2e5ac8>,\n 'basicsusing': <gensim.models.word2vec.Vocab at 0x15a2e5b00>,\n 'httplinkwashingtonpostcomclickahrchmlydcuawzdgfncmftlmnvbswljgunvmwxuzlzcgtptemdbpcjjpwsxrhawxmjaycaeadcbcfccd': <gensim.models.word2vec.Vocab at 0x15a2e5b38>,\n 'fox': <gensim.models.word2vec.Vocab at 0x15a2e5b70>,\n 'nonperson': <gensim.models.word2vec.Vocab at 0x15a2e5ba8>,\n 'mica': <gensim.models.word2vec.Vocab at 0x15a2e5be0>,\n 'antidoping': <gensim.models.word2vec.Vocab at 0x15a2e5c18>,\n 'bend': <gensim.models.word2vec.Vocab at 0x15a2e5c50>,\n 'petreliusdsccorg': <gensim.models.word2vec.Vocab at 0x15a2e5c88>,\n 'wenliang': <gensim.models.word2vec.Vocab at 0x15a2e5cc0>,\n 'watchhttpstoolboxdncorgtoolnamevantageuploaderpathvantageuploaderdncorgvideossharedshowjwteyjexaioijkvqilcjhbgcioijiuzinijeyjpyxqiojenjiotqnzqsimvtywlsijoicbvbgfyawnozbkbmmubjniiwiawqiojmxnzenswizgbmxvywrhymxlijpcnvlfqdovtdcovspqamsdvytyeptduswfacdd': <gensim.models.word2vec.Vocab at 0x15a2e5cf8>,\n 'mmorgensternwashingtonexaminercommailtommorgensternwashingtonexaminercom': <gensim.models.word2vec.Vocab at 0x15a2e5d30>,\n 'outspending': <gensim.models.word2vec.Vocab at 0x15a2e5d68>,\n 'httpwwwthedailybeastcomarticlesagendatheunconspiracythatjustwontdiehtml': <gensim.models.word2vec.Vocab at 0x15a2e5da0>,\n 'bash': <gensim.models.word2vec.Vocab at 0x15a2e5dd8>,\n 'mercenary': <gensim.models.word2vec.Vocab at 0x15a2e5e10>,\n 'stockexchange': <gensim.models.word2vec.Vocab at 0x15a2e5e48>,\n 'candace': <gensim.models.word2vec.Vocab at 0x15b0cb2e8>,\n 'fourthranking': <gensim.models.word2vec.Vocab at 0x15a2e5ef0>,\n 'entertainmentmedia': <gensim.models.word2vec.Vocab at 0x15a2e5f28>,\n 'thetampa': <gensim.models.word2vec.Vocab at 0x15a2e5f60>,\n 'jokey': <gensim.models.word2vec.Vocab at 0x15a2e5f98>,\n 'dwoogoptonlinenet': <gensim.models.word2vec.Vocab at 0x15a2e5fd0>,\n 'photoops': <gensim.models.word2vec.Vocab at 0x15a2e3048>,\n 'overtaken': <gensim.models.word2vec.Vocab at 0x15a2e3080>,\n 'httpfamousdcuslistmanagecomtrackclickucdebedidedeefacbd': <gensim.models.word2vec.Vocab at 0x15a2e30b8>,\n 'sa': <gensim.models.word2vec.Vocab at 0x15a2e30f0>,\n 'flung': <gensim.models.word2vec.Vocab at 0x15ae9ccc0>,\n 'denounced': <gensim.models.word2vec.Vocab at 0x15a2e3160>,\n 'httpsurldefenseproofpointcomvurluhttpawwwfacebookcompagesrolldcallxxfposdrrdcwmfaqcnsxitqylvmhhecrwpueqbgkqtvcikfpxsrcgfylnhvwagyepbqzrnpilfrenezxqgmmupgbzdrfmlsmfizkocycyytbcytuzdveqtfymsukwxwpmagbveimjuxilqnrdxwmoczahcxhtje': <gensim.models.word2vec.Vocab at 0x15a2e3198>,\n 'lockdown': <gensim.models.word2vec.Vocab at 0x15a2e31d0>,\n 'goingdoing': <gensim.models.word2vec.Vocab at 0x15a2e3208>,\n 'flakes': <gensim.models.word2vec.Vocab at 0x15a2e3240>,\n 'undeserved': <gensim.models.word2vec.Vocab at 0x15a2e3278>,\n 'hillaryhttpstwittercomrealdonaldtrumpstatus': <gensim.models.word2vec.Vocab at 0x15a2e32b0>,\n 'puertas': <gensim.models.word2vec.Vocab at 0x15a2e32e8>,\n 'spitzer': <gensim.models.word2vec.Vocab at 0x15a2e3320>,\n 'appearance': <gensim.models.word2vec.Vocab at 0x15a2e3358>,\n 'pairing': <gensim.models.word2vec.Vocab at 0x15a2e3390>,\n 'gibbons': <gensim.models.word2vec.Vocab at 0x15a2e33c8>,\n 'presscatherinecortezmastocom': <gensim.models.word2vec.Vocab at 0x15a2e3400>,\n 'keady': <gensim.models.word2vec.Vocab at 0x15a2e3438>,\n 'httpclickeusatodaycomqsaabdfbfcadebcdfddcadcfbbdbafcbcdfffdde': <gensim.models.word2vec.Vocab at 0x15a2e3470>,\n 'httpclickemailbostonglobecomqsefaabefceffeaddbfacbdfbeadadfcbd': <gensim.models.word2vec.Vocab at 0x15a2e34a8>,\n 'crib': <gensim.models.word2vec.Vocab at 0x15a2e34e0>,\n 'adbel': <gensim.models.word2vec.Vocab at 0x15be080b8>,\n 'cidimagepngdaeeaccac': <gensim.models.word2vec.Vocab at 0x15a2e3518>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytlldmvcgzxjwbnlbhbgtyskywlsesymdivmjaxniwncyoskywlsesymdityjeiryxnpygtcmvjcmltawhdglvbnmtdhlwawzlwvzxjdghpbmctagfwbgvzcyhymdcagutcrvcccnvtcctbzlbwvudcnziymmyxmtkmwimmeymmqzntdjyjyvpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfccfd': <gensim.models.word2vec.Vocab at 0x15a2e3550>,\n 'devised': <gensim.models.word2vec.Vocab at 0x15a2e35c0>,\n 'preferenceshttpamericanbridgepacuslistmanagecomprofileueebfeedcfeeffdidcfcebcdbbc': <gensim.models.word2vec.Vocab at 0x15a2e35f8>,\n 'capsules': <gensim.models.word2vec.Vocab at 0x15a2e3630>,\n 'walks': <gensim.models.word2vec.Vocab at 0x15a2e3668>,\n 'lootinghttpbluenationreviewcombernieaccuseshillaryoflaunderingandlooting': <gensim.models.word2vec.Vocab at 0x15a2e36a0>,\n 'parsed': <gensim.models.word2vec.Vocab at 0x15a2e36d8>,\n 'racking': <gensim.models.word2vec.Vocab at 0x15a2e3710>,\n 'daypart': <gensim.models.word2vec.Vocab at 0x15a2e3748>,\n 'mailtokcirillibloombergnethttpbloombergnet': <gensim.models.word2vec.Vocab at 0x15a2e3780>,\n 'httplinkwashingtonpostcomclickahrchmlydcudfzagluzrvbnbvcquytldyyxboawnzlbvbglawnzlnsawbtbwuzxkvpdwbwmszcglzcmmbmxfzgfpbhkymdicaeadcbcfcecfbd': <gensim.models.word2vec.Vocab at 0x15a2e37b8>,\n 'jda': <gensim.models.word2vec.Vocab at 0x15a2e37f0>,\n 'talents': <gensim.models.word2vec.Vocab at 0x15a2e3828>,\n 'horton': <gensim.models.word2vec.Vocab at 0x15a2e3860>,\n 'mileageplusr': <gensim.models.word2vec.Vocab at 0x15a2e3898>,\n 'httpsmediumcomglobalentrepreneurshipsummitsourceemailccdbafdailydigest': <gensim.models.word2vec.Vocab at 0x15a2e38d0>,\n 'httpsmediumcompauldughisourceemailccdbafdailydigest': <gensim.models.word2vec.Vocab at 0x15a2e3908>,\n 'stolenhttpwwwrgjcomstorynewspoliticsnevadademocraticcaucuseswhatshappeningnowrenoandvegas': <gensim.models.word2vec.Vocab at 0x15a2e3940>,\n 'titled': <gensim.models.word2vec.Vocab at 0x15a2e3978>,\n 'httpwwwcnncompoliticsdonaldtrumpvladimirputinbromance': <gensim.models.word2vec.Vocab at 0x15a2e39b0>,\n 'interestedevent': <gensim.models.word2vec.Vocab at 0x15a2e39e8>,\n 'fourtyfour': <gensim.models.word2vec.Vocab at 0x15a2e3a20>,\n 'safetynet': <gensim.models.word2vec.Vocab at 0x15a2e3a58>,\n 'trailhttpwwwftcomuselection': <gensim.models.word2vec.Vocab at 0x15a2e3a90>,\n 'questionmark': <gensim.models.word2vec.Vocab at 0x15a2e3ac8>,\n 'hacking': <gensim.models.word2vec.Vocab at 0x15a86ba90>,\n 'falls': <gensim.models.word2vec.Vocab at 0x15b0cb550>,\n ...}"
},
"execution_count": 86,
"output_type": "execute_result",
"metadata": {}
}
]
},
{
"metadata": {
"collapsed": true,
"trusted": true
},
"cell_type": "code",
"source": "pca and svd",
"execution_count": null,
"outputs": []
},
{
"metadata": {
"collapsed": true,
"trusted": true
},
"cell_type": "code",
"source": "cosine similarity",
"execution_count": null,
"outputs": []
},
{
"metadata": {
"collapsed": false,
"trusted": true
},
"cell_type": "code",
"source": "model.most_similar('private' ,topn=10)",
"execution_count": 90,
"outputs": [
{
"data": {
"text/plain": "[('sector', 0.6334954500198364),\n ('server', 0.6149282455444336),\n ('property', 0.5859717726707458),\n ('employee', 0.5775003433227539),\n ('assessments', 0.5543426871299744),\n ('completion', 0.5441495776176453),\n ('probe', 0.5410292148590088),\n ('service', 0.5277994275093079),\n ('encrypted', 0.5215306878089905),\n ('investigations', 0.5137321949005127)]"
},
"execution_count": 90,
"output_type": "execute_result",
"metadata": {}
}
]
}
],
"metadata": {
"language_info": {
"name": "python",
"pygments_lexer": "ipython3",
"nbconvert_exporter": "python",
"codemirror_mode": {
"version": 3,
"name": "ipython"
},
"version": "3.5.2",
"file_extension": ".py",
"mimetype": "text/x-python"
},
"kernelspec": {
"name": "python3",
"display_name": "Python 3",
"language": "python"
},
"gist": {
"id": "",
"data": {
"description": "projects/04-fletcher/dnc_leaks/DNC_Word2Vec_Gensim.ipynb",
"public": true
}
}
},
"nbformat": 4,
"nbformat_minor": 0
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment