Created
May 18, 2022 13:40
-
-
Save Narsil/a6b927c4973d4d0a63b1765cfff38e55 to your computer and use it in GitHub Desktop.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
import json | |
import time | |
from collections import defaultdict | |
from typing import List | |
with open("vocab.json", "r") as f: | |
vocab = json.load(f) | |
def normal(vocab: dict) -> List[str]: | |
merges = [] | |
for piece_l in vocab.keys(): | |
for piece_r in vocab.keys(): | |
merge = f"{piece_l}{piece_r}" | |
piece_id = vocab.get(merge, None) | |
if piece_id: | |
merges += [(piece_l, piece_r, piece_id)] | |
merges = sorted(merges, key=lambda val: val[2]) | |
merges = [(val[0], val[1]) for val in merges] | |
return merges | |
def improved(vocab: dict) -> List[str]: | |
merges = [] | |
prefixes = dict() | |
for word in vocab.keys(): | |
for i in range(len(word)): | |
prefixes[word[: i + 1]] = {word} | prefixes.setdefault(word[: i + 1], set()) | |
for word in vocab.keys(): | |
if len(prefixes[word]) > 1: | |
for candidate in prefixes[word]: | |
if word != candidate: | |
if candidate[len(word) :] in vocab: | |
piece_id = vocab.get(candidate, None) | |
merges += [(word, candidate[len(word) :], piece_id)] | |
merges = sorted(merges, key=lambda val: val[2]) | |
merges = [(val[0], val[1]) for val in merges] | |
return merges | |
def improved2(vocab: dict) -> List[str]: | |
merges = [] | |
for candidate, piece_id in vocab.items(): | |
for i in range(1, len(candidate)): | |
left, right = candidate[:i], candidate[i:] | |
left_id = vocab.get(left, None) | |
right_id = vocab.get(right, None) | |
if left_id is not None and right_id is not None: | |
merges += [(left, right, piece_id, left_id, right_id)] | |
merges = sorted(merges, key=lambda val: val[2:]) | |
merges = [(val[0], val[1]) for val in merges] | |
return merges | |
print(f"vocabulary length: {len(vocab)}, max word length: {max(len(word) for word in vocab.keys())}") | |
start = time.time() | |
result_improved = improved(vocab) | |
print(f"improved: {time.time() - start} secs") | |
start = time.time() | |
result_improved2 = improved2(vocab) | |
print(f"improved2: {time.time() - start} secs") | |
start = time.time() | |
result_normal = normal(vocab) | |
print(f"normal: {time.time() - start} secs") | |
# confirm that results match | |
assert result_improved2 == result_improved | |
assert result_normal == result_improved |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
{ | |
"<s>": 0, | |
"<pad>": 1, | |
"</s>": 2, | |
"<unk>": 3, | |
".": 4, | |
"Ġthe": 5, | |
",": 6, | |
"Ġto": 7, | |
"Ġand": 8, | |
"Ġof": 9, | |
"Ġa": 10, | |
"Ġin": 11, | |
"-": 12, | |
"Ġfor": 13, | |
"Ġthat": 14, | |
"Ġon": 15, | |
"Ġis": 16, | |
"âĢ": 17, | |
"'s": 18, | |
"Ġwith": 19, | |
"ĠThe": 20, | |
"Ġwas": 21, | |
"Ġ\"": 22, | |
"Ġat": 23, | |
"Ġit": 24, | |
"Ġas": 25, | |
"Ġsaid": 26, | |
"Ļ": 27, | |
"Ġbe": 28, | |
"s": 29, | |
"Ġby": 30, | |
"Ġfrom": 31, | |
"Ġare": 32, | |
"Ġhave": 33, | |
"Ġhas": 34, | |
":": 35, | |
"Ġ(": 36, | |
"Ġhe": 37, | |
"ĠI": 38, | |
"Ġhis": 39, | |
"Ġwill": 40, | |
"Ġan": 41, | |
"Ġthis": 42, | |
")": 43, | |
"ĠâĢ": 44, | |
"Ġnot": 45, | |
"Ŀ": 46, | |
"Ġyou": 47, | |
"ľ": 48, | |
"Ġtheir": 49, | |
"Ġor": 50, | |
"Ġthey": 51, | |
"Ġwe": 52, | |
"Ġbut": 53, | |
"Ġwho": 54, | |
"Ġmore": 55, | |
"Ġhad": 56, | |
"Ġbeen": 57, | |
"Ġwere": 58, | |
"Ġabout": 59, | |
",\"": 60, | |
"Ġwhich": 61, | |
"Ġup": 62, | |
"Ġits": 63, | |
"Ġcan": 64, | |
"Ġone": 65, | |
"Ġout": 66, | |
"Ġalso": 67, | |
"Ġ$": 68, | |
"Ġher": 69, | |
"Ġall": 70, | |
"Ġafter": 71, | |
".\"": 72, | |
"/": 73, | |
"Ġwould": 74, | |
"'t": 75, | |
"Ġyear": 76, | |
"Ġwhen": 77, | |
"Ġfirst": 78, | |
"Ġshe": 79, | |
"Ġtwo": 80, | |
"Ġover": 81, | |
"Ġpeople": 82, | |
"ĠA": 83, | |
"Ġour": 84, | |
"ĠIt": 85, | |
"Ġtime": 86, | |
"Ġthan": 87, | |
"Ġinto": 88, | |
"Ġthere": 89, | |
"t": 90, | |
"ĠHe": 91, | |
"Ġnew": 92, | |
"ĠâĢĶ": 93, | |
"Ġlast": 94, | |
"Ġjust": 95, | |
"ĠIn": 96, | |
"Ġother": 97, | |
"Ġso": 98, | |
"Ġwhat": 99, | |
"I": 100, | |
"Ġlike": 101, | |
"a": 102, | |
"Ġsome": 103, | |
"S": 104, | |
"ë": 105, | |
"Ġthem": 106, | |
"Ġyears": 107, | |
"'": 108, | |
"Ġdo": 109, | |
"Ġyour": 110, | |
"Ġ-": 111, | |
"Ġ1": 112, | |
"\"": 113, | |
"Ġif": 114, | |
"Ġcould": 115, | |
"?": 116, | |
"Ġno": 117, | |
"i": 118, | |
"m": 119, | |
"Ġget": 120, | |
"ĠU": 121, | |
"Ġnow": 122, | |
"Ġhim": 123, | |
"Ġback": 124, | |
"ĠBut": 125, | |
"ĠâĢĵ": 126, | |
"Ġmy": 127, | |
"Ġ'": 128, | |
"Ġonly": 129, | |
"Ġthree": 130, | |
";": 131, | |
"Ġ2": 132, | |
"The": 133, | |
"1": 134, | |
"Ġpercent": 135, | |
"Ġagainst": 136, | |
"Ġbefore": 137, | |
"Ġcompany": 138, | |
"o": 139, | |
"ĠTrump": 140, | |
"Ġhow": 141, | |
"Ġbecause": 142, | |
"Ġany": 143, | |
"Ġmost": 144, | |
"Ġbeing": 145, | |
"Ġmake": 146, | |
"Ġwhere": 147, | |
"Ġduring": 148, | |
"Ġthrough": 149, | |
"Ġwhile": 150, | |
"000": 151, | |
"ĠThis": 152, | |
"Ġmillion": 153, | |
"ing": 154, | |
"Ġ3": 155, | |
"Ġmade": 156, | |
"Ġwell": 157, | |
"Ġ10": 158, | |
"Ġdown": 159, | |
"Ġoff": 160, | |
"Ġsays": 161, | |
"Ġme": 162, | |
"ĠB": 163, | |
"Ġgoing": 164, | |
"Ġteam": 165, | |
"ĠWe": 166, | |
"Ġthose": 167, | |
"Ġgovernment": 168, | |
"Ġway": 169, | |
"We": 170, | |
"Ġmany": 171, | |
"Ġthen": 172, | |
"Ġwork": 173, | |
"Ġtold": 174, | |
"com": 175, | |
"2": 176, | |
"Ġgame": 177, | |
"ĠAnd": 178, | |
"in": 179, | |
"year": 180, | |
"Ġp": 181, | |
"Ġvery": 182, | |
"Ġday": 183, | |
"Ġhome": 184, | |
"Ġtake": 185, | |
"Ġweek": 186, | |
"Ġsince": 187, | |
"ĠNew": 188, | |
"Ġmay": 189, | |
"Ġeven": 190, | |
"Ġseason": 191, | |
"Ġsee": 192, | |
"Ġ2017": 193, | |
"Ġstate": 194, | |
"Ġ5": 195, | |
"ed": 196, | |
"Ġshould": 197, | |
"Ġaround": 198, | |
"Ġ2018": 199, | |
"Ġsecond": 200, | |
"Ġus": 201, | |
"Ġstill": 202, | |
"Ġmuch": 203, | |
"Ġ4": 204, | |
"Ġgood": 205, | |
"Ġthink": 206, | |
"%": 207, | |
"ĠS": 208, | |
"Ġthese": 209, | |
"Ġmarket": 210, | |
"ĠD": 211, | |
"th": 212, | |
"Ġgo": 213, | |
"'re": 214, | |
"Ġsuch": 215, | |
"Ġknow": 216, | |
"Ġincluding": 217, | |
"Ġdon": 218, | |
"y": 219, | |
"Ġnext": 220, | |
"ĠP": 221, | |
"Ġdid": 222, | |
"Ġunder": 223, | |
"Ġsay": 224, | |
"en": 225, | |
"ĠL": 226, | |
"Ġbetween": 227, | |
"Ġper": 228, | |
"ĠK": 229, | |
"ĠC": 230, | |
"Ġ6": 231, | |
"Ġworld": 232, | |
"Ġpart": 233, | |
"ĠN": 234, | |
"Ġright": 235, | |
"Ġwant": 236, | |
"Ġfour": 237, | |
"),": 238, | |
"Ġhigh": 239, | |
"Ġneed": 240, | |
"re": 241, | |
"e": 242, | |
"It": 243, | |
"Ġhelp": 244, | |
"5": 245, | |
"3": 246, | |
"Ġcountry": 247, | |
"ĠR": 248, | |
"Ġpolice": 249, | |
"A": 250, | |
"Ġlong": 251, | |
"ĠThey": 252, | |
"Ġend": 253, | |
"er": 254, | |
"ĠT": 255, | |
"ĠM": 256, | |
"u": 257, | |
"Ġboth": 258, | |
"Ġhere": 259, | |
"an": 260, | |
"on": 261, | |
"Ġ7": 262, | |
"Ġde": 263, | |
"ĠShe": 264, | |
"Ġbusiness": 265, | |
"Ġreport": 266, | |
"j": 267, | |
"ers": 268, | |
"Ġreally": 269, | |
"ĠPresident": 270, | |
"ar": 271, | |
"ĠG": 272, | |
"ĠFriday": 273, | |
"ĠF": 274, | |
"Ġbest": 275, | |
"Ġsame": 276, | |
"Ġanother": 277, | |
"Ġset": 278, | |
"old": 279, | |
"ĠThat": 280, | |
"as": 281, | |
"n": 282, | |
"Ġcome": 283, | |
"Ġfamily": 284, | |
"Ġpublic": 285, | |
"ĠFor": 286, | |
"ĠAs": 287, | |
"0": 288, | |
"ĠH": 289, | |
"Ġ8": 290, | |
"Ġ20": 291, | |
"Ġfive": 292, | |
"es": 293, | |
"ĠTuesday": 294, | |
"Ġn": 295, | |
"ĠThursday": 296, | |
"Ġquarter": 297, | |
"h": 298, | |
"Ġtop": 299, | |
"Ġgot": 300, | |
"Ġlife": 301, | |
"ĠMonday": 302, | |
"Ġfound": 303, | |
"Ġuse": 304, | |
"ĠW": 305, | |
"4": 306, | |
"ĠWednesday": 307, | |
"Ġown": 308, | |
"Ġaccording": 309, | |
"Ġplay": 310, | |
"Ġshow": 311, | |
"ĠSt": 312, | |
"Ġman": 313, | |
"Ġleft": 314, | |
"ĠUnited": 315, | |
"Ġ12": 316, | |
"Ġplace": 317, | |
"ĠIf": 318, | |
"Ġlot": 319, | |
"Ġformer": 320, | |
"Ġ0": 321, | |
").": 322, | |
"Ġsupport": 323, | |
"ie": 324, | |
"Ġbillion": 325, | |
"Ġt": 326, | |
"Ġshares": 327, | |
"!": 328, | |
"z": 329, | |
"k": 330, | |
"ĠState": 331, | |
"Ġpoints": 332, | |
"Ġgroup": 333, | |
"Ġschool": 334, | |
"Ġinformation": 335, | |
"Ġ2016": 336, | |
"al": 337, | |
"r": 338, | |
"Ġwin": 339, | |
"Ġnews": 340, | |
"Ġused": 341, | |
"Ġput": 342, | |
"Ġcity": 343, | |
"ĠJ": 344, | |
"ĠThere": 345, | |
"Ġnumber": 346, | |
"C": 347, | |
"'ve": 348, | |
"Ġeach": 349, | |
"Ġtoo": 350, | |
"Ġwon": 351, | |
"ly": 352, | |
"Ġmonth": 353, | |
"is": 354, | |
"Ġadded": 355, | |
"Ġlook": 356, | |
"Ġbetter": 357, | |
"Ġevery": 358, | |
"Ġ&": 359, | |
"Ġdays": 360, | |
"Ġ9": 361, | |
"Ġtook": 362, | |
"Ġnight": 363, | |
"Ġe": 364, | |
"Ġ11": 365, | |
"os": 366, | |
"Ġfew": 367, | |
"or": 368, | |
"ĠNorth": 369, | |
"ĠYou": 370, | |
"Ġthird": 371, | |
"Ġgreat": 372, | |
"Ġcalled": 373, | |
"ĠOn": 374, | |
"Ġpast": 375, | |
"Ġcame": 376, | |
"Ġmonths": 377, | |
"ĠSaturday": 378, | |
"Ġ15": 379, | |
"Ġbig": 380, | |
"ĠE": 381, | |
"ĠUS": 382, | |
"Ġthings": 383, | |
"ĠO": 384, | |
"Ġd": 385, | |
"Ġstart": 386, | |
"B": 387, | |
"Ġstock": 388, | |
"Ġ30": 389, | |
"Ġwomen": 390, | |
"ĠSouth": 391, | |
"ĠMay": 392, | |
"Ġnever": 393, | |
"Ġpresident": 394, | |
"ĠSunday": 395, | |
"Ġwithout": 396, | |
"man": 397, | |
"8": 398, | |
"Ġdidn": 399, | |
"Ġlocal": 400, | |
"6": 401, | |
"Ġsomething": 402, | |
"Ġcase": 403, | |
"ĠAll": 404, | |
"it": 405, | |
"7": 406, | |
"ĠSo": 407, | |
"Ġchildren": 408, | |
"Ġaway": 409, | |
"Ġlittle": 410, | |
"Ġsix": 411, | |
"ĠCity": 412, | |
"ĠCounty": 413, | |
"Ġdata": 414, | |
"at": 415, | |
"Ġalready": 416, | |
"d": 417, | |
"Ġmoney": 418, | |
"Ġearly": 419, | |
"Ġacross": 420, | |
"Ġexpected": 421, | |
"Ġrun": 422, | |
"Ġlater": 423, | |
"am": 424, | |
"Ġprice": 425, | |
"Ġgames": 426, | |
"ĠMr": 427, | |
"b": 428, | |
"Ġmight": 429, | |
"Ġdifferent": 430, | |
"Ġreported": 431, | |
"Ġdeal": 432, | |
"Ġmedia": 433, | |
"Ġgrowth": 434, | |
"Ġcommunity": 435, | |
"ĠChina": 436, | |
"'m": 437, | |
"c": 438, | |
"Ġwent": 439, | |
"ĠNo": 440, | |
"Ġable": 441, | |
"Ġmaking": 442, | |
"Ġarea": 443, | |
"Ġfar": 444, | |
"Ġstatement": 445, | |
"ĠHouse": 446, | |
"Ġworking": 447, | |
"M": 448, | |
"Ġk": 449, | |
"Ġseen": 450, | |
"Ġcompanies": 451, | |
"Ġtoday": 452, | |
"Ġmembers": 453, | |
"Ġuntil": 454, | |
"Ġfull": 455, | |
"Ġagain": 456, | |
"Ġhalf": 457, | |
"Ġshare": 458, | |
"le": 459, | |
"Ġalways": 460, | |
"Ġcourt": 461, | |
"l": 462, | |
"and": 463, | |
"Ġchange": 464, | |
"Ġfind": 465, | |
"9": 466, | |
"Ġsystem": 467, | |
"ĠV": 468, | |
"ĠYork": 469, | |
"ĠAmerican": 470, | |
"Ġhead": 471, | |
"Ġplayers": 472, | |
"Ġdoes": 473, | |
"Ġhealth": 474, | |
"Ġm": 475, | |
"Ġpower": 476, | |
"Ġpoint": 477, | |
"Ġhit": 478, | |
"Ġ.": 479, | |
"Ġ--": 480, | |
"Ġfree": 481, | |
".,": 482, | |
"Ġlead": 483, | |
"Ġseveral": 484, | |
"Ġrecent": 485, | |
"Ġcall": 486, | |
"N": 487, | |
"Ġlaw": 488, | |
"Ġkeep": 489, | |
"Ġopen": 490, | |
"ĠNews": 491, | |
"Ġgive": 492, | |
"ia": 493, | |
"ĠMarch": 494, | |
"D": 495, | |
"ĠNational": 496, | |
"ĠAt": 497, | |
"Ġtimes": 498, | |
"Ġfuture": 499, | |
"R": 500, | |
"Ġ14": 501, | |
"ĠJune": 502, | |
"Ġofficials": 503, | |
"Ġ18": 504, | |
"Ġimportant": 505, | |
"f": 506, | |
"Ġfinal": 507, | |
"Ġ13": 508, | |
"ĠOne": 509, | |
"P": 510, | |
"Ġfollowing": 511, | |
"Ġcar": 512, | |
"Ġleast": 513, | |
"Ġwater": 514, | |
"Ġevent": 515, | |
"Ġline": 516, | |
"Ġmove": 517, | |
"Ġservices": 518, | |
"Ġhaving": 519, | |
"ĠWhen": 520, | |
"Ġstudents": 521, | |
"ĠPolice": 522, | |
"el": 523, | |
"Ġam": 524, | |
"ĠZ": 525, | |
"Ġside": 526, | |
"Ġstory": 527, | |
"Ġdue": 528, | |
"Ġmeeting": 529, | |
"K": 530, | |
"Ġmust": 531, | |
"ĠStates": 532, | |
"Ġlikely": 533, | |
"G": 534, | |
"Ġcontinue": 535, | |
"Ġago": 536, | |
"Ġparty": 537, | |
"Ġmajor": 538, | |
"Ġindustry": 539, | |
"Ġless": 540, | |
"30": 541, | |
"Ġun": 542, | |
"Ġhard": 543, | |
"Ġservice": 544, | |
"Ġ16": 545, | |
"Ġlooking": 546, | |
"Ġheld": 547, | |
"ve": 548, | |
"Ġwhether": 549, | |
"ĠJuly": 550, | |
"Ġtaken": 551, | |
"Ġalong": 552, | |
"Ġasked": 553, | |
"Ġstarted": 554, | |
"Ġbecome": 555, | |
"Ġforward": 556, | |
"Ġresearch": 557, | |
"Ġoffice": 558, | |
"Ġpolitical": 559, | |
"to": 560, | |
"Ġtogether": 561, | |
"Ġgetting": 562, | |
"Ġplan": 563, | |
"Ġ25": 564, | |
"T": 565, | |
"Ġamong": 566, | |
"Ġcoming": 567, | |
"Ġdecision": 568, | |
"Ġvideo": 569, | |
"Ġ2015": 570, | |
"g": 571, | |
"ĠAfter": 572, | |
"Ġsecurity": 573, | |
"L": 574, | |
"Ġcare": 575, | |
"Ġgiven": 576, | |
"Ġavailable": 577, | |
"âĢĶ": 578, | |
"Ġs": 579, | |
"ĠWest": 580, | |
"'ll": 581, | |
"Ġpay": 582, | |
"Ġnear": 583, | |
"Ġsaying": 584, | |
"Ġannounced": 585, | |
"Ġprogram": 586, | |
"ĠApril": 587, | |
"Ġreal": 588, | |
"ĠUniversity": 589, | |
"ĠWith": 590, | |
"AP": 591, | |
"Ġsocial": 592, | |
"Ġclose": 593, | |
"et": 594, | |
"Ġcurrent": 595, | |
"Ġwhy": 596, | |
"F": 597, | |
"ĠTo": 598, | |
"ĠTwitter": 599, | |
"Ġthough": 600, | |
"Ġ17": 601, | |
"Ġtaking": 602, | |
"ĠInc": 603, | |
"Ġmen": 604, | |
"w": 605, | |
"Ġcomes": 606, | |
"ley": 607, | |
"Ġdoing": 608, | |
"Ġprocess": 609, | |
"ĠJohn": 610, | |
"ch": 611, | |
"00": 612, | |
"Ġfinancial": 613, | |
"Ġlow": 614, | |
"Ġenough": 615, | |
"ĠWhile": 616, | |
"Ġfurther": 617, | |
"Ġpost": 618, | |
"Ġfeel": 619, | |
"st": 620, | |
"Ġperson": 621, | |
"ĠFacebook": 622, | |
"ĠWorld": 623, | |
"Ġwithin": 624, | |
"ad": 625, | |
"Ġdone": 626, | |
"the": 627, | |
"Ġlate": 628, | |
"Ġtax": 629, | |
"Ġdoesn": 630, | |
"Ġthing": 631, | |
"Ġnational": 632, | |
"Ġjob": 633, | |
"Ġusing": 634, | |
"ĠHowever": 635, | |
"ic": 636, | |
"Ġcampaign": 637, | |
"Ġrecord": 638, | |
"Ġbehind": 639, | |
"://": 640, | |
"ĠDepartment": 641, | |
"p": 642, | |
"Ġothers": 643, | |
"ĠJanuary": 644, | |
"Ġorder": 645, | |
"Ġ[": 646, | |
"Ġsales": 647, | |
"Ġyet": 648, | |
"Ä": 649, | |
"Ġsmall": 650, | |
"Ġseries": 651, | |
"Ġface": 652, | |
"ĠWhat": 653, | |
"Ġ50": 654, | |
"Ġever": 655, | |
"Ġearlier": 656, | |
"Ġlove": 657, | |
"up": 658, | |
"Ġrights": 659, | |
"ĠAn": 660, | |
"ist": 661, | |
"Ġmorning": 662, | |
"ĠWashington": 663, | |
"Ġyoung": 664, | |
"Ġlatest": 665, | |
"ĠIndia": 666, | |
"Ġtrying": 667, | |
"Ġfire": 668, | |
"Ġled": 669, | |
"Ġstrong": 670, | |
"Ġreturn": 671, | |
"Ġlevel": 672, | |
"O": 673, | |
"Ġaverage": 674, | |
"Ġperiod": 675, | |
"Ġexperience": 676, | |
"ak": 677, | |
"Ġpossible": 678, | |
"Ġbelieve": 679, | |
"Ġinclude": 680, | |
"Ġoil": 681, | |
"Ġrecently": 682, | |
"Ġonce": 683, | |
"Ġknown": 684, | |
"Ġlost": 685, | |
"Ġsure": 686, | |
"us": 687, | |
"Ġweeks": 688, | |
"Ġfood": 689, | |
"Ġreports": 690, | |
"Ġrating": 691, | |
"ĠMinister": 692, | |
"Ġwoman": 693, | |
"Ġprovide": 694, | |
"Ġproject": 695, | |
"Ġissue": 696, | |
"Ġlive": 697, | |
"10": 698, | |
"Ġclear": 699, | |
"he": 700, | |
"Ġcost": 701, | |
"Ġplayed": 702, | |
"Ġreleased": 703, | |
"Ġcoach": 704, | |
"v": 705, | |
"Ġ24": 706, | |
"Ġseven": 707, | |
"Ġplans": 708, | |
"Ġdevelopment": 709, | |
"ur": 710, | |
"ĺ": 711, | |
"Ġincrease": 712, | |
"This": 713, | |
"Ġpolicy": 714, | |
"Ġcent": 715, | |
"Ġbased": 716, | |
"E": 717, | |
"il": 718, | |
"ĠDecember": 719, | |
"Ġglobal": 720, | |
"Ġtrade": 721, | |
"Ġhours": 722, | |
"Ġhigher": 723, | |
"Ġgoal": 724, | |
"H": 725, | |
"ĠAl": 726, | |
"Ġ100": 727, | |
"Ġminutes": 728, | |
"Ġelection": 729, | |
"ĠAmerica": 730, | |
"Ġrate": 731, | |
"ĠCh": 732, | |
"Ġ21": 733, | |
"...": 734, | |
"ĠWhite": 735, | |
"Ġdirector": 736, | |
"Ġposition": 737, | |
"Ġshot": 738, | |
"Ġlarge": 739, | |
"Ġc": 740, | |
"Ġb": 741, | |
"]": 742, | |
"Ġissues": 743, | |
"Ġdeath": 744, | |
"Ġbuilding": 745, | |
"Ġtotal": 746, | |
"Ġoften": 747, | |
"Ġv": 748, | |
"Ġcountries": 749, | |
"Ġhistory": 750, | |
"Ġoutside": 751, | |
"Ġfederal": 752, | |
"Ġ19": 753, | |
"Ġfact": 754, | |
"ĠHigh": 755, | |
"Ġcareer": 756, | |
"im": 757, | |
"Ġinternational": 758, | |
"ĠNovember": 759, | |
"Ġfront": 760, | |
"Ġkind": 761, | |
"Ġkey": 762, | |
"ra": 763, | |
"ĠSan": 764, | |
"Ġshort": 765, | |
"Ġname": 766, | |
"ĠAccording": 767, | |
"Ġcourse": 768, | |
"Ġre": 769, | |
"Ġwanted": 770, | |
"W": 771, | |
"ĠSeptember": 772, | |
"Ġinterest": 773, | |
"Ġrole": 774, | |
"Ġresults": 775, | |
"Ġeconomic": 776, | |
"Ġ2014": 777, | |
"Ġchance": 778, | |
"ĠOctober": 779, | |
"Ġspecial": 780, | |
"Ġofficial": 781, | |
"Ġneeds": 782, | |
"um": 783, | |
"Ġl": 784, | |
"Ġproducts": 785, | |
"Ġnon": 786, | |
"Ġ@": 787, | |
"ĠBank": 788, | |
"Ġahead": 789, | |
"Ġhouse": 790, | |
"U": 791, | |
"Ġboard": 792, | |
"Ġold": 793, | |
"Ġsaw": 794, | |
"Ġlower": 795, | |
"ĠEuropean": 796, | |
"Ġcontrol": 797, | |
"ĠRussia": 798, | |
"Ġeight": 799, | |
"Ġrelease": 800, | |
"Ġpotential": 801, | |
"Ġthought": 802, | |
"Ġinvestigation": 803, | |
"Ġonline": 804, | |
"based": 805, | |
"Ġtechnology": 806, | |
"ĠDonald": 807, | |
"id": 808, | |
"Ġbody": 809, | |
"Ġrisk": 810, | |
"ian": 811, | |
"Ġcapital": 812, | |
"Ġstaff": 813, | |
"Ġaction": 814, | |
"ĠLeague": 815, | |
"Ġplaying": 816, | |
"Ġmakes": 817, | |
"Ġalmost": 818, | |
"Ġperformance": 819, | |
"Ġ22": 820, | |
"Ġg": 821, | |
"Ġfilm": 822, | |
"Ġnearly": 823, | |
"ĠCenter": 824, | |
"Ġvisit": 825, | |
"ĠGroup": 826, | |
"Ġbank": 827, | |
"Ġbit": 828, | |
"Ġreceived": 829, | |
"ĠAugust": 830, | |
"Ġmilitary": 831, | |
"ĠHis": 832, | |
"ine": 833, | |
"Ġchief": 834, | |
"ĠSchool": 835, | |
"Ġbring": 836, | |
"ĠCourt": 837, | |
"Ġ(@": 838, | |
"Ġmeans": 839, | |
"ĠSh": 840, | |
"Ġfans": 841, | |
"Ġse": 842, | |
"Ġ40": 843, | |
"20": 844, | |
"\".": 845, | |
"V": 846, | |
"Ġcut": 847, | |
"Ġkilled": 848, | |
"Ġ#": 849, | |
"Ġprices": 850, | |
"Ġgave": 851, | |
"ĠStreet": 852, | |
"ir": 853, | |
"ĠY": 854, | |
"Ġcurrently": 855, | |
"Ġf": 856, | |
"ay": 857, | |
"ne": 858, | |
"te": 859, | |
"Ġtry": 860, | |
"ĠPark": 861, | |
"ĥ": 862, | |
"J": 863, | |
"Ġquestion": 864, | |
"Ġhand": 865, | |
"Ġeconomy": 866, | |
"Ġinvestors": 867, | |
"able": 868, | |
"Ġplayer": 869, | |
"ĠBy": 870, | |
"ĠDavid": 871, | |
"Ġloss": 872, | |
"ab": 873, | |
"Ġbelow": 874, | |
"Ġwrote": 875, | |
"co": 876, | |
"ate": 877, | |
"Ġrunning": 878, | |
"un": 879, | |
"Ġbegan": 880, | |
"Ġsingle": 881, | |
"Ġfield": 882, | |
"Ġ23": 883, | |
"Ġleader": 884, | |
"Ġw": 885, | |
"ĠCalifornia": 886, | |
"Ġfourth": 887, | |
"Ġactually": 888, | |
"Ġlist": 889, | |
"ll": 890, | |
"Ġcouple": 891, | |
"Ġstudy": 892, | |
"Ġteams": 893, | |
"He": 894, | |
"ah": 895, | |
"ĠCanada": 896, | |
"Ġla": 897, | |
"Ġresult": 898, | |
"Ġaccess": 899, | |
"Ġvote": 900, | |
"ĠMore": 901, | |
"ĠFebruary": 902, | |
"Ġrevenue": 903, | |
"Ġoffer": 904, | |
"Ġlet": 905, | |
"ier": 906, | |
"Ġbuy": 907, | |
"Ġattack": 908, | |
"Ġblack": 909, | |
"Ġr": 910, | |
"Ġareas": 911, | |
"Ġstop": 912, | |
"Ġimpact": 913, | |
"Ġmatch": 914, | |
"Ġinvestment": 915, | |
"Ġcustomers": 916, | |
"Ġleaders": 917, | |
"ies": 918, | |
"Ġmember": 919, | |
"Ġchild": 920, | |
"Ġroad": 921, | |
"ul": 922, | |
"Ġvalue": 923, | |
"Ġshows": 924, | |
"ĠDr": 925, | |
"ĠDe": 926, | |
"ant": 927, | |
"ĠLondon": 928, | |
"Ġroom": 929, | |
"Ġmusic": 930, | |
"Ġproduction": 931, | |
"Ġanything": 932, | |
"Ġfirm": 933, | |
"Ġbiggest": 934, | |
"Ġair": 935, | |
"Ġproblem": 936, | |
"Ġgeneral": 937, | |
"Ġwasn": 938, | |
"Ġi": 939, | |
"Ġprivate": 940, | |
"Ġespecially": 941, | |
"Ġadministration": 942, | |
"Ġadditional": 943, | |
"ĠCo": 944, | |
"Ġopportunity": 945, | |
"Ġhold": 946, | |
"&": 947, | |
"Ġmatter": 948, | |
"Ġsenior": 949, | |
"Ġclub": 950, | |
"Ġsomeone": 951, | |
"ĠÃ": 952, | |
"ĠEast": 953, | |
"Ġ2019": 954, | |
".'": 955, | |
"Ġneeded": 956, | |
"ĠJames": 957, | |
"time": 958, | |
"Ġhowever": 959, | |
"Ġeverything": 960, | |
"Ġeveryone": 961, | |
"Ġdied": 962, | |
"Ġinvolved": 963, | |
"Ġfriends": 964, | |
"Ġisn": 965, | |
"Ġworth": 966, | |
"ik": 967, | |
"ĠCup": 968, | |
"Ġshowed": 969, | |
"There": 970, | |
"Ġ28": 971, | |
"Ġmeet": 972, | |
"Ġ26": 973, | |
"Ġ27": 974, | |
"Y": 975, | |
"Ġregion": 976, | |
"ĠPress": 977, | |
"ĠNow": 978, | |
"Ġson": 979, | |
"Ġspace": 980, | |
"Ġleading": 981, | |
"Ġstates": 982, | |
"Ġweekend": 983, | |
"Ġ£": 984, | |
"Ġmother": 985, | |
"Ġprevious": 986, | |
"ĠUK": 987, | |
"ĠMichael": 988, | |
"Ġleave": 989, | |
"est": 990, | |
"em": 991, | |
"Ġz": 992, | |
"ĠSome": 993, | |
"ors": 994, | |
"out": 995, | |
"15": 996, | |
"Ġwar": 997, | |
"Ġwebsite": 998, | |
"Ġstar": 999 | |
} |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment