Created
May 13, 2015 15:08
-
-
Save Apina/655e3fa46e049a0a8dfd to your computer and use it in GitHub Desktop.
650+ English Stop Words (stopwords) in A-Z order, prepped for an array (PHP)
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
'\'tis', | |
'\'twas', | |
'a', | |
'a\'s', | |
'able', | |
'about', | |
'above', | |
'according', | |
'accordingly', | |
'across', | |
'actually', | |
'after', | |
'afterwards', | |
'again', | |
'against', | |
'ain\'t', | |
'all', | |
'allow', | |
'allows', | |
'almost', | |
'alone', | |
'along', | |
'already', | |
'also', | |
'although', | |
'always', | |
'am', | |
'among', | |
'amongst', | |
'amoungst', | |
'amount', | |
'an', | |
'and', | |
'another', | |
'any', | |
'anybody', | |
'anyhow', | |
'anyone', | |
'anything', | |
'anyway', | |
'anyways', | |
'anywhere', | |
'apart', | |
'appear', | |
'appreciate', | |
'appropriate', | |
'are', | |
'aren\'t', | |
'around', | |
'as', | |
'aside', | |
'ask', | |
'asking', | |
'associated', | |
'at', | |
'available', | |
'away', | |
'awfully', | |
'b', | |
'back', | |
'be', | |
'became', | |
'because', | |
'become', | |
'becomes', | |
'becoming', | |
'been', | |
'before', | |
'beforehand', | |
'behind', | |
'being', | |
'believe', | |
'below', | |
'beside', | |
'besides', | |
'best', | |
'better', | |
'between', | |
'beyond', | |
'bill', | |
'both', | |
'bottom', | |
'brief', | |
'but', | |
'by', | |
'c', | |
'c\'mon', | |
'c\'s', | |
'call', | |
'came', | |
'can', | |
'can\'t', | |
'cannot', | |
'cant', | |
'cause', | |
'causes', | |
'certain', | |
'certainly', | |
'changes', | |
'clearly', | |
'co', | |
'com', | |
'come', | |
'comes', | |
'computer', | |
'con', | |
'concerning', | |
'consequently', | |
'consider', | |
'considering', | |
'contain', | |
'containing', | |
'contains', | |
'corresponding', | |
'could', | |
'could\'ve', | |
'couldn\'t', | |
'couldnt', | |
'course', | |
'cry', | |
'currently', | |
'd', | |
'de', | |
'dear', | |
'definitely', | |
'describe', | |
'described', | |
'despite', | |
'detail', | |
'did', | |
'didn\'t', | |
'different', | |
'do', | |
'does', | |
'doesn\'t', | |
'doing', | |
'don\'t', | |
'done', | |
'down', | |
'downwards', | |
'due', | |
'during', | |
'e', | |
'each', | |
'edu', | |
'eg', | |
'e.g.', | |
'eight', | |
'either', | |
'eleven', | |
'else', | |
'elsewhere', | |
'empty', | |
'enough', | |
'entirely', | |
'especially', | |
'et', | |
'etc', | |
'even', | |
'ever', | |
'every', | |
'everybody', | |
'everyone', | |
'everything', | |
'everywhere', | |
'ex', | |
'exactly', | |
'example', | |
'except', | |
'f', | |
'far', | |
'few', | |
'fifteen', | |
'fifth', | |
'fify', | |
'fill', | |
'find', | |
'fire', | |
'first', | |
'five', | |
'followed', | |
'following', | |
'follows', | |
'for', | |
'former', | |
'formerly', | |
'forth', | |
'forty', | |
'found', | |
'four', | |
'from', | |
'front', | |
'full', | |
'further', | |
'furthermore', | |
'g', | |
'get', | |
'gets', | |
'getting', | |
'give', | |
'given', | |
'gives', | |
'go', | |
'goes', | |
'going', | |
'gone', | |
'got', | |
'gotten', | |
'greetings', | |
'h', | |
'had', | |
'hadn\'t', | |
'happens', | |
'hardly', | |
'has', | |
'hasn\'t', | |
'hasnt', | |
'have', | |
'haven\'t', | |
'having', | |
'he', | |
'he\'d', | |
'he\'ll', | |
'he\'s', | |
'hello', | |
'help', | |
'hence', | |
'her', | |
'here', | |
'here\'s', | |
'hereafter', | |
'hereby', | |
'herein', | |
'hereupon', | |
'hers', | |
'herself', | |
'hi', | |
'high', | |
'him', | |
'himself', | |
'his', | |
'hither', | |
'hopefully', | |
'how', | |
'how\'d', | |
'how\'ll', | |
'how\'s', | |
'howbeit', | |
'however', | |
'hundred', | |
'i', | |
'i\'d', | |
'i\'ll', | |
'i\'m', | |
'i\'ve', | |
'ie', | |
'if', | |
'ignored', | |
'immediate', | |
'in', | |
'inasmuch', | |
'inc', | |
'indeed', | |
'indicate', | |
'indicated', | |
'indicates', | |
'inner', | |
'insofar', | |
'instead', | |
'interest', | |
'into', | |
'inward', | |
'is', | |
'isn\'t', | |
'it', | |
'it\'d', | |
'it\'ll', | |
'it\'s', | |
'its', | |
'itself', | |
'j', | |
'just', | |
'k', | |
'keep', | |
'keeps', | |
'kept', | |
'know', | |
'known', | |
'knows', | |
'l', | |
'last', | |
'lately', | |
'later', | |
'latter', | |
'latterly', | |
'least', | |
'less', | |
'lest', | |
'let', | |
'let\'s', | |
'like', | |
'liked', | |
'likely', | |
'little', | |
'long', | |
'look', | |
'looking', | |
'looks', | |
'ltd', | |
'm', | |
'made', | |
'mainly', | |
'make', | |
'many', | |
'may', | |
'maybe', | |
'me', | |
'mean', | |
'meanwhile', | |
'merely', | |
'might', | |
'might\'ve', | |
'mightn\'t', | |
'mill', | |
'mine', | |
'more', | |
'moreover', | |
'most', | |
'mostly', | |
'move', | |
'much', | |
'must', | |
'must\'ve', | |
'mustn\'t', | |
'my', | |
'myself', | |
'n', | |
'name', | |
'namely', | |
'nd', | |
'near', | |
'nearly', | |
'necessary', | |
'need', | |
'needs', | |
'neither', | |
'never', | |
'nevertheless', | |
'new', | |
'next', | |
'nine', | |
'no', | |
'nobody', | |
'non', | |
'none', | |
'noone', | |
'nor', | |
'normally', | |
'not', | |
'nothing', | |
'novel', | |
'now', | |
'nowhere', | |
'o', | |
'obviously', | |
'of', | |
'off', | |
'often', | |
'oh', | |
'ok', | |
'okay', | |
'old', | |
'on', | |
'once', | |
'one', | |
'ones', | |
'only', | |
'onto', | |
'or', | |
'other', | |
'others', | |
'otherwise', | |
'ought', | |
'our', | |
'ours', | |
'ourselves', | |
'out', | |
'outside', | |
'over', | |
'overall', | |
'own', | |
'p', | |
'part', | |
'particular', | |
'particularly', | |
'per', | |
'perhaps', | |
'placed', | |
'please', | |
'plus', | |
'possible', | |
'presumably', | |
'probably', | |
'provides', | |
'put', | |
'q', | |
'que', | |
'quite', | |
'qv', | |
'r', | |
'rather', | |
'rd', | |
're', | |
'really', | |
'reasonably', | |
'regarding', | |
'regardless', | |
'regards', | |
'relatively', | |
'respectively', | |
'right', | |
's', | |
'said', | |
'same', | |
'saw', | |
'say', | |
'saying', | |
'says', | |
'second', | |
'secondly', | |
'see', | |
'seeing', | |
'seem', | |
'seemed', | |
'seeming', | |
'seems', | |
'seen', | |
'self', | |
'selves', | |
'sensible', | |
'sent', | |
'serious', | |
'seriously', | |
'seven', | |
'several', | |
'shall', | |
'shan\'t', | |
'she', | |
'she\'d', | |
'she\'ll', | |
'she\'s', | |
'should', | |
'should\'ve', | |
'shouldn\'t', | |
'show', | |
'side', | |
'since', | |
'sincere', | |
'six', | |
'sixty', | |
'so', | |
'some', | |
'somebody', | |
'somehow', | |
'someone', | |
'something', | |
'sometime', | |
'sometimes', | |
'somewhat', | |
'somewhere', | |
'soon', | |
'sorry', | |
'specified', | |
'specify', | |
'specifying', | |
'still', | |
'sub', | |
'such', | |
'sup', | |
'sure', | |
'system', | |
't', | |
't\'s', | |
'take', | |
'taken', | |
'tell', | |
'ten', | |
'tends', | |
'th', | |
'than', | |
'thank', | |
'thanks', | |
'thanx', | |
'that', | |
'that\'ll', | |
'that\'s', | |
'thats', | |
'the', | |
'their', | |
'theirs', | |
'them', | |
'themselves', | |
'then', | |
'thence', | |
'there', | |
'there\'s', | |
'thereafter', | |
'thereby', | |
'therefore', | |
'therein', | |
'theres', | |
'thereupon', | |
'these', | |
'they', | |
'they\'d', | |
'they\'ll', | |
'they\'re', | |
'they\'ve', | |
'thick', | |
'thin', | |
'think', | |
'third', | |
'this', | |
'thorough', | |
'thoroughly', | |
'those', | |
'though', | |
'three', | |
'through', | |
'throughout', | |
'thru', | |
'thus', | |
'tis', | |
'to', | |
'together', | |
'too', | |
'took', | |
'top', | |
'toward', | |
'towards', | |
'tried', | |
'tries', | |
'truly', | |
'try', | |
'trying', | |
'twas', | |
'twelve', | |
'twenty', | |
'twice', | |
'two', | |
'u', | |
'un', | |
'under', | |
'unfortunately', | |
'unless', | |
'unlikely', | |
'until', | |
'unto', | |
'up', | |
'upon', | |
'us', | |
'use', | |
'used', | |
'useful', | |
'uses', | |
'using', | |
'usually', | |
'uucp', | |
'v', | |
'value', | |
'various', | |
'very', | |
'via', | |
'viz', | |
'vs', | |
'w', | |
'want', | |
'wants', | |
'was', | |
'wasn\'t', | |
'way', | |
'we', | |
'we\'d', | |
'we\'ll', | |
'we\'re', | |
'we\'ve', | |
'welcome', | |
'well', | |
'went', | |
'were', | |
'weren\'t', | |
'what', | |
'what\'d', | |
'what\'s', | |
'whatever', | |
'when', | |
'when\'d', | |
'when\'ll', | |
'when\'s', | |
'whence', | |
'whenever', | |
'where', | |
'where\'d', | |
'where\'ll', | |
'where\'s', | |
'whereafter', | |
'whereas', | |
'whereby', | |
'wherein', | |
'whereupon', | |
'wherever', | |
'whether', | |
'which', | |
'while', | |
'whither', | |
'who', | |
'who\'d', | |
'who\'ll', | |
'who\'s', | |
'whoever', | |
'whole', | |
'whom', | |
'whose', | |
'why', | |
'why\'d', | |
'why\'ll', | |
'why\'s', | |
'will', | |
'willing', | |
'wish', | |
'with', | |
'within', | |
'without', | |
'won\'t', | |
'wonder', | |
'would', | |
'would\'ve', | |
'wouldn\'t', | |
'x', | |
'y', | |
'yes', | |
'yet', | |
'you', | |
'you\'d', | |
'you\'ll', | |
'you\'re', | |
'you\'ve', | |
'your', | |
'yours', | |
'yourself', | |
'yourselves', | |
'z', | |
'zero', |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Most of the words come from the various lists listed here: http://www.docear.org/2012/09/28/list-of-6513-stop-words-for-17-languages-english-german-french-italian-and-many-others/
I've just brought them all together and added a few more.