Created
May 13, 2015 15:08
-
-
Save Apina/655e3fa46e049a0a8dfd to your computer and use it in GitHub Desktop.
650+ English Stop Words (stopwords) in A-Z order, prepped for an array (PHP)
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| '\'tis', | |
| '\'twas', | |
| 'a', | |
| 'a\'s', | |
| 'able', | |
| 'about', | |
| 'above', | |
| 'according', | |
| 'accordingly', | |
| 'across', | |
| 'actually', | |
| 'after', | |
| 'afterwards', | |
| 'again', | |
| 'against', | |
| 'ain\'t', | |
| 'all', | |
| 'allow', | |
| 'allows', | |
| 'almost', | |
| 'alone', | |
| 'along', | |
| 'already', | |
| 'also', | |
| 'although', | |
| 'always', | |
| 'am', | |
| 'among', | |
| 'amongst', | |
| 'amoungst', | |
| 'amount', | |
| 'an', | |
| 'and', | |
| 'another', | |
| 'any', | |
| 'anybody', | |
| 'anyhow', | |
| 'anyone', | |
| 'anything', | |
| 'anyway', | |
| 'anyways', | |
| 'anywhere', | |
| 'apart', | |
| 'appear', | |
| 'appreciate', | |
| 'appropriate', | |
| 'are', | |
| 'aren\'t', | |
| 'around', | |
| 'as', | |
| 'aside', | |
| 'ask', | |
| 'asking', | |
| 'associated', | |
| 'at', | |
| 'available', | |
| 'away', | |
| 'awfully', | |
| 'b', | |
| 'back', | |
| 'be', | |
| 'became', | |
| 'because', | |
| 'become', | |
| 'becomes', | |
| 'becoming', | |
| 'been', | |
| 'before', | |
| 'beforehand', | |
| 'behind', | |
| 'being', | |
| 'believe', | |
| 'below', | |
| 'beside', | |
| 'besides', | |
| 'best', | |
| 'better', | |
| 'between', | |
| 'beyond', | |
| 'bill', | |
| 'both', | |
| 'bottom', | |
| 'brief', | |
| 'but', | |
| 'by', | |
| 'c', | |
| 'c\'mon', | |
| 'c\'s', | |
| 'call', | |
| 'came', | |
| 'can', | |
| 'can\'t', | |
| 'cannot', | |
| 'cant', | |
| 'cause', | |
| 'causes', | |
| 'certain', | |
| 'certainly', | |
| 'changes', | |
| 'clearly', | |
| 'co', | |
| 'com', | |
| 'come', | |
| 'comes', | |
| 'computer', | |
| 'con', | |
| 'concerning', | |
| 'consequently', | |
| 'consider', | |
| 'considering', | |
| 'contain', | |
| 'containing', | |
| 'contains', | |
| 'corresponding', | |
| 'could', | |
| 'could\'ve', | |
| 'couldn\'t', | |
| 'couldnt', | |
| 'course', | |
| 'cry', | |
| 'currently', | |
| 'd', | |
| 'de', | |
| 'dear', | |
| 'definitely', | |
| 'describe', | |
| 'described', | |
| 'despite', | |
| 'detail', | |
| 'did', | |
| 'didn\'t', | |
| 'different', | |
| 'do', | |
| 'does', | |
| 'doesn\'t', | |
| 'doing', | |
| 'don\'t', | |
| 'done', | |
| 'down', | |
| 'downwards', | |
| 'due', | |
| 'during', | |
| 'e', | |
| 'each', | |
| 'edu', | |
| 'eg', | |
| 'e.g.', | |
| 'eight', | |
| 'either', | |
| 'eleven', | |
| 'else', | |
| 'elsewhere', | |
| 'empty', | |
| 'enough', | |
| 'entirely', | |
| 'especially', | |
| 'et', | |
| 'etc', | |
| 'even', | |
| 'ever', | |
| 'every', | |
| 'everybody', | |
| 'everyone', | |
| 'everything', | |
| 'everywhere', | |
| 'ex', | |
| 'exactly', | |
| 'example', | |
| 'except', | |
| 'f', | |
| 'far', | |
| 'few', | |
| 'fifteen', | |
| 'fifth', | |
| 'fify', | |
| 'fill', | |
| 'find', | |
| 'fire', | |
| 'first', | |
| 'five', | |
| 'followed', | |
| 'following', | |
| 'follows', | |
| 'for', | |
| 'former', | |
| 'formerly', | |
| 'forth', | |
| 'forty', | |
| 'found', | |
| 'four', | |
| 'from', | |
| 'front', | |
| 'full', | |
| 'further', | |
| 'furthermore', | |
| 'g', | |
| 'get', | |
| 'gets', | |
| 'getting', | |
| 'give', | |
| 'given', | |
| 'gives', | |
| 'go', | |
| 'goes', | |
| 'going', | |
| 'gone', | |
| 'got', | |
| 'gotten', | |
| 'greetings', | |
| 'h', | |
| 'had', | |
| 'hadn\'t', | |
| 'happens', | |
| 'hardly', | |
| 'has', | |
| 'hasn\'t', | |
| 'hasnt', | |
| 'have', | |
| 'haven\'t', | |
| 'having', | |
| 'he', | |
| 'he\'d', | |
| 'he\'ll', | |
| 'he\'s', | |
| 'hello', | |
| 'help', | |
| 'hence', | |
| 'her', | |
| 'here', | |
| 'here\'s', | |
| 'hereafter', | |
| 'hereby', | |
| 'herein', | |
| 'hereupon', | |
| 'hers', | |
| 'herself', | |
| 'hi', | |
| 'high', | |
| 'him', | |
| 'himself', | |
| 'his', | |
| 'hither', | |
| 'hopefully', | |
| 'how', | |
| 'how\'d', | |
| 'how\'ll', | |
| 'how\'s', | |
| 'howbeit', | |
| 'however', | |
| 'hundred', | |
| 'i', | |
| 'i\'d', | |
| 'i\'ll', | |
| 'i\'m', | |
| 'i\'ve', | |
| 'ie', | |
| 'if', | |
| 'ignored', | |
| 'immediate', | |
| 'in', | |
| 'inasmuch', | |
| 'inc', | |
| 'indeed', | |
| 'indicate', | |
| 'indicated', | |
| 'indicates', | |
| 'inner', | |
| 'insofar', | |
| 'instead', | |
| 'interest', | |
| 'into', | |
| 'inward', | |
| 'is', | |
| 'isn\'t', | |
| 'it', | |
| 'it\'d', | |
| 'it\'ll', | |
| 'it\'s', | |
| 'its', | |
| 'itself', | |
| 'j', | |
| 'just', | |
| 'k', | |
| 'keep', | |
| 'keeps', | |
| 'kept', | |
| 'know', | |
| 'known', | |
| 'knows', | |
| 'l', | |
| 'last', | |
| 'lately', | |
| 'later', | |
| 'latter', | |
| 'latterly', | |
| 'least', | |
| 'less', | |
| 'lest', | |
| 'let', | |
| 'let\'s', | |
| 'like', | |
| 'liked', | |
| 'likely', | |
| 'little', | |
| 'long', | |
| 'look', | |
| 'looking', | |
| 'looks', | |
| 'ltd', | |
| 'm', | |
| 'made', | |
| 'mainly', | |
| 'make', | |
| 'many', | |
| 'may', | |
| 'maybe', | |
| 'me', | |
| 'mean', | |
| 'meanwhile', | |
| 'merely', | |
| 'might', | |
| 'might\'ve', | |
| 'mightn\'t', | |
| 'mill', | |
| 'mine', | |
| 'more', | |
| 'moreover', | |
| 'most', | |
| 'mostly', | |
| 'move', | |
| 'much', | |
| 'must', | |
| 'must\'ve', | |
| 'mustn\'t', | |
| 'my', | |
| 'myself', | |
| 'n', | |
| 'name', | |
| 'namely', | |
| 'nd', | |
| 'near', | |
| 'nearly', | |
| 'necessary', | |
| 'need', | |
| 'needs', | |
| 'neither', | |
| 'never', | |
| 'nevertheless', | |
| 'new', | |
| 'next', | |
| 'nine', | |
| 'no', | |
| 'nobody', | |
| 'non', | |
| 'none', | |
| 'noone', | |
| 'nor', | |
| 'normally', | |
| 'not', | |
| 'nothing', | |
| 'novel', | |
| 'now', | |
| 'nowhere', | |
| 'o', | |
| 'obviously', | |
| 'of', | |
| 'off', | |
| 'often', | |
| 'oh', | |
| 'ok', | |
| 'okay', | |
| 'old', | |
| 'on', | |
| 'once', | |
| 'one', | |
| 'ones', | |
| 'only', | |
| 'onto', | |
| 'or', | |
| 'other', | |
| 'others', | |
| 'otherwise', | |
| 'ought', | |
| 'our', | |
| 'ours', | |
| 'ourselves', | |
| 'out', | |
| 'outside', | |
| 'over', | |
| 'overall', | |
| 'own', | |
| 'p', | |
| 'part', | |
| 'particular', | |
| 'particularly', | |
| 'per', | |
| 'perhaps', | |
| 'placed', | |
| 'please', | |
| 'plus', | |
| 'possible', | |
| 'presumably', | |
| 'probably', | |
| 'provides', | |
| 'put', | |
| 'q', | |
| 'que', | |
| 'quite', | |
| 'qv', | |
| 'r', | |
| 'rather', | |
| 'rd', | |
| 're', | |
| 'really', | |
| 'reasonably', | |
| 'regarding', | |
| 'regardless', | |
| 'regards', | |
| 'relatively', | |
| 'respectively', | |
| 'right', | |
| 's', | |
| 'said', | |
| 'same', | |
| 'saw', | |
| 'say', | |
| 'saying', | |
| 'says', | |
| 'second', | |
| 'secondly', | |
| 'see', | |
| 'seeing', | |
| 'seem', | |
| 'seemed', | |
| 'seeming', | |
| 'seems', | |
| 'seen', | |
| 'self', | |
| 'selves', | |
| 'sensible', | |
| 'sent', | |
| 'serious', | |
| 'seriously', | |
| 'seven', | |
| 'several', | |
| 'shall', | |
| 'shan\'t', | |
| 'she', | |
| 'she\'d', | |
| 'she\'ll', | |
| 'she\'s', | |
| 'should', | |
| 'should\'ve', | |
| 'shouldn\'t', | |
| 'show', | |
| 'side', | |
| 'since', | |
| 'sincere', | |
| 'six', | |
| 'sixty', | |
| 'so', | |
| 'some', | |
| 'somebody', | |
| 'somehow', | |
| 'someone', | |
| 'something', | |
| 'sometime', | |
| 'sometimes', | |
| 'somewhat', | |
| 'somewhere', | |
| 'soon', | |
| 'sorry', | |
| 'specified', | |
| 'specify', | |
| 'specifying', | |
| 'still', | |
| 'sub', | |
| 'such', | |
| 'sup', | |
| 'sure', | |
| 'system', | |
| 't', | |
| 't\'s', | |
| 'take', | |
| 'taken', | |
| 'tell', | |
| 'ten', | |
| 'tends', | |
| 'th', | |
| 'than', | |
| 'thank', | |
| 'thanks', | |
| 'thanx', | |
| 'that', | |
| 'that\'ll', | |
| 'that\'s', | |
| 'thats', | |
| 'the', | |
| 'their', | |
| 'theirs', | |
| 'them', | |
| 'themselves', | |
| 'then', | |
| 'thence', | |
| 'there', | |
| 'there\'s', | |
| 'thereafter', | |
| 'thereby', | |
| 'therefore', | |
| 'therein', | |
| 'theres', | |
| 'thereupon', | |
| 'these', | |
| 'they', | |
| 'they\'d', | |
| 'they\'ll', | |
| 'they\'re', | |
| 'they\'ve', | |
| 'thick', | |
| 'thin', | |
| 'think', | |
| 'third', | |
| 'this', | |
| 'thorough', | |
| 'thoroughly', | |
| 'those', | |
| 'though', | |
| 'three', | |
| 'through', | |
| 'throughout', | |
| 'thru', | |
| 'thus', | |
| 'tis', | |
| 'to', | |
| 'together', | |
| 'too', | |
| 'took', | |
| 'top', | |
| 'toward', | |
| 'towards', | |
| 'tried', | |
| 'tries', | |
| 'truly', | |
| 'try', | |
| 'trying', | |
| 'twas', | |
| 'twelve', | |
| 'twenty', | |
| 'twice', | |
| 'two', | |
| 'u', | |
| 'un', | |
| 'under', | |
| 'unfortunately', | |
| 'unless', | |
| 'unlikely', | |
| 'until', | |
| 'unto', | |
| 'up', | |
| 'upon', | |
| 'us', | |
| 'use', | |
| 'used', | |
| 'useful', | |
| 'uses', | |
| 'using', | |
| 'usually', | |
| 'uucp', | |
| 'v', | |
| 'value', | |
| 'various', | |
| 'very', | |
| 'via', | |
| 'viz', | |
| 'vs', | |
| 'w', | |
| 'want', | |
| 'wants', | |
| 'was', | |
| 'wasn\'t', | |
| 'way', | |
| 'we', | |
| 'we\'d', | |
| 'we\'ll', | |
| 'we\'re', | |
| 'we\'ve', | |
| 'welcome', | |
| 'well', | |
| 'went', | |
| 'were', | |
| 'weren\'t', | |
| 'what', | |
| 'what\'d', | |
| 'what\'s', | |
| 'whatever', | |
| 'when', | |
| 'when\'d', | |
| 'when\'ll', | |
| 'when\'s', | |
| 'whence', | |
| 'whenever', | |
| 'where', | |
| 'where\'d', | |
| 'where\'ll', | |
| 'where\'s', | |
| 'whereafter', | |
| 'whereas', | |
| 'whereby', | |
| 'wherein', | |
| 'whereupon', | |
| 'wherever', | |
| 'whether', | |
| 'which', | |
| 'while', | |
| 'whither', | |
| 'who', | |
| 'who\'d', | |
| 'who\'ll', | |
| 'who\'s', | |
| 'whoever', | |
| 'whole', | |
| 'whom', | |
| 'whose', | |
| 'why', | |
| 'why\'d', | |
| 'why\'ll', | |
| 'why\'s', | |
| 'will', | |
| 'willing', | |
| 'wish', | |
| 'with', | |
| 'within', | |
| 'without', | |
| 'won\'t', | |
| 'wonder', | |
| 'would', | |
| 'would\'ve', | |
| 'wouldn\'t', | |
| 'x', | |
| 'y', | |
| 'yes', | |
| 'yet', | |
| 'you', | |
| 'you\'d', | |
| 'you\'ll', | |
| 'you\'re', | |
| 'you\'ve', | |
| 'your', | |
| 'yours', | |
| 'yourself', | |
| 'yourselves', | |
| 'z', | |
| 'zero', |
Author
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
Most of the words come from the various lists listed here: http://www.docear.org/2012/09/28/list-of-6513-stop-words-for-17-languages-english-german-french-italian-and-many-others/
I've just brought them all together and added a few more.