2019-03-26 21:51:28 +00:00
|
|
|
package tldr
|
|
|
|
|
2019-03-28 21:38:04 +00:00
|
|
|
//nltk stopwords list, from some point...
|
|
|
|
|
2019-03-26 21:51:28 +00:00
|
|
|
var THESE_ARE_NOT_THE_WORDS_YOU_ARE_LOOKING_FOR = []string{
|
|
|
|
"i",
|
|
|
|
"me",
|
|
|
|
"my",
|
2019-03-28 21:38:04 +00:00
|
|
|
"myself",
|
|
|
|
"we",
|
|
|
|
"our",
|
|
|
|
"ours",
|
|
|
|
"ourselves",
|
|
|
|
"you",
|
|
|
|
"you're",
|
|
|
|
"you've",
|
|
|
|
"you'll",
|
|
|
|
"you'd",
|
|
|
|
"your",
|
|
|
|
"yours",
|
|
|
|
"yourself",
|
|
|
|
"yourselves",
|
2019-03-26 21:51:28 +00:00
|
|
|
"he",
|
2019-03-28 21:38:04 +00:00
|
|
|
"him",
|
|
|
|
"his",
|
|
|
|
"himself",
|
|
|
|
"she",
|
|
|
|
"she's",
|
|
|
|
"her",
|
|
|
|
"hers",
|
|
|
|
"herself",
|
|
|
|
"it",
|
|
|
|
"it's",
|
2019-03-26 21:51:28 +00:00
|
|
|
"its",
|
2019-03-28 21:38:04 +00:00
|
|
|
"itself",
|
|
|
|
"they",
|
|
|
|
"them",
|
|
|
|
"their",
|
|
|
|
"theirs",
|
|
|
|
"themselves",
|
|
|
|
"what",
|
|
|
|
"which",
|
|
|
|
"who",
|
|
|
|
"whom",
|
|
|
|
"this",
|
|
|
|
"that",
|
|
|
|
"that'll",
|
|
|
|
"these",
|
|
|
|
"those",
|
|
|
|
"am",
|
|
|
|
"is",
|
|
|
|
"are",
|
|
|
|
"was",
|
|
|
|
"were",
|
|
|
|
"be",
|
|
|
|
"been",
|
|
|
|
"being",
|
|
|
|
"have",
|
2019-03-26 21:51:28 +00:00
|
|
|
"has",
|
|
|
|
"had",
|
2019-03-28 21:38:04 +00:00
|
|
|
"having",
|
|
|
|
"do",
|
|
|
|
"does",
|
|
|
|
"did",
|
|
|
|
"doing",
|
|
|
|
"a",
|
|
|
|
"an",
|
|
|
|
"the",
|
|
|
|
"and",
|
2019-03-26 21:51:28 +00:00
|
|
|
"but",
|
2019-03-28 21:38:04 +00:00
|
|
|
"if",
|
|
|
|
"or",
|
|
|
|
"because",
|
|
|
|
"as",
|
|
|
|
"until",
|
|
|
|
"while",
|
|
|
|
"of",
|
|
|
|
"at",
|
|
|
|
"by",
|
2019-03-26 21:51:28 +00:00
|
|
|
"for",
|
2019-03-28 21:38:04 +00:00
|
|
|
"with",
|
|
|
|
"about",
|
|
|
|
"against",
|
|
|
|
"between",
|
|
|
|
"into",
|
|
|
|
"through",
|
|
|
|
"during",
|
|
|
|
"before",
|
|
|
|
"after",
|
|
|
|
"above",
|
|
|
|
"below",
|
|
|
|
"to",
|
|
|
|
"from",
|
|
|
|
"up",
|
|
|
|
"down",
|
|
|
|
"in",
|
2019-03-26 21:51:28 +00:00
|
|
|
"out",
|
2019-03-28 21:38:04 +00:00
|
|
|
"on",
|
2019-03-26 21:51:28 +00:00
|
|
|
"off",
|
2019-03-28 21:38:04 +00:00
|
|
|
"over",
|
|
|
|
"under",
|
|
|
|
"again",
|
|
|
|
"further",
|
|
|
|
"then",
|
2019-03-26 21:51:28 +00:00
|
|
|
"once",
|
2019-03-28 21:38:04 +00:00
|
|
|
"here",
|
|
|
|
"there",
|
|
|
|
"when",
|
|
|
|
"where",
|
|
|
|
"why",
|
|
|
|
"how",
|
|
|
|
"all",
|
|
|
|
"any",
|
2019-03-26 21:51:28 +00:00
|
|
|
"both",
|
|
|
|
"each",
|
2019-03-28 21:38:04 +00:00
|
|
|
"few",
|
|
|
|
"more",
|
2019-03-26 21:51:28 +00:00
|
|
|
"most",
|
2019-03-28 21:38:04 +00:00
|
|
|
"other",
|
2019-03-26 21:51:28 +00:00
|
|
|
"some",
|
2019-03-28 21:38:04 +00:00
|
|
|
"such",
|
|
|
|
"no",
|
|
|
|
"nor",
|
|
|
|
"not",
|
2019-03-26 21:51:28 +00:00
|
|
|
"only",
|
2019-03-28 21:38:04 +00:00
|
|
|
"own",
|
|
|
|
"same",
|
|
|
|
"so",
|
|
|
|
"than",
|
|
|
|
"too",
|
|
|
|
"very",
|
|
|
|
"s",
|
|
|
|
"t",
|
|
|
|
"can",
|
2019-03-26 21:51:28 +00:00
|
|
|
"will",
|
2019-03-28 21:38:04 +00:00
|
|
|
"just",
|
|
|
|
"don",
|
|
|
|
"don't",
|
|
|
|
"should",
|
|
|
|
"should've",
|
|
|
|
"now",
|
|
|
|
"d",
|
|
|
|
"ll",
|
|
|
|
"m",
|
|
|
|
"o",
|
|
|
|
"re",
|
|
|
|
"ve",
|
|
|
|
"y",
|
|
|
|
"ain",
|
|
|
|
"aren",
|
|
|
|
"aren't",
|
|
|
|
"couldn",
|
|
|
|
"couldn't",
|
|
|
|
"didn",
|
|
|
|
"didn't",
|
|
|
|
"doesn",
|
|
|
|
"doesn't",
|
|
|
|
"hadn",
|
|
|
|
"hadn't",
|
|
|
|
"hasn",
|
|
|
|
"hasn't",
|
|
|
|
"haven",
|
|
|
|
"haven't",
|
|
|
|
"isn",
|
|
|
|
"isn't",
|
|
|
|
"ma",
|
|
|
|
"mightn",
|
|
|
|
"mightn't",
|
|
|
|
"mustn",
|
|
|
|
"mustn't",
|
|
|
|
"needn",
|
|
|
|
"needn't",
|
|
|
|
"shan",
|
|
|
|
"shan't",
|
|
|
|
"shouldn",
|
|
|
|
"shouldn't",
|
|
|
|
"wasn",
|
|
|
|
"wasn't",
|
|
|
|
"weren",
|
|
|
|
"weren't",
|
|
|
|
"won",
|
|
|
|
"won't",
|
|
|
|
"wouldn",
|
|
|
|
"wouldn't",
|
2019-03-26 21:51:28 +00:00
|
|
|
}
|