105 lines
		
	
	
		
			No EOL
		
	
	
		
			1,007 B
		
	
	
	
		
			Clojure
		
	
	
	
	
	
			
		
		
	
	
			105 lines
		
	
	
		
			No EOL
		
	
	
		
			1,007 B
		
	
	
	
		
			Clojure
		
	
	
	
	
	
;; list of English language words that should not be indexed.
 | 
						|
;; taken from the first hundred words in [Peter Norvig's analysis of the 
 | 
						|
;; frequency of English words](https://norvig.com/ngrams/count_1w.txt);
 | 
						|
;; I've then commented out from the list those words which, although
 | 
						|
;; common, I think it may be reasonable for people to search for.
 | 
						|
["the"
 | 
						|
"of"
 | 
						|
"and"
 | 
						|
"to"
 | 
						|
"a"
 | 
						|
"in"
 | 
						|
"for"
 | 
						|
"is"
 | 
						|
"on"
 | 
						|
"that"
 | 
						|
"by"
 | 
						|
"this"
 | 
						|
"with"
 | 
						|
"i"
 | 
						|
"you"
 | 
						|
"it"
 | 
						|
"not"
 | 
						|
"or"
 | 
						|
"be"
 | 
						|
"are"
 | 
						|
"from"
 | 
						|
"at"
 | 
						|
"as"
 | 
						|
"your"
 | 
						|
"all"
 | 
						|
"have"
 | 
						|
"new"
 | 
						|
"more"
 | 
						|
"an"
 | 
						|
"was"
 | 
						|
"we"
 | 
						|
"will"
 | 
						|
"home"
 | 
						|
"can"
 | 
						|
"us"
 | 
						|
"about"
 | 
						|
"if"
 | 
						|
"page"
 | 
						|
"my"
 | 
						|
"has"
 | 
						|
"search"
 | 
						|
"free"
 | 
						|
"but"
 | 
						|
"our"
 | 
						|
"one"
 | 
						|
"other"
 | 
						|
"do"
 | 
						|
"no"
 | 
						|
;; "information"
 | 
						|
"time"
 | 
						|
"they"
 | 
						|
"site"
 | 
						|
"he"
 | 
						|
"up"
 | 
						|
"may"
 | 
						|
"what"
 | 
						|
"which"
 | 
						|
"their"
 | 
						|
"news"
 | 
						|
"out"
 | 
						|
"use"
 | 
						|
"any"
 | 
						|
"there"
 | 
						|
"see"
 | 
						|
"only"
 | 
						|
"so"
 | 
						|
"his"
 | 
						|
"when"
 | 
						|
;; "contact"
 | 
						|
"here"
 | 
						|
;; "business"
 | 
						|
"who"
 | 
						|
"web"
 | 
						|
"also"
 | 
						|
"now"
 | 
						|
;; "help"
 | 
						|
"get"
 | 
						|
"pm"
 | 
						|
"view"
 | 
						|
;; "online"
 | 
						|
"c"
 | 
						|
"e"
 | 
						|
"first"
 | 
						|
"am"
 | 
						|
"been"
 | 
						|
"would"
 | 
						|
"how"
 | 
						|
"were"
 | 
						|
"me"
 | 
						|
"s"
 | 
						|
;; "services"
 | 
						|
"some"
 | 
						|
"these"
 | 
						|
"click"
 | 
						|
"its"
 | 
						|
"like"
 | 
						|
;; "service"
 | 
						|
"x"
 | 
						|
"than"
 | 
						|
"find"] |