8 lines
246 B
Python
8 lines
246 B
Python
import sys, re, string
|
|
|
|
def extract_words(path_to_file):
|
|
words = re.findall('[a-z]{2,}', open(path_to_file).read().lower())
|
|
stopwords = set(open('../stop_words.txt').read().split(','))
|
|
return [w for w in words if w not in stopwords]
|
|
|