November 2015
Intermediate to advanced
304 pages
5h 23m
English
Chapter 12

1 #!/usr/bin/env python 2 import sys, re, operator, string 3 4 # Auxiliary functions that can't be lambdas 5 # 6 def extract_words(obj, path_to_file): 7 with open(path_to_file) as f: 8 obj['data'] = f.read() 9 pattern = re.compile('[\W_]+') 10 data_str = ''.join(pattern.sub(' ', obj['data']).lower()) 11 obj['data'] = data_str.split()