Sorry, that was constructivist, even though this editor is flagging that word with red squiggles.

2013-12-01 09:48:18 -08:00
parent 6338f712a2
commit 783c4eb65a
2 changed files with 0 additions and 0 deletions
--- a/21-constructivist/README.md
+++ b/21-constructivist/README.md
@@ -0,0 +1,20 @@
+Style #21
+==============================
+
+Constraints:
+
+- Every single procedure and function checks the sanity of its
+  arguments and either returns something sensible when the arguments
+  are unreasonable or assigns them reasonable values
+
+- All code blocks check for possible errors and escape the block
+  when things go wrong, setting the state to something reasonable
+
+Possible names:
+
+- Constructive
+- Defensive
+- Hopeful
+- Shit happens, life goes on
+
+(See http://en.wikipedia.org/wiki/Constructivism_(mathematics))
--- a/21-constructivist/tf-21.py
+++ b/21-constructivist/tf-21.py
@@ -0,0 +1,72 @@
+#!/usr/bin/env python
+
+import sys, re, operator, string, inspect
+
+#
+# The functions
+#
+def extract_words(path_to_file):
+    """
+    Takes a path to a file and returns the non-stop
+    words, after properly removing nonalphanumeric chars
+    and normalizing for lower case
+    """
+    if type(path_to_file) is not str or not path_to_file:
+        return []
+
+    try:
+        with open(path_to_file) as f:
+            str_data = f.read()
+    except IOError as e:
+        print "I/O error({0}) when opening {1}: {2}".format(e.errno, path_to_file, e.strerror)
+        return []
+    
+    pattern = re.compile('[\W_]+')
+    word_list = pattern.sub(' ', str_data).lower().split()
+
+    try:
+        with open('../stop_words.txt') as f:
+            stop_words = f.read().split(',')
+    except IOError as e:
+        print "I/O error({0}) when opening ../stops_words.txt: {1}".format(e.errno, e.strerror)
+        return []
+
+    stop_words.extend(list(string.ascii_lowercase))
+    return [w for w in word_list if not w in stop_words]
+
+def frequencies(word_list):
+    """
+    Takes a list of words and returns a dictionary associating
+    words with frequencies of occurrence
+    """
+    if type(word_list) is not list or word_list == []:
+        return {}
+
+    word_freqs = {}
+    for w in word_list:
+        if w in word_freqs:
+            word_freqs[w] += 1
+        else:
+            word_freqs[w] = 1
+    return word_freqs
+
+def sort(word_freq):
+    """
+    Takes a dictionary of words and their frequencies
+    and returns a list of pairs where the entries are
+    sorted by frequency 
+    """
+    if type(word_freq) is not dict or word_freq == {}:
+        return []
+
+    return sorted(word_freq.iteritems(), key=operator.itemgetter(1), reverse=True)
+
+#
+# The main function
+#
+filename = sys.argv[1] if len(sys.argv) > 1 else "../input.txt"
+word_freqs = sort(frequencies(extract_words(filename)))
+
+for tf in word_freqs[0:25]:
+    print tf[0], ' - ', tf[1]
+