First commit, first style.

2013-09-22 08:44:03 -07:00
parent 6dfc5e1cfe
commit 11790919d8
2 changed files with 60 additions and 0 deletions
--- a/01-monolithic/README.md
+++ b/01-monolithic/README.md
@@ -0,0 +1,11 @@
+exercises-in-programming-style
+==============================
+
+Constraints:
+
+- No abstractions
+
+Alternative names of this style:
+
+- Labyrinth
+- Brain dump
--- a/01-monolithic/tf-01.py
+++ b/01-monolithic/tf-01.py
@@ -0,0 +1,49 @@
+import sys, string
+# the global list of [word, frequency] pairs
+word_freqs = []
+# the list of stop words
+with open('../stop_words.txt') as f:
+    stop_words = f.read().split(',')
+stop_words.extend(list(string.ascii_lowercase))
+
+# iterate through the file one line at a time 
+for line in open(sys.argv[1]):
+    start_char = None
+    i = 0
+    for c in line:
+        if start_char == None:
+            if c.isalnum():
+                # We found the start of a word
+                start_char = i
+        else:
+            if not c.isalnum():
+                # We found the end of a word. Process it
+                found = False
+                word = line[start_char:i].lower()
+                # Ignore stop words
+                if word not in stop_words:
+                    pair_index = 0
+                    # Let's see if it already exists
+                    for pair in word_freqs:
+                        if word == pair[0]:
+                            pair[1] += 1
+                            found = True
+                            found_at = pair_index
+                            break
+                        pair_index += 1
+                    if not found:
+                        word_freqs.append([word, 1])
+                    elif len(word_freqs) > 1:
+                        # We may need to reorder
+                        for n in reversed(range(pair_index)):
+                            if word_freqs[pair_index][1] > word_freqs[n][1]:
+                                # swap
+                                word_freqs[n], word_freqs[pair_index] = word_freqs[pair_index], word_freqs[n]
+                                pair_index = n
+                # Let's reset
+                start_char = None
+        i += 1
+
+for tf in word_freqs[0:25]:
+    print tf[0], ' - ', tf[1]
+