Massive renaming!

2019-08-12 14:38:16 -07:00
parent e6c1238a56
commit 61d5f74ad9
90 changed files with 0 additions and 0 deletions
--- a/05-cookbook/README.md
+++ b/05-cookbook/README.md
@@ -0,0 +1,12 @@
+Style #4
+==============================
+
+Constraints:
+
+- Larger problem decomposed in procedural abstractions
+- Larger problem solved as a sequence of commands, each corresponding to a procedure
+
+Possible names:
+
+- Cookbook
+- Procedural
--- a/05-cookbook/tf-05.py
+++ b/05-cookbook/tf-05.py
@@ -0,0 +1,87 @@
+#!/usr/bin/env python
+import sys, string
+
+# The shared mutable data
+data = []
+words = []
+word_freqs = []
+
+#
+# The procedures
+#
+def read_file(path_to_file):
+    """
+    Takes a path to a file and assigns the entire
+    contents of the file to the global variable data
+    """
+    global data
+    with open(path_to_file) as f:
+        data = data + list(f.read())
+
+def filter_chars_and_normalize():
+    """
+    Replaces all nonalphanumeric chars in data with white space
+    """
+    global data
+    for i in range(len(data)):
+        if not data[i].isalnum():
+            data[i] = ' '
+        else:
+            data[i] = data[i].lower()
+
+def scan():
+    """
+    Scans data for words, filling the global variable words
+    """
+    global data
+    global words
+    data_str = ''.join(data)
+    words = words + data_str.split()
+
+def remove_stop_words():
+    global words
+    with open('../stop_words.txt') as f:
+        stop_words = f.read().split(',')
+    # add single-letter words
+    stop_words.extend(list(string.ascii_lowercase))
+    indexes = []
+    for i in range(len(words)):
+        if words[i] in stop_words:
+            indexes.append(i)
+    for i in reversed(indexes):
+        words.pop(i)
+
+def frequencies():
+    """
+    Creates a list of pairs associating
+    words with frequencies
+    """
+    global words
+    global word_freqs
+    for w in words:
+        keys = [wd[0] for wd in word_freqs]
+        if w in keys:
+            word_freqs[keys.index(w)][1] += 1
+        else:
+            word_freqs.append([w, 1])
+
+def sort():
+    """
+    Sorts word_freqs by frequency
+    """
+    global word_freqs
+    word_freqs.sort(key=lambda x: x[1], reverse=True)
+
+
+#
+# The main function
+#
+read_file(sys.argv[1])
+filter_chars_and_normalize()
+scan()
+remove_stop_words()
+frequencies()
+sort()
+
+for tf in word_freqs[0:25]:
+    print(tf[0], ' - ', tf[1])