changing shit. and refactoring

zstumgoren · zstumgoren · commit d37c99a675a6 · 2014-02-13T23:17:15.000-08:00
diff --git a/elex1/election_results.py b/elex1/election_results.py
@@ -18,12 +18,12 @@
 import urllib
 from operator import itemgetter
 from collections import defaultdict
-from os.path import abspath, dirname, join
+from os.path import dirname, join
 
 
 # Download CSV of fake Virginia election results to root of project
 url = "https://docs.google.com/spreadsheet/pub?key=0AhhC0IWaObRqdGFkUW1kUmp2ZlZjUjdTYV9lNFJ5RHc&output=csv"
-filename = join(dirname(dirname(abspath(__file__))), 'fake_va_elec_results.csv')
+filename = join(dirname(dirname(__file__)), 'fake_va_elec_results.csv')
 urllib.urlretrieve(url, filename)
 
 # Create reader for ingesting CSV as array of dicts
@@ -40,10 +40,13 @@
     # Convert total votes to an integer
     row['votes'] = int(row['votes'])
 
-    # Store county-level results by office/district pair, then by candidate party and raw name
-    race_key = (row['office'], row['district'])
+    # Store county-level results by slugified office and district (if there is one), 
+    # then by candidate party and raw name
+    race_key = row['office']
+    if row['district']:
+            race_key += "-%s" % row['district']
     # Create unique candidate key from party and name, in case multiple candidates have same
-    cand_key = (row['party'], row['candidate'])
+    cand_key = "-".join((row['party'], row['candidate']))
     # Below, setdefault initializes empty dict and list for the respective keys if they don't already exist.
     race = results[race_key]
     race.setdefault(cand_key, []).append(row)
@@ -94,7 +97,7 @@
 
 
 # Write CSV of results
-outfile = join(dirname(abspath(__file__)), 'summary_results.csv')
+outfile = join(dirname(__file__), 'summary_results.csv')
 with open(outfile, 'wb') as fh:
     # We'll limit the output to cleanly parsed, standardized values
     fieldnames = [
diff --git a/elex2/election_results.py b/elex2/election_results.py
@@ -15,12 +15,12 @@
 import urllib
 from operator import itemgetter
 from collections import defaultdict
-from os.path import abspath, dirname, join
+from os.path import dirname, join
 
 
 def main():
     # Download CSV of fake Virginia election results to root of project
-    path = join(dirname(dirname(abspath(__file__))), 'fake_va_elec_results.csv')
+    path = join(dirname(dirname(__file__)), 'fake_va_elec_results.csv')
     download_results(path)
     # Process data
     results = parse_and_clean(path)
@@ -60,10 +60,13 @@ def parse_and_clean(path):
         # Convert total votes to an integer
         row['votes'] = int(row['votes'])
 
-        # Store county-level results by office/district pair, then by candidate party and raw name
-        race_key = (row['office'], row['district'])
+        # Store county-level results by slugified office and district (if there is one), 
+        # then by candidate party and raw name
+        race_key = row['office'] 
+        if row['district']:
+            race_key += "-%s" % row['district']
         # Create unique candidate key from party and name, in case multiple candidates have same
-        cand_key = (row['party'], row['candidate'])
+        cand_key = "-".join((row['party'], row['candidate']))
         # Below, setdefault initializes empty dict and list for the respective keys if they don't already exist.
         race = results[race_key]
         race.setdefault(cand_key, []).append(row)
@@ -131,7 +134,7 @@ def write_csv(summary):
     as this module.
 
     """
-    outfile = join(dirname(abspath(__file__)), 'summary_results.csv')
+    outfile = join(dirname((__file__)), 'summary_results.csv')
     with open(outfile, 'wb') as fh:
         # Limit output to cleanly parsed, standardized values
         fieldnames = [
diff --git a/elex2/tests/__init__.py b/elex2/tests/__init__.py
diff --git a/elex2/tests/sample_results.csv b/elex2/tests/sample_results.csv
@@ -0,0 +1,5 @@
+date,office,district,county,candidate,party,votes
+2012-11-06,President,,Some County,"Smith, Joe",GOP,10
+2012-11-06,President,,Some County,"Doe, Jane",DEM,11
+2012-11-06,President,,Another County,"Smith, Joe",GOP,5
+2012-11-06,President,,Another County,"Doe, Jane",DEM,5
diff --git a/elex2/tests/sample_results_parsed.json b/elex2/tests/sample_results_parsed.json
@@ -0,0 +1,52 @@
+{
+    "President": {
+        "DEM-Doe, Jane": [
+            {
+                "candidate": "Doe, Jane", 
+                "county": "Some County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Jane", 
+                "last_name": "Doe", 
+                "office": "President", 
+                "party": "DEM", 
+                "votes": 11
+            }, 
+            {
+                "candidate": "Doe, Jane", 
+                "county": "Another County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Jane", 
+                "last_name": "Doe", 
+                "office": "President", 
+                "party": "DEM", 
+                "votes": 5
+            }
+        ], 
+        "GOP-Smith, Joe": [
+            {
+                "candidate": "Smith, Joe", 
+                "county": "Some County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Joe", 
+                "last_name": "Smith", 
+                "office": "President", 
+                "party": "GOP", 
+                "votes": 10
+            }, 
+            {
+                "candidate": "Smith, Joe", 
+                "county": "Another County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Joe", 
+                "last_name": "Smith", 
+                "office": "President", 
+                "party": "GOP", 
+                "votes": 5
+            }
+        ]
+    }
+}
diff --git a/elex2/tests/sample_results_parsed_tie_race.json b/elex2/tests/sample_results_parsed_tie_race.json
@@ -0,0 +1,52 @@
+{
+    "President": {
+        "DEM-Doe, Jane": [
+            {
+                "candidate": "Doe, Jane", 
+                "county": "Some County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Jane", 
+                "last_name": "Doe", 
+                "office": "President", 
+                "party": "DEM", 
+                "votes": 10
+            }, 
+            {
+                "candidate": "Doe, Jane", 
+                "county": "Another County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Jane", 
+                "last_name": "Doe", 
+                "office": "President", 
+                "party": "DEM", 
+                "votes": 5
+            }
+        ], 
+        "GOP-Smith, Joe": [
+            {
+                "candidate": "Smith, Joe", 
+                "county": "Some County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Joe", 
+                "last_name": "Smith", 
+                "office": "President", 
+                "party": "GOP", 
+                "votes": 10
+            }, 
+            {
+                "candidate": "Smith, Joe", 
+                "county": "Another County", 
+                "date": "2012-11-06", 
+                "district": "", 
+                "first_name": "Joe", 
+                "last_name": "Smith", 
+                "office": "President", 
+                "party": "GOP", 
+                "votes": 5
+            }
+        ]
+    }
+}
diff --git a/elex2/tests/test_parser.py b/elex2/tests/test_parser.py
@@ -1,29 +1,20 @@
+from os.path import dirname, join
 from unittest import TestCase
 
-from .election_results import clean_office, clean_party, percent
+from elex2.election_results import parse_and_clean
 
 
 class TestDataCleaners(TestCase):
 
-    def test_clean_office_rep(self):
-        self.assertEquals(clean_office('U.S. Rep - 1'), ('U.S. House of Representatives', 1))
-
-    def test_clean_office_other(self):
-        self.assertEquals(clean_office('U.S. Senate'), ('U.S. Senate', ''))
-
-    def test_clean_party_gop(self):
-        self.assertEquals(clean_party('GOP'), 'REP')
-
-    def test_clean_party_dem(self):
-        self.assertEquals(clean_party('Democratic'), 'DEM')
-
-    def test_clean_party_others(self):
-        self.assertEquals(clean_party('Green'), 'GREEN')
-
-
-
-class TestPercentFunc(TestCase):
-
-    def test_percent(self):
-        "test_percent returns percentage as string"
-        self.assertEquals(percent(50, 100), '50')
+class TestParser(TestCase):
+
+    def test_name_parsing(self):
+        "Parser should split full candidate name into first and last names"
+        path = join(dirname(__file__), 'sample_results.csv')
+        results = parse_and_clean(path)
+        race_key = 'President'
+        cand_key = 'GOP-Smith, Joe'
+        # Get one county result
+        smith = results[race_key][cand_key][0]
+        self.assertEqual(smith['first_name'], 'Joe')
+        self.assertEqual(smith['last_name'], 'Smith')
diff --git a/elex2/tests/test_summary.py b/elex2/tests/test_summary.py
@@ -0,0 +1,66 @@
+from os.path import dirname, join
+from unittest import TestCase
+import json
+
+from elex2.election_results import summarize
+
+
+class TestSummaryResults(TestCase):
+
+    # Read the results of the parse_and_clean function stored in a test fixture
+    json_file = open(join(dirname(__file__), 'sample_results_parsed.json'), 'rb')
+    SAMPLE_RESULTS = json.load(json_file)
+    # Q: Why aren't we just using the parse_and_clean method instead of
+    # using a snapshot of that function's output?
+    # A: To achieve better test isolation!
+    
+    # Q: Why aren't reading in the JSON in a setUp method?
+    # A: setUp is called before each test method. This ensures we only
+    # incur the overhead of reading in the JSON once. In python2.7 or newer,
+    # you should use the setUpClass method instead of a class attribute.
+    # http://docs.python.org/2/library/unittest.html#unittest.TestCase.setUpClass
+
+    # We will, however, use the setUp method to call the summarize
+    # funciton afresh before each of our test methods.
+    def setUp(self):
+        results = summarize(self.SAMPLE_RESULTS)
+        self.race = results['President']
+
+    def test_racewide_vote_total(self):
+        "Summary results should be annotated with total votes cast in race"
+        self.assertEqual(self.race['all_votes'], 31)
+
+    def test_candiate_vote_totals(self):
+        "Summary candidates should reflect total votes from all counties"
+        # Loop through candidates and find Smith rather than relying on
+        # default sorting of candidates, which would make this test brittle
+        # the implementation changed.
+        smith = [cand for cand in self.race['candidates'] if cand['last_name'] == 'Smith'][0]
+        self.assertEqual(smith['votes'], 15)
+
+    def test_winner_has_flag(self):
+        "Winner flag should be assigned to candidates with most votes"
+        doe = [cand for cand in self.race['candidates'] if cand['last_name'] == 'Doe'][0]
+        self.assertEqual(doe['winner'], 'X')
+
+    def test_loser_has_no_winner_flag(self):
+        "Winner flag should be not be assigned to candidate with that does not have highest vote total"
+        smith = [cand for cand in self.race['candidates'] if cand['last_name'] == 'Smith'][0]
+        self.assertEqual(smith['winner'], '')
+
+
+class TestTieRace(TestCase):
+
+    # Q: Why do we need a new class and fixture for this race?
+    # A: So that we can change the vote counts so that we have a tie, of course!
+    # We don't *need* a new test class, but hey, why not?
+    json_file = open(join(dirname(__file__), 'sample_results_parsed_tie_race.json'), 'rb')
+    SAMPLE_RESULTS = json.load(json_file)
+
+    def test_tie_race_winner_flags(self):
+        "Winner flag should not be assigned to any candidate in a tie race"
+        pass
+        results = summarize(self.SAMPLE_RESULTS)
+        race = results['President']
+        for cand in race['candidates']:
+            self.assertEqual(cand['winner'], '')