-------------------------------------------------------------------------------------------------------------------------------------- name: log: /Users/Shared/EVIC Sync Files/Data/NVRA 2010/logfiles/create_2010EAVS_A.log log type: text opened on: 8 Sep 2011, 15:23:04 . . // File creation and cleaning run for the 2010 EAC NVRA Dataset . // . // Paul Gronke, September 8, 2011 . // . // File originally downloaded from the EAC website http://www.eac.gov/registration-data/ . // Excel file was exported as tab delimited and read directly into Stata using the . // insheet command. . // . cd "/Users/Shared/EVIC Sync Files/Data/NVRA 2010/" /Users/Shared/EVIC Sync Files/Data/NVRA 2010/ . insheet using "2010EAVS_A_Final.txt" (156 vars, 4695 obs) . . // Missing Values . . mvdecode qa1a qa3a qa3b qa4a qa5? qa5_total qa6? qa6_total qa7? qa7_total, mv(-999999) qa1a: 54 missing values generated qa3a: 127 missing values generated qa3b: 419 missing values generated qa4a: 675 missing values generated qa5a: 459 missing values generated qa5b: 454 missing values generated qa5c: 2262 missing values generated qa5d: 1176 missing values generated qa5e: 1185 missing values generated qa5f: 849 missing values generated qa5g: 1572 missing values generated qa5h: 316 missing values generated qa5i: 319 missing values generated qa5j: 321 missing values generated qa5k: 321 missing values generated qa5l: 321 missing values generated qa5_total: 441 missing values generated qa6a: 995 missing values generated qa6b: 1000 missing values generated qa6c: 2186 missing values generated qa6d: 1074 missing values generated qa6e: 1222 missing values generated qa6f: 1326 missing values generated qa6g: 1254 missing values generated qa6h: 1331 missing values generated qa6i: 2096 missing values generated qa6j: 254 missing values generated qa6k: 254 missing values generated qa6l: 254 missing values generated qa6m: 254 missing values generated qa6n: 254 missing values generated qa6o: 254 missing values generated qa6_total: 959 missing values generated qa7a: 562 missing values generated qa7b: 573 missing values generated qa7c: 2282 missing values generated qa7d: 658 missing values generated qa7e: 805 missing values generated qa7f: 903 missing values generated qa7g: 1188 missing values generated qa7h: 896 missing values generated qa7i: 1982 missing values generated qa7j: 259 missing values generated qa7k: 258 missing values generated qa7l: 258 missing values generated qa7m: 258 missing values generated qa7n: 258 missing values generated qa7o: 258 missing values generated qa7_total: 516 missing values generated . . lab var qa1a "total registration" . lab var qa3a "active registration" . lab var qa3b "inactive registration" . lab var qa4a "same day registration" . lab var qa5a "forms: total registration forms" . lab var qa5b "forms: new valid registration" . lab var qa5c "forms new pre registrations" . lab var qa5d "forms duplicate registrations" . lab var qa5e "forms rejected registrations" . lab var qa5f "forms change to name party or address" . lab var qa5g "forms address in new jurisdiction" . lab var qa5h "forms other 1" . lab var qa5i "forms other 2" . lab var qa5j "forms other 3" . lab var qa5k "forms other 4" . lab var qa5_total "forms total all types" . lab var qa6a "forms mail, fax, email" . lab var qa6b "forms in person leo" . lab var qa6c "forms internet" . lab var qa6d "forms dmv" . lab var qa6e "forms public asst offices" . lab var qa6f "forms disability agencies" . lab var qa6g "forms armed services recruitment" . lab var qa6h "forms others agencies (not nvra)" . lab var qa6i "forms third party reg drives" . lab var qa6j "forms other sources 1" . lab var qa6k "forms other sources 2" . lab var qa6l "forms other sources 3" . lab var qa6m "forms other sources 4" . lab var qa6n "forms other sources 5" . lab var qa6o "forms other sources 6" . lab var qa6_total "forms total all sources" . lab var qa7a "new forms mail, fax, email" . lab var qa7b "new forms in person leo" . lab var qa7c "new forms internet" . lab var qa7d "new forms dmv" . lab var qa7e "new forms public asst offices" . lab var qa7f "new forms disability agencies" . lab var qa7g "new forms armed services recruitment" . lab var qa7h "new forms others agencies (not nvra)" . lab var qa7i "new forms third party reg drives" . lab var qa7j "new forms other sources 1" . lab var qa7k "new forms other sources 2" . lab var qa7l "new forms other sources 3" . lab var qa7m "new forms other sources 4" . lab var qa7n "new forms other sources 5" . lab var qa7o "new forms other sources 6" . lab var qa7_total "new forms total all sources" . . // total registered voters . . sum qa1a Variable | Obs Mean Std. Dev. Min Max -------------+-------------------------------------------------------- qa1a | 4625 40292.2 136063 0 4449415 . . tabstat qa1a, by(state) stat(sum count) Summary for variables: qa1a by categories of: state (State) state | sum N -------+-------------------- AK | 560146 1 AL | 2964070 67 AR | 1638135 75 AS | 16124 1 AZ | 3502743 15 CA | 1.73e+07 58 CO | 3293942 64 CT | 2150633 169 DC | 512897 1 DE | 623425 3 FL | 1.26e+07 67 GA | 5748459 159 GU | 52821 1 HI | 692745 4 IA | 2116170 99 ID | 790531 44 IL | 8542397 110 IN | 4329977 92 KS | 1725012 105 KY | 2885775 120 LA | 2935062 64 MA | 4121180 351 MD | 3468287 24 ME | 1028501 505 MI | 7276237 83 MN | 3220844 87 MO | 4137495 116 MS | 1978463 82 MT | 651335 56 NC | 6207093 100 ND | 0 0 NE | 1142247 93 NH | 945341 323 NJ | 5135830 21 NM | 1147177 33 NV | 1375848 17 NY | 1.18e+07 62 OH | 8044315 88 OK | 2082428 77 OR | 2068798 36 PA | 8220759 67 RI | 706161 39 SC | 2630363 46 SD | 575150 66 TN | 3952404 95 TX | 1.33e+07 254 UT | 1500305 29 VA | 5032135 134 VT | 439333 233 WA | 4066517 39 WI | 3709229 72 WV | 1216023 55 WY | 270083 23 -------+-------------------- Total | 1.86e+08 4625 ---------------------------- . . // the count statistic will provide us the number of jurisdictions used to create the . // statewide totals. this will be important to determine if the denominator problem . // crops up--that is, the EAC is reporting statistics based on a different number of . // jurisdictions . . // Total active and inactive registered voters . sum qa3a qa3b Variable | Obs Mean Std. Dev. Min Max -------------+-------------------------------------------------------- qa3a | 4538 37663.93 128142.9 0 4449415 qa3b | 3767 5512.34 41982.22 0 1648709 . . // Total by state . tabstat qa3a qa3b, by(state) stat(sum count) Summary statistics: sum, N by categories of: state (State) state | qa3a qa3b -------+-------------------- AK | 494876 65270 | 1 1 -------+-------------------- AL | 2586282 377788 | 67 67 -------+-------------------- AR | 1326681 311454 | 75 75 -------+-------------------- AS | 16124 0 | 1 0 -------+-------------------- AZ | 3146418 356325 | 15 15 -------+-------------------- CA | 1.73e+07 6367117 | 58 57 -------+-------------------- CO | 2477202 816740 | 64 64 -------+-------------------- CT | 2026874 123759 | 169 169 -------+-------------------- DC | 454695 58202 | 1 1 -------+-------------------- DE | 603456 19969 | 3 3 -------+-------------------- FL | 1.12e+07 1323288 | 67 67 -------+-------------------- GA | 5027430 721029 | 159 159 -------+-------------------- GU | 52821 0 | 1 0 -------+-------------------- HI | 605532 85213 | 4 4 -------+-------------------- IA | 1984995 131175 | 99 99 -------+-------------------- ID | 790531 0 | 44 0 -------+-------------------- IL | 7455076 1087321 | 110 110 -------+-------------------- IN | 4196884 133093 | 92 92 -------+-------------------- KS | 1580688 144324 | 105 105 -------+-------------------- KY | 2880155 144086 | 120 120 -------+-------------------- LA | 2711974 223088 | 64 64 -------+-------------------- MA | 3684321 436859 | 351 350 -------+-------------------- MD | 3468287 0 | 24 0 -------+-------------------- ME | 984455 44046 | 505 505 -------+-------------------- MI | 7276237 0 | 83 0 -------+-------------------- MN | 3220844 0 | 87 0 -------+-------------------- MO | 3674460 463035 | 116 116 -------+-------------------- MS | 1624981 104178 | 73 54 -------+-------------------- MT | 549683 101652 | 56 56 -------+-------------------- NC | 5756403 450690 | 100 100 -------+-------------------- ND | 0 0 | 0 0 -------+-------------------- NE | 1020637 121610 | 93 93 -------+-------------------- NH | 945341 0 | 323 0 -------+-------------------- NJ | 4719468 416362 | 21 21 -------+-------------------- NM | 1066970 80207 | 33 33 -------+-------------------- NV | 1114395 256951 | 16 16 -------+-------------------- NY | 1.07e+07 1126491 | 62 62 -------+-------------------- OH | 8048315 0 | 88 0 -------+-------------------- OK | 1773975 308453 | 77 77 -------+-------------------- OR | 2068798 0 | 36 0 -------+-------------------- PA | 7499183 721573 | 67 67 -------+-------------------- RI | 647569 58592 | 39 39 -------+-------------------- SC | 2630363 327192 | 46 46 -------+-------------------- SD | 519396 55754 | 66 66 -------+-------------------- TN | 3604935 347459 | 95 95 -------+-------------------- TX | 1.14e+07 1887762 | 254 254 -------+-------------------- UT | 1338747 161558 | 29 29 -------+-------------------- VA | 4720451 311684 | 134 134 -------+-------------------- VT | 386501 28388 | 211 171 -------+-------------------- WA | 3601268 465249 | 39 39 -------+-------------------- WI | 3709229 0 | 72 72 -------+-------------------- WV | 0 0 | 0 0 -------+-------------------- WY | 270083 0 | 23 0 -------+-------------------- Total | 1.71e+08 2.08e+07 | 4538 3767 ---------------------------- . . // Data consistency check 1: Does the total registered voters = inactive + active? . . gen activeandinactive=qa3a+qa3b (928 missing values generated) . list state jurisdiction qa1a activeandinactive if qa1a>activeandinactive | qa1aqa5a | qa5_totalqa5a & qa5b!=. & qa5a!=. +------------------------------------------+ | state jurisdiction qa5a qa5b | |------------------------------------------| 836. | IL Brown County 306 377 | 919. | IL Saline County 1427 1435 | 924. | IL St. Clair County 14945 14956 | 3274. | NY Clinton County 3025 3031 | 3282. | NY Fulton County 1375 2473 | |------------------------------------------| 3289. | NY Lewis County 567 1153 | 3311. | NY Schoharie County 1375 1533 | 3683. | SD BON HOMME COUNTY 0 286 | 3732. | SD POTTER COUNTY 0 111 | +------------------------------------------+ . . // OOPS! . // The plot below displays the proportion of new forms, by county, across states, and does not . // truncate at 1.0 . . gen percent_new_forms=qa5b/qa5a if qa5a!=. & qa5b!=. (610 missing values generated) . graph box percent_new_forms, over(state, label(angle(vertical) labsize(vsmall))) ytitle(Proportion of registration forms that were n > ew) /// > title(New Registration Forms) subtitle(By county within state) . graph export new_forms.png, replace (file new_forms.png written in PNG format) . . // Now let's make the same calculation for rejected forms . . list state jurisdiction qa5a qa5e if qa5e>qa5a & qa5a!=. & qa5e!=. . . // At least no counties rejected more forms than they received. One wonders how many counties reported . // on rejected forms at all however . . gen percent_rejected=qa5e/qa5a if qa5a!=. & qa5e!=. (1521 missing values generated) . graph box percent_rejected, over(state, label(angle(vertical) labsize(vsmall))) ytitle(Proportion of registration forms rejected) // > / > title(Rejected Registration Forms) subtitle(By county within state) . graph export rejected_forms.png, replace (file rejected_forms.png written in PNG format) . . tabstat qa5a qa5e, by(state) stat(count) Summary statistics: N by categories of: state (State) state | qa5a qa5e -------+-------------------- AK | 1 1 AL | 67 67 AR | 75 75 AS | 1 1 AZ | 15 14 CA | 57 36 CO | 64 64 CT | 169 0 DC | 1 1 DE | 3 3 FL | 67 0 GA | 159 159 GU | 0 0 HI | 4 0 IA | 99 99 ID | 44 0 IL | 109 85 IN | 92 92 KS | 105 105 KY | 120 120 LA | 64 64 MA | 351 351 MD | 24 24 ME | 505 505 MI | 83 83 MN | 87 87 MO | 116 76 MS | 62 36 MT | 56 53 NC | 100 100 ND | 0 0 NE | 93 27 NH | 0 0 NJ | 21 21 NM | 33 1 NV | 14 3 NY | 53 0 OH | 88 75 OK | 77 0 OR | 36 0 PA | 67 67 RI | 39 0 SC | 46 0 SD | 66 65 TN | 95 61 TX | 254 254 UT | 29 29 VA | 134 131 VT | 202 133 WA | 39 24 WI | 72 0 WV | 14 8 WY | 23 0 -------+-------------------- Total | 4195 3200 ---------------------------- . . // That is a bit disappointing ... . . // Final graphic just for Doug. I am going to replicate by proportion forms processed by the DMV . // Start by identifying out of bounds values . . list state jurisdiction qa5a qa6d if qa6d>qa5a & qa6d!=. & qa5a!=. +------------------------------------------------+ | state jurisdiction qa5a qa6d | |------------------------------------------------| 857. | IL Edgar County 235 1502 | 899. | IL McLean County 6223 7770 | 924. | IL St. Clair County 14945 19412 | 1025. | IN WARREN COUNTY 971 1016 | 3282. | NY Fulton County 1375 2033 | |------------------------------------------------| 3289. | NY Lewis County 567 953 | 3297. | NY Oneida County 19271 56770 | 3683. | SD BON HOMME COUNTY 0 368 | 3732. | SD POTTER COUNTY 0 26 | 4124. | VA ACCOMACK COUNTY 2593 3481 | |------------------------------------------------| 4125. | VA ALBEMARLE COUNTY 6041 9400 | 4126. | VA ALEXANDRIA CITY 11649 23696 | 4127. | VA ALLEGHANY COUNTY 789 1714 | 4128. | VA AMELIA COUNTY 478 1110 | 4129. | VA AMHERST COUNTY 1366 2761 | |------------------------------------------------| 4130. | VA APPOMATTOX COUNTY 856 1437 | 4131. | VA ARLINGTON COUNTY 16605 37098 | 4132. | VA AUGUSTA COUNTY 3358 6264 | 4133. | VA BATH COUNTY 244 281 | 4134. | VA BEDFORD CITY 269 813 | |------------------------------------------------| 4135. | VA BEDFORD COUNTY 3756 9047 | 4136. | VA BLAND COUNTY 331 643 | 4137. | VA BOTETOURT COUNTY 1682 3343 | 4138. | VA BRISTOL CITY 1292 2379 | 4139. | VA BRUNSWICK COUNTY 792 1069 | |------------------------------------------------| 4140. | VA BUCHANAN COUNTY 1207 1475 | 4141. | VA BUCKINGHAM COUNTY 907 1257 | 4142. | VA BUENA VISTA CITY 290 519 | 4143. | VA CAMPBELL COUNTY 2635 5473 | 4144. | VA CAROLINE COUNTY 1507 3574 | |------------------------------------------------| 4145. | VA CARROLL COUNTY 1496 2658 | 4146. | VA CHARLES CITY COUNTY 334 577 | 4147. | VA CHARLOTTE COUNTY 432 974 | 4148. | VA CHARLOTTESVILLE CITY 2583 3345 | 4149. | VA CHESAPEAKE CITY 11097 12791 | |------------------------------------------------| 4150. | VA CHESTERFIELD COUNTY 16682 43344 | 4151. | VA CLARKE COUNTY 671 1518 | 4152. | VA COLONIAL HEIGHTS CITY 781 2150 | 4153. | VA COVINGTON CITY 239 357 | 4154. | VA CRAIG COUNTY 314 598 | |------------------------------------------------| 4155. | VA CULPEPER COUNTY 1987 5899 | 4156. | VA CUMBERLAND COUNTY 351 726 | 4157. | VA DANVILLE CITY 2339 5955 | 4159. | VA DINWIDDIE COUNTY 1096 2781 | 4160. | VA EMPORIA CITY 283 857 | |------------------------------------------------| 4161. | VA ESSEX COUNTY 621 1220 | 4162. | VA FAIRFAX CITY 1355 2493 | 4163. | VA FAIRFAX COUNTY 60542 105564 | 4164. | VA FALLS CHURCH CITY 734 1080 | 4165. | VA FAUQUIER COUNTY 3659 9071 | |------------------------------------------------| 4166. | VA FLOYD COUNTY 702 1622 | 4167. | VA FLUVANNA COUNTY 1140 1987 | 4168. | VA FRANKLIN CITY 578 859 | 4169. | VA FRANKLIN COUNTY 3198 7193 | 4170. | VA FREDERICK COUNTY 5616 10620 | |------------------------------------------------| 4171. | VA FREDERICKSBURG CITY 1872 3913 | 4172. | VA GALAX CITY 251 554 | 4173. | VA GILES COUNTY 916 1640 | 4174. | VA GLOUCESTER COUNTY 1886 4727 | 4175. | VA GOOCHLAND COUNTY 844 1599 | |------------------------------------------------| 4176. | VA GRAYSON COUNTY 677 1081 | 4177. | VA GREENE COUNTY 990 1507 | 4178. | VA GREENSVILLE COUNTY 430 939 | 4179. | VA HALIFAX COUNTY 1677 3303 | 4180. | VA HAMPTON CITY 4767 14514 | |------------------------------------------------| 4181. | VA HANOVER COUNTY 3794 8753 | 4182. | VA HARRISONBURG CITY 1920 4719 | 4183. | VA HENRICO COUNTY 13381 39597 | 4184. | VA HENRY COUNTY 2870 5310 | 4185. | VA HIGHLAND COUNTY 100 108 | |------------------------------------------------| 4186. | VA HOPEWELL CITY 1052 2573 | 4187. | VA ISLE OF WIGHT COUNTY 2019 5063 | 4188. | VA JAMES CITY COUNTY 4433 9214 | 4189. | VA KING AND QUEEN COUNTY 259 505 | 4190. | VA KING GEORGE COUNTY 1429 2555 | |------------------------------------------------| 4191. | VA KING WILLIAM COUNTY 847 1618 | 4192. | VA LANCASTER COUNTY 552 917 | 4193. | VA LEE COUNTY 1053 2831 | 4194. | VA LEXINGTON CITY 337 528 | 4195. | VA LOUDOUN COUNTY 18751 34312 | |------------------------------------------------| 4196. | VA LOUISA COUNTY 1521 3178 | 4197. | VA LUNENBURG COUNTY 538 1055 | 4198. | VA LYNCHBURG CITY 5249 10432 | 4199. | VA MADISON COUNTY 554 1096 | 4200. | VA MANASSAS CITY 1390 3993 | |------------------------------------------------| 4201. | VA MANASSAS PARK CITY 785 1460 | 4202. | VA MARTINSVILLE CITY 834 1650 | 4203. | VA MATHEWS COUNTY 579 979 | 4204. | VA MECKLENBURG COUNTY 1497 3551 | 4205. | VA MIDDLESEX COUNTY 435 1077 | |------------------------------------------------| 4206. | VA MONTGOMERY COUNTY 5028 14186 | 4207. | VA NELSON COUNTY 553 940 | 4208. | VA NEW KENT COUNTY 942 1515 | 4209. | VA NEWPORT NEWS CITY 6730 23496 | 4210. | VA NORFOLK CITY 11537 28945 | |------------------------------------------------| 4211. | VA NORTHAMPTON COUNTY 921 945 | 4212. | VA NORTHUMBERLAND COUNTY 668 1025 | 4213. | VA NORTON CITY 210 273 | 4214. | VA NOTTOWAY COUNTY 822 1397 | 4215. | VA ORANGE COUNTY 1843 4123 | |------------------------------------------------| 4216. | VA PAGE COUNTY 1038 1955 | 4217. | VA PATRICK COUNTY 846 1215 | 4218. | VA PETERSBURG CITY 1639 3981 | 4219. | VA PITTSYLVANIA COUNTY 2694 7387 | 4220. | VA POQUOSON CITY 371 684 | |------------------------------------------------| 4221. | VA PORTSMOUTH CITY 3484 10917 | 4222. | VA POWHATAN COUNTY 1051 2023 | 4223. | VA PRINCE EDWARD COUNTY 1243 3211 | 4224. | VA PRINCE GEORGE COUNTY 1793 3262 | 4225. | VA PRINCE WILLIAM COUNTY 22633 47502 | |------------------------------------------------| 4226. | VA PULASKI COUNTY 1770 4517 | 4227. | VA RADFORD CITY 670 1934 | 4228. | VA RAPPAHANNOCK COUNTY 400 841 | 4229. | VA RICHMOND CITY 10576 28461 | 4230. | VA RICHMOND COUNTY 369 640 | |------------------------------------------------| 4231. | VA ROANOKE CITY 3654 16126 | 4232. | VA ROANOKE COUNTY 3952 11614 | 4233. | VA ROCKBRIDGE COUNTY 1170 2208 | 4234. | VA ROCKINGHAM COUNTY 3035 7300 | 4235. | VA RUSSELL COUNTY 1197 1486 | |------------------------------------------------| 4236. | VA SALEM CITY 1235 3167 | 4237. | VA SCOTT COUNTY 796 1503 | 4238. | VA SHENANDOAH COUNTY 2604 5660 | 4239. | VA SMYTH COUNTY 1534 3356 | 4240. | VA SOUTHAMPTON COUNTY 915 2214 | |------------------------------------------------| 4241. | VA SPOTSYLVANIA COUNTY 6367 16870 | 4242. | VA STAFFORD COUNTY 7879 17434 | 4243. | VA STAUNTON CITY 1306 3561 | 4244. | VA SUFFOLK CITY 3000 10641 | 4245. | VA SURRY COUNTY 378 627 | |------------------------------------------------| 4246. | VA SUSSEX COUNTY 588 1157 | 4247. | VA TAZEWELL COUNTY 2033 4319 | 4248. | VA VIRGINIA BEACH CITY 19646 38370 | 4249. | VA WARREN COUNTY 2239 5785 | 4250. | VA WASHINGTON COUNTY 2817 7094 | |------------------------------------------------| 4251. | VA WAYNESBORO CITY 989 2578 | 4252. | VA WESTMORELAND COUNTY 1042 1693 | 4253. | VA WILLIAMSBURG CITY 1234 1503 | 4254. | VA WINCHESTER CITY 1713 3600 | 4255. | VA WISE COUNTY 1152 2137 | |------------------------------------------------| 4256. | VA WYTHE COUNTY 1748 3735 | 4257. | VA YORK COUNTY 3423 6159 | +------------------------------------------------+ . . // OUCH! A lot more problems here. Duplicate forms?? . . gen percent_DMV=qa6d/qa5a if qa5a!=. & qa6d!=. (1170 missing values generated) . graph box percent_DMV, over(state, label(angle(vertical) labsize(vsmall))) ytitle(Proportion of registration forms from DMV) /// > title(Registration Forms from the DMV) subtitle(By county within state) . graph export DMV_forms.png, replace (file DMV_forms.png written in PNG format) . . // And the same graph but truncated . graph box percent_DMV if percent_DMV<=1, over(state, label(angle(vertical) labsize(vsmall))) ytitle(Proportion of registration forms > from DMV) /// > title(Registration Forms from the DMV) subtitle(By county within state) . graph export DMV_forms_1.png, replace (file DMV_forms_1.png written in PNG format) . end of do-file . log cose cose invalid r(198); . log close name: log: /Users/Shared/EVIC Sync Files/Data/NVRA 2010/logfiles/create_2010EAVS_A.log log type: text closed on: 8 Sep 2011, 15:23:24 --------------------------------------------------------------------------------------------------------------------------------------