diff --git a/.gitignore b/.gitignore index ad334de..69154a4 100644 --- a/.gitignore +++ b/.gitignore @@ -1,59 +1,42 @@ -# Byte-compiled / optimized / DLL files -__pycache__/ -*.py[cod] -db.sqlite3 -migrations/ -media/ -settings.py -# C extensions -*.so - -# Distribution / packaging -.Python -env/ -build/ -develop-eggs/ -dist/ -downloads/ -eggs/ -.eggs/ -lib64/ -parts/ -sdist/ -var/ -*.egg-info/ -.installed.cfg -*.egg - -# PyInstaller -# Usually these files are written by a python script from a template -# before PyInstaller builds the exe, so as to inject date/other infos into it. -*.manifest -*.spec - -# Installer logs -pip-log.txt -pip-delete-this-directory.txt - -# Unit test / coverage reports -htmlcov/ -.tox/ +MANIFEST +build +dist +_build +docs/man/*.gz +docs/source/api/generated +docs/source/config.rst +docs/gh-pages +notebook/i18n/*/LC_MESSAGES/*.mo +notebook/i18n/*/LC_MESSAGES/nbjs.json +notebook/static/components +notebook/static/style/*.min.css* +notebook/static/*/js/built/ +notebook/static/*/built/ +notebook/static/built/ +notebook/static/*/js/main.min.js* +notebook/static/lab/*bundle.js +node_modules +*.py[co] +__pycache__ +*.egg-info +*~ +*.bak +.ipynb_checkpoints +.tox +.DS_Store +\#*# +.#* .coverage -.coverage.* -.cache -nosetests.xml -coverage.xml -*,cover - -# Translations -*.mo -*.pot +src -# Django stuff: -*.log +*.swp +*.map +.idea/ +Read the Docs +config.rst -# Sphinx documentation -docs/_build/ +/.project +/.pydevproject -# PyBuilder -target/ +package-lock.json +data diff --git a/build.sh b/build.sh old mode 100644 new mode 100755 index 7ba0b06..61c49ea --- a/build.sh +++ b/build.sh @@ -1,11 +1,18 @@ -#!/env/bin bash -# Create the basic virtualenv -virtualenv FEC_data_notebook +#!/bin/bash +install_path=$1 +src_path=$(pwd) +app_path=$install_path/FEC_data_notebook -mkdir ./data -mkdir ./data/2016 +# Create the basic virtualenv +cd $install_path && virtualenv FEC_data_notebook +cp -r $src_path/src $app_path +cp $src_path/requirements.txt $app_path +cp $src_path/start.sh $app_path +mkdir $app_path/data +mkdir $app_path/data/2016 -wget -O ./data/2016/independent_expenditure_2016.csv https://cg-519a459a-0ea3-42c2-b7bc-fa1143481f74.s3-us-gov-west-1.amazonaws.com/bulk-downloads/2016/independent_expenditure_2016.csv +# Download the 2016 sample data to the data path +wget -O $app_path/data/2016/independent_expenditure_2016.csv https://cg-519a459a-0ea3-42c2-b7bc-fa1143481f74.s3-us-gov-west-1.amazonaws.com/bulk-downloads/2016/independent_expenditure_2016.csv # Activate the virtual env, install dependencies, and start the notebook -source ./FEC_data_notebook/bin/activate && pip install -r ./requirements.txt && cd ./src && jupyter notebook \ No newline at end of file +source $app_path/bin/activate && pip install -r $app_path/requirements.txt && export FEC_data_path=$app_path/data && cd $app_path/src && jupyter notebook diff --git a/src/Drafts/Independent Expenditures.ipynb b/src/Drafts/Independent Expenditures.ipynb index 46a0bcd..52d2686 100644 --- a/src/Drafts/Independent Expenditures.ipynb +++ b/src/Drafts/Independent Expenditures.ipynb @@ -27,7 +27,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 4, "metadata": {}, "outputs": [], "source": [ @@ -46,7 +46,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -61,7 +61,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 6, "metadata": {}, "outputs": [], "source": [ @@ -71,9 +71,22 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 7, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + " expenditure date\n", + "0 188000.0 2016-11-07\n", + "1 50359.0 2016-10-26\n", + "2 100000.0 2016-10-28\n", + "3 22000.0 2016-11-03\n", + "4 68240.0 2016-11-03\n" + ] + } + ], "source": [ "# Convert the dataframe with headers to an RDD, for use in map/reduce actions\n", "total_expenditures_rdd = (\n", @@ -100,9 +113,20 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 8, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "Row(cand_id='P00003392', cand_name='CLINTON, HILLARY RODHAM', spe_id='C00344531', spe_nam='1199 32BJ/144 SERVICE EMPLOYEES INTERNATIONAL UNION HOME CARE POLITICAL ACTION FUND', ele_type='G', can_office_state=None, can_office_dis='00', can_office='P', cand_pty_aff='DEMOCRATIC PARTY', exp_amo='188000', exp_date='07-NOV-16', agg_amo='188000', sup_opp='S', pur='EVENT EXPENSES', pay='ART SCHOOL DROPOUT INC.', file_num='1123839', amndt_ind='N', tran_id='SE.5047', image_num='201611049037122225', receipt_dat='04-NOV-16', fec_election_yr='2016', prev_file_num=None)" + ] + }, + "execution_count": 8, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "# Print the first expenditures RDD -- this is for general debugging and viewing\n", "total_expenditures_rdd.first()" @@ -110,7 +134,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 9, "metadata": {}, "outputs": [], "source": [ @@ -133,9 +157,17 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 10, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[(39523, 'CLINTON, HILLARY'), (16440, 'STRICKLAND, TED'), (9572, 'ROSS, DEBORAH'), (7577, 'MCGINTY, KATHLEEN'), (3316, 'MURPHY, PATRICK'), (3297, 'KANDER, JASON'), (1979, 'CLINTON, HILLARY RODHAM'), (885, 'TRUMP, DONALD'), (820, 'DUCKWORTH, TAMMY'), (682, 'RUBIO, MARCO'), (673, 'BUSH, JEB'), (671, 'CHRISTIE, CHRISTOPHER J.'), (574, \"CRUZ, RAFAEL EDWARD 'TED'\"), (572, 'SANDERS, BERNARD'), (497, 'CARSON, BEN'), (452, 'BAYH, EVAN'), (403, 'SANDERS, BERNIE'), (398, 'CRUZ, TED'), (307, 'MASTO, CATHERINE CORTEZ'), (257, 'GLENN, DARRYL'), (242, \"CRUZ, RAFAEL 'TED'\"), (223, 'JOHNSON, RON'), (198, 'TRUMP, DONALD J'), (191, 'MCGINTY, KATIE'), (185, 'RODHAM CLINTON, HILLARY'), (181, 'KASICH, JOHN R'), (177, 'CRUZ, RAFAEL EDWARD TED'), (172, 'CORTEZ MASTO, CATHERINE'), (168, 'MCGINTY, KATHLEEN ALANA'), (153, 'HECK, JOE'), (153, 'PAUL, RAND'), (149, 'FIORINA, CARLY'), (148, 'FEINGOLD, RUSS'), (119, 'PORTMAN, ROB'), (117, 'HASSAN, MARGARET WOOD'), (113, 'LEE, MIKE'), (110, 'LOVE, MIA'), (105, 'TRUMP, DONALD J.'), (99, 'BLUNT, ROY'), (99, 'WALKER, SCOTT'), (98, 'TOOMEY, PATRICK JOSEPH'), (97, 'KIHUEN, RUBEN'), (92, 'CORTEZ-MASTO, CATHERINE'), (91, 'GRAHAM, LINDSEY'), (88, 'MURPHY, PATRICK E'), (83, 'BURR, RICHARD'), (82, 'DRISKELL, GRETCHEN'), (81, 'CLINTON, HILARY'), (81, 'ROSS, DEBORAH K'), (80, 'HURD, WILLIAM'), (74, 'VERNON, MONICA'), (73, 'CAMPBELL, FOSTER LONNNIE II'), (69, 'KIRKPATRICK, ANN LEILA'), (68, 'CURBELO, CARLOS'), (65, 'SCOTT, TIMOTHY E'), (63, 'CLINTON, HILLARY RODHAM / K'), (62, 'JOHNSON, GARY'), (61, 'ASHFORD, BRAD'), (61, 'AYOTTE, KELLY A'), (59, 'JOHNSON, RONALD HAROLD'), (58, 'WARD, KELLI'), (58, 'VAN HOLLEN, CHRIS'), (55, 'DESANTIS, RONALD'), (53, 'HASSAN, MARGARET'), (52, 'AYOTTE, KELLY A.'), (52, 'JAYAPAL, PRAMILA'), (51, 'GALLAGHER, MIKE'), (51, 'STUTZMAN, MARLIN'), (50, 'JINDAL, BOBBY'), (49, 'TOOMEY, PATRICK'), (48, 'GALLEGO, PETE'), (48, 'BENNETT, LUANN'), (47, 'HOEBER, AMIE'), (45, 'EGGMAN, MICHAEL'), (45, \"O'MALLEY, MARTIN\"), (44, 'SCHNEIDER, BRAD'), (44, 'MAST, BRIAN'), (43, 'CRUZ, RAFAEL'), (43, 'NELSON, TOM'), (41, 'APPLEGATE, DOUG'), (39, 'CRANE, MICHAEL ROBERT'), (39, 'CARBAJAL, SALUD'), (39, 'HUCKABEE, MIKE'), (39, 'DOLD, ROBERT'), (38, 'HILLARY, CLINTON'), (38, 'VELAZQUEZ, NYDIA'), (38, 'GOTTHEIMER, JOSH'), (37, 'FEINGOLD, RUSSELL'), (36, 'DOLD, ROBERT JAMES JR'), (36, 'SHEA-PORTER, CAROL'), (35, 'SZELIGA, KATHY'), (35, 'FEINGOLD, RUSSELL DANA'), (34, 'MCCAIN, JOHN S'), (33, 'CAFORIO, BRYAN'), (33, 'DAVIDSON, WARREN'), (33, 'HILLARY CLINTON, RUSS FEINGOLD'), (32, 'GAETZ, MATT'), (31, 'MURPHY, STEPHANIE'), (31, 'MARSHALL, ROGER W.'), (31, 'AYOTTE, KELLY'), (30, 'HOLLINGSWORTH, TREY'), (29, 'NEGRON, REBECCA'), (28, 'THOMAS, MARY'), (27, 'MASTO, CATHERINE'), (27, 'DENHAM, JEFF'), (27, 'REED, THOMAS W II'), (26, 'HUELSKAMP, TIMOTHY A REPRESENTA'), (26, 'TED, STRICKLAND'), (26, 'SCHRADER, KURT'), (26, 'KENNEDY, JOHN NEELY'), (26, 'STEFANIK, ELISE M.'), (25, 'KUSTER, ANN MCLANE'), (25, 'WILLIS, COLM'), (25, 'HUERTA, EMILIO'), (25, 'DIANE, CHISESI'), (25, 'YOUNG, DAVID'), (25, 'CARROLL, MORGAN'), (24, 'EDWARDS, DONNA FERN'), (24, 'BUDD, THEODORE P MR.'), (23, 'PENA-MELNYK, JOSELINE'), (23, 'WASSERMAN SCHULTZ, DEBBIE'), (23, 'CLINTON, CLINTON'), (22, 'COFFMAN, MIKE'), (22, 'PG, SITTENFELD'), (22, 'YOUNG, TODD'), (22, 'FERGUSON, DREW'), (21, 'BACON, DONALD'), (21, 'FAREED, JUSTIN'), (21, 'JOHNSON, JAMES'), (21, 'PERRY, JAMES R (RICK)'), (21, 'BENNET, MICHAEL F'), (20, 'SANTORUM, RICHARD J.'), (20, 'MCCAIN, JOHN'), (20, 'ZINKE, RYAN K'), (20, 'MANESS, ROBERT L COL. RET'), (20, 'PAULSEN, ERIK'), (20, 'TARKANIAN, DANNY'), (19, 'LEE, YUNGMAN'), (19, 'HARRIS, KAMALA'), (19, 'GUTIERREZ, ANA SOL'), (19, 'BIGGS, ANDY'), (18, 'BARRAGAN, NANETTE'), (18, 'DERICKSON, TIMOTHY'), (18, 'CRAIG, ANGIE'), (18, 'WILDER, SELLUS'), (18, 'SOTO, DARREN'), (18, 'BANKS, JAMES'), (18, 'MOONEY, ALEXANDER XAVIER'), (17, 'SANTARSIERO, STEVEN'), (17, 'SASSE, BENJAMIN E'), (17, 'BERA, AMERISH'), (17, 'BLUM, RODNEY'), (17, 'CARSON, BENJAMIN S SR MD'), (17, 'KENNEDY, JOHN'), (17, 'HILARY, CLINTON'), (17, 'ISAKSON, JOHNNY'), (17, 'WILLIAM BILL WELD, GARY JOHNSON /'), (17, 'EMMER, THOMAS EARL JR.'), (16, 'TENNEY, CLAUDIA'), (16, 'TOTH, STEVE'), (16, 'SESTAK, JOSEPH'), (16, 'GUINTA, FRANK'), (16, 'TED, CRUZ'), (16, 'ROSEN, JACKY'), (16, 'COMSTOCK, BARBARA J.'), (16, 'TEACHOUT, ZEPHYR'), (16, 'HARDY, CRESENT'), (16, 'JONES, SCOTT'), (16, 'CAIN, EMILY'), (15, 'MURKOWSKI, LISA'), (15, 'HUELSKAMP, TIMOTHY'), (15, 'JOHNSON, RONALD'), (15, 'CLINTON, ROSS, HILLARY'), (15, 'NOLAN, RICK'), (15, 'DONALD, TRUMP'), (15, 'COOK, PAUL'), (15, 'ROGERS, WENDY'), (14, 'RASKIN, JAMIE'), (14, 'GRASSLEY, CHARLES E SENATOR'), (14, 'NOLAN, RICHARD'), (14, 'CURBELO, CARLOS MR.'), (14, 'BANKS, JAMES E'), (14, 'COMSTOCK, BARBARA J HONORABLE'), (14, 'NORCROSS, DONALD'), (14, 'KATKO, JOHN M'), (14, 'VALADAO, DAVID'), (14, 'CORREA, LOU'), (14, 'GARCIA, JOSE'), (13, 'PATRICK, MURPHY'), (13, 'BRADY, KEVIN'), (13, 'KATIE, MCGINTY'), (13, 'MOWRER, JIM'), (13, 'FITZPATRICK, BRIAN'), (13, 'FLYNN, MICHAEL'), (13, 'ZELDIN, LEE M'), (12, 'SHELBY, RICHARD'), (12, 'PATAKI, GEORGE E'), (12, 'TOOMEY, PAT'), (12, 'DUNN, NEAL'), (12, 'KIRK, MARK STEVEN'), (12, 'MATTHEWS, KATHLEEN'), (12, 'SMUCKER, LLOYD'), (12, 'JOHNSON, JAMES MICHAEL'), (12, 'COLM, WILLIS'), (12, 'HUDSON, RICHARD'), (11, 'BERGMAN, JOHN'), (11, 'SCHWARTZ, GAIL'), (11, 'MEEHAN, PATRICK L. MR.'), (11, 'POLIQUIN, BRUCE L'), (11, 'COMSTOCK, BARBARA'), (11, 'DEMINGS, VAL'), (11, 'HECK, JOSEPH'), (11, 'CHRISTIE, CHRISTOPHER J'), (11, 'JUDGE, PATTY JEAN'), (11, 'SHIMKUS, JOHN'), (11, 'DEACON, COLLEEN'), (10, 'DOLD JR., ROBERT JAMES MR.'), (10, 'EDWARDS, DONNA'), (10, 'GARRETT, SCOTT'), (10, ', '), (10, 'COFFMAN, MICHAEL'), (10, 'THRONE-HOLST, ANNA'), (9, 'GALLAGHER, MICHAEL JOHN'), (9, 'CORREA, JOSE LUIS (LOU)'), (9, \"O'MALLEY, MARTIN JOSEPH\"), (9, \"SUNDHEIM, GEORGE 'DUF'\"), (9, 'CHABOT, PAUL R DR.'), (9, 'HALL, ISADORE'), (9, 'MARIE, DAVIS'), (9, 'FLEMING, JOHN C JR'), (9, 'BRIDENSTINE, JAMES FREDERICK'), (9, 'ROBERSON, MICHAEL'), (9, 'FASO, JOHN J. MR.'), (9, 'PETERS, SCOTT'), (9, 'CARSON, BENJAMIN'), (9, 'KNIGHT, STEVE'), (9, 'YOUNG, TODD CHRISTOPHER'), (9, 'ROCHESTER, LISA BLUNT'), (8, 'ROSS, HENRY'), (8, 'BENNET, MICHAEL'), (8, 'CRANE, MICHAEL'), (8, 'YOUNG, DON'), (8, 'RANDOLPH, SUSANNAH'), (8, 'KIRKPATRICK, ANN'), (8, 'MYERS, KIM'), (8, 'JOYCE, DAVID'), (8, 'DESANTIS, RONALD D.'), (8, 'DESANTIS, RONALD D'), (8, 'KAPLAN, ANNA'), (8, 'HONDA, MIKE'), (8, 'DUNN, JOE'), (8, 'MARGARET, HASSAN'), (8, 'GRASSLEY, CHUCK'), (8, 'KEMPER, NANCY JO'), (8, 'DAVIS, MARIE'), (8, 'MARSHALL, ROGER'), (8, 'MICA, JOHN L. MR.'), (7, 'DUNN MD FACS, NEAL PATRICK'), (7, 'ROBY, MARTHA'), (7, 'MONTES, JOSEPH'), (7, 'MANDEL, JOSH'), (7, 'BERTRAND, RICK'), (7, 'GALLAGHER, MICHAEL'), (7, 'MARSHALL, ROGER W'), (7, 'STUTZMAN, MARLIN A.'), (7, 'TADDEO, ANNETTE'), (7, 'MILLS, STEWART'), (7, 'LAMALFA, DOUG'), (7, 'KHANNA, RO'), (7, 'BABEU, PAUL RAYMOND'), (7, 'KATHLEEN, MCGINTY'), (7, 'APPLEGATE, DOUGLAS'), (7, 'COSTELLO, RYAN A'), (7, 'HOLDING, GEORGE E'), (6, 'HUERTA, EMILIO JESUS MR.'), (6, 'JUNEAU, DENISE'), (6, 'LATTA, BOB'), (6, 'HIDALGO, JUAN M JR'), (6, 'FREEMAN, MARC BENJAMIN'), (6, 'KELSEY, BRIAN'), (6, 'MCMULLIN, EVAN'), (6, 'JOHNSON, LONNIE'), (6, 'PENA-MELNYK, JOSELINE A.'), (6, 'BRIDENSTINE, JAMES'), (6, 'ROGERS, MIKE'), (6, ', HILLARY'), (6, 'SANTARSIERO, STEVEN J'), (6, 'RUIZ, RAUL'), (6, 'TIPTON, SCOTT R.'), (6, 'PITTENGER, ROBERT'), (6, 'MCSALLY, MARTHA E. MS.'), (6, 'KEFALAS, CHRYSOVALANTIS P'), (6, 'WEST, BENJAMIN'), (6, 'SESSIONS, PETE'), (6, 'CLINTON, ROSS, HILLARY DEBORAH'), (6, 'FAYARD, CATHRYN CAROLINE'), (6, 'MCCARTHY, KEVIN'), (6, 'TURNER, MICHAEL'), (6, 'CRIST, CHARLIE JOSEPH'), (6, 'MURRAY, PATTY'), (6, 'HIGGINS, CAPTAIN CLAY'), (6, 'HARTMAN, CHRISTINA'), (6, 'GARCIA, JOE'), (6, 'RENACCI, JAMES'), (6, 'ROSS, HILLARY, DEBORAH'), (5, 'MCSALLY, MARTHA E'), (5, 'LAHOOD, DARIN'), (5, 'GOWDY, TREY'), (5, 'CHABOT, PAUL'), (5, 'SHIMKUS, JOHN M'), (5, 'HOWARD, JULIA'), (5, 'GARRETT, SCOTT REP.'), (5, 'LAWRENCE, BRENDA LULENAR'), (5, 'UPTON, FREDERICK STEPHEN'), (5, 'ANGELLE, SCOTT MR.'), (5, 'SMUCKER, LLOYD K'), (5, 'HOLLIDAY, ED'), (5, 'KATKO, JOHN'), (5, 'RAND, PAUL'), (5, 'ZELDIN, LEE'), (5, 'GOSAR, PAUL'), (5, 'HILLARY, HILLARY'), (5, 'CRAIG, ANGELA'), (5, 'HILLARY RODHAM, CLINTON'), (5, 'GRAY, JIM P'), (5, 'DONOVAN, DAN'), (5, 'SANCHEZ, LORETTA'), (5, 'BABEU, PAUL'), (5, 'NEHLEN, PAUL III'), (5, 'COLE, TOM'), (5, 'NOLAN, RICHARD MICHAEL'), (4, 'STARR, MICHAEL BOB'), (4, 'TITUS, DINA'), (4, 'WALKINSHAW, BRADY PINERO'), (4, 'SUSIE, LEE'), (4, 'NEHLEN, PAUL'), (4, 'EVANS, DWIGHT'), (4, 'HOLDING, GEORGE E MR.'), (4, 'SHUSTER, BILL'), (4, 'PITTENGER, ROBERT M. HON.'), (4, 'MCCARTER, KYLE'), (4, 'DANNY, ZELAYA'), (4, 'SMITH, ADAM'), (4, \"O'HALLERAN, TOM\"), (4, 'HOUCHIN, ERIN'), (4, 'PHILLIPS, GEORGE'), (4, 'WELLS, STEVEN'), (4, 'CANOVA, TIMOTHY A.'), (4, 'GARRETT, THOMAS'), (4, 'YODER, KEVIN'), (4, 'GRIFFIN, TAYLOR'), (4, 'ESPAILLAT, ADRIANO'), (4, 'ROUZER, DAVID'), (4, 'CONYERS, JOHN'), (4, 'JOHNSON, WILLIAM'), (4, 'STUTZMAN, MARLIN A'), (4, 'JOLLY, DAVID W.'), (4, 'DELBENE, SUZAN'), (4, 'MIKE, LEE'), (4, 'RUBIN, JOEL'), (4, 'GLENN, JON'), (4, 'SUOZZI, THOMAS'), (4, 'HARTZLER, VICKY'), (4, 'TRUMP, DONALD J. / MICHAEL'), (3, 'ELLMERS, RENEE'), (3, 'SHELBY, RICHARD C'), (3, 'VERNON, MONICA W'), (3, 'TRUMO, DONALD'), (3, 'SINEMA, KYRSTEN'), (3, 'GREEN, GENE'), (3, 'KUO, PETER'), (3, 'BIRCHER, MARK'), (3, 'BOOZMAN, JOHN'), (3, 'DOLD, ROBERT JAMES MR JR'), (3, 'ZOPP, ANDREA'), (3, 'DUCKWORTH, L. TAMMY'), (3, 'PAPE, MICHAEL J'), (3, 'RAMIREZ, RITA'), (3, 'JONES, WALTER'), (3, 'BARNEY, SEAN'), (3, 'COSTELLO, RYAN'), (3, 'LUANN, BENNETT'), (3, 'LEE, MICHAEL'), (3, 'BERUFF, CARLOS'), (3, 'JOE, HECK'), (3, 'BERNIE 2016, BERNIE'), (3, 'KIRK, MARK'), (3, 'ZINKE, RYAN'), (3, 'FERGUSON IV, ANDERSON DREW'), (3, 'MCMULLIN, EVAN JOHNSON'), (3, 'DAVIS, RODNEY'), (3, 'JOYCE, DAVE'), (3, 'ISSA, DARRELL'), (3, 'ANGELLE, SCOTT'), (3, 'LINDBECK, STEVE'), (3, 'DUCKWORTH, L TAMMY'), (3, 'WILSON, FREDERICA'), (3, 'CORTEZ MASTO (NV), CATHERINE'), (3, 'KEYSER, JON'), (3, 'STEVE, KING'), (3, 'BOST, MICHAEL'), (3, 'REED, TOM'), (3, 'GOODLATTE, BOB'), (3, 'STRAUSS, RAYMOND JOHN'), (3, 'WALLKER, SCOTT'), (3, 'NITO, PARRA'), (3, 'BEN, CARSON'), (3, 'LONNIE, JOHNSON'), (3, 'BYDLAK, REBEKAH'), (3, 'KINGSON, ERIC R. MR.'), (3, 'BONOFF, TERRI'), (3, 'EDWARD, MALIN'), (3, 'SIDIE, JAY'), (3, 'HULTGREN, RANDY'), (3, 'CRIST, CHARLIE'), (3, 'PAT, TOOMEY'), (3, 'NICK, BAUMAN'), (3, 'LEWIS, JASON'), (3, 'HECK, DENNIS'), (2, 'KASICH, JOHN'), (2, 'DOLD, BOB'), (2, 'PARRA, NITO'), (2, 'MIA, LOVE'), (2, 'TIM, SCOTT'), (2, 'AGUILAR, PETE'), (2, 'BRAT, DAVID ALAN'), (2, 'FLORES, LUCY'), (2, 'LARSEN, RICK'), (2, '/ KAINE, CLINTON'), (2, 'PELOSI, NANCY'), (2, 'LAPOLICE, ALAN'), (2, 'LUCIUS, CASEY'), (2, 'JOHNSON, RAN'), (2, 'ELIZABETH, CHENEY'), (2, 'LIZ, CHENEY'), (2, 'RAMSLAND, RUSSELL'), (2, 'ASHOOH, RICHARD E.'), (2, 'MURHPY, PATRICK'), (2, 'ARRINGTON, JODEY COOK'), (2, 'DONALD J. TRUMP FOR PRESIDENT, INC.'), (2, 'PARRISH, RAY'), (2, 'BUSTOS, CHERI'), (2, 'TODD, YOUNG'), (2, 'LONG, WENDY'), (2, 'CLINTON, KIRK'), (2, 'WALZ-ALLEN, MIRANDA'), (2, 'HOLDING, GEORGE E B'), (2, 'KYRSTEN, SINEMA'), (2, 'TAYLOR, SCOTT'), (2, 'BERA, AMI'), (2, 'MEEHAN, PATRICK'), (2, 'GLENN, DAVID'), (2, 'WAKELY, THOMAS MR.'), (2, 'MCMULLIN, DAVID'), (2, 'CASTLE, DARRELL'), (2, 'GREEN, RAYMOND'), (2, 'WRIGHT, KEITH'), (2, \"O'CONNOR, SHAWN PATRICK\"), (2, 'TAKANO, MARK'), (2, 'JAWANDO, WILL'), (2, 'WRIGHT, KEITH L T'), (2, 'NEWMAN, MARIE'), (2, 'JONES, WALTER B.'), (2, 'BACON, DON'), (2, 'BUDD, THEODORE'), (2, 'MORAN, JERRY'), (2, 'KILMER, DEREK'), (2, 'HASSAN, MAGGIE'), (2, 'SPEIER, JACKIE'), (2, 'KINZINGER, ADAM'), (2, 'ROS-LEHTINEN, ILEANA THE HON.'), (2, 'CASPERSON, TOM'), (2, 'SHUSTER, WILLIAM MR.'), (2, 'MCMULLIN / NATHAN DANIEL, EVAN JOHNSON'), (2, 'GRIFFITH, MORGAN'), (2, 'UPTON, FREDERICK'), (2, 'AYOTTE, KELLEY'), (2, 'HEINZ, MATTHEW G.'), (2, 'POCAN, MARK'), (2, 'RON, DESANTIS'), (2, 'CHARLES, FERRY'), (2, 'GALLEGOS, PETE'), (2, 'CHISESI, DIANE'), (2, 'LAHOOD, DARIN MCKAY'), (2, 'ROSKAM, PETER'), (2, 'MARCO, RUBIO'), (2, 'COMER, JAMES'), (2, 'DONALD TRUMP, MIKE PENCE'), (2, 'BERGMAN, JACK'), (2, 'GRAYSON, DENA MD, PHD'), (2, 'BAUCUM, RALPH'), (2, 'CLINTON / KAINE, HILLARY RODHAM / TIM'), (2, 'FLEMING, JOHN'), (2, 'GARRETT, E SCOTT'), (2, 'SUOZZI, TOM'), (2, 'DOLD, JR., ROBERT J.'), (2, 'FETTERMAN, JOHN'), (1, 'GLENN, MANYA'), (1, 'JOHNSON, ESTELLE'), (1, 'JOHNSON, RED'), (1, 'ROONEY, FRANCIS'), (1, 'BISHOP, MIKE'), (1, 'WELLS, STEVE'), (1, 'FAYARD, CATHRYN'), (1, 'SHAPIRO, JOSH'), (1, 'GARY, JOHNSON'), (1, 'WARREN, STEWART'), (1, 'MULLIN, MARKWAYNE'), (1, 'SMITH, CHRISTOPHER'), (1, 'HECK, DENNY'), (1, 'ADAMS, ALMA SHEALEY'), (1, 'EDWARD, CRUZ'), (1, 'RAFAEL, CRUZ'), (1, 'TENNEY, CLAUDIE'), (1, 'BYRNE, BRADLEY'), (1, 'HILLARY RODHAM CLINTON, RUSS FEINGOLD'), (1, 'MCTEAGUE, DAVE'), (1, 'ROS-LEHTINEN, ILEANA'), (1, 'CHRISTIE, CHRIS'), (1, 'GLEN, SETH'), (1, 'HALL, ISAHORE'), (1, 'TRUMP, DONALD J. / M. PENCE'), (1, 'REICHERT, DAVE'), (1, 'CLINTON, HILLLARY'), (1, 'MASSIE, THOMAS H.'), (1, 'KUSTER, ANN'), (1, 'KYLE, MCCARTER'), (1, 'BARKSDALE, JAMES FREEMAN'), (1, 'CLINTON / SUOZZI / RICE/ SCHUM, HILLARY'), (1, 'CLINTON/SUOZZI/RICE/SCHUMER, HILLARY/TOM/KATHELEE'), (1, 'CHENEY, ELIZABETH'), (1, 'MOORE, GWENDOLYNNE'), (1, 'DAVIS, BRUCE'), (1, 'MCNEIL, JOHN P'), (1, 'PRICE, DAVID'), (1, 'LOUIE, GOHMERT'), (1, 'KHOURI, TONIA'), (1, 'TREY, GOWDY'), (1, 'J, RON'), (1, 'VALADAO, DAVID.'), (1, 'SCOTT, ROBERT'), (1, 'RUSSEL, FEINGOLD'), (1, 'ROBERT, DOLD'), (1, 'GRAYSON, DENA'), (1, 'PATAKI, GEORGE'), (1, 'GLENN, ARRYL'), (1, 'JOOHNSON, RON'), (1, 'GRAYSON, ALAN MARK'), (1, 'MCMULIN, EVAN'), (1, 'GRABELLE, JUSTIN M'), (1, 'FLYNN, MIKE'), (1, 'ELIJAH, MANLEY'), (1, 'MEADOWS, MARK R'), (1, 'TRUMP, DONLAD'), (1, 'CATHERINE, CORTEZ MASTO'), (1, 'QUIST, ROB'), (1, 'OLSZEWSKI, AL'), (1, 'FASO, JOHN'), (1, 'JAPAYAL, PRAMILA'), (1, 'DONALS, TRUMP'), (1, 'TRUMP, DONALS'), (1, 'ELBERT, GUILLORY'), (1, 'FRANK, BEN'), (1, 'CONNOLLY, GERALD E'), (1, 'BRAD, ASHFORD'), (1, 'LOBIONDO, FRANK A.'), (1, 'ALLEN, JASON'), (1, 'SANTORUM, RICHARD'), (1, 'SCHUMER, CHARLES'), (1, 'LAW, ALEXANDER'), (1, 'KATIE, MCGINTY'), (1, 'RON, JOHNSON'), (1, 'LANCE, LEONARD'), (1, 'DIANE, CHISSESI'), (1, 'BACKER, DAN'), (1, 'DICIANNI, PETER'), (1, \"DEMINGS, VALDEZ 'VAL'\"), (1, 'TOWNSEND, BRYAN'), (1, 'CLINTON/SUOZZI/RICE/SCHUMER, '), (1, 'BRANNON, JOSH'), (1, 'DERICKSON, T'), (1, 'CRAIG, ANGELA DAWN'), (1, 'GERRITSON, REBECCA'), (1, 'GOHMERT, LOUIE'), (1, 'BEYER, DONALD STERNOFF'), (1, 'MOORE, GWEN S'), (1, 'ERIK, PAULSEN'), (1, 'GENE, GREEN'), (1, 'COPE, CLAY'), (1, 'GLENN, SETH'), (1, 'WALTZ, BRENT'), (1, 'SHAPINO, JOSH'), (1, 'BABINEC, MARTIN'), (1, 'WALSER, JASON'), (1, 'MILLS, THOMAS'), (1, 'GARCIA, JOSE ANTONIO'), (1, 'CCARSON, BEN'), (1, 'RYAN, PAUL'), (1, 'COTTON, THOMAS'), (1, 'LAND, TERRI LYNN'), (1, 'JOHNSON, MICHAEL'), (1, 'KIEHNE, GARY'), (1, 'AMERISH, BERA'), (1, 'CORTEZ-MASTOS, CATHERINE'), (1, 'PAULSEN, ERIC'), (1, 'GLENN, DARRY'), (1, 'GLENN, SHAWN'), (1, 'JOHSON, RON'), (1, 'LAYENDECKER, LEVANA'), (1, 'ASHOOH, RICHARD'), (1, 'LONG, BILLY'), (1, 'GORDON, KINZLER'), (1, 'DANIEL, MUROFF'), (1, 'CLLINTON, HILLARY'), (1, 'SLAUGHTER, LOUISE'), (1, 'BRYSON, RICK'), (1, 'HURD, WILL'), (1, 'MCSALLY, MARTHA'), (1, 'PLUMB, JOHN'), (1, 'DENT, CHARLES'), (1, 'GREGORY, DUWAYNE'), (1, 'STEFANIK, ELISE M'), (1, 'COSTA, JIM'), (1, 'DEBORAH, ROSS'), (1, 'MACARTHUR, THOMAS'), (1, 'LOFGREN, ZOE'), (1, ', HILLARY / TOM / KATH'), (1, 'MIKE, JOHNSON'), (1, 'WHITWELL, ROBERT'), (1, 'SCHNEIDER, BRADLEY SCOTT'), (1, 'DASTO, CATHERINE COR'), (1, 'BOST, MIKE'), (1, 'SHAUGHNESSY, NAUGHTON'), (1, 'VARIOUS REPUBLICAN, CANDIDATES'), (1, 'MAGGIE, HASSAN'), (1, 'RUSS, FEINGOLD'), (1, 'CLINTON (NV), HILLARY'), (1, 'BONGINO, DANIEL J'), (1, 'GOSAR, PAUL ANTHONY'), (1, 'GLENN, DARR'), (1, 'DAVIS, RODNEY L'), (1, 'HUELSKAMP, TIMOTHY A'), (1, 'TUMP, DONALD'), (1, 'PETERSON, COLLIN CLARK'), (1, 'CLEMENTS, PAUL'), (1, 'KELLY, ROBIN L.'), (1, 'NOLAN, RICHARD M.'), (1, 'POLIQUIN, BRUCE'), (1, 'CHABOT, STEVE'), (1, 'HOLDING, GEORGE'), (1, 'CLINTON, '), (1, 'CLINTON/SUOZZI/RICE/SCHUMER, HILLARY'), (1, 'JAMES, JORDAN'), (1, 'JAMES, LANKFORD'), (1, 'KELLI, WARD'), (1, 'ROSENBAUM, ANDREW'), (1, 'KRISHNAMOORTHI, S. RAJA'), (1, 'ADRIAN, GARCIA'), (1, \"ANTHONY, D'ORAZIO\"), (1, 'WARREN, WEST')]\n" + ] + } + ], "source": [ "# Print to the console a list containing tuples of (count of supportive expenditures, candidate names)\n", "print(supportive_expenditures_by_candidate.collect())" @@ -143,9 +175,17 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 11, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[(27648, 'TRUMP, DONALD'), (12715, 'PORTMAN, ROB'), (8801, 'BURR, RICHARD'), (2663, 'TOOMEY, PATRICK'), (2476, 'CLINTON, HILLARY RODHAM'), (1997, 'TRUMP, DONALD J.'), (1634, 'BLUNT, ROY'), (1432, 'RUBIO, MARCO'), (1229, 'CLINTON, HILLARY'), (853, 'TRUMP, DONALD J'), (811, 'KIRK, MARK'), (472, 'YOUNG, TODD'), (362, 'STRICKLAND, TED'), (322, 'BAYH, EVAN'), (288, 'MCGINTY, KATHLEEN ALANA'), (278, 'KANDER, JASON'), (255, 'HECK, JOE'), (213, 'MURPHY, PATRICK E'), (197, 'FEINGOLD, RUSSELL DANA'), (189, 'MASTO, CATHERINE CORTEZ'), (186, 'AYOTTE, KELLY'), (175, 'ROSS, DEBORAH K'), (166, 'CORTEZ MASTO, CATHERINE'), (152, 'TOOMEY, PAT'), (152, 'CARROLL, MORGAN'), (122, 'MASTO, CATHERINE'), (117, 'HECK, JOSEPH'), (116, 'MCGINTY, KATHLEEN'), (106, 'HURD, WILLIAM'), (99, \"CRUZ, RAFAEL EDWARD 'TED'\"), (98, 'GARRETT, SCOTT'), (88, 'POLIQUIN, BRUCE'), (83, 'COMSTOCK, BARBARA'), (80, 'MILLS, STEWART'), (79, 'TARKANIAN, DANNY'), (75, 'TOOMEY, PATRICK JOSEPH'), (72, 'KNIGHT, STEVE'), (71, 'FITZPATRICK, BRIAN'), (68, 'TENNEY, CLAUDIA'), (68, 'BLUM, RODNEY'), (67, 'FASO, JOHN'), (67, 'CATHERINE, MASTO'), (66, 'CLINTON, HILARY'), (65, 'TEACHOUT, ZEPHYR'), (65, 'JONES, SCOTT'), (65, 'DONALD, TRUMP'), (61, 'ROSS, DEBORAH'), (60, 'BUSH, JEB'), (59, 'COFFMAN, MICHAEL'), (58, 'PERKINS, RANDY'), (57, 'ASHFORD, BRAD'), (57, 'AYOTTE, KELLY A'), (56, 'ELLMERS, RENEE'), (54, 'BABINEC, MARTIN'), (53, 'HASSAN, MARGARET WOOD'), (52, 'GARCIA, JOE'), (51, 'COFFMAN, MIKE REP.'), (51, 'MARGARET, HASSAN'), (51, 'BABEU, PAUL'), (50, 'BERGMAN, JOHN'), (50, 'BENNETT, LUANN'), (48, 'JOSEPH, PATRICK'), (48, 'YOUNG, DAVID'), (47, 'ROSEN, JACKY'), (46, 'CAIN, EMILY'), (44, 'CURBELO, CARLOS'), (44, 'FEINGOLD, RUSSELL'), (43, 'MOWRER, JIM'), (43, 'HARDY, CRESENT'), (42, 'ISSA, DARRELL'), (41, 'KASICH, JOHN'), (40, 'CRIST, CHARLIE JOSEPH'), (39, 'HUELSKAMP, TIMOTHY A.'), (39, 'PAULSEN, ERIK'), (38, 'FASO, JOHN J. MR.'), (37, 'BRADY, KEVIN'), (37, 'KATKO, JOHN'), (36, 'DUNN, NEAL PATRICK MD'), (34, 'MURPHY, PATRICK'), (34, 'KASICH, JOHN R'), (34, 'VERNON, MONICA'), (34, 'TRUMP, '), (34, 'ZELDIN, LEE'), (33, 'GALLEGO, PETE'), (33, 'PATRICK, TOOMEY'), (33, 'LEWIS, JASON'), (32, 'KIHUEN, RUBEN'), (32, 'JOHNSON, LON'), (32, 'GOSAR, PAUL ANTHONY'), (31, 'ROY, BLUNT'), (31, 'MYERS, KIM'), (31, 'FERGUSON, ANDERSON DREW IV'), (31, 'CHRISTIE, CHRISTOPHER J.'), (31, 'YODER, KEVIN'), (31, 'BIRCH, BAYH'), (31, 'ELLMERS, RENEE JACISIN'), (30, 'FEINGOLD, RUSS'), (29, 'CRUZ, RAFAEL EDWARD TED'), (29, 'CRUZ, TED'), (29, 'TRUMP, TRUMP'), (29, 'CARBAJAL, SALUD'), (28, 'HUELSKAMP, TIMOTHY A REPRESENTA'), (28, 'BENNETT, MICHAEL'), (28, 'DENHAM, JEFF'), (28, 'DEACON, COLLEEN'), (27, 'WARD, KELLI'), (27, 'JOHNSON, RON'), (27, 'JOHNSON, RONALD HAROLD'), (27, 'MICA, JOHN'), (26, 'KELLY, AYOTTE'), (25, 'SANTARSIERO, STEVEN'), (25, 'SCHNEIDER, BRADLEY'), (25, 'NOLAN, RICHARD'), (25, 'ROB, PORTMAN'), (25, 'NELSON, TOM'), (25, 'KATHLEEN, MCGINTY'), (24, 'HASSAN, MARGARET'), (23, 'YODER, SHELLI'), (23, 'JOE, HECK'), (23, 'SOTO, DARREN'), (23, 'RICHARD, BURR'), (22, 'TED, STRICKLAND'), (22, 'TODD, YOUNG'), (22, 'CRUZ, RAFAEL'), (22, 'NOLAN, RICK'), (22, 'FASO, JOHN J.'), (21, 'TINNEY, CLAUDIA'), (21, 'CRAIG, ANGIE'), (21, 'BOUSTANY, CHARLES W.'), (20, 'THOMAS, MARY'), (20, 'THEODORE, STRICKLAND'), (19, 'MCCAIN, JOHN'), (19, 'FAREED, JUSTIN'), (19, 'KASICH, JOHN R.'), (18, 'JOHNSON, RONALD'), (18, 'GRASSLEY, CHARLES E SENATOR'), (18, 'CHRISTIE, CHRIS'), (18, 'PAUL, RAND'), (17, 'KIRKPATRICK, ANN LEILA'), (17, 'TOOMEY (PA), PAT'), (17, 'HOLLINGSWORTH, TREY'), (17, 'CAMPBELL, FOSTER'), (17, 'CARSON, BENJAMIN'), (17, 'HECK (NV), JOE'), (17, 'BENNET, MICHAEL F'), (16, 'BERA, AMERISH'), (16, 'FLEMING, JOHN C.'), (16, 'FIORINA, CARLY'), (16, 'RYAN, PAUL'), (16, 'LOVE, MIA'), (16, 'KENNEDY, JOHN NEELY'), (16, 'DOLD, ROBERT'), (15, 'BACON, DONALD'), (15, 'MARSHALL, ROGER W'), (15, 'MURPHY, PATRICK E.'), (15, 'ANGELLE, SCOTT MR.'), (15, 'HEANEY, ANDREW'), (15, 'BACON, DON'), (15, 'SANDERS, BERNARD'), (15, 'JOLLY, DAVID'), (15, 'DITTMAR, JANE'), (15, 'JASON, KANDER'), (15, 'TOM, KIP E'), (15, 'JONES, CHRISTINE'), (15, 'GRAHAM, LINDSEY'), (14, 'MCCAIN, JOHN S'), (14, 'BABEU, PAUL RAYMOND'), (14, 'WALBERG, TIMOTHY'), (13, 'CAFORIO, BRYAN'), (13, 'SANTARSIERO, STEVE'), (13, 'DUCKWORTH, L TAMMY'), (13, 'OWENS, H DOUGLAS'), (13, 'HUCKABEE, MIKE'), (13, 'TIPTON, SCOTT'), (12, 'TRUMP, TRUMP'), (12, 'GARCIA, ADRIAN'), (12, 'HONDA, MIKE'), (12, 'WALKER, SCOTT'), (12, 'YOUNG, TODD CHRISTOPHER'), (12, 'CHRISTIE, CHRISTOPHER J'), (12, 'THRONE-HOLST, ANNA'), (12, 'MASTRO, CATHERINE'), (11, 'EGGMAN, MICHAEL'), (11, 'GOSS, CHAUNCEY'), (11, 'KURT, SCHRADER'), (11, 'VALADAO, DAVID'), (11, 'HIGGINS, CAPTAIN CLAY'), (11, 'ZOELLER, GREGORY FRANCIS MR.'), (10, 'PATRICK, MURPHY'), (10, 'POLIQUIN, BRUCE L'), (10, 'BERA, AMI'), (10, 'DAVIDSON, WARREN'), (10, 'BONOFF, TERRI'), (9, 'RANDOLPH, SUSANNAH'), (9, 'COFFMAN, MIKE'), (9, 'BONGINO, DANIEL'), (9, 'GRAYSON, DENA'), (9, 'HALL, ISADORE'), (9, 'SCHNEIDER, HELENE'), (9, 'SCHWARTZ, GALE'), (9, 'MCGINTY, KATIE'), (9, 'HARTMAN, CHRISTINA'), (9, 'SUOZZI, THOMAS'), (9, 'HALVORSON, ARTHUR L'), (8, 'ROONEY, FRANCIS'), (8, 'GALLAGHER, MICHAEL JOHN'), (8, 'GLENN, DARRYL'), (8, 'DERICKSON, TIMOTHY'), (8, ', '), (8, 'HUERTA, EMILIO'), (8, 'BEAGLE, WILLIAM'), (8, 'CLINTON/KAINE, HILLARY RODHAM/TIMOT'), (8, 'CORREA, LOU'), (8, 'DOLD, JR., ROBERT JAMES'), (8, 'RUTHERFORD, JOHN'), (8, 'SIDIE, JAY'), (8, 'MARSHALL, ROGER'), (7, 'RUBIO (FL), MARCO'), (7, 'GALLAGHER, MICHAEL'), (7, '/ PENCE, TRUMP'), (7, 'RUSSELL, FEINGOLD'), (7, 'HASSAN, MAGGIE'), (7, 'AYOTTE, KELLY A.'), (7, 'BLUNT (MO), ROY'), (7, 'MURPHY, STEPHANIE'), (7, 'SHEA-PORTER, CAROL'), (7, 'TRUMP, TRUMP TRUMP'), (6, 'YOUNG (IN), TODD CHRISTOPHER'), (6, 'BECCARO, THOMAS DEL'), (6, 'BENNET, MICHAEL'), (6, 'SHIMKUS, JOHN M'), (6, 'SCHRADER, KURT'), (6, 'LONNIE, CAMPBELL'), (6, 'DUCKWORTH, TAMMY'), (6, 'HOUCHIN, ERIN'), (6, 'STUTZMAN, MARLIN'), (6, 'JOYCE, DAVE'), (6, 'CARSON, BEN'), (6, 'CASPERSON, TOM'), (6, 'MASTRO, CATHERINE CORTEZ'), (6, 'CAMPBELL, FOSTER LONNIE II'), (6, 'SHKRELI, SUZANNA'), (6, 'GRAYSON, DENA MD, PHD'), (6, 'REED, THOMAS'), (5, 'RYAN, PAUL D.'), (5, 'TANZLER, HANS'), (5, 'CRANE, MICHAEL'), (5, 'DONALD J. TRUMP FOR PRESIDENT, INC.'), (5, 'SESTAK, JOSEPH'), (5, 'COMSTOCK, BARBARA J HONORABLE'), (5, 'KIRK, MARK STEVEN'), (5, 'ZINKE, RYAN'), (5, 'STEVEN, SANTARSIERO'), (5, 'BROWN, LIZ'), (5, 'EVANS, BAYH'), (5, 'DRISKELL, GRETCHEN'), (5, ', TRUMP'), (5, 'JUDGE, PATTY'), (4, 'CORTEZ-MASTO, CATHERINE'), (4, 'AYOTTE ((NH), KELLY'), (4, 'JOHNSON, GARY'), (4, 'GAETZ, MATT'), (4, 'CLINTON, HILLARY CLINTON/K'), (4, 'MARCO, RUBIO'), (4, 'JOHNSON, JAMES MICHAEL'), (4, 'DEBORAH, ROSS'), (4, 'SCHNEIDER, BRADLEY SCOTT'), (4, 'FLINN, GEORGE S DR JR'), (4, 'HEINZ, MATT'), (4, 'BRANNON, GREGORY'), (3, 'FLORES, LUCY'), (3, 'TOTH, STEVE'), (3, 'FIORE, MICHELE'), (3, 'LAHOOD, DARIN'), (3, 'OWENS, DOUG'), (3, 'CHABOT, PAUL'), (3, 'BANKS, JAMES E'), (3, 'MAXWELL, CHIP'), (3, 'ALLEN, JASON'), (3, 'MCMICHAEL, CRAIG'), (3, 'CARSON, BENJAMIN S SR MD'), (3, 'CANOVA, TIMOTHY A.'), (3, 'GRAY, JIM P'), (3, 'DEAN, ANDRE'), (3, 'FAYARD, CATHRYN CAROLINE'), (3, 'MARTINS, JACK'), (3, 'MITCHELL, PAUL III'), (3, 'SCHUMER, CHARLES E'), (3, 'BOUSTANY, CHARLES W JR DR'), (3, 'ROGERS, WENDY'), (3, 'SANDERS, BERNIE'), (3, 'HALVORSON, ARTHUR'), (3, 'NEGRON, REBECCA'), (3, 'CAMPBELL, FOSTER LONNNIE II'), (2, 'DONALD J., TRUMP'), (2, 'GRIFFIN, WILLIAM TAYLOR'), (2, 'CHRISTENSEN, GORDON'), (2, 'PELOSI, NANCY'), (2, 'EDWARDS, DONNA FERN'), (2, 'GARRETT, SCOTT REP.'), (2, 'GUINTA, FRANK'), (2, 'BIRCH, BAY'), (2, 'MURPHY, CHRISTOPHER S'), (2, 'JINDAL, BOBBY'), (2, 'KIRKPATRICK, ANN'), (2, 'TRUMP (IN), DONALD J.'), (2, 'TRUMP (MO), DONALD J.'), (2, 'KING, STEVE'), (2, 'HARRIS, KAMALA'), (2, 'BERUFF, CARLOS'), (2, 'FRANK, GUINTA'), (2, 'DUNN, NEAL'), (2, 'CANO, FERNANDO'), (2, 'NEU, JAMES'), (2, 'JONES, ROGER STARNER'), (2, 'ELDRIDGE, CONNER'), (2, 'DEGNER, KAI'), (2, 'KLEPINGER, ROBERT'), (2, 'MILLS, THOMAS'), (2, 'MUNDY, KEITH'), (2, 'GENE, GREEN'), (2, 'BURR (NC), RICHARD'), (2, 'GOTTHEIMER, JOSH'), (2, 'BOST, MICHAEL'), (2, 'MCCONNELL, JONATHAN EDWARD'), (2, 'MCCAIN, JOHN S.'), (2, 'CATHERINE, MAST0'), (2, 'HUELSKAMP, TIM'), (2, 'ZELDIN, LEE M'), (2, 'DERRICK, MIKE'), (2, 'SCHAKOWSKY, JANICE D'), (2, 'LASEE, FRANK'), (2, 'PERRY, RICK'), (2, 'JOHN, MCCAIN'), (1, 'PAUL, RYAN'), (1, 'CHRISTOPHER, YOUNG'), (1, 'WAGNER, ANN L.'), (1, 'HILLARY, CLINTON'), (1, 'DUKE, DAVID'), (1, 'HILL, JAMES FRENCH'), (1, 'CRUZ, RAFAEL EDWARD'), (1, 'BONNOFF, TERRI'), (1, 'JOLLY, DAVID W'), (1, 'MCGINTY, KATHLLEEN'), (1, 'CARROL, MORGAN'), (1, 'DELANEY, JOHN K'), (1, 'KITTS, DERRICK'), (1, 'PORTMA, ROB'), (1, 'GLIDEWELL, PET'), (1, 'FRANK, ROBERT'), (1, 'PETERS, GARY'), (1, 'BARRAGAN, NANETTE'), (1, 'REED, WENDY'), (1, 'PENCE, TRUMP /'), (1, 'CLINTON, HILL'), (1, 'PRYOR, MARK LUNSFORD'), (1, 'LANDRIEU, MARY L'), (1, 'MAST, BRIAN'), (1, 'RAY, LAKE GROSS III'), (1, 'MCSALLY, MARTHA'), (1, 'KIEHNE, GARY'), (1, 'ACHADJIAN, KHATCHIK'), (1, 'SCHULTZ, DEBBIE WASSERMAN'), (1, 'LONNIE, CAMPBEL'), (1, 'SUKHIA, KEN'), (1, 'KITTS, DEREK'), (1, 'OSSOFF, JONATHAN'), (1, 'HILLARY CLINTON, RUSS FEINGOLD'), (1, 'CLINTER, HILLARY'), (1, 'CAROLL, MORGAN'), (1, 'PLUMB, JOHN'), (1, 'SEAN, FLYNN'), (1, 'DONALD, TRUMPH'), (1, 'TRUMP, DONAL'), (1, 'SMITH, LAMAR'), (1, 'MCCOLLUM, BETTY'), (1, 'DUFFY, SEAN')]\n" + ] + } + ], "source": [ "# Print to the console a list containing tuples of (count of oppositional expenditures, candidate names)\n", "print(oppositional_expenditures_by_candidate.collect())" @@ -153,9 +193,17 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 12, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[((39523, 1229), 'CLINTON, HILLARY'), ((16440, 362), 'STRICKLAND, TED'), ((9572, 61), 'ROSS, DEBORAH'), ((7577, 116), 'MCGINTY, KATHLEEN'), ((3316, 34), 'MURPHY, PATRICK'), ((3297, 278), 'KANDER, JASON'), ((1979, 2476), 'CLINTON, HILLARY RODHAM'), ((885, 27648), 'TRUMP, DONALD'), ((820, 6), 'DUCKWORTH, TAMMY'), ((682, 1432), 'RUBIO, MARCO'), ((673, 60), 'BUSH, JEB'), ((671, 31), 'CHRISTIE, CHRISTOPHER J.'), ((574, 99), \"CRUZ, RAFAEL EDWARD 'TED'\"), ((572, 15), 'SANDERS, BERNARD'), ((497, 6), 'CARSON, BEN'), ((452, 322), 'BAYH, EVAN'), ((403, 3), 'SANDERS, BERNIE'), ((398, 29), 'CRUZ, TED'), ((307, 189), 'MASTO, CATHERINE CORTEZ'), ((257, 8), 'GLENN, DARRYL'), ((242, 0), \"CRUZ, RAFAEL 'TED'\"), ((223, 27), 'JOHNSON, RON'), ((198, 853), 'TRUMP, DONALD J'), ((191, 9), 'MCGINTY, KATIE'), ((185, 0), 'RODHAM CLINTON, HILLARY'), ((181, 34), 'KASICH, JOHN R'), ((177, 29), 'CRUZ, RAFAEL EDWARD TED'), ((172, 166), 'CORTEZ MASTO, CATHERINE'), ((168, 288), 'MCGINTY, KATHLEEN ALANA'), ((153, 255), 'HECK, JOE'), ((153, 18), 'PAUL, RAND'), ((149, 16), 'FIORINA, CARLY'), ((148, 30), 'FEINGOLD, RUSS'), ((119, 12715), 'PORTMAN, ROB'), ((117, 53), 'HASSAN, MARGARET WOOD'), ((113, 0), 'LEE, MIKE'), ((110, 16), 'LOVE, MIA'), ((105, 1997), 'TRUMP, DONALD J.'), ((99, 1634), 'BLUNT, ROY'), ((99, 12), 'WALKER, SCOTT'), ((98, 75), 'TOOMEY, PATRICK JOSEPH'), ((97, 32), 'KIHUEN, RUBEN'), ((92, 4), 'CORTEZ-MASTO, CATHERINE'), ((91, 15), 'GRAHAM, LINDSEY'), ((88, 213), 'MURPHY, PATRICK E'), ((83, 8801), 'BURR, RICHARD'), ((82, 5), 'DRISKELL, GRETCHEN'), ((81, 175), 'ROSS, DEBORAH K'), ((81, 66), 'CLINTON, HILARY'), ((80, 106), 'HURD, WILLIAM'), ((74, 34), 'VERNON, MONICA'), ((73, 3), 'CAMPBELL, FOSTER LONNNIE II'), ((69, 17), 'KIRKPATRICK, ANN LEILA'), ((68, 44), 'CURBELO, CARLOS'), ((65, 0), 'SCOTT, TIMOTHY E'), ((63, 0), 'CLINTON, HILLARY RODHAM / K'), ((62, 4), 'JOHNSON, GARY'), ((61, 57), 'ASHFORD, BRAD'), ((61, 57), 'AYOTTE, KELLY A'), ((59, 27), 'JOHNSON, RONALD HAROLD'), ((58, 27), 'WARD, KELLI'), ((58, 0), 'VAN HOLLEN, CHRIS'), ((55, 0), 'DESANTIS, RONALD'), ((53, 24), 'HASSAN, MARGARET'), ((52, 7), 'AYOTTE, KELLY A.'), ((52, 0), 'JAYAPAL, PRAMILA'), ((51, 6), 'STUTZMAN, MARLIN'), ((51, 0), 'GALLAGHER, MIKE'), ((50, 2), 'JINDAL, BOBBY'), ((49, 2663), 'TOOMEY, PATRICK'), ((48, 50), 'BENNETT, LUANN'), ((48, 33), 'GALLEGO, PETE'), ((47, 0), 'HOEBER, AMIE'), ((45, 11), 'EGGMAN, MICHAEL'), ((45, 0), \"O'MALLEY, MARTIN\"), ((44, 1), 'MAST, BRIAN'), ((44, 0), 'SCHNEIDER, BRAD'), ((43, 25), 'NELSON, TOM'), ((43, 22), 'CRUZ, RAFAEL'), ((41, 0), 'APPLEGATE, DOUG'), ((39, 29), 'CARBAJAL, SALUD'), ((39, 16), 'DOLD, ROBERT'), ((39, 13), 'HUCKABEE, MIKE'), ((39, 0), 'CRANE, MICHAEL ROBERT'), ((38, 2), 'GOTTHEIMER, JOSH'), ((38, 1), 'HILLARY, CLINTON'), ((38, 0), 'VELAZQUEZ, NYDIA'), ((37, 44), 'FEINGOLD, RUSSELL'), ((36, 7), 'SHEA-PORTER, CAROL'), ((36, 0), 'DOLD, ROBERT JAMES JR'), ((35, 197), 'FEINGOLD, RUSSELL DANA'), ((35, 0), 'SZELIGA, KATHY'), ((34, 14), 'MCCAIN, JOHN S'), ((33, 13), 'CAFORIO, BRYAN'), ((33, 10), 'DAVIDSON, WARREN'), ((33, 1), 'HILLARY CLINTON, RUSS FEINGOLD'), ((32, 4), 'GAETZ, MATT'), ((31, 186), 'AYOTTE, KELLY'), ((31, 7), 'MURPHY, STEPHANIE'), ((31, 0), 'MARSHALL, ROGER W.'), ((30, 17), 'HOLLINGSWORTH, TREY'), ((29, 3), 'NEGRON, REBECCA'), ((28, 20), 'THOMAS, MARY'), ((27, 122), 'MASTO, CATHERINE'), ((27, 28), 'DENHAM, JEFF'), ((27, 0), 'REED, THOMAS W II'), ((26, 28), 'HUELSKAMP, TIMOTHY A REPRESENTA'), ((26, 22), 'TED, STRICKLAND'), ((26, 16), 'KENNEDY, JOHN NEELY'), ((26, 6), 'SCHRADER, KURT'), ((26, 0), 'STEFANIK, ELISE M.'), ((25, 152), 'CARROLL, MORGAN'), ((25, 48), 'YOUNG, DAVID'), ((25, 8), 'HUERTA, EMILIO'), ((25, 0), 'KUSTER, ANN MCLANE'), ((25, 0), 'WILLIS, COLM'), ((25, 0), 'DIANE, CHISESI'), ((24, 2), 'EDWARDS, DONNA FERN'), ((24, 0), 'BUDD, THEODORE P MR.'), ((23, 0), 'PENA-MELNYK, JOSELINE'), ((23, 0), 'WASSERMAN SCHULTZ, DEBBIE'), ((23, 0), 'CLINTON, CLINTON'), ((22, 472), 'YOUNG, TODD'), ((22, 9), 'COFFMAN, MIKE'), ((22, 0), 'PG, SITTENFELD'), ((22, 0), 'FERGUSON, DREW'), ((21, 19), 'FAREED, JUSTIN'), ((21, 17), 'BENNET, MICHAEL F'), ((21, 15), 'BACON, DONALD'), ((21, 0), 'JOHNSON, JAMES'), ((21, 0), 'PERRY, JAMES R (RICK)'), ((20, 79), 'TARKANIAN, DANNY'), ((20, 39), 'PAULSEN, ERIK'), ((20, 19), 'MCCAIN, JOHN'), ((20, 0), 'SANTORUM, RICHARD J.'), ((20, 0), 'ZINKE, RYAN K'), ((20, 0), 'MANESS, ROBERT L COL. RET'), ((19, 2), 'HARRIS, KAMALA'), ((19, 0), 'LEE, YUNGMAN'), ((19, 0), 'GUTIERREZ, ANA SOL'), ((19, 0), 'BIGGS, ANDY'), ((18, 23), 'SOTO, DARREN'), ((18, 21), 'CRAIG, ANGIE'), ((18, 8), 'DERICKSON, TIMOTHY'), ((18, 1), 'BARRAGAN, NANETTE'), ((18, 0), 'WILDER, SELLUS'), ((18, 0), 'BANKS, JAMES'), ((18, 0), 'MOONEY, ALEXANDER XAVIER'), ((17, 68), 'BLUM, RODNEY'), ((17, 25), 'SANTARSIERO, STEVEN'), ((17, 16), 'BERA, AMERISH'), ((17, 3), 'CARSON, BENJAMIN S SR MD'), ((17, 0), 'SASSE, BENJAMIN E'), ((17, 0), 'KENNEDY, JOHN'), ((17, 0), 'HILARY, CLINTON'), ((17, 0), 'ISAKSON, JOHNNY'), ((17, 0), 'WILLIAM BILL WELD, GARY JOHNSON /'), ((17, 0), 'EMMER, THOMAS EARL JR.'), ((16, 68), 'TENNEY, CLAUDIA'), ((16, 65), 'TEACHOUT, ZEPHYR'), ((16, 65), 'JONES, SCOTT'), ((16, 47), 'ROSEN, JACKY'), ((16, 46), 'CAIN, EMILY'), ((16, 43), 'HARDY, CRESENT'), ((16, 5), 'SESTAK, JOSEPH'), ((16, 3), 'TOTH, STEVE'), ((16, 2), 'GUINTA, FRANK'), ((16, 0), 'TED, CRUZ'), ((16, 0), 'COMSTOCK, BARBARA J.'), ((15, 65), 'DONALD, TRUMP'), ((15, 22), 'NOLAN, RICK'), ((15, 18), 'JOHNSON, RONALD'), ((15, 3), 'ROGERS, WENDY'), ((15, 0), 'MURKOWSKI, LISA'), ((15, 0), 'HUELSKAMP, TIMOTHY'), ((15, 0), 'CLINTON, ROSS, HILLARY'), ((15, 0), 'COOK, PAUL'), ((14, 25), 'NOLAN, RICHARD'), ((14, 18), 'GRASSLEY, CHARLES E SENATOR'), ((14, 11), 'VALADAO, DAVID'), ((14, 8), 'CORREA, LOU'), ((14, 5), 'COMSTOCK, BARBARA J HONORABLE'), ((14, 3), 'BANKS, JAMES E'), ((14, 0), 'RASKIN, JAMIE'), ((14, 0), 'CURBELO, CARLOS MR.'), ((14, 0), 'NORCROSS, DONALD'), ((14, 0), 'KATKO, JOHN M'), ((14, 0), 'GARCIA, JOSE'), ((13, 71), 'FITZPATRICK, BRIAN'), ((13, 43), 'MOWRER, JIM'), ((13, 37), 'BRADY, KEVIN'), ((13, 10), 'PATRICK, MURPHY'), ((13, 2), 'ZELDIN, LEE M'), ((13, 0), 'KATIE, MCGINTY'), ((13, 0), 'FLYNN, MICHAEL'), ((12, 152), 'TOOMEY, PAT'), ((12, 5), 'KIRK, MARK STEVEN'), ((12, 4), 'JOHNSON, JAMES MICHAEL'), ((12, 2), 'DUNN, NEAL'), ((12, 0), 'SHELBY, RICHARD'), ((12, 0), 'PATAKI, GEORGE E'), ((12, 0), 'MATTHEWS, KATHLEEN'), ((12, 0), 'SMUCKER, LLOYD'), ((12, 0), 'COLM, WILLIS'), ((12, 0), 'HUDSON, RICHARD'), ((11, 117), 'HECK, JOSEPH'), ((11, 83), 'COMSTOCK, BARBARA'), ((11, 50), 'BERGMAN, JOHN'), ((11, 28), 'DEACON, COLLEEN'), ((11, 12), 'CHRISTIE, CHRISTOPHER J'), ((11, 10), 'POLIQUIN, BRUCE L'), ((11, 0), 'SCHWARTZ, GAIL'), ((11, 0), 'MEEHAN, PATRICK L. MR.'), ((11, 0), 'DEMINGS, VAL'), ((11, 0), 'JUDGE, PATTY JEAN'), ((11, 0), 'SHIMKUS, JOHN'), ((10, 98), 'GARRETT, SCOTT'), ((10, 59), 'COFFMAN, MICHAEL'), ((10, 12), 'THRONE-HOLST, ANNA'), ((10, 8), ', '), ((10, 0), 'DOLD JR., ROBERT JAMES MR.'), ((10, 0), 'EDWARDS, DONNA'), ((9, 72), 'KNIGHT, STEVE'), ((9, 38), 'FASO, JOHN J. MR.'), ((9, 17), 'CARSON, BENJAMIN'), ((9, 12), 'YOUNG, TODD CHRISTOPHER'), ((9, 9), 'HALL, ISADORE'), ((9, 8), 'GALLAGHER, MICHAEL JOHN'), ((9, 0), 'CORREA, JOSE LUIS (LOU)'), ((9, 0), \"O'MALLEY, MARTIN JOSEPH\"), ((9, 0), \"SUNDHEIM, GEORGE 'DUF'\"), ((9, 0), 'CHABOT, PAUL R DR.'), ((9, 0), 'MARIE, DAVIS'), ((9, 0), 'FLEMING, JOHN C JR'), ((9, 0), 'BRIDENSTINE, JAMES FREDERICK'), ((9, 0), 'ROBERSON, MICHAEL'), ((9, 0), 'PETERS, SCOTT'), ((9, 0), 'ROCHESTER, LISA BLUNT'), ((8, 51), 'MARGARET, HASSAN'), ((8, 31), 'MYERS, KIM'), ((8, 12), 'HONDA, MIKE'), ((8, 9), 'RANDOLPH, SUSANNAH'), ((8, 8), 'MARSHALL, ROGER'), ((8, 6), 'BENNET, MICHAEL'), ((8, 5), 'CRANE, MICHAEL'), ((8, 2), 'KIRKPATRICK, ANN'), ((8, 0), 'ROSS, HENRY'), ((8, 0), 'YOUNG, DON'), ((8, 0), 'JOYCE, DAVID'), ((8, 0), 'DESANTIS, RONALD D.'), ((8, 0), 'DESANTIS, RONALD D'), ((8, 0), 'KAPLAN, ANNA'), ((8, 0), 'DUNN, JOE'), ((8, 0), 'GRASSLEY, CHUCK'), ((8, 0), 'KEMPER, NANCY JO'), ((8, 0), 'DAVIS, MARIE'), ((8, 0), 'MICA, JOHN L. MR.'), ((7, 80), 'MILLS, STEWART'), ((7, 25), 'KATHLEEN, MCGINTY'), ((7, 15), 'MARSHALL, ROGER W'), ((7, 14), 'BABEU, PAUL RAYMOND'), ((7, 7), 'GALLAGHER, MICHAEL'), ((7, 0), 'DUNN MD FACS, NEAL PATRICK'), ((7, 0), 'ROBY, MARTHA'), ((7, 0), 'MONTES, JOSEPH'), ((7, 0), 'MANDEL, JOSH'), ((7, 0), 'BERTRAND, RICK'), ((7, 0), 'STUTZMAN, MARLIN A.'), ((7, 0), 'TADDEO, ANNETTE'), ((7, 0), 'LAMALFA, DOUG'), ((7, 0), 'KHANNA, RO'), ((7, 0), 'APPLEGATE, DOUGLAS'), ((7, 0), 'COSTELLO, RYAN A'), ((7, 0), 'HOLDING, GEORGE E'), ((6, 52), 'GARCIA, JOE'), ((6, 40), 'CRIST, CHARLIE JOSEPH'), ((6, 11), 'HIGGINS, CAPTAIN CLAY'), ((6, 9), 'HARTMAN, CHRISTINA'), ((6, 3), 'FAYARD, CATHRYN CAROLINE'), ((6, 0), 'HUERTA, EMILIO JESUS MR.'), ((6, 0), 'JUNEAU, DENISE'), ((6, 0), 'LATTA, BOB'), ((6, 0), 'HIDALGO, JUAN M JR'), ((6, 0), 'FREEMAN, MARC BENJAMIN'), ((6, 0), 'KELSEY, BRIAN'), ((6, 0), 'MCMULLIN, EVAN'), ((6, 0), 'JOHNSON, LONNIE'), ((6, 0), 'PENA-MELNYK, JOSELINE A.'), ((6, 0), 'BRIDENSTINE, JAMES'), ((6, 0), 'ROGERS, MIKE'), ((6, 0), ', HILLARY'), ((6, 0), 'SANTARSIERO, STEVEN J'), ((6, 0), 'RUIZ, RAUL'), ((6, 0), 'TIPTON, SCOTT R.'), ((6, 0), 'PITTENGER, ROBERT'), ((6, 0), 'MCSALLY, MARTHA E. MS.'), ((6, 0), 'KEFALAS, CHRYSOVALANTIS P'), ((6, 0), 'WEST, BENJAMIN'), ((6, 0), 'SESSIONS, PETE'), ((6, 0), 'CLINTON, ROSS, HILLARY DEBORAH'), ((6, 0), 'MCCARTHY, KEVIN'), ((6, 0), 'TURNER, MICHAEL'), ((6, 0), 'MURRAY, PATTY'), ((6, 0), 'RENACCI, JAMES'), ((6, 0), 'ROSS, HILLARY, DEBORAH'), ((5, 51), 'BABEU, PAUL'), ((5, 37), 'KATKO, JOHN'), ((5, 34), 'ZELDIN, LEE'), ((5, 15), 'ANGELLE, SCOTT MR.'), ((5, 6), 'SHIMKUS, JOHN M'), ((5, 3), 'LAHOOD, DARIN'), ((5, 3), 'CHABOT, PAUL'), ((5, 3), 'GRAY, JIM P'), ((5, 2), 'GARRETT, SCOTT REP.'), ((5, 0), 'MCSALLY, MARTHA E'), ((5, 0), 'GOWDY, TREY'), ((5, 0), 'HOWARD, JULIA'), ((5, 0), 'LAWRENCE, BRENDA LULENAR'), ((5, 0), 'UPTON, FREDERICK STEPHEN'), ((5, 0), 'SMUCKER, LLOYD K'), ((5, 0), 'HOLLIDAY, ED'), ((5, 0), 'RAND, PAUL'), ((5, 0), 'GOSAR, PAUL'), ((5, 0), 'HILLARY, HILLARY'), ((5, 0), 'CRAIG, ANGELA'), ((5, 0), 'HILLARY RODHAM, CLINTON'), ((5, 0), 'DONOVAN, DAN'), ((5, 0), 'SANCHEZ, LORETTA'), ((5, 0), 'NEHLEN, PAUL III'), ((5, 0), 'COLE, TOM'), ((5, 0), 'NOLAN, RICHARD MICHAEL'), ((4, 31), 'YODER, KEVIN'), ((4, 9), 'SUOZZI, THOMAS'), ((4, 6), 'HOUCHIN, ERIN'), ((4, 3), 'CANOVA, TIMOTHY A.'), ((4, 0), 'STARR, MICHAEL BOB'), ((4, 0), 'TITUS, DINA'), ((4, 0), 'WALKINSHAW, BRADY PINERO'), ((4, 0), 'SUSIE, LEE'), ((4, 0), 'NEHLEN, PAUL'), ((4, 0), 'EVANS, DWIGHT'), ((4, 0), 'HOLDING, GEORGE E MR.'), ((4, 0), 'SHUSTER, BILL'), ((4, 0), 'PITTENGER, ROBERT M. HON.'), ((4, 0), 'MCCARTER, KYLE'), ((4, 0), 'DANNY, ZELAYA'), ((4, 0), 'SMITH, ADAM'), ((4, 0), \"O'HALLERAN, TOM\"), ((4, 0), 'PHILLIPS, GEORGE'), ((4, 0), 'WELLS, STEVEN'), ((4, 0), 'GARRETT, THOMAS'), ((4, 0), 'GRIFFIN, TAYLOR'), ((4, 0), 'ESPAILLAT, ADRIANO'), ((4, 0), 'ROUZER, DAVID'), ((4, 0), 'CONYERS, JOHN'), ((4, 0), 'JOHNSON, WILLIAM'), ((4, 0), 'STUTZMAN, MARLIN A'), ((4, 0), 'JOLLY, DAVID W.'), ((4, 0), 'DELBENE, SUZAN'), ((4, 0), 'MIKE, LEE'), ((4, 0), 'RUBIN, JOEL'), ((4, 0), 'GLENN, JON'), ((4, 0), 'HARTZLER, VICKY'), ((4, 0), 'TRUMP, DONALD J. / MICHAEL'), ((3, 811), 'KIRK, MARK'), ((3, 56), 'ELLMERS, RENEE'), ((3, 42), 'ISSA, DARRELL'), ((3, 33), 'LEWIS, JASON'), ((3, 23), 'JOE, HECK'), ((3, 13), 'DUCKWORTH, L TAMMY'), ((3, 10), 'BONOFF, TERRI'), ((3, 8), 'SIDIE, JAY'), ((3, 6), 'JOYCE, DAVE'), ((3, 5), 'ZINKE, RYAN'), ((3, 2), 'BERUFF, CARLOS'), ((3, 2), 'BOST, MICHAEL'), ((3, 0), 'SHELBY, RICHARD C'), ((3, 0), 'VERNON, MONICA W'), ((3, 0), 'TRUMO, DONALD'), ((3, 0), 'SINEMA, KYRSTEN'), ((3, 0), 'GREEN, GENE'), ((3, 0), 'KUO, PETER'), ((3, 0), 'BIRCHER, MARK'), ((3, 0), 'BOOZMAN, JOHN'), ((3, 0), 'DOLD, ROBERT JAMES MR JR'), ((3, 0), 'ZOPP, ANDREA'), ((3, 0), 'DUCKWORTH, L. TAMMY'), ((3, 0), 'PAPE, MICHAEL J'), ((3, 0), 'RAMIREZ, RITA'), ((3, 0), 'JONES, WALTER'), ((3, 0), 'BARNEY, SEAN'), ((3, 0), 'COSTELLO, RYAN'), ((3, 0), 'LUANN, BENNETT'), ((3, 0), 'LEE, MICHAEL'), ((3, 0), 'BERNIE 2016, BERNIE'), ((3, 0), 'FERGUSON IV, ANDERSON DREW'), ((3, 0), 'MCMULLIN, EVAN JOHNSON'), ((3, 0), 'DAVIS, RODNEY'), ((3, 0), 'ANGELLE, SCOTT'), ((3, 0), 'LINDBECK, STEVE'), ((3, 0), 'WILSON, FREDERICA'), ((3, 0), 'CORTEZ MASTO (NV), CATHERINE'), ((3, 0), 'KEYSER, JON'), ((3, 0), 'STEVE, KING'), ((3, 0), 'REED, TOM'), ((3, 0), 'GOODLATTE, BOB'), ((3, 0), 'STRAUSS, RAYMOND JOHN'), ((3, 0), 'WALLKER, SCOTT'), ((3, 0), 'NITO, PARRA'), ((3, 0), 'BEN, CARSON'), ((3, 0), 'LONNIE, JOHNSON'), ((3, 0), 'BYDLAK, REBEKAH'), ((3, 0), 'KINGSON, ERIC R. MR.'), ((3, 0), 'EDWARD, MALIN'), ((3, 0), 'HULTGREN, RANDY'), ((3, 0), 'CRIST, CHARLIE'), ((3, 0), 'PAT, TOOMEY'), ((3, 0), 'NICK, BAUMAN'), ((3, 0), 'HECK, DENNIS'), ((2, 41), 'KASICH, JOHN'), ((2, 22), 'TODD, YOUNG'), ((2, 15), 'BACON, DON'), ((2, 10), 'BERA, AMI'), ((2, 7), 'HASSAN, MAGGIE'), ((2, 6), 'CASPERSON, TOM'), ((2, 6), 'GRAYSON, DENA MD, PHD'), ((2, 5), 'DONALD J. TRUMP FOR PRESIDENT, INC.'), ((2, 4), 'MARCO, RUBIO'), ((2, 3), 'FLORES, LUCY'), ((2, 2), 'PELOSI, NANCY'), ((2, 0), 'DOLD, BOB'), ((2, 0), 'PARRA, NITO'), ((2, 0), 'MIA, LOVE'), ((2, 0), 'TIM, SCOTT'), ((2, 0), 'AGUILAR, PETE'), ((2, 0), 'BRAT, DAVID ALAN'), ((2, 0), 'LARSEN, RICK'), ((2, 0), '/ KAINE, CLINTON'), ((2, 0), 'LAPOLICE, ALAN'), ((2, 0), 'LUCIUS, CASEY'), ((2, 0), 'JOHNSON, RAN'), ((2, 0), 'ELIZABETH, CHENEY'), ((2, 0), 'LIZ, CHENEY'), ((2, 0), 'RAMSLAND, RUSSELL'), ((2, 0), 'ASHOOH, RICHARD E.'), ((2, 0), 'MURHPY, PATRICK'), ((2, 0), 'ARRINGTON, JODEY COOK'), ((2, 0), 'PARRISH, RAY'), ((2, 0), 'BUSTOS, CHERI'), ((2, 0), 'LONG, WENDY'), ((2, 0), 'CLINTON, KIRK'), ((2, 0), 'WALZ-ALLEN, MIRANDA'), ((2, 0), 'HOLDING, GEORGE E B'), ((2, 0), 'KYRSTEN, SINEMA'), ((2, 0), 'TAYLOR, SCOTT'), ((2, 0), 'MEEHAN, PATRICK'), ((2, 0), 'GLENN, DAVID'), ((2, 0), 'WAKELY, THOMAS MR.'), ((2, 0), 'MCMULLIN, DAVID'), ((2, 0), 'CASTLE, DARRELL'), ((2, 0), 'GREEN, RAYMOND'), ((2, 0), 'WRIGHT, KEITH'), ((2, 0), \"O'CONNOR, SHAWN PATRICK\"), ((2, 0), 'TAKANO, MARK'), ((2, 0), 'JAWANDO, WILL'), ((2, 0), 'WRIGHT, KEITH L T'), ((2, 0), 'NEWMAN, MARIE'), ((2, 0), 'JONES, WALTER B.'), ((2, 0), 'BUDD, THEODORE'), ((2, 0), 'MORAN, JERRY'), ((2, 0), 'KILMER, DEREK'), ((2, 0), 'SPEIER, JACKIE'), ((2, 0), 'KINZINGER, ADAM'), ((2, 0), 'ROS-LEHTINEN, ILEANA THE HON.'), ((2, 0), 'SHUSTER, WILLIAM MR.'), ((2, 0), 'MCMULLIN / NATHAN DANIEL, EVAN JOHNSON'), ((2, 0), 'GRIFFITH, MORGAN'), ((2, 0), 'UPTON, FREDERICK'), ((2, 0), 'AYOTTE, KELLEY'), ((2, 0), 'HEINZ, MATTHEW G.'), ((2, 0), 'POCAN, MARK'), ((2, 0), 'RON, DESANTIS'), ((2, 0), 'CHARLES, FERRY'), ((2, 0), 'GALLEGOS, PETE'), ((2, 0), 'CHISESI, DIANE'), ((2, 0), 'LAHOOD, DARIN MCKAY'), ((2, 0), 'ROSKAM, PETER'), ((2, 0), 'COMER, JAMES'), ((2, 0), 'DONALD TRUMP, MIKE PENCE'), ((2, 0), 'BERGMAN, JACK'), ((2, 0), 'BAUCUM, RALPH'), ((2, 0), 'CLINTON / KAINE, HILLARY RODHAM / TIM'), ((2, 0), 'FLEMING, JOHN'), ((2, 0), 'GARRETT, E SCOTT'), ((2, 0), 'SUOZZI, TOM'), ((2, 0), 'DOLD, JR., ROBERT J.'), ((2, 0), 'FETTERMAN, JOHN'), ((1, 88), 'POLIQUIN, BRUCE'), ((1, 67), 'FASO, JOHN'), ((1, 54), 'BABINEC, MARTIN'), ((1, 32), 'GOSAR, PAUL ANTHONY'), ((1, 18), 'CHRISTIE, CHRIS'), ((1, 16), 'RYAN, PAUL'), ((1, 9), 'GRAYSON, DENA'), ((1, 8), 'ROONEY, FRANCIS'), ((1, 4), 'DEBORAH, ROSS'), ((1, 4), 'SCHNEIDER, BRADLEY SCOTT'), ((1, 3), 'ALLEN, JASON'), ((1, 2), 'GENE, GREEN'), ((1, 2), 'MILLS, THOMAS'), ((1, 1), 'KIEHNE, GARY'), ((1, 1), 'MCSALLY, MARTHA'), ((1, 1), 'PLUMB, JOHN'), ((1, 0), 'GLENN, MANYA'), ((1, 0), 'JOHNSON, ESTELLE'), ((1, 0), 'JOHNSON, RED'), ((1, 0), 'BISHOP, MIKE'), ((1, 0), 'WELLS, STEVE'), ((1, 0), 'FAYARD, CATHRYN'), ((1, 0), 'SHAPIRO, JOSH'), ((1, 0), 'GARY, JOHNSON'), ((1, 0), 'WARREN, STEWART'), ((1, 0), 'MULLIN, MARKWAYNE'), ((1, 0), 'SMITH, CHRISTOPHER'), ((1, 0), 'HECK, DENNY'), ((1, 0), 'ADAMS, ALMA SHEALEY'), ((1, 0), 'EDWARD, CRUZ'), ((1, 0), 'RAFAEL, CRUZ'), ((1, 0), 'TENNEY, CLAUDIE'), ((1, 0), 'BYRNE, BRADLEY'), ((1, 0), 'HILLARY RODHAM CLINTON, RUSS FEINGOLD'), ((1, 0), 'MCTEAGUE, DAVE'), ((1, 0), 'ROS-LEHTINEN, ILEANA'), ((1, 0), 'GLEN, SETH'), ((1, 0), 'HALL, ISAHORE'), ((1, 0), 'TRUMP, DONALD J. / M. PENCE'), ((1, 0), 'REICHERT, DAVE'), ((1, 0), 'CLINTON, HILLLARY'), ((1, 0), 'MASSIE, THOMAS H.'), ((1, 0), 'KUSTER, ANN'), ((1, 0), 'KYLE, MCCARTER'), ((1, 0), 'BARKSDALE, JAMES FREEMAN'), ((1, 0), 'CLINTON / SUOZZI / RICE/ SCHUM, HILLARY'), ((1, 0), 'CLINTON/SUOZZI/RICE/SCHUMER, HILLARY/TOM/KATHELEE'), ((1, 0), 'CHENEY, ELIZABETH'), ((1, 0), 'MOORE, GWENDOLYNNE'), ((1, 0), 'DAVIS, BRUCE'), ((1, 0), 'MCNEIL, JOHN P'), ((1, 0), 'PRICE, DAVID'), ((1, 0), 'LOUIE, GOHMERT'), ((1, 0), 'KHOURI, TONIA'), ((1, 0), 'TREY, GOWDY'), ((1, 0), 'J, RON'), ((1, 0), 'VALADAO, DAVID.'), ((1, 0), 'SCOTT, ROBERT'), ((1, 0), 'RUSSEL, FEINGOLD'), ((1, 0), 'ROBERT, DOLD'), ((1, 0), 'PATAKI, GEORGE'), ((1, 0), 'GLENN, ARRYL'), ((1, 0), 'JOOHNSON, RON'), ((1, 0), 'GRAYSON, ALAN MARK'), ((1, 0), 'MCMULIN, EVAN'), ((1, 0), 'GRABELLE, JUSTIN M'), ((1, 0), 'FLYNN, MIKE'), ((1, 0), 'ELIJAH, MANLEY'), ((1, 0), 'MEADOWS, MARK R'), ((1, 0), 'TRUMP, DONLAD'), ((1, 0), 'CATHERINE, CORTEZ MASTO'), ((1, 0), 'QUIST, ROB'), ((1, 0), 'OLSZEWSKI, AL'), ((1, 0), 'JAPAYAL, PRAMILA'), ((1, 0), 'DONALS, TRUMP'), ((1, 0), 'TRUMP, DONALS'), ((1, 0), 'ELBERT, GUILLORY'), ((1, 0), 'FRANK, BEN'), ((1, 0), 'CONNOLLY, GERALD E'), ((1, 0), 'BRAD, ASHFORD'), ((1, 0), 'LOBIONDO, FRANK A.'), ((1, 0), 'SANTORUM, RICHARD'), ((1, 0), 'SCHUMER, CHARLES'), ((1, 0), 'LAW, ALEXANDER'), ((1, 0), 'KATIE, MCGINTY'), ((1, 0), 'RON, JOHNSON'), ((1, 0), 'LANCE, LEONARD'), ((1, 0), 'DIANE, CHISSESI'), ((1, 0), 'BACKER, DAN'), ((1, 0), 'DICIANNI, PETER'), ((1, 0), \"DEMINGS, VALDEZ 'VAL'\"), ((1, 0), 'TOWNSEND, BRYAN'), ((1, 0), 'CLINTON/SUOZZI/RICE/SCHUMER, '), ((1, 0), 'BRANNON, JOSH'), ((1, 0), 'DERICKSON, T'), ((1, 0), 'CRAIG, ANGELA DAWN'), ((1, 0), 'GERRITSON, REBECCA'), ((1, 0), 'GOHMERT, LOUIE'), ((1, 0), 'BEYER, DONALD STERNOFF'), ((1, 0), 'MOORE, GWEN S'), ((1, 0), 'ERIK, PAULSEN'), ((1, 0), 'COPE, CLAY'), ((1, 0), 'GLENN, SETH'), ((1, 0), 'WALTZ, BRENT'), ((1, 0), 'SHAPINO, JOSH'), ((1, 0), 'WALSER, JASON'), ((1, 0), 'GARCIA, JOSE ANTONIO'), ((1, 0), 'CCARSON, BEN'), ((1, 0), 'COTTON, THOMAS'), ((1, 0), 'LAND, TERRI LYNN'), ((1, 0), 'JOHNSON, MICHAEL'), ((1, 0), 'AMERISH, BERA'), ((1, 0), 'CORTEZ-MASTOS, CATHERINE'), ((1, 0), 'PAULSEN, ERIC'), ((1, 0), 'GLENN, DARRY'), ((1, 0), 'GLENN, SHAWN'), ((1, 0), 'JOHSON, RON'), ((1, 0), 'LAYENDECKER, LEVANA'), ((1, 0), 'ASHOOH, RICHARD'), ((1, 0), 'LONG, BILLY'), ((1, 0), 'GORDON, KINZLER'), ((1, 0), 'DANIEL, MUROFF'), ((1, 0), 'CLLINTON, HILLARY'), ((1, 0), 'SLAUGHTER, LOUISE'), ((1, 0), 'BRYSON, RICK'), ((1, 0), 'HURD, WILL'), ((1, 0), 'DENT, CHARLES'), ((1, 0), 'GREGORY, DUWAYNE'), ((1, 0), 'STEFANIK, ELISE M'), ((1, 0), 'COSTA, JIM'), ((1, 0), 'MACARTHUR, THOMAS'), ((1, 0), 'LOFGREN, ZOE'), ((1, 0), ', HILLARY / TOM / KATH'), ((1, 0), 'MIKE, JOHNSON'), ((1, 0), 'WHITWELL, ROBERT'), ((1, 0), 'DASTO, CATHERINE COR'), ((1, 0), 'BOST, MIKE'), ((1, 0), 'SHAUGHNESSY, NAUGHTON'), ((1, 0), 'VARIOUS REPUBLICAN, CANDIDATES'), ((1, 0), 'MAGGIE, HASSAN'), ((1, 0), 'RUSS, FEINGOLD'), ((1, 0), 'CLINTON (NV), HILLARY'), ((1, 0), 'BONGINO, DANIEL J'), ((1, 0), 'GLENN, DARR'), ((1, 0), 'DAVIS, RODNEY L'), ((1, 0), 'HUELSKAMP, TIMOTHY A'), ((1, 0), 'TUMP, DONALD'), ((1, 0), 'PETERSON, COLLIN CLARK'), ((1, 0), 'CLEMENTS, PAUL'), ((1, 0), 'KELLY, ROBIN L.'), ((1, 0), 'NOLAN, RICHARD M.'), ((1, 0), 'CHABOT, STEVE'), ((1, 0), 'HOLDING, GEORGE'), ((1, 0), 'CLINTON, '), ((1, 0), 'CLINTON/SUOZZI/RICE/SCHUMER, HILLARY'), ((1, 0), 'JAMES, JORDAN'), ((1, 0), 'JAMES, LANKFORD'), ((1, 0), 'KELLI, WARD'), ((1, 0), 'ROSENBAUM, ANDREW'), ((1, 0), 'KRISHNAMOORTHI, S. RAJA'), ((1, 0), 'ADRIAN, GARCIA'), ((1, 0), \"ANTHONY, D'ORAZIO\"), ((1, 0), 'WARREN, WEST'), ((0, 67), 'CATHERINE, MASTO'), ((0, 58), 'PERKINS, RANDY'), ((0, 51), 'COFFMAN, MIKE REP.'), ((0, 48), 'JOSEPH, PATRICK'), ((0, 39), 'HUELSKAMP, TIMOTHY A.'), ((0, 36), 'DUNN, NEAL PATRICK MD'), ((0, 34), 'TRUMP, '), ((0, 33), 'PATRICK, TOOMEY'), ((0, 32), 'JOHNSON, LON'), ((0, 31), 'ROY, BLUNT'), ((0, 31), 'FERGUSON, ANDERSON DREW IV'), ((0, 31), 'BIRCH, BAYH'), ((0, 31), 'ELLMERS, RENEE JACISIN'), ((0, 29), 'TRUMP, TRUMP'), ((0, 28), 'BENNETT, MICHAEL'), ((0, 27), 'MICA, JOHN'), ((0, 26), 'KELLY, AYOTTE'), ((0, 25), 'SCHNEIDER, BRADLEY'), ((0, 25), 'ROB, PORTMAN'), ((0, 23), 'YODER, SHELLI'), ((0, 23), 'RICHARD, BURR'), ((0, 22), 'FASO, JOHN J.'), ((0, 21), 'TINNEY, CLAUDIA'), ((0, 21), 'BOUSTANY, CHARLES W.'), ((0, 20), 'THEODORE, STRICKLAND'), ((0, 19), 'KASICH, JOHN R.'), ((0, 17), 'TOOMEY (PA), PAT'), ((0, 17), 'CAMPBELL, FOSTER'), ((0, 17), 'HECK (NV), JOE'), ((0, 16), 'FLEMING, JOHN C.'), ((0, 15), 'MURPHY, PATRICK E.'), ((0, 15), 'HEANEY, ANDREW'), ((0, 15), 'JOLLY, DAVID'), ((0, 15), 'DITTMAR, JANE'), ((0, 15), 'JASON, KANDER'), ((0, 15), 'TOM, KIP E'), ((0, 15), 'JONES, CHRISTINE'), ((0, 14), 'WALBERG, TIMOTHY'), ((0, 13), 'SANTARSIERO, STEVE'), ((0, 13), 'OWENS, H DOUGLAS'), ((0, 13), 'TIPTON, SCOTT'), ((0, 12), 'TRUMP, TRUMP'), ((0, 12), 'GARCIA, ADRIAN'), ((0, 12), 'MASTRO, CATHERINE'), ((0, 11), 'GOSS, CHAUNCEY'), ((0, 11), 'KURT, SCHRADER'), ((0, 11), 'ZOELLER, GREGORY FRANCIS MR.'), ((0, 9), 'BONGINO, DANIEL'), ((0, 9), 'SCHNEIDER, HELENE'), ((0, 9), 'SCHWARTZ, GALE'), ((0, 9), 'HALVORSON, ARTHUR L'), ((0, 8), 'BEAGLE, WILLIAM'), ((0, 8), 'CLINTON/KAINE, HILLARY RODHAM/TIMOT'), ((0, 8), 'DOLD, JR., ROBERT JAMES'), ((0, 8), 'RUTHERFORD, JOHN'), ((0, 7), 'RUBIO (FL), MARCO'), ((0, 7), '/ PENCE, TRUMP'), ((0, 7), 'RUSSELL, FEINGOLD'), ((0, 7), 'BLUNT (MO), ROY'), ((0, 7), 'TRUMP, TRUMP TRUMP'), ((0, 6), 'YOUNG (IN), TODD CHRISTOPHER'), ((0, 6), 'BECCARO, THOMAS DEL'), ((0, 6), 'LONNIE, CAMPBELL'), ((0, 6), 'MASTRO, CATHERINE CORTEZ'), ((0, 6), 'CAMPBELL, FOSTER LONNIE II'), ((0, 6), 'SHKRELI, SUZANNA'), ((0, 6), 'REED, THOMAS'), ((0, 5), 'RYAN, PAUL D.'), ((0, 5), 'TANZLER, HANS'), ((0, 5), 'STEVEN, SANTARSIERO'), ((0, 5), 'BROWN, LIZ'), ((0, 5), 'EVANS, BAYH'), ((0, 5), ', TRUMP'), ((0, 5), 'JUDGE, PATTY'), ((0, 4), 'AYOTTE ((NH), KELLY'), ((0, 4), 'CLINTON, HILLARY CLINTON/K'), ((0, 4), 'FLINN, GEORGE S DR JR'), ((0, 4), 'HEINZ, MATT'), ((0, 4), 'BRANNON, GREGORY'), ((0, 3), 'FIORE, MICHELE'), ((0, 3), 'OWENS, DOUG'), ((0, 3), 'MAXWELL, CHIP'), ((0, 3), 'MCMICHAEL, CRAIG'), ((0, 3), 'DEAN, ANDRE'), ((0, 3), 'MARTINS, JACK'), ((0, 3), 'MITCHELL, PAUL III'), ((0, 3), 'SCHUMER, CHARLES E'), ((0, 3), 'BOUSTANY, CHARLES W JR DR'), ((0, 3), 'HALVORSON, ARTHUR'), ((0, 2), 'DONALD J., TRUMP'), ((0, 2), 'GRIFFIN, WILLIAM TAYLOR'), ((0, 2), 'CHRISTENSEN, GORDON'), ((0, 2), 'BIRCH, BAY'), ((0, 2), 'MURPHY, CHRISTOPHER S'), ((0, 2), 'TRUMP (IN), DONALD J.'), ((0, 2), 'TRUMP (MO), DONALD J.'), ((0, 2), 'KING, STEVE'), ((0, 2), 'FRANK, GUINTA'), ((0, 2), 'CANO, FERNANDO'), ((0, 2), 'NEU, JAMES'), ((0, 2), 'JONES, ROGER STARNER'), ((0, 2), 'ELDRIDGE, CONNER'), ((0, 2), 'DEGNER, KAI'), ((0, 2), 'KLEPINGER, ROBERT'), ((0, 2), 'MUNDY, KEITH'), ((0, 2), 'BURR (NC), RICHARD'), ((0, 2), 'MCCONNELL, JONATHAN EDWARD'), ((0, 2), 'MCCAIN, JOHN S.'), ((0, 2), 'CATHERINE, MAST0'), ((0, 2), 'HUELSKAMP, TIM'), ((0, 2), 'DERRICK, MIKE'), ((0, 2), 'SCHAKOWSKY, JANICE D'), ((0, 2), 'LASEE, FRANK'), ((0, 2), 'PERRY, RICK'), ((0, 2), 'JOHN, MCCAIN'), ((0, 1), 'PAUL, RYAN'), ((0, 1), 'CHRISTOPHER, YOUNG'), ((0, 1), 'WAGNER, ANN L.'), ((0, 1), 'DUKE, DAVID'), ((0, 1), 'HILL, JAMES FRENCH'), ((0, 1), 'CRUZ, RAFAEL EDWARD'), ((0, 1), 'BONNOFF, TERRI'), ((0, 1), 'JOLLY, DAVID W'), ((0, 1), 'MCGINTY, KATHLLEEN'), ((0, 1), 'CARROL, MORGAN'), ((0, 1), 'DELANEY, JOHN K'), ((0, 1), 'KITTS, DERRICK'), ((0, 1), 'PORTMA, ROB'), ((0, 1), 'GLIDEWELL, PET'), ((0, 1), 'FRANK, ROBERT'), ((0, 1), 'PETERS, GARY'), ((0, 1), 'REED, WENDY'), ((0, 1), 'PENCE, TRUMP /'), ((0, 1), 'CLINTON, HILL'), ((0, 1), 'PRYOR, MARK LUNSFORD'), ((0, 1), 'LANDRIEU, MARY L'), ((0, 1), 'RAY, LAKE GROSS III'), ((0, 1), 'ACHADJIAN, KHATCHIK'), ((0, 1), 'SCHULTZ, DEBBIE WASSERMAN'), ((0, 1), 'LONNIE, CAMPBEL'), ((0, 1), 'SUKHIA, KEN'), ((0, 1), 'KITTS, DEREK'), ((0, 1), 'OSSOFF, JONATHAN'), ((0, 1), 'CLINTER, HILLARY'), ((0, 1), 'CAROLL, MORGAN'), ((0, 1), 'SEAN, FLYNN'), ((0, 1), 'DONALD, TRUMPH'), ((0, 1), 'TRUMP, DONAL'), ((0, 1), 'SMITH, LAMAR'), ((0, 1), 'MCCOLLUM, BETTY'), ((0, 1), 'DUFFY, SEAN'), ((0, 0), 'GERALD, JENNINGS')]\n" + ] + } + ], "source": [ "# Return a list of ((supportive expenditures, oppositional expenditures), CandidateName)\n", "# Sorted by greatest number of supportive expenditures\n", @@ -186,9 +234,17 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 13, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[(15691.8, 'ROSS, DEBORAH'), (13666.67, 'DUCKWORTH, TAMMY'), (13433.33, 'SANDERS, BERNIE'), (9752.94, 'MURPHY, PATRICK'), (8283.33, 'CARSON, BEN'), (6531.9, 'MCGINTY, KATHLEEN'), (4541.44, 'STRICKLAND, TED'), (4400.0, 'MAST, BRIAN'), (3813.33, 'SANDERS, BERNARD'), (3800.0, 'HILLARY, CLINTON'), (3300.0, 'HILLARY CLINTON, RUSS FEINGOLD'), (3215.87, 'CLINTON, HILLARY'), (3212.5, 'GLENN, DARRYL'), (2500.0, 'JINDAL, BOBBY'), (2433.33, 'CAMPBELL, FOSTER LONNNIE II'), (2300.0, 'CORTEZ-MASTO, CATHERINE'), (2164.52, 'CHRISTIE, CHRISTOPHER J.'), (2122.22, 'MCGINTY, KATIE'), (1900.0, 'GOTTHEIMER, JOSH'), (1800.0, 'BARRAGAN, NANETTE'), (1640.0, 'DRISKELL, GRETCHEN'), (1550.0, 'JOHNSON, GARY'), (1372.41, 'CRUZ, TED'), (1200.0, 'EDWARDS, DONNA FERN'), (1185.97, 'KANDER, JASON'), (1121.67, 'BUSH, JEB'), (966.67, 'NEGRON, REBECCA'), (950.0, 'HARRIS, KAMALA'), (931.25, 'FIORINA, CARLY'), (850.0, 'PAUL, RAND'), (850.0, 'STUTZMAN, MARLIN'), (825.93, 'JOHNSON, RON'), (825.0, 'WALKER, SCOTT'), (800.0, 'GAETZ, MATT'), (800.0, 'GUINTA, FRANK'), (742.86, 'AYOTTE, KELLY A.'), (687.5, 'LOVE, MIA'), (650.0, 'ZELDIN, LEE M'), (610.34, 'CRUZ, RAFAEL EDWARD TED'), (606.67, 'GRAHAM, LINDSEY'), (600.0, 'DUNN, NEAL'), (579.8, \"CRUZ, RAFAEL EDWARD 'TED'\"), (566.67, 'CARSON, BENJAMIN S SR MD'), (533.33, 'TOTH, STEVE'), (532.35, 'KASICH, JOHN R'), (514.29, 'SHEA-PORTER, CAROL'), (500.0, 'ROGERS, WENDY'), (493.33, 'FEINGOLD, RUSS'), (466.67, 'BANKS, JAMES E'), (442.86, 'MURPHY, STEPHANIE'), (433.33, 'SCHRADER, KURT'), (409.09, 'EGGMAN, MICHAEL'), (405.88, 'KIRKPATRICK, ANN LEILA'), (400.0, 'KIRKPATRICK, ANN'), (330.0, 'DAVIDSON, WARREN'), (320.0, 'SESTAK, JOSEPH'), (312.5, 'HUERTA, EMILIO'), (303.12, 'KIHUEN, RUBEN'), (300.0, 'HUCKABEE, MIKE'), (300.0, 'JOHNSON, JAMES MICHAEL'), (280.0, 'COMSTOCK, BARBARA J HONORABLE'), (253.85, 'CAFORIO, BRYAN'), (250.0, 'GARRETT, SCOTT REP.'), (244.44, 'COFFMAN, MIKE'), (243.75, 'DOLD, ROBERT'), (242.86, 'MCCAIN, JOHN S'), (242, \"CRUZ, RAFAEL 'TED'\"), (240.0, 'KIRK, MARK STEVEN'), (225.0, 'DERICKSON, TIMOTHY'), (220.83, 'HASSAN, MARGARET'), (220.75, 'HASSAN, MARGARET WOOD'), (218.52, 'JOHNSON, RONALD HAROLD'), (217.65, 'VERNON, MONICA'), (214.81, 'WARD, KELLI'), (200.0, 'FAYARD, CATHRYN CAROLINE'), (195.45, 'CRUZ, RAFAEL'), (185, 'RODHAM CLINTON, HILLARY'), (176.47, 'HOLLINGSWORTH, TREY'), (175.0, 'CORREA, LOU'), (172.0, 'NELSON, TOM'), (166.67, 'LAHOOD, DARIN'), (166.67, 'CHABOT, PAUL'), (166.67, 'GRAY, JIM P'), (162.5, 'KENNEDY, JOHN NEELY'), (162.43, 'MASTO, CATHERINE CORTEZ'), (160.0, 'CRANE, MICHAEL'), (154.55, 'CURBELO, CARLOS'), (150.0, 'BERUFF, CARLOS'), (150.0, 'BOST, MICHAEL'), (145.45, 'GALLEGO, PETE'), (140.37, 'BAYH, EVAN'), (140.0, 'THOMAS, MARY'), (140.0, 'BACON, DONALD'), (134.48, 'CARBAJAL, SALUD'), (133.33, 'BENNET, MICHAEL'), (133.33, 'CANOVA, TIMOTHY A.'), (130.67, 'TOOMEY, PATRICK JOSEPH'), (130.0, 'PATRICK, MURPHY'), (127.27, 'VALADAO, DAVID'), (125.0, ', '), (123.53, 'BENNET, MICHAEL F'), (122.73, 'CLINTON, HILARY'), (118.18, 'TED, STRICKLAND'), (113, 'LEE, MIKE'), (112.5, 'GALLAGHER, MICHAEL JOHN'), (110.53, 'FAREED, JUSTIN'), (110.0, 'POLIQUIN, BRUCE L'), (107.02, 'ASHFORD, BRAD'), (107.02, 'AYOTTE, KELLY A'), (106.25, 'BERA, AMERISH'), (105.26, 'MCCAIN, JOHN'), (103.61, 'CORTEZ MASTO, CATHERINE'), (100.0, 'HALL, ISADORE'), (100.0, 'MARSHALL, ROGER'), (100.0, 'GALLAGHER, MICHAEL'), (100.0, 'PELOSI, NANCY'), (100.0, 'KIEHNE, GARY'), (100.0, 'MCSALLY, MARTHA'), (100.0, 'PLUMB, JOHN'), (96.43, 'DENHAM, JEFF'), (96.0, 'BENNETT, LUANN'), (92.86, 'HUELSKAMP, TIMOTHY A REPRESENTA'), (91.67, 'CHRISTIE, CHRISTOPHER J'), (88.89, 'RANDOLPH, SUSANNAH'), (85.71, 'CRAIG, ANGIE'), (84.09, 'FEINGOLD, RUSSELL'), (83.33, 'JOHNSON, RONALD'), (83.33, 'THRONE-HOLST, ANNA'), (83.33, 'SHIMKUS, JOHN M'), (79.93, 'CLINTON, HILLARY RODHAM'), (78.26, 'SOTO, DARREN'), (77.78, 'GRASSLEY, CHARLES E SENATOR'), (75.47, 'HURD, WILLIAM'), (75.0, 'YOUNG, TODD CHRISTOPHER'), (68.18, 'NOLAN, RICK'), (68.0, 'SANTARSIERO, STEVEN'), (66.67, 'HONDA, MIKE'), (66.67, 'HARTMAN, CHRISTINA'), (66.67, 'HOUCHIN, ERIN'), (66.67, 'FLORES, LUCY'), (65, 'SCOTT, TIMOTHY E'), (63, 'CLINTON, HILLARY RODHAM / K'), (60.0, 'HECK, JOE'), (60.0, 'ZINKE, RYAN'), (58.33, 'MCGINTY, KATHLEEN ALANA'), (58, 'VAN HOLLEN, CHRIS'), (56.0, 'NOLAN, RICHARD'), (55, 'DESANTIS, RONALD'), (54.55, 'HIGGINS, CAPTAIN CLAY'), (52.94, 'CARSON, BENJAMIN'), (52.08, 'YOUNG, DAVID'), (52, 'JAYAPAL, PRAMILA'), (51.28, 'PAULSEN, ERIK'), (51, 'GALLAGHER, MIKE'), (50.0, 'BABEU, PAUL RAYMOND'), (50.0, 'JOYCE, DAVE'), (50.0, 'MARCO, RUBIO'), (50.0, 'GENE, GREEN'), (50.0, 'MILLS, THOMAS'), (47.63, 'RUBIO, MARCO'), (47, 'HOEBER, AMIE'), (46.67, 'MARSHALL, ROGER W'), (46.29, 'ROSS, DEBORAH K'), (45, \"O'MALLEY, MARTIN\"), (44.44, 'SUOZZI, THOMAS'), (44, 'SCHNEIDER, BRAD'), (41.31, 'MURPHY, PATRICK E'), (41, 'APPLEGATE, DOUG'), (40.0, 'DONALD J. TRUMP FOR PRESIDENT, INC.'), (39.29, 'DEACON, COLLEEN'), (39, 'CRANE, MICHAEL ROBERT'), (38, 'VELAZQUEZ, NYDIA'), (37.5, 'SIDIE, JAY'), (37.21, 'HARDY, CRESENT'), (36, 'DOLD, ROBERT JAMES JR'), (35.14, 'BRADY, KEVIN'), (35, 'SZELIGA, KATHY'), (34.78, 'CAIN, EMILY'), (34.04, 'ROSEN, JACKY'), (33.33, 'ANGELLE, SCOTT MR.'), (33.33, 'CASPERSON, TOM'), (33.33, 'GRAYSON, DENA MD, PHD'), (33.33, 'ALLEN, JASON'), (31, 'MARSHALL, ROGER W.'), (30.23, 'MOWRER, JIM'), (30.0, 'BONOFF, TERRI'), (28.57, 'HASSAN, MAGGIE'), (28.0, 'KATHLEEN, MCGINTY'), (27, 'REED, THOMAS W II'), (26, 'STEFANIK, ELISE M.'), (25.81, 'MYERS, KIM'), (25.32, 'TARKANIAN, DANNY'), (25, 'KUSTER, ANN MCLANE'), (25, 'WILLIS, COLM'), (25, 'DIANE, CHISESI'), (25.0, 'BLUM, RODNEY'), (25.0, 'DEBORAH, ROSS'), (25.0, 'SCHNEIDER, BRADLEY SCOTT'), (24.62, 'TEACHOUT, ZEPHYR'), (24.62, 'JONES, SCOTT'), (24, 'BUDD, THEODORE P MR.'), (23.68, 'FASO, JOHN J. MR.'), (23.53, 'TENNEY, CLAUDIA'), (23.21, 'TRUMP, DONALD J'), (23.08, 'DONALD, TRUMP'), (23.08, 'DUCKWORTH, L TAMMY'), (23, 'PENA-MELNYK, JOSELINE'), (23, 'WASSERMAN SCHULTZ, DEBBIE'), (23, 'CLINTON, CLINTON'), (22.13, 'MASTO, CATHERINE'), (22, 'PG, SITTENFELD'), (22, 'FERGUSON, DREW'), (22.0, 'BERGMAN, JOHN'), (21, 'JOHNSON, JAMES'), (21, 'PERRY, JAMES R (RICK)'), (20, 'SANTORUM, RICHARD J.'), (20, 'ZINKE, RYAN K'), (20, 'MANESS, ROBERT L COL. RET'), (20.0, 'BERA, AMI'), (19, 'LEE, YUNGMAN'), (19, 'GUTIERREZ, ANA SOL'), (19, 'BIGGS, ANDY'), (18.31, 'FITZPATRICK, BRIAN'), (18, 'WILDER, SELLUS'), (18, 'BANKS, JAMES'), (18, 'MOONEY, ALEXANDER XAVIER'), (17.77, 'FEINGOLD, RUSSELL DANA'), (17, 'SASSE, BENJAMIN E'), (17, 'KENNEDY, JOHN'), (17, 'HILARY, CLINTON'), (17, 'ISAKSON, JOHNNY'), (17, 'WILLIAM BILL WELD, GARY JOHNSON /'), (17, 'EMMER, THOMAS EARL JR.'), (16.95, 'COFFMAN, MICHAEL'), (16.67, 'AYOTTE, KELLY'), (16.45, 'CARROLL, MORGAN'), (16, 'TED, CRUZ'), (16, 'COMSTOCK, BARBARA J.'), (15.69, 'MARGARET, HASSAN'), (15, 'MURKOWSKI, LISA'), (15, 'HUELSKAMP, TIMOTHY'), (15, 'CLINTON, ROSS, HILLARY'), (15, 'COOK, PAUL'), (15.0, 'CRIST, CHARLIE JOSEPH'), (14.71, 'ZELDIN, LEE'), (14, 'RASKIN, JAMIE'), (14, 'CURBELO, CARLOS MR.'), (14, 'NORCROSS, DONALD'), (14, 'KATKO, JOHN M'), (14, 'GARCIA, JOSE'), (13.51, 'KATKO, JOHN'), (13.33, 'BACON, DON'), (13.25, 'COMSTOCK, BARBARA'), (13.04, 'JOE, HECK'), (13, 'KATIE, MCGINTY'), (13, 'FLYNN, MICHAEL'), (12.9, 'YODER, KEVIN'), (12.5, 'KNIGHT, STEVE'), (12.5, 'ROONEY, FRANCIS'), (12, 'SHELBY, RICHARD'), (12, 'PATAKI, GEORGE E'), (12, 'MATTHEWS, KATHLEEN'), (12, 'SMUCKER, LLOYD'), (12, 'COLM, WILLIS'), (12, 'HUDSON, RICHARD'), (11.54, 'GARCIA, JOE'), (11.11, 'GRAYSON, DENA'), (11, 'SCHWARTZ, GAIL'), (11, 'MEEHAN, PATRICK L. MR.'), (11, 'DEMINGS, VAL'), (11, 'JUDGE, PATTY JEAN'), (11, 'SHIMKUS, JOHN'), (10.2, 'GARRETT, SCOTT'), (10, 'DOLD JR., ROBERT JAMES MR.'), (10, 'EDWARDS, DONNA'), (9.8, 'BABEU, PAUL'), (9.4, 'HECK, JOSEPH'), (9.09, 'LEWIS, JASON'), (9.09, 'TODD, YOUNG'), (9, 'CORREA, JOSE LUIS (LOU)'), (9, \"O'MALLEY, MARTIN JOSEPH\"), (9, \"SUNDHEIM, GEORGE 'DUF'\"), (9, 'CHABOT, PAUL R DR.'), (9, 'MARIE, DAVIS'), (9, 'FLEMING, JOHN C JR'), (9, 'BRIDENSTINE, JAMES FREDERICK'), (9, 'ROBERSON, MICHAEL'), (9, 'PETERS, SCOTT'), (9, 'ROCHESTER, LISA BLUNT'), (8.75, 'MILLS, STEWART'), (8, 'ROSS, HENRY'), (8, 'YOUNG, DON'), (8, 'JOYCE, DAVID'), (8, 'DESANTIS, RONALD D.'), (8, 'DESANTIS, RONALD D'), (8, 'KAPLAN, ANNA'), (8, 'DUNN, JOE'), (8, 'GRASSLEY, CHUCK'), (8, 'KEMPER, NANCY JO'), (8, 'DAVIS, MARIE'), (8, 'MICA, JOHN L. MR.'), (7.89, 'TOOMEY, PAT'), (7.14, 'ISSA, DARRELL'), (7, 'DUNN MD FACS, NEAL PATRICK'), (7, 'ROBY, MARTHA'), (7, 'MONTES, JOSEPH'), (7, 'MANDEL, JOSH'), (7, 'BERTRAND, RICK'), (7, 'STUTZMAN, MARLIN A.'), (7, 'TADDEO, ANNETTE'), (7, 'LAMALFA, DOUG'), (7, 'KHANNA, RO'), (7, 'APPLEGATE, DOUGLAS'), (7, 'COSTELLO, RYAN A'), (7, 'HOLDING, GEORGE E'), (6.25, 'RYAN, PAUL'), (6.06, 'BLUNT, ROY'), (6, 'HUERTA, EMILIO JESUS MR.'), (6, 'JUNEAU, DENISE'), (6, 'LATTA, BOB'), (6, 'HIDALGO, JUAN M JR'), (6, 'FREEMAN, MARC BENJAMIN'), (6, 'KELSEY, BRIAN'), (6, 'MCMULLIN, EVAN'), (6, 'JOHNSON, LONNIE'), (6, 'PENA-MELNYK, JOSELINE A.'), (6, 'BRIDENSTINE, JAMES'), (6, 'ROGERS, MIKE'), (6, ', HILLARY'), (6, 'SANTARSIERO, STEVEN J'), (6, 'RUIZ, RAUL'), (6, 'TIPTON, SCOTT R.'), (6, 'PITTENGER, ROBERT'), (6, 'MCSALLY, MARTHA E. MS.'), (6, 'KEFALAS, CHRYSOVALANTIS P'), (6, 'WEST, BENJAMIN'), (6, 'SESSIONS, PETE'), (6, 'CLINTON, ROSS, HILLARY DEBORAH'), (6, 'MCCARTHY, KEVIN'), (6, 'TURNER, MICHAEL'), (6, 'MURRAY, PATTY'), (6, 'RENACCI, JAMES'), (6, 'ROSS, HILLARY, DEBORAH'), (5.56, 'CHRISTIE, CHRIS'), (5.36, 'ELLMERS, RENEE'), (5.26, 'TRUMP, DONALD J.'), (5, 'MCSALLY, MARTHA E'), (5, 'GOWDY, TREY'), (5, 'HOWARD, JULIA'), (5, 'LAWRENCE, BRENDA LULENAR'), (5, 'UPTON, FREDERICK STEPHEN'), (5, 'SMUCKER, LLOYD K'), (5, 'HOLLIDAY, ED'), (5, 'RAND, PAUL'), (5, 'GOSAR, PAUL'), (5, 'HILLARY, HILLARY'), (5, 'CRAIG, ANGELA'), (5, 'HILLARY RODHAM, CLINTON'), (5, 'DONOVAN, DAN'), (5, 'SANCHEZ, LORETTA'), (5, 'NEHLEN, PAUL III'), (5, 'COLE, TOM'), (5, 'NOLAN, RICHARD MICHAEL'), (4.88, 'KASICH, JOHN'), (4.66, 'YOUNG, TODD'), (4, 'STARR, MICHAEL BOB'), (4, 'TITUS, DINA'), (4, 'WALKINSHAW, BRADY PINERO'), (4, 'SUSIE, LEE'), (4, 'NEHLEN, PAUL'), (4, 'EVANS, DWIGHT'), (4, 'HOLDING, GEORGE E MR.'), (4, 'SHUSTER, BILL'), (4, 'PITTENGER, ROBERT M. HON.'), (4, 'MCCARTER, KYLE'), (4, 'DANNY, ZELAYA'), (4, 'SMITH, ADAM'), (4, \"O'HALLERAN, TOM\"), (4, 'PHILLIPS, GEORGE'), (4, 'WELLS, STEVEN'), (4, 'GARRETT, THOMAS'), (4, 'GRIFFIN, TAYLOR'), (4, 'ESPAILLAT, ADRIANO'), (4, 'ROUZER, DAVID'), (4, 'CONYERS, JOHN'), (4, 'JOHNSON, WILLIAM'), (4, 'STUTZMAN, MARLIN A'), (4, 'JOLLY, DAVID W.'), (4, 'DELBENE, SUZAN'), (4, 'MIKE, LEE'), (4, 'RUBIN, JOEL'), (4, 'GLENN, JON'), (4, 'HARTZLER, VICKY'), (4, 'TRUMP, DONALD J. / MICHAEL'), (3.2, 'TRUMP, DONALD'), (3.12, 'GOSAR, PAUL ANTHONY'), (3, 'SHELBY, RICHARD C'), (3, 'VERNON, MONICA W'), (3, 'TRUMO, DONALD'), (3, 'SINEMA, KYRSTEN'), (3, 'GREEN, GENE'), (3, 'KUO, PETER'), (3, 'BIRCHER, MARK'), (3, 'BOOZMAN, JOHN'), (3, 'DOLD, ROBERT JAMES MR JR'), (3, 'ZOPP, ANDREA'), (3, 'DUCKWORTH, L. TAMMY'), (3, 'PAPE, MICHAEL J'), (3, 'RAMIREZ, RITA'), (3, 'JONES, WALTER'), (3, 'BARNEY, SEAN'), (3, 'COSTELLO, RYAN'), (3, 'LUANN, BENNETT'), (3, 'LEE, MICHAEL'), (3, 'BERNIE 2016, BERNIE'), (3, 'FERGUSON IV, ANDERSON DREW'), (3, 'MCMULLIN, EVAN JOHNSON'), (3, 'DAVIS, RODNEY'), (3, 'ANGELLE, SCOTT'), (3, 'LINDBECK, STEVE'), (3, 'WILSON, FREDERICA'), (3, 'CORTEZ MASTO (NV), CATHERINE'), (3, 'KEYSER, JON'), (3, 'STEVE, KING'), (3, 'REED, TOM'), (3, 'GOODLATTE, BOB'), (3, 'STRAUSS, RAYMOND JOHN'), (3, 'WALLKER, SCOTT'), (3, 'NITO, PARRA'), (3, 'BEN, CARSON'), (3, 'LONNIE, JOHNSON'), (3, 'BYDLAK, REBEKAH'), (3, 'KINGSON, ERIC R. MR.'), (3, 'EDWARD, MALIN'), (3, 'HULTGREN, RANDY'), (3, 'CRIST, CHARLIE'), (3, 'PAT, TOOMEY'), (3, 'NICK, BAUMAN'), (3, 'HECK, DENNIS'), (2, 'DOLD, BOB'), (2, 'PARRA, NITO'), (2, 'MIA, LOVE'), (2, 'TIM, SCOTT'), (2, 'AGUILAR, PETE'), (2, 'BRAT, DAVID ALAN'), (2, 'LARSEN, RICK'), (2, '/ KAINE, CLINTON'), (2, 'LAPOLICE, ALAN'), (2, 'LUCIUS, CASEY'), (2, 'JOHNSON, RAN'), (2, 'ELIZABETH, CHENEY'), (2, 'LIZ, CHENEY'), (2, 'RAMSLAND, RUSSELL'), (2, 'ASHOOH, RICHARD E.'), (2, 'MURHPY, PATRICK'), (2, 'ARRINGTON, JODEY COOK'), (2, 'PARRISH, RAY'), (2, 'BUSTOS, CHERI'), (2, 'LONG, WENDY'), (2, 'CLINTON, KIRK'), (2, 'WALZ-ALLEN, MIRANDA'), (2, 'HOLDING, GEORGE E B'), (2, 'KYRSTEN, SINEMA'), (2, 'TAYLOR, SCOTT'), (2, 'MEEHAN, PATRICK'), (2, 'GLENN, DAVID'), (2, 'WAKELY, THOMAS MR.'), (2, 'MCMULLIN, DAVID'), (2, 'CASTLE, DARRELL'), (2, 'GREEN, RAYMOND'), (2, 'WRIGHT, KEITH'), (2, \"O'CONNOR, SHAWN PATRICK\"), (2, 'TAKANO, MARK'), (2, 'JAWANDO, WILL'), (2, 'WRIGHT, KEITH L T'), (2, 'NEWMAN, MARIE'), (2, 'JONES, WALTER B.'), (2, 'BUDD, THEODORE'), (2, 'MORAN, JERRY'), (2, 'KILMER, DEREK'), (2, 'SPEIER, JACKIE'), (2, 'KINZINGER, ADAM'), (2, 'ROS-LEHTINEN, ILEANA THE HON.'), (2, 'SHUSTER, WILLIAM MR.'), (2, 'MCMULLIN / NATHAN DANIEL, EVAN JOHNSON'), (2, 'GRIFFITH, MORGAN'), (2, 'UPTON, FREDERICK'), (2, 'AYOTTE, KELLEY'), (2, 'HEINZ, MATTHEW G.'), (2, 'POCAN, MARK'), (2, 'RON, DESANTIS'), (2, 'CHARLES, FERRY'), (2, 'GALLEGOS, PETE'), (2, 'CHISESI, DIANE'), (2, 'LAHOOD, DARIN MCKAY'), (2, 'ROSKAM, PETER'), (2, 'COMER, JAMES'), (2, 'DONALD TRUMP, MIKE PENCE'), (2, 'BERGMAN, JACK'), (2, 'BAUCUM, RALPH'), (2, 'CLINTON / KAINE, HILLARY RODHAM / TIM'), (2, 'FLEMING, JOHN'), (2, 'GARRETT, E SCOTT'), (2, 'SUOZZI, TOM'), (2, 'DOLD, JR., ROBERT J.'), (2, 'FETTERMAN, JOHN'), (1.85, 'BABINEC, MARTIN'), (1.84, 'TOOMEY, PATRICK'), (1.49, 'FASO, JOHN'), (1.14, 'POLIQUIN, BRUCE'), (1, 'GLENN, MANYA'), (1, 'JOHNSON, ESTELLE'), (1, 'JOHNSON, RED'), (1, 'BISHOP, MIKE'), (1, 'WELLS, STEVE'), (1, 'FAYARD, CATHRYN'), (1, 'SHAPIRO, JOSH'), (1, 'GARY, JOHNSON'), (1, 'WARREN, STEWART'), (1, 'MULLIN, MARKWAYNE'), (1, 'SMITH, CHRISTOPHER'), (1, 'HECK, DENNY'), (1, 'ADAMS, ALMA SHEALEY'), (1, 'EDWARD, CRUZ'), (1, 'RAFAEL, CRUZ'), (1, 'TENNEY, CLAUDIE'), (1, 'BYRNE, BRADLEY'), (1, 'HILLARY RODHAM CLINTON, RUSS FEINGOLD'), (1, 'MCTEAGUE, DAVE'), (1, 'ROS-LEHTINEN, ILEANA'), (1, 'GLEN, SETH'), (1, 'HALL, ISAHORE'), (1, 'TRUMP, DONALD J. / M. PENCE'), (1, 'REICHERT, DAVE'), (1, 'CLINTON, HILLLARY'), (1, 'MASSIE, THOMAS H.'), (1, 'KUSTER, ANN'), (1, 'KYLE, MCCARTER'), (1, 'BARKSDALE, JAMES FREEMAN'), (1, 'CLINTON / SUOZZI / RICE/ SCHUM, HILLARY'), (1, 'CLINTON/SUOZZI/RICE/SCHUMER, HILLARY/TOM/KATHELEE'), (1, 'CHENEY, ELIZABETH'), (1, 'MOORE, GWENDOLYNNE'), (1, 'DAVIS, BRUCE'), (1, 'MCNEIL, JOHN P'), (1, 'PRICE, DAVID'), (1, 'LOUIE, GOHMERT'), (1, 'KHOURI, TONIA'), (1, 'TREY, GOWDY'), (1, 'J, RON'), (1, 'VALADAO, DAVID.'), (1, 'SCOTT, ROBERT'), (1, 'RUSSEL, FEINGOLD'), (1, 'ROBERT, DOLD'), (1, 'PATAKI, GEORGE'), (1, 'GLENN, ARRYL'), (1, 'JOOHNSON, RON'), (1, 'GRAYSON, ALAN MARK'), (1, 'MCMULIN, EVAN'), (1, 'GRABELLE, JUSTIN M'), (1, 'FLYNN, MIKE'), (1, 'ELIJAH, MANLEY'), (1, 'MEADOWS, MARK R'), (1, 'TRUMP, DONLAD'), (1, 'CATHERINE, CORTEZ MASTO'), (1, 'QUIST, ROB'), (1, 'OLSZEWSKI, AL'), (1, 'JAPAYAL, PRAMILA'), (1, 'DONALS, TRUMP'), (1, 'TRUMP, DONALS'), (1, 'ELBERT, GUILLORY'), (1, 'FRANK, BEN'), (1, 'CONNOLLY, GERALD E'), (1, 'BRAD, ASHFORD'), (1, 'LOBIONDO, FRANK A.'), (1, 'SANTORUM, RICHARD'), (1, 'SCHUMER, CHARLES'), (1, 'LAW, ALEXANDER'), (1, 'KATIE, MCGINTY'), (1, 'RON, JOHNSON'), (1, 'LANCE, LEONARD'), (1, 'DIANE, CHISSESI'), (1, 'BACKER, DAN'), (1, 'DICIANNI, PETER'), (1, \"DEMINGS, VALDEZ 'VAL'\"), (1, 'TOWNSEND, BRYAN'), (1, 'CLINTON/SUOZZI/RICE/SCHUMER, '), (1, 'BRANNON, JOSH'), (1, 'DERICKSON, T'), (1, 'CRAIG, ANGELA DAWN'), (1, 'GERRITSON, REBECCA'), (1, 'GOHMERT, LOUIE'), (1, 'BEYER, DONALD STERNOFF'), (1, 'MOORE, GWEN S'), (1, 'ERIK, PAULSEN'), (1, 'COPE, CLAY'), (1, 'GLENN, SETH'), (1, 'WALTZ, BRENT'), (1, 'SHAPINO, JOSH'), (1, 'WALSER, JASON'), (1, 'GARCIA, JOSE ANTONIO'), (1, 'CCARSON, BEN'), (1, 'COTTON, THOMAS'), (1, 'LAND, TERRI LYNN'), (1, 'JOHNSON, MICHAEL'), (1, 'AMERISH, BERA'), (1, 'CORTEZ-MASTOS, CATHERINE'), (1, 'PAULSEN, ERIC'), (1, 'GLENN, DARRY'), (1, 'GLENN, SHAWN'), (1, 'JOHSON, RON'), (1, 'LAYENDECKER, LEVANA'), (1, 'ASHOOH, RICHARD'), (1, 'LONG, BILLY'), (1, 'GORDON, KINZLER'), (1, 'DANIEL, MUROFF'), (1, 'CLLINTON, HILLARY'), (1, 'SLAUGHTER, LOUISE'), (1, 'BRYSON, RICK'), (1, 'HURD, WILL'), (1, 'DENT, CHARLES'), (1, 'GREGORY, DUWAYNE'), (1, 'STEFANIK, ELISE M'), (1, 'COSTA, JIM'), (1, 'MACARTHUR, THOMAS'), (1, 'LOFGREN, ZOE'), (1, ', HILLARY / TOM / KATH'), (1, 'MIKE, JOHNSON'), (1, 'WHITWELL, ROBERT'), (1, 'DASTO, CATHERINE COR'), (1, 'BOST, MIKE'), (1, 'SHAUGHNESSY, NAUGHTON'), (1, 'VARIOUS REPUBLICAN, CANDIDATES'), (1, 'MAGGIE, HASSAN'), (1, 'RUSS, FEINGOLD'), (1, 'CLINTON (NV), HILLARY'), (1, 'BONGINO, DANIEL J'), (1, 'GLENN, DARR'), (1, 'DAVIS, RODNEY L'), (1, 'HUELSKAMP, TIMOTHY A'), (1, 'TUMP, DONALD'), (1, 'PETERSON, COLLIN CLARK'), (1, 'CLEMENTS, PAUL'), (1, 'KELLY, ROBIN L.'), (1, 'NOLAN, RICHARD M.'), (1, 'CHABOT, STEVE'), (1, 'HOLDING, GEORGE'), (1, 'CLINTON, '), (1, 'CLINTON/SUOZZI/RICE/SCHUMER, HILLARY'), (1, 'JAMES, JORDAN'), (1, 'JAMES, LANKFORD'), (1, 'KELLI, WARD'), (1, 'ROSENBAUM, ANDREW'), (1, 'KRISHNAMOORTHI, S. RAJA'), (1, 'ADRIAN, GARCIA'), (1, \"ANTHONY, D'ORAZIO\"), (1, 'WARREN, WEST'), (0.94, 'PORTMAN, ROB'), (0.94, 'BURR, RICHARD'), (0.37, 'KIRK, MARK'), (0, 'GERALD, JENNINGS'), (-100, 'PAUL, RYAN'), (-100, 'CHRISTOPHER, YOUNG'), (-100, 'WAGNER, ANN L.'), (-100, 'DUKE, DAVID'), (-100, 'HILL, JAMES FRENCH'), (-100, 'CRUZ, RAFAEL EDWARD'), (-100, 'BONNOFF, TERRI'), (-100, 'JOLLY, DAVID W'), (-100, 'MCGINTY, KATHLLEEN'), (-100, 'CARROL, MORGAN'), (-100, 'DELANEY, JOHN K'), (-100, 'KITTS, DERRICK'), (-100, 'PORTMA, ROB'), (-100, 'GLIDEWELL, PET'), (-100, 'FRANK, ROBERT'), (-100, 'PETERS, GARY'), (-100, 'REED, WENDY'), (-100, 'PENCE, TRUMP /'), (-100, 'CLINTON, HILL'), (-100, 'PRYOR, MARK LUNSFORD'), (-100, 'LANDRIEU, MARY L'), (-100, 'RAY, LAKE GROSS III'), (-100, 'ACHADJIAN, KHATCHIK'), (-100, 'SCHULTZ, DEBBIE WASSERMAN'), (-100, 'LONNIE, CAMPBEL'), (-100, 'SUKHIA, KEN'), (-100, 'KITTS, DEREK'), (-100, 'OSSOFF, JONATHAN'), (-100, 'CLINTER, HILLARY'), (-100, 'CAROLL, MORGAN'), (-100, 'SEAN, FLYNN'), (-100, 'DONALD, TRUMPH'), (-100, 'TRUMP, DONAL'), (-100, 'SMITH, LAMAR'), (-100, 'MCCOLLUM, BETTY'), (-100, 'DUFFY, SEAN'), (-200, 'DONALD J., TRUMP'), (-200, 'GRIFFIN, WILLIAM TAYLOR'), (-200, 'CHRISTENSEN, GORDON'), (-200, 'BIRCH, BAY'), (-200, 'MURPHY, CHRISTOPHER S'), (-200, 'TRUMP (IN), DONALD J.'), (-200, 'TRUMP (MO), DONALD J.'), (-200, 'KING, STEVE'), (-200, 'FRANK, GUINTA'), (-200, 'CANO, FERNANDO'), (-200, 'NEU, JAMES'), (-200, 'JONES, ROGER STARNER'), (-200, 'ELDRIDGE, CONNER'), (-200, 'DEGNER, KAI'), (-200, 'KLEPINGER, ROBERT'), (-200, 'MUNDY, KEITH'), (-200, 'BURR (NC), RICHARD'), (-200, 'MCCONNELL, JONATHAN EDWARD'), (-200, 'MCCAIN, JOHN S.'), (-200, 'CATHERINE, MAST0'), (-200, 'HUELSKAMP, TIM'), (-200, 'DERRICK, MIKE'), (-200, 'SCHAKOWSKY, JANICE D'), (-200, 'LASEE, FRANK'), (-200, 'PERRY, RICK'), (-200, 'JOHN, MCCAIN'), (-300, 'FIORE, MICHELE'), (-300, 'OWENS, DOUG'), (-300, 'MAXWELL, CHIP'), (-300, 'MCMICHAEL, CRAIG'), (-300, 'DEAN, ANDRE'), (-300, 'MARTINS, JACK'), (-300, 'MITCHELL, PAUL III'), (-300, 'SCHUMER, CHARLES E'), (-300, 'BOUSTANY, CHARLES W JR DR'), (-300, 'HALVORSON, ARTHUR'), (-400, 'AYOTTE ((NH), KELLY'), (-400, 'CLINTON, HILLARY CLINTON/K'), (-400, 'FLINN, GEORGE S DR JR'), (-400, 'HEINZ, MATT'), (-400, 'BRANNON, GREGORY'), (-500, 'RYAN, PAUL D.'), (-500, 'TANZLER, HANS'), (-500, 'STEVEN, SANTARSIERO'), (-500, 'BROWN, LIZ'), (-500, 'EVANS, BAYH'), (-500, ', TRUMP'), (-500, 'JUDGE, PATTY'), (-600, 'YOUNG (IN), TODD CHRISTOPHER'), (-600, 'BECCARO, THOMAS DEL'), (-600, 'LONNIE, CAMPBELL'), (-600, 'MASTRO, CATHERINE CORTEZ'), (-600, 'CAMPBELL, FOSTER LONNIE II'), (-600, 'SHKRELI, SUZANNA'), (-600, 'REED, THOMAS'), (-700, 'RUBIO (FL), MARCO'), (-700, '/ PENCE, TRUMP'), (-700, 'RUSSELL, FEINGOLD'), (-700, 'BLUNT (MO), ROY'), (-700, 'TRUMP, TRUMP TRUMP'), (-800, 'BEAGLE, WILLIAM'), (-800, 'CLINTON/KAINE, HILLARY RODHAM/TIMOT'), (-800, 'DOLD, JR., ROBERT JAMES'), (-800, 'RUTHERFORD, JOHN'), (-900, 'BONGINO, DANIEL'), (-900, 'SCHNEIDER, HELENE'), (-900, 'SCHWARTZ, GALE'), (-900, 'HALVORSON, ARTHUR L'), (-1100, 'GOSS, CHAUNCEY'), (-1100, 'KURT, SCHRADER'), (-1100, 'ZOELLER, GREGORY FRANCIS MR.'), (-1200, 'TRUMP, TRUMP'), (-1200, 'GARCIA, ADRIAN'), (-1200, 'MASTRO, CATHERINE'), (-1300, 'SANTARSIERO, STEVE'), (-1300, 'OWENS, H DOUGLAS'), (-1300, 'TIPTON, SCOTT'), (-1400, 'WALBERG, TIMOTHY'), (-1500, 'MURPHY, PATRICK E.'), (-1500, 'HEANEY, ANDREW'), (-1500, 'JOLLY, DAVID'), (-1500, 'DITTMAR, JANE'), (-1500, 'JASON, KANDER'), (-1500, 'TOM, KIP E'), (-1500, 'JONES, CHRISTINE'), (-1600, 'FLEMING, JOHN C.'), (-1700, 'TOOMEY (PA), PAT'), (-1700, 'CAMPBELL, FOSTER'), (-1700, 'HECK (NV), JOE'), (-1900, 'KASICH, JOHN R.'), (-2000, 'THEODORE, STRICKLAND'), (-2100, 'TINNEY, CLAUDIA'), (-2100, 'BOUSTANY, CHARLES W.'), (-2200, 'FASO, JOHN J.'), (-2300, 'YODER, SHELLI'), (-2300, 'RICHARD, BURR'), (-2500, 'SCHNEIDER, BRADLEY'), (-2500, 'ROB, PORTMAN'), (-2600, 'KELLY, AYOTTE'), (-2700, 'MICA, JOHN'), (-2800, 'BENNETT, MICHAEL'), (-2900, 'TRUMP, TRUMP'), (-3100, 'ROY, BLUNT'), (-3100, 'FERGUSON, ANDERSON DREW IV'), (-3100, 'BIRCH, BAYH'), (-3100, 'ELLMERS, RENEE JACISIN'), (-3200, 'JOHNSON, LON'), (-3300, 'PATRICK, TOOMEY'), (-3400, 'TRUMP, '), (-3600, 'DUNN, NEAL PATRICK MD'), (-3900, 'HUELSKAMP, TIMOTHY A.'), (-4800, 'JOSEPH, PATRICK'), (-5100, 'COFFMAN, MIKE REP.'), (-5800, 'PERKINS, RANDY'), (-6700, 'CATHERINE, MASTO')]\n" + ] + } + ], "source": [ "# Calculate the ratio of support to opposition for a given candidate, expressed as a precentage\n", "# Return a list of (support to opposition ratio, candidate name) sorted by support ratio\n", @@ -211,7 +267,7 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 14, "metadata": {}, "outputs": [], "source": [ @@ -229,18 +285,47 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 15, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "[(131187, 'Working America'), (1477, 'AMERICANS FOR PROSPERITY'), (1472, 'DCCC'), (1012, \"FREEDOM'S DEFENSE FUND\"), (954, 'VIGOP (VIRGIN ISLANDS REPUBLICAN PARTY)'), (929, 'Coalition of Black Trade Unionists'), (854, 'Right to Rise USA'), (852, 'Planned Parenthood Votes'), (822, 'AVAAZ FOUNDATION'), (749, 'House Majority PAC'), (721, 'NRCC'), (717, 'The 2016 Committee'), (706, 'National Rifle Association of America Political Victory Fund'), (681, 'CLUB FOR GROWTH ACTION'), (677, 'America Leads'), (663, 'FEMINIST MAJORITY'), (603, 'MOVEON.ORG POLITICAL ACTION'), (525, 'National Nurses United for Patient Protection'), (494, 'For Our Future'), (473, 'GREAT AMERICA PAC'), (469, 'Working America Coalition'), (459, 'Conservative Solutions PAC'), (457, 'Senate Majority PAC'), (448, 'SEIU COPE (Service Employees International Union Committee On Political Education)'), (399, 'Planned Parenthood Action Fund Inc.'), (386, 'LIBRE INITIATIVE'), (374, 'Immigrant Voters Win PAC'), (373, 'American Majority Action'), (358, 'National Rifle Association Institute for Legislative Action'), (356, 'EARN INTERNATIONAL UNION OF OPERATING ENGINEERS'), (350, 'Women Vote!'), (333, 'Keep the Promise III'), (331, 'Democratic Socialists of America, Inc.'), (306, 'Congressional Leadership Fund'), (304, 'Senate Conservatives Fund'), (294, 'Priorities USA Action'), (278, 'KEEP THE PROMISE I'), (270, 'Human Rights Campaign PAC'), (258, 'TEA PARTY MAJORITY FUND'), (254, 'ESAFund'), (248, 'Our Principles PAC'), (245, 'NRSC'), (243, 'United We Can'), (240, 'Freedom Partners Action Fund, Inc.'), (235, 'Stop Hillary PAC'), (232, 'CASA IN ACTION INC.'), (227, 'Human Rights Campaign Equality Votes'), (219, 'WOMEN SPEAK OUT PAC'), (215, 'OHIO ENVIRONMENTAL COUNCIL ACTION FUND INC.'), (215, 'Senate Leadership Fund'), (203, 'NextGen Climate Action Committee'), (202, 'National Association of Realtors Congressional Fund'), (202, 'COURAGEOUS CONSERVATIVES PAC'), (195, 'VOCES DE LA FRONTERA ACTION'), (184, 'DSCC'), (183, 'New Day for America'), (175, \"AMERICA'S RENEWABLE FUTURE INC\"), (172, 'Citizens United Super PAC LLC'), (166, 'Make DC Listen'), (166, 'WEST VIRGINIANS FOR LIFE INC POLITICAL ACTION COMMITTEE'), (164, 'COALITION OF BLACK TRADE UNIONISTS'), (163, 'Progressive Turnout Project'), (162, 'Florida Freedom PAC'), (160, 'League of Conservation Voters, Inc.'), (159, 'SIERRA CLUB POLITICAL COMMITTEE'), (158, 'CONSERVATIVE MAJORITY FUND'), (152, 'Keep the Promise PAC'), (151, 'Future45'), (149, 'ACTION NC'), (139, 'Tea Party Patriots Citizens Fund'), (136, 'CONSERVATIVE, AUTHENTIC, RESPONSIVE LEADERSHIP FOR YOU AND FOR AMERICA'), (135, \"Colorado People's Action\"), (131, 'SUSAN B ANTHONY LIST INC'), (130, 'CITIZENS FOR RESPONSIBLE ENERGY SOLUTIONS INC.'), (130, 'OHIO VOTER FUND POLITICAL ACTION COMMITTEE'), (129, 'Environmental Defense Action Fund'), (128, 'Everytown for Gun Safety Action Fund'), (126, 'ONE PITTSBURGH'), (121, 'Concerned American Voters'), (118, 'CLEARPATH ACTION, INC.'), (118, 'Jews for Progress'), (110, 'End Citizens United'), (108, 'AMERICAN FEDERATION OF STATE COUNTY AND MUNICIPAL EMPLOYEES AFL-CIO'), (102, 'Unintimidated PAC'), (99, 'AMERICAN UNITY PAC INC'), (99, 'Local Voices'), (98, 'Conservative Campaign Committee'), (98, 'US Chamber of Commerce'), (98, 'Security Is Strength PAC'), (92, 'CASE ACTION FUND'), (90, 'Keep the Promise III, Inc.'), (88, 'THE CONSERVATIVE STRIKEFORCE'), (87, 'CLUB FOR GROWTH PAC'), (86, 'HUMANE SOCIETY LEGISLATIVE FUND'), (86, 'Texas Tea Party Patriots PAC'), (85, 'LCV Victory Fund'), (84, 'Rebuilding America Now'), (84, 'ColorOfChange PAC'), (84, 'Communications Workers of America Working Voices'), (83, 'Americas PAC'), (82, 'Sharon Quirk-Silva for Assembly 2016'), (80, 'AAPI VICTORY FUND'), (79, 'Committee for Working Families, sponsored by the California Labor Federation, AFL-CIO'), (76, 'Planned Parenthood Action Fund of the Pacific Southwest'), (76, 'ARIZONA GRASSROOTS ACTION PAC'), (75, 'NATIONAL ASSOCIATION OF HOME BUILDERS'), (75, 'LATINO VICTORY FUND'), (71, 'New American Jobs Fund'), (70, 'AMERICAN FEDERATION OF STATE COUNTY & MUNICIPAL EMPLOYEES P E O P L E'), (70, 'American Action Network'), (69, 'IOWA CITIZENS FOR COMMUNITY IMPROVEMENT ACTION FUND'), (68, 'CITIZEN SUPER PAC'), (63, 'FEDUP POLITICAL ACTION COMMITTEE AKA FEDUP PAC'), (63, 'iAmerica Action'), (61, 'VETS FOR ECONOMIC FREEDOM TRUST DBA CONCERNED VETERANS FOR AMERICA'), (61, 'Independence USA PAC'), (61, 'Trusted Leadership PAC'), (61, 'BEND THE ARC JEWISH ACTION INC'), (61, 'INDIANA JOBS NOW'), (60, 'AFL-CIO COMMITTEE ON POLITICAL EDUCATION TREASURY FUND'), (57, 'REPUBLICAN NATIONAL COMMITTEE'), (57, 'CASA IN ACTION'), (56, 'We Vote - Nosotros Votamos - PPAMM Committee'), (55, 'SPECIAL OPERATIONS FOR AMERICA'), (54, 'ENTERPRISE FREEDOM ACTION COMMITTEE'), (54, 'Missouri Jobs with Justice Voter Action'), (53, None), (52, 'TEA PARTY VICTORY FUND'), (52, 'FOOD POLICY ACTION'), (52, 'RGA RIGHT DIRECTION PAC'), (52, 'Hispanic Victory PAC'), (51, 'NextGen California Action Committee'), (50, 'MAKE AMERICA AWESOME'), (50, 'WE ARE WISCONSIN POLITICAL FUND'), (50, 'FAIR SHARE ACTION'), (50, 'OREGON RIGHT TO LIFE VICTORY PAC'), (50, 'Mayday PAC'), (49, 'RIGHT WAY SUPERPAC'), (49, 'VOTEVETS'), (48, 'Educators for Ohio'), (47, 'National Right to Life Victory Fund'), (47, 'Maryland USA'), (47, 'Senate Conservatives Action'), (47, 'Majority Forward'), (46, 'MI Planned Parenthood Votes'), (46, 'Generation Forward PAC'), (46, 'Reform America Fund'), (46, 'EQUALITY PENNSYLVANIA'), (45, 'Defending Main Street SuperPAC Inc.'), (45, 'MISSOURI JOBS WITH JUSTICE VOTER ACTION'), (45, 'PATRIOTS FOR TRUMP'), (45, 'KENTUCKIANS FOR STRONG LEADERSHIP'), (45, 'National Association for Gun Rights Inc PAC'), (44, 'NEW LEADERSHIP FOR OHIO'), (44, 'One Nation'), (44, 'People for Pinellas'), (43, 'VOCES DE LA FRONTERA ACTION INC'), (42, \"PURSUING AMERICA'S GREATNESS\"), (42, \"LABORERS' INTERNATIONAL UNION OF NORTH AMERICA (LIUNA) PAC\"), (41, 'ADVANCE NORTH CAROLINA'), (40, 'Restoration PAC'), (40, 'LABORERS POLITICAL LEAGUE - EDUCATION FUND'), (39, 'Make America Number 1'), (39, 'PLANNED PARENTHOOD VOTES NORTHWEST'), (38, 'CLUB FOR GROWTH'), (38, 'PEOPLE FOR THE AMERICAN WAY'), (38, 'Fighting for Ohio Fund'), (38, 'NEA Advocacy Fund'), (38, 'New York State Immigrant Action Fund'), (37, 'THE 60 PLUS ASSOCIATION'), (36, 'BELIEVE AGAIN'), (36, 'John Bolton Super PAC'), (35, 'SECUREAMERICANOW.ORG'), (35, 'WISCONSIN JOBS NOW!'), (35, 'Wisconsin Jobs Now!'), (35, \"PHYLLIS SCHLAFLY'S EAGLE PAC\"), (34, 'NORTH FLORIDA NEIGHBORS'), (34, 'STRONG LEADERSHIP FOR AMERICA'), (34, 'Stand For Truth, Inc.'), (34, 'MOVE MARYLAND FORWARD'), (33, 'Grow the Economy Pac, LLC'), (32, 'Warrior PAC'), (32, 'NCLR Action PAC'), (32, 'Americans Deserve Better PAC, Inc'), (32, 'FREEDOMWORKS FOR AMERICA'), (32, 'Missouri Right to Life Victory Fund'), (31, 'Defend Louisiana PAC'), (31, 'PURPLE PAC INC'), (31, 'AFT Solidarity'), (30, 'Defend Rural Arizona PAC'), (30, 'New Day Independent Media Committee'), (29, 'Conservative Congress Now!'), (29, 'Americans for Responsible Solutions-PAC'), (29, 'FREEDOM COMMITTEE'), (29, 'Ending Spending, Inc.'), (28, 'National Right to Life Political Action Committee'), (28, 'KelliPAC'), (27, \"Committee for Maryland's Progress\"), (27, 'AlternativePAC'), (27, 'Gun Owners of America, Inc.'), (27, 'Madison Project Inc.'), (26, 'Granite State Solutions'), (26, 'American Dental Association Independent Expenditures Committee'), (26, 'FUTURE IN AMERICA INC.'), (25, 'Black PAC'), (25, 'WISCONSIN RIGHT TO LIFE VICTORY FUND'), (25, 'New Power PAC'), (25, 'Black Conservatives Fund'), (24, 'AMERICAN FUTURE FUND'), (24, 'New Prosperity Foundation; The'), (23, 'WORKING FOR US POLITICAL ACTION COMMITTEE INC'), (22, 'American College of Radiology Association PAC'), (22, 'THE CATHOLIC ASSOCIATION'), (22, 'American Opportunity PAC'), (22, \"People's Action Movement\"), (22, 'Patriot Majority PAC'), (22, 'Florida First Project'), (21, 'The National Republican Trust PAC'), (21, 'Opportunity and Freedom PAC'), (21, 'J Street'), (21, 'CatholicVote.org'), (21, '350.ORG ACTION FUND'), (21, 'Cooperative of American Physicians IE Committee'), (21, 'AMERICAN WORKING FAMILIES'), (21, 'Not Who We Are PAC'), (21, 'The Guardian Fund'), (20, 'Conservative Action Fund'), (20, 'Floridians for a Strong Middle Class'), (20, 'Environment America Action Fund'), (20, 'CLIMATE REALITY ACTION FUND'), (20, 'Constitutional Conservatives'), (20, 'Right to Life of Michigan Victory Fund'), (20, 'Sixteen Thirty Fund / Make it Work Action'), (19, 'Californians for Innovation'), (19, 'International Brotherhood of Electrical Workers Local 98 Committee on Political Education'), (19, 'COMMUNITY ACTION NOW'), (19, 'CAPE FOX PROFESSIONAL LICENSE'), (19, 'COMMON SENSE LEADERSHIP FOR AMERICA'), (19, 'Human Rights Campaign'), (18, 'RESTORE AMERICAN FREEDOM AND LIBERTY'), (18, 'PLANNED PARENTHOOD OF NASSAU COUNTY ACTION FUND'), (18, 'STAND UP FOR OHIO PAC'), (18, 'Ohio Environmental Council Action Fund Inc.'), (18, 'One Pittsburgh'), (18, 'RIGHT WAY INITIATIVE INC.'), (18, 'Values are Vital'), (18, 'Prosperity for Pennsylvania Inc.'), (17, 'VALOR AMERICA'), (17, 'SAFARI CLUB INTERNATIONAL PAC (SCI-PAC)'), (17, 'FRIENDS OF THE EARTH ACTION'), (17, 'HARD HATS FOR AMERICA'), (16, 'CLIMATE HAWKS VOTE POLITICAL ACTION'), (16, 'CULAC the PAC of Credit Union National Association'), (16, 'INDEPENDENT VOICE FOR ILLINOIS PAC'), (16, 'Spirit of Democracy America'), (16, 'Consumers for Responsible Government'), (16, 'Accountable Leadership'), (16, \"America's Liberty PAC\"), (16, 'CAPA21- Federal'), (16, \"ILLINOIS AGRICULTURAL ASSOCIATION ACTIVATOR POLITICAL INVOLVEMENT FUND (FED) 'ACTIVATOR'/'ILLINOIS FARM BUREAU ACTIVATOR'\"), (16, 'NARAL Pro-Choice America'), (16, 'NC LATINO POWER'), (16, 'United Association Political Education Committee (United Association of Journeymen and Apprentices of the Plumbing & Pipefitting Industry of the United States and Canada)'), (16, 'WORKING FAMILIES OF ALASKA'), (15, 'LOVE FOR LOUISIANA POLITICAL ACTION COMMITTEE'), (15, 'Valor Fund'), (15, \"America's Renewable Future Inc.\"), (15, 'Campaign for American Principles'), (15, 'Sixteen Thirty Fund / Make It Work Action'), (15, 'R4C16'), (15, 'America Speaks PAC'), (15, 'NEW YORK WINS PAC'), (15, 'FLORIDIANS FOR A STRONG MIDDLE CLASS'), (14, '45 Committee Inc.'), (14, 'A Whole Lot of People for Grijalva Congressional Committee'), (14, 'Political Action Committee of the American Association of Orthopaedic Surgeons--PAC of AAOS'), (14, 'The American Foundations Committee'), (14, 'RAMPART PAC'), (14, 'American Hospital Association PAC'), (14, 'Defenders of Freedom and Security'), (14, 'Patriot Majority USA'), (14, 'USW Works'), (14, 'WORKING FAMILIES PARTY INDEPENDENT EXPENDITURE COMMITTEE'), (14, 'Prosperity With Accountability'), (14, 'Bukowsky'), (14, 'United Steelworkers Political Action Fund'), (13, 'REPLACEMENTS LTD PAC'), (13, 'Patriots for Economic Freedom'), (13, 'Save the Day PAC'), (13, 'Texas Organizing Project PAC'), (13, 'True Blue Florida'), (13, '45Committee Inc.'), (13, 'GROW NC STRONG INC'), (13, 'BLUE AMERICA PAC INDEPENDENT EXPENDITURE COMMITTEE'), (13, 'FIGHT FOR TOMORROW'), (12, 'El Super PAC Voto Latino'), (12, 'RESTORE THE CONSTITUTION COALITION'), (12, 'UNITE HERE TIP State & Local Fund'), (12, 'VICTORY 2016'), (12, 'Silver State PAC, Inc.'), (12, 'CHINESE AMERICANS FOR KEEPING AMERICA GREAT'), (12, \"Int'l Union Of Bricklayers And Allied Craftworkers PAC\"), (12, 'African Amer Voter Reg Educ and Participation Proj'), (12, 'CITIZENS FOR A WORKING AMERICA INC.'), (12, 'Heartland Resurgence'), (12, 'MAKING MAINE GREAT AGAIN'), (12, 'SIERRA CLUB INDEPENDENT ACTION'), (12, 'Americans for Legal Immigration PAC'), (12, 'LATINO VICTORY PROJECT'), (12, 'SIXTEEN THIRTY FUND / MAKE IT WORK ACTION'), (12, 'Stand Up for Ohio'), (12, 'URBAN VICTORY FUND (UVF)'), (11, 'Republican Jewish Coalition'), (11, 'American Crossroads'), (11, 'Conserv America Building a Brighter Future Together'), (11, 'Greenpeace, Inc.'), (11, 'OneAmerica Votes'), (11, 'CONSERVATIVE OUTSIDER PAC'), (11, 'Sixteen Thirty Fund'), (11, 'NATIONAL CAMPAIGN'), (11, 'Californians for Fiscal Responsibility'), (11, 'Ending Spending Action Fund'), (11, 'Freethought Equality Super PAC'), (11, 'Make Louisiana Great Again'), (11, \"WE'VE GOT YOUR BACKPAC\"), (11, 'Amish PAC'), (10, 'Monstah Pac'), (10, 'CONSERVATIVE LIBERTY COALITION'), (10, 'OUR VOICE MATTERS SUPER PAC'), (10, 'The Nuisance Committee'), (10, 'Voter Education'), (10, 'LET AMERICA WORK'), (10, 'LIFT LEADING ILLINOIS FOR TOMORROW'), (10, 'ONEAMERICA VOTES'), (10, 'WE THE PEOPLE, NOT WASHINGTON'), (10, 'Fifty Second Street Fund'), (9, '314 PAC'), (9, 'Working Again PAC'), (9, \"America's Opportunity Fund\"), (9, 'Character is Essential PAC (CIE PAC)'), (9, 'NEW YORK JOBS COUNCIL'), (9, 'PROGRESS UNITED PAC'), (9, 'SHARON QUIRK-SILVA FOR ASSEMBLY 2016'), (9, 'EDUCATORS FOR OHIO'), (9, 'Baby Got PAC'), (9, 'PERSON TO PERSON PAC'), (9, 'UNITED FOOD AND COMMERCIAL WORKERS INTERNATIONAL UNION ACTIVE BALLOT CLUB'), (9, 'USA BUSINESS FREEDOM PAC'), (9, 'UltraViolet Action'), (9, 'JANPAC'), (9, 'Tea Party Forward'), (8, '21st Century Leaders'), (8, 'AMERICAN MEDICAL ASSOCIATION POLITICAL ACTION COMMITTEE'), (8, 'Associated Builders and Contractors Inc.'), (8, 'Climate Reality Action Fund'), (8, 'Effective Leadership for America'), (8, 'Mountaineers Are Always Free PAC'), (8, 'NARAL Pro-Choice America PAC'), (8, \"Standing up for California's Middle Class\"), (8, 'Americans For Concrete Solutions'), (8, 'Greenpeace Inc.'), (8, 'ASSOCIATED BUILDERS AND CONTRACTORS INC.'), (8, 'CENTER FORWARD'), (8, 'OneAmerica'), (8, 'PROGRESS PROJECT'), (8, 'AMERICARISINGPAC.ORG'), (8, 'ASIAN PACIFIC AMERICAN LABOR ALLIANCE AFL-CIO'), (8, 'WISCONSIN RIGHT TO LIFE POLITICAL ACTION COMMITTEE'), (8, 'Libre Initiative'), (8, 'National Emergency Medicine Political Action Committee - American College of Emergency Physicians'), (8, 'FLORIDIANS FOR SECURITY AND PROSPERITY'), (8, 'House Liberty Project'), (8, 'AMERICAN CONSERVATIVE UNION'), (8, 'Treasure Coast Committee'), (8, 'VOTEVETS.ORG ACTION FUND'), (7, 'AMERICANS FOR ACCOUNTABILITY IN LEADERSHIP'), (7, 'FERNANDEZ MIGUEL B.'), (7, 'JIM OWLES LIBERAL DEMOCRATIC CLUB'), (7, 'TENACIOUS TRUTH PAC'), (7, 'Democracy for America'), (7, 'Restore America Super PAC'), (7, 'Humanity for Progress'), (7, 'RHODE ISLAND STATE RIGHT TO LIFE COMMITTEE INC'), (7, 'Truth PAC'), (7, 'AFL-CIO Committee on Political Education Treasury Fund'), (7, 'RALLYPAC'), (7, 'SAVE AMERICA FROM ITS GOVERNMENT'), (7, 'CHC BOLD PAC'), (7, 'CIVIC INNOVATION USA INC'), (7, 'LOUISIANA PROSPERITY FUND'), (7, 'Progressive Change Campaign Committee'), (7, 'STAND UP FOR OHIO'), (6, \"1199 SERVICE EMPLOYEES INT'L UNION FEDERAL POLITICAL ACTION FUND\"), (6, 'America Working Together'), (6, 'HUNTER ACTION FUND (HAF)'), (6, 'Human Rights Campaign C90012626'), (6, 'INDEPENDENT LEADERSHIP FUND'), (6, 'Missouri Farm Bureau Federation Federal PAC'), (6, 'NEW HAMPSHIRE PRIORITIES'), (6, 'PLANNED PARENTHOOD ADVOCACY PROJECT LOS ANGELES COUNTY'), (6, 'REFORM WISCONSIN FUND'), (6, 'Transportation Trades Department AFL-CIO Political Education Fund'), (6, 'Building Bridges, Not Walls'), (6, 'Citizens For Strength And Security PAC'), (6, 'Concerned Taxpayers of America'), (6, 'GET OUR JOBS BACK, INC'), (6, 'NATIONAL FEDERATION OF INDEPENDENT BUSINESS/ SAVE AMERICAS FREE ENTERPRISE TRUST'), (6, 'Planned Parenthood Central Coast Action Fund'), (6, 'San Francisco Democratic County Central Committee'), (6, 'Working for Maryland'), (6, 'AMERICA NEXT INC'), (6, 'CHARACTER COUNTS POLITICAL ACTION COMMITTEE'), (6, 'NeverTrump PAC'), (6, \"WOMEN'S VOICES WOMEN VOTE ACTION FUND\"), (6, 'Growth & Opportunity PAC, Inc.'), (6, 'PLANNED PARENTHOOD CENTRAL COAST ACTION FUND'), (6, 'United Food and Commercial Workers International Union Working Families Advocacy Project'), (6, 'AMERICANS FOR CRUZ'), (6, 'Agron'), (6, 'Believe Again'), (6, 'LIBERTY AND LEADERSHIP FUND'), (6, 'Vets for Economic Freedom Trust dba Concerned Veterans for America'), (6, 'AMERICAN ACADEMY OF OPHTHALMOLOGY INC POLITICAL COMMITTEE (OPHTHPAC)'), (6, 'EQUALITY PENNSYLVAVIA'), (6, 'Minnesota Democratic-Farmer-Labor Party'), (6, 'SAVE THE AMERICAN WAY'), (6, 'CONSERVATIVES UNITED'), (6, 'NATIONAL HORIZON'), (6, 'Freedomworks for America'), (6, 'RIGHTS & DEMOCRACY ACTION'), (5, 'Golden State Leadership Fund PAC'), (5, 'MIDWEST GROWTH PAC'), (5, 'Working Assets Funding Service'), (5, 'Every Voice Action'), (5, 'FEDERATION OF AMERICAN HOSPITALS'), (5, 'GROW WV INC'), (5, 'Catalyst Oklahoma'), (5, 'MONTANA NATIVE VOTE'), (5, 'New Jersey Right to Life Committee Federal PAC'), (5, 'Tea Party Express Campaign Fund'), (5, 'KENTUCKY MOVING FORWARD'), (5, 'MIDDLE CLASS VALUES PAC'), (5, 'Mothers and Daughters Against Misogynistic Exploitation'), (5, 'NATIONAL COUNCIL OF LA RAZA ACTION FUND INC.'), (5, 'Transport Workers Union Political Contributions Committee'), (5, 'AMERICA ASCENDANT PAC'), (5, 'Local 32BJ Service Employees International Union American Dream Political Action Fund'), (5, 'Priorities for Iowa Political Fund'), (5, 'ADAMS STEPHEN'), (5, 'America Together, Inc.'), (5, 'Bend the Arc Jewish Action Inc'), (5, 'American Wind Action'), (5, 'CONSERVATIVE FREEDOM FIGHTERS'), (5, \"California's New Frontier\"), (5, 'INFORMED CITIZENS'), (5, 'Never Means Never PAC'), (4, 'Opportunity PAC - A Coalition of teachers health care givers faculty members school employees and public and pr'), (4, 'Stand With America'), (4, 'TrumPAC'), (4, 'CAMPAIGN FOR WORKING FAMILIES'), (4, 'Faith Family Freedom Fund'), (4, 'Freedom Partners Chamber of Commerce Inc.'), (4, 'THE AMERICAN CONGRESS OF OB-GYNS PAC (OB-GYN PAC)'), (4, 'TRUMPAC'), (4, 'CONSERVATIVE TEXANS'), (4, 'Hillary for America'), (4, 'Planned Parenthood Action PAC North Carolina'), (4, 'THE INDEPENDENT PROJECT PAC (TIP PAC)'), (4, 'FORWARD PHILADELPHIA PAC'), (4, 'Great America PAC'), (4, 'Right to Life of Michigan Political Action Committee'), (4, 'STATE CONSERVATIVE REFORM ACTION PAC (SCRAP)'), (4, 'UNITE HERE TIP Campaign Committee'), (4, 'VOTE 2 REDUCE DEBT (V2RD)'), (4, 'A NEW VOICE FOR MARYLAND'), (4, \"America's Voice\"), (4, 'DANNY ZELAYA FOR PRESIDENT'), (4, 'Democratic Women of the Desert'), (4, 'MAKE THE ROAD ACTION INC.'), (4, 'Protecting Choice in California, a project of Planned Parenthood Affiliates of California'), (4, 'REPUBLICAN HINDU COALITION'), (4, 'Democratic Party of Illinois'), (4, \"Our Children's Future\"), (4, 'Planned Parenthood Advocates of Wisconsin Inc (C4)'), (4, 'RIGHT TO RISE USA'), (4, 'SIERRA CLUB'), (4, 'Sixteen Thirty Fund / Make It Work America1'), (4, 'Veterans for a Strong America Action Group'), (4, 'American Horizons PAC'), (4, 'California Federation of Teachers COPE'), (4, 'FIGHTING FOR LOUISIANA'), (4, 'Win for America PAC'), (4, 'Family Policy Alliance fka CitizenLink fka Focus on the Family Action'), (4, 'OCEAN CHAMPIONS'), (3, 'AMERICAN FUTURE FUND POLITICAL ACTION'), (3, 'Alliance for a Free Society, Inc.'), (3, 'CONCERNED AMERICAN VOTERS'), (3, 'Freedom For All PAC'), (3, 'MAKE MICHIGAN FIRST NOW'), (3, 'NICK ANGELO BAUMAN FOR THE PEOPLE'), (3, 'PROGRESS FOR AMERICA PAC'), (3, 'PROGRESS N@'), (3, 'Planned Parenthood of New York City Action Fund'), (3, 'Protect Louisiana, Inc.'), (3, 'AMERICA VOTES ACTION FUND'), (3, 'American College of Surgeons Professional Association PAC'), (3, 'Kansas Ag Communities Coalition'), (3, 'AMERICA IS WORTH IT'), (3, 'Laborers Political League - Education Fund'), (3, 'Make the Road Action Inc.'), (3, 'NC Hospital Association'), (3, 'PANHANDLE VICTORY FUND'), (3, 'Planned Parenthood Hudson Peconic Action Fund'), (3, 'United for Progress PAC'), (3, 'COLORADO CONSERVATIVE PAC'), (3, 'California Progress Coalition'), (3, 'Extraordinary America'), (3, 'GERALD JOHN JENNINGS II FOR PRESIDENT'), (3, 'Make Arizona Strong'), (3, 'NORTHERN MI FIRST'), (3, 'REPUBLICAN SUPER PAC INC'), (3, 'Strong NH Action'), (3, 'UAW EDUCATION FUND'), (3, 'AGRON DOMINICK'), (3, 'Chu'), (3, 'Citizens United Political Victory Fund'), (3, 'FREEDOM AND FAIRNESS VIRGINIA'), (3, 'LETS CLEAN UP WASHINGTON'), (3, \"People's Action\"), (3, 'Planned Parenthood Advocacy Project Los Angeles County'), (3, 'FRUSTRATED AMERICAN TAXPAYER'), (3, 'MISSOURI REPUBLICAN STATE COMMITTEE-FEDERAL'), (3, 'NEW FLORIDA MAJORITY'), (3, 'Americans United for Values'), (3, 'Council For Citizens Against Government Waste'), (3, 'FUND FOR ECONOMIC GROWTH'), (3, 'Fenton Communications Inc.'), (3, 'ILLINOIS VOICES MATTER'), (3, 'Inland Empire Taxpayers Association Federal PAC'), (3, 'POWER WHEELS REMOTE CONTROL'), (3, 'TEXANS FOR A BETTER FUTURE'), (3, 'Arizona Accountability Project'), (3, 'FREEDOM FOR ALL PAC'), (3, 'GEORGE WASHINGTON LEADERSHIP FOUNDATION, INC.'), (3, 'Jobs Opportunity and Freedom Political Action Committee - JOFPAC'), (3, 'West Hollywood/Beverly Hills Democratic Headquarters Committee'), (2, 'Alzheimers Impact Movement'), (2, 'CONSERVATIVE AMERICA NOW PAC'), (2, 'National Association of Letter Carriers of U.S.A. Political Fund (Letter Carrier Political'), (2, 'Progress Now'), (2, 'Progress Project'), (2, 'American Bridge 21st Century'), (2, 'BELIEVE IN INDIANA'), (2, 'CAMPAIGN FOR JOBS AND OPPORTUNITY'), (2, \"Cure 4 Louisiana's Future PAC\"), (2, 'FORWARD FOR A BETTER FUTURE'), (2, 'Nevada Advocates for Planned Parenthood Affiliates'), (2, 'PA Common Sense'), (2, 'PLANNED PARENTHOOD ACTION PAC NORTH CAROLINA'), (2, 'American Future Fund'), (2, 'Art of the Deal PAC'), (2, 'Arts'), (2, 'Hampton Creek Inc.'), (2, 'ILLINOIS IMMIGRANT ACTION'), (2, 'LUNCH PAIL REPUBLICANS INDEPENDENT EXPENDITURE ONLY COMMITTEE'), (2, 'MAINE REPUBLICAN PARTY'), (2, 'OCEAN MAJORITY PAC'), (2, 'The 15104'), (2, 'WOMEN VOTE!'), (2, \"COMMITTEE TO RESTORE AMERICA'S GREATNESS\"), (2, 'EMERGENCY COMMITTEE FOR ISRAEL'), (2, 'ILLINOIS FAMILIES FIRST'), (2, 'Independence Party of Minnesota'), (2, 'L PAC'), (2, 'PAGE COMMUNICATIONS, L.L.C.'), (2, 'ARTICLE I ADVOCATES'), (2, 'American Federation of Teachers, AFL-CIO Committee on Political Education'), (2, 'BETTER LOUISIANA PAC'), (2, \"BLACK AMERICA'S POLITICAL ACTION COMMITTEE\"), (2, 'Bruzzone'), (2, 'Citizen PAC, Inc.'), (2, 'FREEDOM PARTNERS CHAMBER OF COMMERCE INC.'), (2, 'Friends of Traditional Banking'), (2, 'Ludwig'), (2, 'Texans for Integrity'), (2, 'VanderSloot'), (2, 'Asian Pacific American Labor Alliance AFL-CIO'), (2, 'Los Angeles County Democratic Central Committee'), (2, 'One Nation PAC'), (2, 'Our Revolution'), (2, 'Planned Parenthood of Central and Western New York Action Fund (formerly known as Planned Parenthood of the Rochester/Syracuse Region Action Fund)'), (2, 'America Next Inc'), (2, 'American Freedom Builders Action Network'), (2, 'EDUCATION REFORM NOW ADVOCACY'), (2, 'Floridians for Security and Prosperity'), (2, 'Fund This Advert'), (2, 'GRANITE VOICES PAC'), (2, 'House Freedom Action Fund'), (2, 'PLANNED PARENTHOOD ADVOCATES OF WISCONSIN INC'), (2, 'ACTION NC'), (2, 'Alaska Strong PAC'), (2, 'American Academy of Dermatology Association Political Action Committee (SkinPAC)'), (2, 'Asian Pacific Americans for Progress'), (2, 'Busse'), (2, 'Delegates Unbound PAC'), (2, 'National Emergency Medicine Political Action Committee'), (2, 'Ventura County Republican Party (Fed.)'), (2, 'Vermont Right to Life Committee Political Committee'), (1, '2016 COMMITTEE; THE'), (1, 'Avaaz Foundation'), (1, 'Barfels'), (1, 'Bulletin Displays LLC'), (1, 'CEASEFIRE PENNSYLVANIA'), (1, 'CENTER FORWARD COMMITTEE'), (1, 'CLEAN SLATE BALTIMORE PAC'), (1, 'Cline-Jones'), (1, 'Libery Initiative Fund'), (1, 'MONTPAC-MONTANA MEDICAL ASSOCIATION (MMA)'), (1, 'PLANNED PARENTHOOD OF MN ACTION FUND'), (1, 'Republican Party of Texas'), (1, 'Restoring Prosperity Fund'), (1, 'U.S.-Cuba Democracy Political Action Committee'), (1, 'Vocal Citizens'), (1, 'CREATIVE MAJORITY POLITICAL ACTION COMMITTEE'), (1, 'Committee for American Sovereignty'), (1, 'ELIJAH MANLEY FOR PRESIDENT 2016'), (1, 'FRIENDS OF JOHN DELANEY'), (1, \"Jewish Floridians for America's Future\"), (1, 'Kentucky Tomorrow, Inc.'), (1, 'LABOR UNITED FOR CONNECTICUT'), (1, 'OUTFRONT MEDIA LLC'), (1, 'Outfront Media LLC'), (1, 'REPUBLICAN PARTY OF PETERS TOWNSHIP'), (1, 'Safety for All Yes on Prop. 63 Newsom Ballot Measure Committee'), (1, 'The Catholic Association'), (1, 'Tony for 25th'), (1, '1199 32BJ/144 SERVICE EMPLOYEES INTERNATIONAL UNION HOME CARE POLITICAL ACTION FUND'), (1, 'Alaska Democratic Party'), (1, 'American Potential'), (1, 'Fernandez'), (1, 'International Union Of Operating Engineers Local 49 PAC'), (1, 'LEAGUE OF CONSERVATION VOTERS VICTORY FUND'), (1, 'Labor United for Connecticut'), (1, 'OUR SHARED FUTURE PAC'), (1, 'Page Communications L.L.C.'), (1, \"The People's Lobby\"), (1, 'US NEWS NETWORK'), (1, 'ACTION PAC'), (1, 'Adams'), (1, 'CARELESS PAC'), (1, 'HAMPTON CREEK INC.'), (1, 'House Freedom Fund'), (1, 'International Brotherhood of Electrical Workers Political Action Committee'), (1, 'LIFE AND LIBERTY PAC INC'), (1, 'Main Street Advocacy'), (1, 'NEA Fund for Children and Public Education'), (1, 'OHIO REPUBLICAN PARTY STATE CENTRAL & EXECUTIVE COMMITTEE'), (1, 'RESTORE AMERICAN LEADERSHIP'), (1, 'Republican Hindu Coalition'), (1, 'Republican Party of San Diego County'), (1, 'Rosenbaum'), (1, 'Tulare County Republican Central Committee (Federal)'), (1, 'WARREN FOR PRESIDENT 16'), (1, 'CATHOLIC ADVOCATE'), (1, 'FERNANDEZ, MIGUEL B.'), (1, 'FREEDOM AND OPPORTUNITY PAC INC'), (1, 'Fund for Economic Growth'), (1, 'INDIANA REPUBLICAN STATE COMMITTEE, INC.'), (1, 'JOBS OPPORTUNITY AND FREEDOM POLITICAL ACTION COMMITTEE - JOFPAC'), (1, 'Johnson'), (1, 'LEGACY FOUNDATION ACTION FUND'), (1, 'Life'), (1, 'NEW JERSEY FAMILY FIRST INC'), (1, 'National Association of Home Builders'), (1, 'STOP THEM NOW PAC'), (1, 'TeaPartyExpress.org'), (1, 'WATCHDOG PAC'), (1, '32BJ United American Dream Fund'), (1, 'A Fair & Just Virginia PAC'), (1, 'AM RACING LLC'), (1, 'AMERICA REVIVED PAC'), (1, 'ASSOCIATED BUILDERS & CONTRACTORS OF MICHIGAN'), (1, 'American Academy of Family Physicians Political Action Committee'), (1, 'CONSERVATIVE PARTY NATIONAL COMMITTEE'), (1, 'CeaseFire Pennsylvania'), (1, 'Freedom and Liberty PAC'), (1, 'Granite Voices PAC'), (1, 'Jim Owles Liberal Democratic Club'), (1, 'LET FREEDOM RING INC'), (1, 'LOKI PAC'), (1, 'PEOPLE AND POLITICS'), (1, 'Republican Party of Peters Township'), (1, 'Rodrigues'), (1, 'America Progress'), (1, \"Int'l Union of Bricklayers and Allied Craftworkers PAC\"), (1, 'Michigan Republican Party'), (1, 'NEW YORK STATE COMMITTEE OF THE WORKING FAMILIES PARTY'), (1, 'New Direction PAC'), (1, 'Protect the Harvest Political Action Committee'), (1, 'RIGHT WAY INITIATIVE INC'), (1, 'US CHAMBER OF COMMERCE'), (1, 'American Osteopathic Information Association - Osteopathic Political Action Committee'), (1, 'BULLETIN DISPLAYS LLC'), (1, 'CONSERVATIVE ACTION PAC'), (1, 'CONSERVATIVE PARTY OF THESE UNITED STATES'), (1, 'Californians for Opportunity'), (1, 'Cummings'), (1, 'DEMOCRATIC PARTY OF ILLINOIS'), (1, 'Frugal Hoosiers'), (1, 'KLW Political Fund'), (1, 'NATIONAL ORGANIZATION FOR MARRIAGE'), (1, 'National Council of La Raza Action Fund, Inc.'), (1, 'Patterson'), (1, 'Your Vote Matters')]\n" + ] + } + ], "source": [ "print(expenditures_by_spender)" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 20, "metadata": {}, - "outputs": [], + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/Dan/Documents/projects/spark_learning/spark/spark/lib/python3.6/site-packages/scipy/stats/stats.py:1713: FutureWarning: Using a non-tuple sequence for multidimensional indexing is deprecated; use `arr[tuple(seq)]` instead of `arr[seq]`. In the future this will be interpreted as an array index, `arr[np.array(seq)]`, which will result either in an error or a different result.\n", + " return np.add.reduce(sorted[indexer] * weights, axis=axis) / sumval\n" + ] + }, + { + "data": { + "image/png": "iVBORw0KGgoAAAANSUhEUgAAA0EAAAHyCAYAAAAtPMUrAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDMuMC4wLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvqOYd8AAAIABJREFUeJzt3XuUZdddH/jvr6vdfkmybNRRG8mDHaKBKIYI3NjKQAawjS1rBSQmhjHJuAVLoBDsWZAHhcnMxAzgAJoQrxAcMUqsWCKAMQYvKyw5ijCeITDLxrJoZPlB3JiHVdKVuq1Hd6utlrp6zx91butW9a1nV9+61efzWatW3bvPY+/7Pt9z9tmnWmsBAADoix1b3QAAAIBJEoIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBe2bnVDVhNVT0nye8leXYW2vv+1trbq+o9Sb45yePdrN/bWttfVZXkXye5Osmxrvyebl3XJfnfu/l/urV2a1f+iiTvSfLcJHck+eHWWquqFyX59SQvTfLnSb67tfboSnUs56KLLmovfelLz+zJAADgnPaJT3ziUGtt91a341w39SEoyfEkr26tHa2qZyX5/ar6UDftR1tr718y/xuSXNb9vSrJTUle1QWatyfZm6Ql+URV3d5ae7Sb5weSfCwLIeiqJB9K8rYkH26t/WxVva27/2PL1bHSg3jpS1+au++++wyeBgAAznVV9Rdb3YY+mPrucG3B0e7us7q/tsIi1yS5rVvuo0kurKoXJ3l9krtaa490weeuJFd10y5orX20tdaS3Jbk2pF13drdvnVJ+bg6AACAKTf1IShJqmqmqvYneTgLQeZj3aR3VNW9VfXOqnp2V3ZJki+MLH5/V7ZS+f1jypPk4tbag93tQZKLV6kDAACYctsiBLXW5ltrVyS5NMkrq+rlSX48yVcn+YYkL8pCN7Wz2YaWlY9Anaaqbqiqu6vq7oMHD56llgEAAOuxLULQUGvtsSQfSXJVa+3Brjva8ST/Ickru9nmkrxkZLFLu7KVyi8dU54kDw27uXX/H16ljqXtvbm1tre1tnf3bue3AQDANJj6EFRVu6vqwu72c5N8W5LPjoSTysK5Ovd1i9yeZF8tuDLJ412XtjuTvK6qXlhVL0zyuiR3dtMOV9WV3br2JfngyLqu625ft6R8XB0AAMCU2w6jw704ya1VNZOF0Pa+1tpvV9XvVtXuJJVkf5If7Oa/IwtDVx/IwvDV35ckrbVHquqnkny8m+8nW2uPdLd/KM8Mkf2h7i9JfjbJ+6rq+iR/keS7V6oDAACYfrVwqgtn2969e5shsgEAWElVfaK1tner23Gum/rucAAAAJtJCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpl51Y3AOBsm52dzWAwyJ49e3LjjTdudXMAgC0mBAHnvMFgkLm5ua1uBgAwJXSHAwAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAekUIAgAAemXqQ1BVPaeq/rCq/riqPlVV/2dX/rKq+lhVHaiqX6+qXV35s7v7B7rpLx1Z14935X9SVa8fKb+qKztQVW8bKV93HQAAwHSb+hCU5HiSV7fW/maSK5JcVVVXJvm5JO9srf21JI8mub6b//okj3bl7+zmS1VdnuRNSf5GkquS/NuqmqmqmSTvSvKGJJcn+Z5u3qy3DgAAYPpNfQhqC452d5/V/bUkr07y/q781iTXdrev6e6nm/6aqqqu/L2tteOttT9LciDJK7u/A621z7fWnkry3iTXdMustw4AAGDKTX0ISpLuiM3+JA8nuSvJnyZ5rLV2opvl/iSXdLcvSfKFJOmmP57ky0bLlyyzXPmXbaCOpe2+oarurqq7Dx48uLEHDwAAbKptEYJaa/OttSuSXJqFIzdfvcVNWpPW2s2ttb2ttb27d+/e6uYAAADZJiFoqLX2WJKPJPlbSS6sqp3dpEuTzHW355K8JEm66S9I8sXR8iXLLFf+xQ3UAQAATLmpD0FVtbuqLuxuPzfJtyX5TBbC0Bu72a5L8sHu9u3d/XTTf7e11rryN3Uju70syWVJ/jDJx5Nc1o0EtysLgyfc3i2z3joAAIApt3P1Wbbci5Pc2o3itiPJ+1prv11Vn07y3qr66SR/lOTd3fzvTvLLVXUgySNZCDVprX2qqt6X5NNJTiR5S2ttPkmq6q1J7kwyk+SW1tqnunX92HrqAAAApt/Uh6DW2r1Jvm5M+eezcH7Q0vInk3zXMut6R5J3jCm/I8kdm1EHAAAw3aa+OxwAAMBmEoIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBemfoQVFUvqaqPVNWnq+pTVfXDXflPVNVcVe3v/q4eWebHq+pAVf1JVb1+pPyqruxAVb1tpPxlVfWxrvzXq2pXV/7s7v6BbvpLV6sDAACYblMfgpKcSPJPWmuXJ7kyyVuq6vJu2jtba1d0f3ckSTftTUn+RpKrkvzbqpqpqpkk70ryhiSXJ/mekfX8XLeuv5bk0STXd+XXJ3m0K39nN9+ydZy9pwAAANgsUx+CWmsPttbu6W4fSfKZJJessMg1Sd7bWjveWvuzJAeSvLL7O9Ba+3xr7akk701yTVVVklcneX+3/K1Jrh1Z163d7fcneU03/3J1AAAAU27qQ9Corjva1yX5WFf01qq6t6puqaoXdmWXJPnCyGL3d2XLlX9ZksdaayeWlC9aVzf98W7+5da1tL03VNXdVXX3wYMH1/14AQCAzbdtQlBVnZfkN5P8SGvtcJKbknxlkiuSPJjk57eweWO11m5ure1tre3dvXv3VjcHAADINglBVfWsLASgX2mt/VaStNYeaq3Nt9ZOJvl3eaY72lySl4wsfmlXtlz5F5NcWFU7l5QvWlc3/QXd/MutCwAAmHJTH4K6c3DeneQzrbV/NVL+4pHZvjPJfd3t25O8qRvZ7WVJLkvyh0k+nuSybiS4XVkY2OD21lpL8pEkb+yWvy7JB0fWdV13+41Jfrebf7k6AACAKbdz9Vm23DcmeXOST1bV/q7sn2VhdLcrkrQkf57kHyRJa+1TVfW+JJ/Owshyb2mtzSdJVb01yZ1JZpLc0lr7VLe+H0vy3qr66SR/lIXQle7/L1fVgSSPZCE4rVgHAAAw3aY+BLXWfj9JjZl0xwrLvCPJO8aU3zFuudba5zNmdLfW2pNJvms9dQAAANNt6rvDAQAAbCYhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6JWpD0FV9ZKq+khVfbqqPlVVP9yVv6iq7qqqz3X/X9iVV1X9QlUdqKp7q+rrR9Z1XTf/56rqupHyV1TVJ7tlfqGqaqN1AAAA023qQ1CSE0n+SWvt8iRXJnlLVV2e5G1JPtxauyzJh7v7SfKGJJd1fzckuSlZCDRJ3p7kVUlemeTtw1DTzfMDI8td1ZWvqw4AAGD6TX0Iaq092Fq7p7t9JMlnklyS5Jokt3az3Zrk2u72NUluaws+muTCqnpxktcnuau19khr7dEkdyW5qpt2QWvto621luS2JetaTx0AAMCUm/oQNKqqXprk65J8LMnFrbUHu0mDJBd3ty9J8oWRxe7vylYqv39MeTZQBwAAMOW2TQiqqvOS/GaSH2mtHR6d1h3BaWez/o3UUVU3VNXdVXX3wYMHz1LLAACA9dgWIaiqnpWFAPQrrbXf6oofGnZB6/4/3JXPJXnJyOKXdmUrlV86pnwjdSzSWru5tba3tbZ39+7da3/AAADAWTP1Iagbqe3dST7TWvtXI5NuTzIc4e26JB8cKd/XjeB2ZZLHuy5tdyZ5XVW9sBsQ4XVJ7uymHa6qK7u69i1Z13rqAAAAptzOSVZWVf99FkZSu7i19vKq+tok39Fa++kVFvvGJG9O8smq2t+V/bMkP5vkfVV1fZK/SPLd3bQ7klyd5ECSY0m+L0laa49U1U8l+Xg330+21h7pbv9QkvckeW6SD3V/WW8dAADA9JtoCEry75L8aJL/O0laa/dW1a8mWTYEtdZ+P0ktM/k1Y+ZvSd6yzLpuSXLLmPK7k7x8TPkX11sHAAAw3SbdHe55rbU/XFJ2YsJtAAAAemzSIehQVX1lulHWquqNSZxLAwAATMyku8O9JcnNSb66quaS/FmSvz/hNgAAAD02sRBUVTuS7G2tvbaqnp9kR2vtyKTqBwAASCbYHa61djLJbHf7CQEIAADYCpM+J+h3quqfVtVLqupFw78JtwEAAOixSZ8T9D93/0eHl25J/uqE2wEAAPTURENQa+1lk6wPAABgqYmGoKraN668tXbbJNsBAAD016S7w33DyO3nJHlNknuSCEEAAMBETLo73P86er+qLkzy3km2AQAA6LdJjw631BNJnCcEAABMzKTPCfpPWRgNLlkIYJcn+Y1JtgEAAOi3SZ8T9C9Hbp9I8hettfsn3AYAAKDHJt0d7urW2v/b/f1Ba+3+qvq5CbcBAADosUmHoG8bU/aGCbcBAADosYl0h6uqf5jkh5L81aq6d2TS+Un+YBJtAAAASCZ3TtCvJvlQkp9J8raR8iOttUcm1AYAAICJhaDWWvvzqnrL0glV9SJBCAAAmJRJHgn6O0k+kYUhsmtkWkvyVyfUDgAAoOcmEoJaa3+n++/CqAAAwJaa1MAIX7/S9NbaPZNoBwAAwKS6w/189/85SfYm+eMsdIn72iR3J/lbE2oHAADQcxO5TlBr7Vtba9+a5MEkX99a29tae0WSr0syN4k2AAAAJJO/WOpXtdY+ObzTWrsvyV+fcBsAAIAem1R3uKF7q+rfJ/mP3f2/n+TeFeYHAADYVJMOQd+X5B8m+eHu/u8luWnCbQAAAHpsoiGotfZkknd2fwAAABM30RBUVd+Y5CeSfMVo3a01F0sFAAAmYtLd4d6d5B8l+USS+QnXDQAAMPEQ9Hhr7UMTrhMAAOCUSYegj1TV/5Xkt5IcHxa21u6ZcDsAAICemnQIelX3f+9IWUvy6gm3AwAA6KlJjw73rZOsDwAAYKkdk6ysqi6uqndX1Ye6+5dX1fWTbAMAANBvEw1BSd6T5M4kX97d/29JfmTCbQAAAHps0iHootba+5KcTJLW2okYKhsAAJigSYegJ6rqy7IwGEKq6sokj0+4DQAAQI9NenS4f5zk9iRfWVV/kGR3kjdOuA0AAECPTXp0uHuq6puTfFWSSvInrbWnJ9kGAACg3yYagqrqOUl+KMk3ZaFL3H+tql9qrT05yXYAAAD9NenucLclOZLk33T3/16SX07yXRNuBwAA0FOTDkEvb61dPnL/I1X16Qm3AQAA6LFJjw53TzciXJKkql6V5O4JtwEAAOixSR8JekWS/6+q/rK7/98l+ZOq+mSS1lr72gm3BwAA6JlJh6CrJlwfAADAIpMOQZe11n5ntKCqrmut3TrhdgAAAD016XOC/nlV3VRVz6+qi6vqPyX59gm3AQAA6LFJh6BvTvKnSfYn+f0kv9pae+OE2wAAAPTYpEPQC5O8MgtB6HiSr6iqmnAbAACAHpt0CPpokv/cWrsqyTck+fIkfzDhNgAAAD026RD02iRPV9U/b619Kcm/TPK2CbcBAADosUmHoB9PcmWS7+nuH0ny8xNuAwAA0GOTHiL7Va21r6+qP0qS1tqjVbVrwm0AAAB6bNJHgp6uqpkkLUmqaneSkxNuAwAA0GOTDkG/kOQDSf5KVb0jC8Nk/4uVFqiqW6rq4aq6b6TsJ6pqrqr2d39Xj0z78ao6UFV/UlWvHym/qis7UFVvGyl/WVV9rCv/9eGRqap6dnf/QDf9pavVAQAATL+JhqDW2q8kmU3yM0keTHJta+03VlnsPUmuGlP+ztbaFd3fHUlSVZcneVOSv9Et82+raqY7+vSuJG9IcnmS7+nmTZKf69b115I8muT6rvz6JI925e/s5lu2jvU9EwAAwFaZ9JGgtNY+21p7V2vtF1trn1nD/L+X5JE1rv6aJO9trR1vrf1ZkgNZuC7RK5McaK19vrX2VJL3Jrmmu0bRq5O8v1v+1iTXjqzr1u72+5O8ppt/uToAAIBtYOIhaBO9taru7brLvbAruyTJF0bmub8rW678y5I81lo7saR80bq66Y938y+3LgAAYBvYriHopiRfmeSKLHSrm8phtqvqhqq6u6ruPnjw4FY3BwAAyDYNQa21h1pr8621k0n+XZ7pjjaX5CUjs17alS1X/sUkF1bVziXli9bVTX9BN/9y6xrXzptba3tba3t37969kYcKAABssm0ZgqrqxSN3vzPJcOS425O8qRvZ7WVJLkvyh0k+nuSybiS4XVkY2OD21lpL8pEkb+yWvy7JB0fWdV13+41Jfrebf7k6AACAbWDSF0tdt6r6tSTfkuSiqro/yduTfEtVXZGF6w39eZJ/kCSttU9V1fuSfDrJiSRvaa3Nd+t5a5I7k8wkuaW19qmuih9L8t6q+ukkf5Tk3V35u5P8clUdyMLADG9arQ4AAGD6TX0Iaq19z5jid48pG87/jiTvGFN+R5I7xpR/PmNGd2utPZnku9ZTBwAAMP22ZXc4AACAjRKCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXtm51Q0AOBOzs7MZDAbZs2dPbrzxxq1uDgCwDQhBwLY2GAwyNze31c0AALYR3eEAAIBeEYIAAIBe2RYhqKpuqaqHq+q+kbIXVdVdVfW57v8Lu/Kqql+oqgNVdW9Vff3IMtd183+uqq4bKX9FVX2yW+YXqqo2WgcAADDdtkUISvKeJFctKXtbkg+31i5L8uHufpK8Icll3d8NSW5KFgJNkrcneVWSVyZ5+zDUdPP8wMhyV22kDgAAYPptixDUWvu9JI8sKb4mya3d7VuTXDtSfltb8NEkF1bVi5O8PsldrbVHWmuPJrkryVXdtAtaax9trbUkty1Z13rqAAAApty2CEHLuLi19mB3e5Dk4u72JUm+MDLf/V3ZSuX3jynfSB2LVNUNVXV3Vd198ODBdTw0AADgbNnOIeiU7ghOm7Y6Wms3t9b2ttb27t69+yy1DAAAWI/tHIIeGnZB6/4/3JXPJXnJyHyXdmUrlV86pnwjdQAAAFNuO4eg25MMR3i7LskHR8r3dSO4XZnk8a5L251JXldVL+wGRHhdkju7aYer6spuVLh9S9a1njoAAIApt3OrG7AWVfVrSb4lyUVVdX8WRnn72STvq6rrk/xFku/uZr8jydVJDiQ5luT7kqS19khV/VSSj3fz/WRrbTjYwg9lYQS65yb5UPeX9dYBAABMv20Rglpr37PMpNeMmbclecsy67klyS1jyu9O8vIx5V9cbx0AAMB0287d4QAAANZNCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpFCAIAAHpl51Y3AGA7mZ2dzWAwyJ49e3LjjTdudXMAgA0QggDWYTAYZG5ubqubAQCcAd3hAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXhGCAACAXnGdIABgqrgoMXC2CUEAwFRxUWLgbNMdDgAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BUhCAAA6BVDZAOLuD4HAHCuE4KARVyfAwA41+kOBwAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9IoQBAAA9MrOrW4AsLlmZ2czGAyyZ8+e3HjjjVvdHACAqSMEwTlmMBhkbm5uq5sBADC1dIcDAAB6RQgCAAB6RQgCAAB6RQgCAAB6RQgCAAB6RQgCAAB6RQgCAAB6ZVuHoKr686r6ZFXtr6q7u7IXVdVdVfW57v8Lu/Kqql+oqgNVdW9Vff3Ieq7r5v9cVV03Uv6Kbv0HumVrpToAAIDpt61DUOdbW2tXtNb2dvffluTDrbXLkny4u58kb0hyWfd3Q5KbkoVAk+TtSV6V5JVJ3j4Sam5K8gMjy121Sh0AAMCUOxdC0FLXJLm1u31rkmtHym9rCz6a5MKqenGS1ye5q7X2SGvt0SR3Jbmqm3ZBa+2jrbWW5LYl6xpXBwDAVJidnc2+ffsyOzu71U2BqbPdQ1BL8l+q6hNVdUNXdnFr7cHu9iDJxd3tS5J8YWTZ+7uylcrvH1O+Uh2LVNUNVXV3Vd198ODBdT84AICNGgwGmZuby2Aw2OqmwNTZudUNOEPf1Fqbq6q/kuSuqvrs6MTWWquqdjYbsFIdrbWbk9ycJHv37j2r7QCmz+zsbAaDQfbs2ZMbb7xxq5sDAHS2dQhqrc11/x+uqg9k4Zyeh6rqxa21B7subQ93s88lecnI4pd2ZXNJvmVJ+f/TlV86Zv6sUAfAKcO9sAAbZWcKnB3btjtcVT2/qs4f3k7yuiT3Jbk9yXCEt+uSfLC7fXuSfd0ocVcmebzr0nZnktdV1Qu7ARFel+TObtrhqrqyGxVu35J1jasDtr3HjthoB5gWurTB2bGdjwRdnOQD3ajVO5P8amvtP1fVx5O8r6quT/IXSb67m/+OJFcnOZDkWJLvS5LW2iNV9VNJPt7N95OttUe62z+U5D1JnpvkQ91fkvzsMnUAAABTbtuGoNba55P8zTHlX0zymjHlLclbllnXLUluGVN+d5KXr7UOAABg+m3b7nAAAAAbsW2PBAEA6+Mke4AFQhAA9IQRCwEWCEEA5yh7/QFgPCEImAgb5JNnrz8AjGdgBGCswWCQ2dnZTV2fa10AANNACIJz1JmGmPn5+bMWWGZnZ7Nv375NDVkAAGulOxyco85miDlTumkB9Jfu0UwDIQgAgImxI4xpIATBNtH3PWd9f/wAwOYRgmCb6Pues74//jMlRALAM4QggB4QIgHgGUIQbFP27AMAbIwQBNvUpPfsC10AwLlCCALWRHcqAOBcIQQBAGvmqDBwLhCCAIA1c1QYOBcIQdAz9uICAH0nBEHP2IsLAPTdjq1uAAAAwCQJQQAAQK/oDgfnOOcAAQAsJgTBOW695wA9/7zKk0/syPz8/FlsFRsl1HIu8X4+c55D2BghCFjkG6+ayR/eebHBE6aUgS04l3g/nznPIWyMEARnwB44AIDtx8AIsMTs7Gz27duX2dnZVecd7oEbDAYTaNl0GAwGa3puAACmlSNBsMS0di04cng62jQ/P9+r0Afr4egwwPYgBAHAJpnWnSgALCYEwSayF3jreQ02biufO68bAJMkBMEmshd463kNNm4rnzuvGwCTZGAEAACgVxwJAgBWNeyyeOjQoa1uCsAZE4LgHHN4SkaRA84twy6LMzMzW90UgDOmOxy9tp5rAq2Ha+kwbR44+vhWN4Elztb3DwCrcySIXjtbJ2O7ls7pHjnqCBWM2orBIB48+tRE6wOYVkIQ5yTD7ULywNHHtroJbJGt+A48F793z8XHBCwQgjgnbWQP6+/8+6vz2u+/4yy1aHuYnZ3NZz93IieOO/GZjdmuG43btd3L2YqjTNtlmPP1vNbb5TEB6ycEAacMBoM8cTiZmTmx1U1hm9quG43btd2sn9caSIQgAHpqeETg8OHDOXY/bXJUAAASzElEQVTs2FY3B4AJEoKALbVduyEdOnQo+/bt23bt5hmjQz7Pz89vdXMAmCAhCNhS27VryokTJ7Zlu6fBdg2+02Lc8+c5BVgfIQiYuI0Ml33QENtn3aSuJbTdgu+0BYxxz992e04BtpoQBBsw3Cg6dGh9o6hN28YU288DRx/d6iacZvR9Pc02+vlba8AYrh8mxXsONk4Igg0YPZdgI8vBuWQ7vK9nZ2ezf//+s3ruz2Aw6OW5RRvdKZQkjx3t3/O1mfr6noPNIASxLW2HIypOnGeS1vOZ2A6fn81mY/HsWbpTaDAYZHZ2tjfvLRb08XuF7U0IYltY+uW6WXuev3T4gU1o3XibfeL8eedVzr/gy8+oy9Fo14nN3FDx47f11vOZ2A5HbvpuO3+m5ufnz4kuWrqarY/vleVt58/zuUwIYluY1i/XdnLje5ZHr1FywQUXrPrl+LrXzuTN33vbhutLFu8N38wNleHrs95gNRgMsnPn5nwNDY+8baRLztmwVRtQo0cgN5Mf8ckY7Vp2/PjxiR9V2ezXebu8b8a109FDNsu0bsP03Y6tbgCcq5b+eC7dKB5+KR47duxUgNju1hus5ufnc+LEiVXnm52dzVNHVp5neORtLes7E3v27Eku3LVqeNuqDajh87DZ76fRoLuSB44eXnVdDxxd/sUcbvT3wYNHv3Ra2fB5Hr6Pz3RnxXqfz7W+zpu9vq143Ufr3OzHDUw/IQiWsdk/ytthr+LjR87+nqpDhw7lyVUCzVKDwSA5ubZ559vZfY5vvPHG7HrzX89FF110Vuvpg3GfseU2+mdnZ7Nv376xn8m1TNuMI4RbHdCGj2XuoYeXnWfpEdGNhqjheib1eLeiC9250m2P6bDS9xDTSXe4c8RWdDnYLt0cNmqljTE/nBsfFvnEiRNpaww0TIez9Z5fz0bo0u4ko++/lbqabHQkxzNt79lw6nHuWH7/5fBI4Hoe77jP8kbOaTzZ1jU7nFN0edt+hKBzxFZ8+MbVOS3B6MnHVx/wYHZ2No8dXf+v9ugRneGP/mbtIZ7087fa+QYrnV+ylvfc2b5+zEY3zqflfbpdrHYUc9gF7tChQ2lPP7Up9a12HsyZfOct/bwu13V1ve+PB44eO61s0u+10XP+1mq7bLxt1nP5xNH174WZ1hHvnn5863oX+B5luxOC2FTb5cc0WWjrZu253Kw9xJN+/lZr95mOcDfaz34jT/Vq1x/ZaBfDjT7Pw/Y8vePxPPDE06vOtxFLg+PZ3MjY7A27EydOnHY4YC0bSkufr9Xel8s9vysNSz/fnmnXauvfzM/h6LrWs9G4lvf1Zr9+hw4dWtM5dTt37szMeReta+fGRi8ZMPoYVzoaOJz3bH1Wtvoo4DTaTr/3W23+8aNb3QTGEIJgm5ubm8vVV1+dl7/85Vu2N+7RVc4lmp+fT63hDMTlhkLfjK5MycaP2C0dsSsX7kqlVqxnpY3Y2dnZ3HfffUly2uu2dMNiszYy6oLn5cvPe8Gp7mPJ6Rt2df7z8+XnvSCHDx9ecYN1PRvzaxk5cLnna/R5Oj5/4tS8hw4dOjX/6Ib7ekL7WkYmXOuIg8N2tuPHTysfNxjKZjmTDfNxR3lPnDixpvB14sSJPPeCi3LjjTfmRz9w/4rrHz53owN2rCe4rfQYz9ZnZfi6PTQ4uKj8bF77bSuPqjiiMznTekSxr4Sgc8T8448tuj/tX2pnq32nhp3+0vLHHZ75gZvsHqyjhzd+5GHPnj35msuXn284lO5K1rqXdyutZSPxTIaAXu08r9H347hzTjYzjB3vNphH2zO60bzZr9eu7/im3PY/vSVJsm/fvmXm+ebs+difZjAY5MiRIxkMBrn22mtz7Ngz3bwOHTq0oSNw8/Pz2b9//7pHKhs+T8PzYObn5xfVvdYN93HtWW25pefXzMzMnHrfLX1/HF8SgIbt38zBUB48+uTCjZPr6861XODZaGiYn5/PU4dXDobLnZs0/Ay+8wOD/KPv3Fg32bM9HP7w875jx+K2j3vORt8H3/41P5q//ebdZ1TnVlxku69HdNZzlHo9r8do0Bku/8iXnkiy8P6/7777Fn0ep3lb7VwnBJ2Bqroqyb9OMpPk37fWfnaLm3TKer7Uxu2VfuBd/zhf/pZ/ddoXwP2/eH0ufeu7l13PRk9y3iynfryW30m/pnlWcuwsXmB1aPglOvo8rRSC1mKjG4vLWe3oz3JOLhm9bdwe/aVGR3xb68bbesLSuKMVZ9plbq3Tl9Y5fD5We72W21gafT6Xnp+zWvfCYXtGzys5duzYpoSO4foGg0Hq/PPSjhxdcWN+LUdqhuscdztZeLxzDz64cGctwWHHjuzZsyf3HPjTsXUsvYbMZnaZ2+je4bUc3dxI4JnfxK7Co/9XMgzdF1xwwaL36HJHlYYB60x2GGzk6PDoZ2/R++BrNtSERUZfq7V8XrfCcu3as2dP5h99el07qObm5vLa1742u3btyq5du/LUUwvfWcNtkdWupzc6femyo/OMO/K+ls/wWj/no9/rozvbTu1AG+kKsfTz2McAOi2EoA2qqpkk70rybUnuT/Lxqrq9tfbprW3Z+i23V/qBd/1IBoNHxn5AZ2dnM3hgcfnoxtPoD8ta93Ist8flTM6vGP1RXbreHTuSnFw4hWEwGOTXPnIyr/3+tS+/2UZ/yNdyTsTSH6BxP+ZnejRh9PVc60VNN7pBN7pxvdKGyXCeubm5VNWi8uqa2E4u7n7zvOc9LzMzM6tuiG2ke9HSx3va3v8dtejowf79+0/bcB93hGS57mHtyMK1ZVbbsB13fs5mHNFa6TkcThseMVnus/vsb399nvzV30x7/PBCF8Onnz613EZO7F/OYDBY11GTOv+CJEk7cnjFNqzlO2mlz8zwe+XkE8/sHV73d9yOHcnJk6feP2v5fA4Gg5ysZ46ordVwI3K4kTnqcx+8McfGtH0j51vOz8/nyJEjOXLkyKL36Goj3o07CreeOkef+7V8Zx4/fnzZz97SjfKnnnoqu3btWvNG/dDc3FweeOCBtNYWhb2lRxAe/dIji9q+dPp6AtTSHSvjzrk6fPjwqR0j49p10fNedNp34rigMqq1luPHj+fEU09nvhs6dHi0ZNgFeWZm5tTR6dFti9HpS38/hsEnyWnbOKOf4fX+Zo17DVc76js/ZkjU0e+IrTgCiBB0Jl6Z5EBr7fNJUlXvTXJNkomEoId/6RfzV37wrafu737+czPzggvXvAdm9Mtt/vEvnioffhn8yFesvPz9n92/4p7C0R/m4ZfPaiOFLbfHZWm4Wto9Z3TdD3dd3IY/wMM92UeOHFk0X5Jc8LzKC55f+cuDlfn5+fzlQxm7ITr8UV7NmQaOcT/kR7oudIPBIP/ld07mzd+bU/ePHz+eqqSNPNalG1JPPfVUWjvzXbqjXYdqx8Iev+GRoMFg8aAHw8P9V1999dgfvLXWt3///pyslTfUlj62mecnrZL5x545ejR8D+zcufO0H6nh+VTH55c/l2NpOB3X1qXdGxbZUYuO7C23jpU2ZIc/kHMPPXja1uVwT+pKBoNB2u2/n+RZYx/HsG1P1Yk8cPSJ09q20nrHhdXh87A08I2z0gbs4jDZ7UldQ6gZtuuBo+s/GXml4HTo0KFT7+vhe28wGGS+Tj+sPO69Ngztw/fkaD2rHZH4u7/5sWWnLfsc75hJTs6f+q5emG/1ELvUuO5+Tz/xaPbt25ejDx1MG7NcO7ny6/7RD/5M9n3g0Tz15NHUjpnT5l/uc5Is/s5bztIN1dFQsvR7Y/S1WfP7MafviEnG/44dP348+/fvP/XbNVzPaJfTJ7qRBUfrWNrOYfgabjwvbeu4IwxLg8pKR0xG1z/aE2H4Hbj08Q/vj4bC+WNPZ3Bo4TpWp51LOWK1HTFLg+bozpH77rvvVHtOHWEZs8NnWOe4upYe8R59zKuFyLnP/mkGTzx2KpiNM1zfuAERRusdPfLviNDkuVjqxl2S5Asj9+/vyjbk4C/9h3XM+67Tyv7Z/3hlbrvttmX3IDx0079Ikgxu+qkkydyffOrUl91Fz9uVmZEf540edVlqfn4+J5565otvtMvRUp+86TtO3T7++APZ/0vfniS555e+PcdHhrse7Z6zoxY2tj568985te75FbaPvnT4gdM2Qv/et+7KC563sNDwiNCePXvWvad8OP9KP8rnn1dju+CttrEwXO/RdQ7nXTtO/xFdambmmQ3Wd/3H1+d551Wef0FW3Kv8vPMWLhj6vPNr0d63pXtujx8/vqj+2pFccsklYwdImJmZOa3O+fn5NV8gdTXDNl5yySV5YObBRdOOHz9+Wj2f+NN719wtLUmOP/3U8lebP9lOTXvg6COnTx9p4/H5pzPuTTJc/6kf+h216PlqrS081yPLju55nJ+fTzt8+vDNQ8PPTzsyEoDGvVmXlM3Pz+eeA/8tdf55p01bLvA9cHQNV8pdeh2cnTPZsefi1Pnnr77sqXYdGDutqhZvuO7ceeqvzr/gtBA4NHx/L31fL7xP1/ZGXbTcks/m/Px8/ujAny9tbLLzWac+ozvOf+Ezz82OmUXP086dO1e8ftByHjz6dB7eccHC+pbx8NHFO3ee/exnJ+m68Zwc7hyZSS2zjnHfp186fChzc3PZ9ZzzctElly+77EYN39PHjh3L3Nxcnnji2Gmv3ahx5TtqJjtndq1Yz9Llnjwy/rtiXNfS0fKl3YRH7dy5MzM1s2iZE0+N2eE28jZ8+rHF6xtuZB87uvA8jJ5HuvQ3b35+PnOfuX/Rsms5cjj/6OIRM4evwdi2jjFTM9m141mnBculxrVnpmYWdTlbNK1Vdu3YmV0zz3yW5h/70mnzjW6jnGr7yI7Nh3/xQ2t6HMmZbUsdvOlXNrQc61ebsZe4j6rqjUmuaq19f3f/zUle1Vp768g8NyS5obv7VUm+eNqKTncoyXovRW+Z6V5mknVZ5txbZpJ1WebcW2aSdVlmupeZZF2WObNlvqy1tra9PmyY7nAbN5fkJSP3L+3KTmmt3Zzk5uH9qrp7tZW21vauZT7LbJ9lJlmXZc69ZSZZl2XOvWUmWZdlpnuZSdZlmTNeZrpGwzhH6Q63cR9PcllVvayqdiV5U5Lbt7hNAADAKhwJ2qDW2omqemuSO7MwRPYtrbVPbXGzAACAVQhBZ6C1dkeSO9axyM2rz7Ku+SyzfZaZZF2WOfeWmWRdljn3lplkXZaZ7mUmWZdlJvu6sk4GRgAAAHrFOUEAAECvrNodrqpekuTXk1yR5NlJRgdwX3kwdwAAgLOjjfw9mYUrQn8xCwOYvbm1tuxV21ftDldVL07yNd3d5yZ5VxYuO/78DC8/vnBEaXhUqZIcT/KcdTRemAIAAFYyzA3zSU5k4YDO0SSPJjkvyZ8l+UiSFyT549baTcutaN3nBFXVB5PsTvJ1o8VJRi+rPN816mR0uQMAANZv6cGS+SyMyjwMMCe72/cm+dokf5DkxUm+N8lPtNZev9yK1zU6XFW9NMnerjHPXjp5zHoFIAAAYCOGYaeW3B89IvSsJBd0ZRcluTjJ/UkuWWnFaw5BVXVekg9koavbaCNOzbKkUQAAAJO0pm5uawpBVfWsJL+VhXOChicYncgzYae6v2H3t2EQWhqIBCQAAGAthhlj9P7o/5ksHA063JUdysKRoUuTzK204rWMDldJ3t2t7OTIpCNZCEXpKnt6TEOT09PYcAQHXeUAAIDlLM0Vw/xwMs8MjPBEkhcleSwLA7d9MMl13f/lV7yG0eG+Kcl/XXeTAQAAzp7RIbKPZyEYfTHJJ5L8L62148stuO7R4QAAALYzXdIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAAIBeEYIAOKuq6ieq6p+uMP3aqrp8km0CoN+EIAC22rVJhCAAJsZ1ggDYdFX1v2Xhit0PJ/lCFi5c93iSG5LsSnIgyZuTXJHkt7tpjyf5u90q3pVkd5JjSX6gtfbZSbYfgHObEATApqqqVyR5T5JXJdmZ5J4kv5TkP7TWvtjN89NJHmqt/Zuqek+S326tvb+b9uEkP9ha+1xVvSrJz7TWXj35RwLAuWrnVjcAgHPO307ygdbasSSpqtu78pd34efCJOcluXPpglV1XpL/IclvVNWw+NlnvcUA9IoQBMCkvCfJta21P66q703yLWPm2ZHksdbaFRNsFwA9Y2AEADbb7yW5tqqeW1XnJ/n2rvz8JA9W1bOS/P2R+Y9009JaO5zkz6rqu5KkFvzNyTUdgD4QggDYVK21e5L8epI/TvKhJB/vJv0fST6W5A+SjA508N4kP1pVf1RVX5mFgHR9Vf1xkk8luWZSbQegHwyMAAAA9IojQQAAQK8IQQAAQK8IQQAAQK8IQQAAQK8IQQAAQK8IQQAAQK8IQQAAQK8IQQAAQK/8/waCZ4Fa3agYAAAAAElFTkSuQmCC\n", + "text/plain": [ + "
" + ] + }, + "metadata": { + "needs_background": "light" + }, + "output_type": "display_data" + } + ], "source": [ "## https://content.pivotal.io/blog/how-data-science-assists-sports\n", "## https://seaborn.pydata.org/generated/seaborn.lineplot.html\n", @@ -281,7 +366,7 @@ }, { "cell_type": "code", - "execution_count": 90, + "execution_count": 21, "metadata": {}, "outputs": [], "source": [ @@ -329,16 +414,27 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 22, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/plain": [ + "0.0" + ] + }, + "execution_count": 22, + "metadata": {}, + "output_type": "execute_result" + } + ], "source": [ "calculate_similarity_coefficient(['1'], ['2'])" ] }, { "cell_type": "code", - "execution_count": 91, + "execution_count": 23, "metadata": {}, "outputs": [ { @@ -1347,7 +1443,7 @@ " ...]" ] }, - "execution_count": 91, + "execution_count": 23, "metadata": {}, "output_type": "execute_result" } diff --git a/src/IndependentExpenditures/IndependentExpenditureJaccardIndex.ipynb b/src/IndependentExpenditures/IndependentExpenditureJaccardIndex.ipynb index 8579ae5..6a2d112 100644 --- a/src/IndependentExpenditures/IndependentExpenditureJaccardIndex.ipynb +++ b/src/IndependentExpenditures/IndependentExpenditureJaccardIndex.ipynb @@ -44,7 +44,7 @@ }, { "cell_type": "code", - "execution_count": 22, + "execution_count": 7, "metadata": {}, "outputs": [], "source": [ @@ -63,26 +63,46 @@ }, { "cell_type": "code", - "execution_count": 23, + "execution_count": 10, "metadata": {}, "outputs": [], "source": [ "# Instantiate variables for processing data moving forward\n", "spark = SparkSession.builder.appName('ElectionAnalyzer').getOrCreate()\n", - "datapath = '/Users/Dan/data/'\n", + "datapath = './data/'\n", "\n", "# Set the election year; modify this value to look at a different year\n", "election_year = \"2016\"\n", "\n", "# Set the file paths for the data file, based on the data path and election year\n", - "independent_expenditure_file = '{0}independent_expenditure_{1}.csv'.format(datapath, election_year)" + "independent_expenditure_file = '{0}{1}/independent_expenditure_{1}.csv'.format(datapath, election_year)" ] }, { "cell_type": "code", - "execution_count": 24, + "execution_count": 11, "metadata": {}, - "outputs": [], + "outputs": [ + { + "ename": "AnalysisException", + "evalue": "'Path does not exist: file:/Users/Dan/Desktop/git/FEC_data_notebooks/src/IndependentExpenditures/data/2016/independent_expenditure_2016.csv;'", + "output_type": "error", + "traceback": [ + "\u001b[0;31m------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mPy4JJavaError\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/sql/utils.py\u001b[0m in \u001b[0;36mdeco\u001b[0;34m(*a, **kw)\u001b[0m\n\u001b[1;32m 62\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 63\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mf\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkw\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 64\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mpy4j\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mprotocol\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mPy4JJavaError\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/py4j/protocol.py\u001b[0m in \u001b[0;36mget_return_value\u001b[0;34m(answer, gateway_client, target_id, name)\u001b[0m\n\u001b[1;32m 327\u001b[0m \u001b[0;34m\"An error occurred while calling {0}{1}{2}.\\n\"\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 328\u001b[0;31m format(target_id, \".\", name), value)\n\u001b[0m\u001b[1;32m 329\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mPy4JJavaError\u001b[0m: An error occurred while calling o126.csv.\n: org.apache.spark.sql.AnalysisException: Path does not exist: file:/Users/Dan/Desktop/git/FEC_data_notebooks/src/IndependentExpenditures/data/2016/independent_expenditure_2016.csv;\n\tat org.apache.spark.sql.execution.datasources.DataSource$.org$apache$spark$sql$execution$datasources$DataSource$$checkAndGlobPathIfNecessary(DataSource.scala:715)\n\tat org.apache.spark.sql.execution.datasources.DataSource$$anonfun$15.apply(DataSource.scala:389)\n\tat org.apache.spark.sql.execution.datasources.DataSource$$anonfun$15.apply(DataSource.scala:389)\n\tat scala.collection.TraversableLike$$anonfun$flatMap$1.apply(TraversableLike.scala:241)\n\tat scala.collection.TraversableLike$$anonfun$flatMap$1.apply(TraversableLike.scala:241)\n\tat scala.collection.immutable.List.foreach(List.scala:381)\n\tat scala.collection.TraversableLike$class.flatMap(TraversableLike.scala:241)\n\tat scala.collection.immutable.List.flatMap(List.scala:344)\n\tat org.apache.spark.sql.execution.datasources.DataSource.resolveRelation(DataSource.scala:388)\n\tat org.apache.spark.sql.DataFrameReader.loadV1Source(DataFrameReader.scala:239)\n\tat org.apache.spark.sql.DataFrameReader.load(DataFrameReader.scala:227)\n\tat org.apache.spark.sql.DataFrameReader.csv(DataFrameReader.scala:596)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)\n\tat sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)\n\tat java.lang.reflect.Method.invoke(Method.java:498)\n\tat py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244)\n\tat py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:357)\n\tat py4j.Gateway.invoke(Gateway.java:282)\n\tat py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132)\n\tat py4j.commands.CallCommand.execute(CallCommand.java:79)\n\tat py4j.GatewayConnection.run(GatewayConnection.java:238)\n\tat java.lang.Thread.run(Thread.java:745)\n", + "\nDuring handling of the above exception, another exception occurred:\n", + "\u001b[0;31mAnalysisException\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0;31m# Read the CSV as a spark dataframe\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0mind_exp\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mspark\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcsv\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mindependent_expenditure_file\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mheader\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 3\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 4\u001b[0m \u001b[0;31m# Convert the dataframe to an RDD, and\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 5\u001b[0m \u001b[0;31m# filter out the empty lines\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/sql/readwriter.py\u001b[0m in \u001b[0;36mcsv\u001b[0;34m(self, path, schema, sep, encoding, quote, escape, comment, header, inferSchema, ignoreLeadingWhiteSpace, ignoreTrailingWhiteSpace, nullValue, nanValue, positiveInf, negativeInf, dateFormat, timestampFormat, maxColumns, maxCharsPerColumn, maxMalformedLogPerPartition, mode, columnNameOfCorruptRecord, multiLine, charToEscapeQuoteEscaping)\u001b[0m\n\u001b[1;32m 439\u001b[0m \u001b[0mpath\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m[\u001b[0m\u001b[0mpath\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 440\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mtype\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mpath\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;34m==\u001b[0m \u001b[0mlist\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 441\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_df\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jreader\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcsv\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_spark\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_sc\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jvm\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mPythonUtils\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtoSeq\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mpath\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 442\u001b[0m \u001b[0;32melif\u001b[0m \u001b[0misinstance\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mpath\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mRDD\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 443\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0miterator\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/py4j/java_gateway.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, *args)\u001b[0m\n\u001b[1;32m 1255\u001b[0m \u001b[0manswer\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgateway_client\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msend_command\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcommand\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1256\u001b[0m return_value = get_return_value(\n\u001b[0;32m-> 1257\u001b[0;31m answer, self.gateway_client, self.target_id, self.name)\n\u001b[0m\u001b[1;32m 1258\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1259\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mtemp_arg\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtemp_args\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/sql/utils.py\u001b[0m in \u001b[0;36mdeco\u001b[0;34m(*a, **kw)\u001b[0m\n\u001b[1;32m 67\u001b[0m e.java_exception.getStackTrace()))\n\u001b[1;32m 68\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0ms\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstartswith\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'org.apache.spark.sql.AnalysisException: '\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 69\u001b[0;31m \u001b[0;32mraise\u001b[0m \u001b[0mAnalysisException\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ms\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m': '\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstackTrace\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 70\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0ms\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstartswith\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m'org.apache.spark.sql.catalyst.analysis'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 71\u001b[0m \u001b[0;32mraise\u001b[0m \u001b[0mAnalysisException\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ms\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msplit\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m': '\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mstackTrace\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mAnalysisException\u001b[0m: 'Path does not exist: file:/Users/Dan/Desktop/git/FEC_data_notebooks/src/IndependentExpenditures/data/2016/independent_expenditure_2016.csv;'" + ] + } + ], "source": [ "# Read the CSV as a spark dataframe\n", "ind_exp = spark.read.csv(independent_expenditure_file, header=True)\n", @@ -98,7 +118,7 @@ }, { "cell_type": "code", - "execution_count": 25, + "execution_count": 4, "metadata": {}, "outputs": [], "source": [ @@ -155,7 +175,7 @@ }, { "cell_type": "code", - "execution_count": 26, + "execution_count": 5, "metadata": {}, "outputs": [], "source": [ @@ -173,22 +193,22 @@ }, { "cell_type": "code", - "execution_count": 27, + "execution_count": 6, "metadata": {}, "outputs": [ { "ename": "Py4JJavaError", - "evalue": "An error occurred while calling z:org.apache.spark.api.python.PythonRDD.collectAndServe.\n: org.apache.spark.SparkException: Job aborted due to stage failure: Task 0 in stage 15.0 failed 1 times, most recent failure: Lost task 0.0 in stage 15.0 (TID 270, localhost, executor driver): org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\tat java.lang.Thread.run(Thread.java:745)\n\nDriver stacktrace:\n\tat org.apache.spark.scheduler.DAGScheduler.org$apache$spark$scheduler$DAGScheduler$$failJobAndIndependentStages(DAGScheduler.scala:1602)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1590)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1589)\n\tat scala.collection.mutable.ResizableArray$class.foreach(ResizableArray.scala:59)\n\tat scala.collection.mutable.ArrayBuffer.foreach(ArrayBuffer.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.abortStage(DAGScheduler.scala:1589)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat scala.Option.foreach(Option.scala:257)\n\tat org.apache.spark.scheduler.DAGScheduler.handleTaskSetFailed(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.doOnReceive(DAGScheduler.scala:1823)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1772)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1761)\n\tat org.apache.spark.util.EventLoop$$anon$1.run(EventLoop.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.runJob(DAGScheduler.scala:642)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2034)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2055)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2074)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2099)\n\tat org.apache.spark.rdd.RDD$$anonfun$collect$1.apply(RDD.scala:939)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:151)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:112)\n\tat org.apache.spark.rdd.RDD.withScope(RDD.scala:363)\n\tat org.apache.spark.rdd.RDD.collect(RDD.scala:938)\n\tat org.apache.spark.api.python.PythonRDD$.collectAndServe(PythonRDD.scala:162)\n\tat org.apache.spark.api.python.PythonRDD.collectAndServe(PythonRDD.scala)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)\n\tat sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)\n\tat java.lang.reflect.Method.invoke(Method.java:498)\n\tat py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244)\n\tat py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:357)\n\tat py4j.Gateway.invoke(Gateway.java:282)\n\tat py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132)\n\tat py4j.commands.CallCommand.execute(CallCommand.java:79)\n\tat py4j.GatewayConnection.run(GatewayConnection.java:238)\n\tat java.lang.Thread.run(Thread.java:745)\nCaused by: org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\t... 1 more\n", + "evalue": "An error occurred while calling z:org.apache.spark.api.python.PythonRDD.collectAndServe.\n: org.apache.spark.SparkException: Job aborted due to stage failure: Task 0 in stage 1.0 failed 1 times, most recent failure: Lost task 0.0 in stage 1.0 (TID 1, localhost, executor driver): org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\tat java.lang.Thread.run(Thread.java:745)\n\nDriver stacktrace:\n\tat org.apache.spark.scheduler.DAGScheduler.org$apache$spark$scheduler$DAGScheduler$$failJobAndIndependentStages(DAGScheduler.scala:1602)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1590)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1589)\n\tat scala.collection.mutable.ResizableArray$class.foreach(ResizableArray.scala:59)\n\tat scala.collection.mutable.ArrayBuffer.foreach(ArrayBuffer.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.abortStage(DAGScheduler.scala:1589)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat scala.Option.foreach(Option.scala:257)\n\tat org.apache.spark.scheduler.DAGScheduler.handleTaskSetFailed(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.doOnReceive(DAGScheduler.scala:1823)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1772)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1761)\n\tat org.apache.spark.util.EventLoop$$anon$1.run(EventLoop.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.runJob(DAGScheduler.scala:642)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2034)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2055)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2074)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2099)\n\tat org.apache.spark.rdd.RDD$$anonfun$collect$1.apply(RDD.scala:939)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:151)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:112)\n\tat org.apache.spark.rdd.RDD.withScope(RDD.scala:363)\n\tat org.apache.spark.rdd.RDD.collect(RDD.scala:938)\n\tat org.apache.spark.api.python.PythonRDD$.collectAndServe(PythonRDD.scala:162)\n\tat org.apache.spark.api.python.PythonRDD.collectAndServe(PythonRDD.scala)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)\n\tat sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)\n\tat java.lang.reflect.Method.invoke(Method.java:498)\n\tat py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244)\n\tat py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:357)\n\tat py4j.Gateway.invoke(Gateway.java:282)\n\tat py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132)\n\tat py4j.commands.CallCommand.execute(CallCommand.java:79)\n\tat py4j.GatewayConnection.run(GatewayConnection.java:238)\n\tat java.lang.Thread.run(Thread.java:745)\nCaused by: org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\t... 1 more\n", "output_type": "error", "traceback": [ "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", "\u001b[0;31mPy4JJavaError\u001b[0m Traceback (most recent call last)", - "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0;31m# Collect the (similarity, candidate pair) RDD, printing to the console\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0mcandidate_pairs_with_jaccard_index\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msortByKey\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;32mFalse\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcollect\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", - "\u001b[0;32m~/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\u001b[0m in \u001b[0;36mcollect\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 832\u001b[0m \"\"\"\n\u001b[1;32m 833\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mSCCallSiteSync\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0mcss\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 834\u001b[0;31m \u001b[0msock_info\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mctx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jvm\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mPythonRDD\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcollectAndServe\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jrdd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrdd\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 835\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mlist\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0m_load_from_socket\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msock_info\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jrdd_deserializer\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 836\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/py4j/java_gateway.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, *args)\u001b[0m\n\u001b[1;32m 1255\u001b[0m \u001b[0manswer\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgateway_client\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msend_command\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcommand\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1256\u001b[0m return_value = get_return_value(\n\u001b[0;32m-> 1257\u001b[0;31m answer, self.gateway_client, self.target_id, self.name)\n\u001b[0m\u001b[1;32m 1258\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1259\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mtemp_arg\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtemp_args\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/sql/utils.py\u001b[0m in \u001b[0;36mdeco\u001b[0;34m(*a, **kw)\u001b[0m\n\u001b[1;32m 61\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mdeco\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkw\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 62\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 63\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mf\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkw\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 64\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mpy4j\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mprotocol\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mPy4JJavaError\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 65\u001b[0m \u001b[0ms\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjava_exception\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtoString\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", - "\u001b[0;32m~/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/py4j/protocol.py\u001b[0m in \u001b[0;36mget_return_value\u001b[0;34m(answer, gateway_client, target_id, name)\u001b[0m\n\u001b[1;32m 326\u001b[0m raise Py4JJavaError(\n\u001b[1;32m 327\u001b[0m \u001b[0;34m\"An error occurred while calling {0}{1}{2}.\\n\"\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 328\u001b[0;31m format(target_id, \".\", name), value)\n\u001b[0m\u001b[1;32m 329\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 330\u001b[0m raise Py4JError(\n", - "\u001b[0;31mPy4JJavaError\u001b[0m: An error occurred while calling z:org.apache.spark.api.python.PythonRDD.collectAndServe.\n: org.apache.spark.SparkException: Job aborted due to stage failure: Task 0 in stage 15.0 failed 1 times, most recent failure: Lost task 0.0 in stage 15.0 (TID 270, localhost, executor driver): org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\tat java.lang.Thread.run(Thread.java:745)\n\nDriver stacktrace:\n\tat org.apache.spark.scheduler.DAGScheduler.org$apache$spark$scheduler$DAGScheduler$$failJobAndIndependentStages(DAGScheduler.scala:1602)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1590)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1589)\n\tat scala.collection.mutable.ResizableArray$class.foreach(ResizableArray.scala:59)\n\tat scala.collection.mutable.ArrayBuffer.foreach(ArrayBuffer.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.abortStage(DAGScheduler.scala:1589)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat scala.Option.foreach(Option.scala:257)\n\tat org.apache.spark.scheduler.DAGScheduler.handleTaskSetFailed(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.doOnReceive(DAGScheduler.scala:1823)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1772)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1761)\n\tat org.apache.spark.util.EventLoop$$anon$1.run(EventLoop.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.runJob(DAGScheduler.scala:642)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2034)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2055)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2074)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2099)\n\tat org.apache.spark.rdd.RDD$$anonfun$collect$1.apply(RDD.scala:939)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:151)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:112)\n\tat org.apache.spark.rdd.RDD.withScope(RDD.scala:363)\n\tat org.apache.spark.rdd.RDD.collect(RDD.scala:938)\n\tat org.apache.spark.api.python.PythonRDD$.collectAndServe(PythonRDD.scala:162)\n\tat org.apache.spark.api.python.PythonRDD.collectAndServe(PythonRDD.scala)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)\n\tat sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)\n\tat java.lang.reflect.Method.invoke(Method.java:498)\n\tat py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244)\n\tat py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:357)\n\tat py4j.Gateway.invoke(Gateway.java:282)\n\tat py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132)\n\tat py4j.commands.CallCommand.execute(CallCommand.java:79)\n\tat py4j.GatewayConnection.run(GatewayConnection.java:238)\n\tat java.lang.Thread.run(Thread.java:745)\nCaused by: org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/stagingArea/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\t... 1 more\n" + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0;31m# Collect the (similarity, candidate pair) RDD, printing to the console\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0mcandidate_pairs_with_jaccard_index\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msortByKey\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;32mFalse\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcollect\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\u001b[0m in \u001b[0;36mcollect\u001b[0;34m(self)\u001b[0m\n\u001b[1;32m 832\u001b[0m \"\"\"\n\u001b[1;32m 833\u001b[0m \u001b[0;32mwith\u001b[0m \u001b[0mSCCallSiteSync\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcontext\u001b[0m\u001b[0;34m)\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0mcss\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 834\u001b[0;31m \u001b[0msock_info\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mctx\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jvm\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mPythonRDD\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcollectAndServe\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jrdd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrdd\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 835\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mlist\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0m_load_from_socket\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msock_info\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_jrdd_deserializer\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 836\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/py4j/java_gateway.py\u001b[0m in \u001b[0;36m__call__\u001b[0;34m(self, *args)\u001b[0m\n\u001b[1;32m 1255\u001b[0m \u001b[0manswer\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mgateway_client\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msend_command\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcommand\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1256\u001b[0m return_value = get_return_value(\n\u001b[0;32m-> 1257\u001b[0;31m answer, self.gateway_client, self.target_id, self.name)\n\u001b[0m\u001b[1;32m 1258\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 1259\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mtemp_arg\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mtemp_args\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/sql/utils.py\u001b[0m in \u001b[0;36mdeco\u001b[0;34m(*a, **kw)\u001b[0m\n\u001b[1;32m 61\u001b[0m \u001b[0;32mdef\u001b[0m \u001b[0mdeco\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkw\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 62\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 63\u001b[0;31m \u001b[0;32mreturn\u001b[0m \u001b[0mf\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m*\u001b[0m\u001b[0ma\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m**\u001b[0m\u001b[0mkw\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 64\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mpy4j\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mprotocol\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mPy4JJavaError\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 65\u001b[0m \u001b[0ms\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjava_exception\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mtoString\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;32m~/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/py4j/protocol.py\u001b[0m in \u001b[0;36mget_return_value\u001b[0;34m(answer, gateway_client, target_id, name)\u001b[0m\n\u001b[1;32m 326\u001b[0m raise Py4JJavaError(\n\u001b[1;32m 327\u001b[0m \u001b[0;34m\"An error occurred while calling {0}{1}{2}.\\n\"\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 328\u001b[0;31m format(target_id, \".\", name), value)\n\u001b[0m\u001b[1;32m 329\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 330\u001b[0m raise Py4JError(\n", + "\u001b[0;31mPy4JJavaError\u001b[0m: An error occurred while calling z:org.apache.spark.api.python.PythonRDD.collectAndServe.\n: org.apache.spark.SparkException: Job aborted due to stage failure: Task 0 in stage 1.0 failed 1 times, most recent failure: Lost task 0.0 in stage 1.0 (TID 1, localhost, executor driver): org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\tat java.lang.Thread.run(Thread.java:745)\n\nDriver stacktrace:\n\tat org.apache.spark.scheduler.DAGScheduler.org$apache$spark$scheduler$DAGScheduler$$failJobAndIndependentStages(DAGScheduler.scala:1602)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1590)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$abortStage$1.apply(DAGScheduler.scala:1589)\n\tat scala.collection.mutable.ResizableArray$class.foreach(ResizableArray.scala:59)\n\tat scala.collection.mutable.ArrayBuffer.foreach(ArrayBuffer.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.abortStage(DAGScheduler.scala:1589)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGScheduler$$anonfun$handleTaskSetFailed$1.apply(DAGScheduler.scala:831)\n\tat scala.Option.foreach(Option.scala:257)\n\tat org.apache.spark.scheduler.DAGScheduler.handleTaskSetFailed(DAGScheduler.scala:831)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.doOnReceive(DAGScheduler.scala:1823)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1772)\n\tat org.apache.spark.scheduler.DAGSchedulerEventProcessLoop.onReceive(DAGScheduler.scala:1761)\n\tat org.apache.spark.util.EventLoop$$anon$1.run(EventLoop.scala:48)\n\tat org.apache.spark.scheduler.DAGScheduler.runJob(DAGScheduler.scala:642)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2034)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2055)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2074)\n\tat org.apache.spark.SparkContext.runJob(SparkContext.scala:2099)\n\tat org.apache.spark.rdd.RDD$$anonfun$collect$1.apply(RDD.scala:939)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:151)\n\tat org.apache.spark.rdd.RDDOperationScope$.withScope(RDDOperationScope.scala:112)\n\tat org.apache.spark.rdd.RDD.withScope(RDD.scala:363)\n\tat org.apache.spark.rdd.RDD.collect(RDD.scala:938)\n\tat org.apache.spark.api.python.PythonRDD$.collectAndServe(PythonRDD.scala:162)\n\tat org.apache.spark.api.python.PythonRDD.collectAndServe(PythonRDD.scala)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)\n\tat sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)\n\tat sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)\n\tat java.lang.reflect.Method.invoke(Method.java:498)\n\tat py4j.reflection.MethodInvoker.invoke(MethodInvoker.java:244)\n\tat py4j.reflection.ReflectionEngine.invoke(ReflectionEngine.java:357)\n\tat py4j.Gateway.invoke(Gateway.java:282)\n\tat py4j.commands.AbstractCommand.invokeMethod(AbstractCommand.java:132)\n\tat py4j.commands.CallCommand.execute(CallCommand.java:79)\n\tat py4j.GatewayConnection.run(GatewayConnection.java:238)\n\tat java.lang.Thread.run(Thread.java:745)\nCaused by: org.apache.spark.api.python.PythonException: Traceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1556, in __getattr__\n idx = self.__fields__.index(item)\nValueError: 'cand_id' is not in list\n\nDuring handling of the above exception, another exception occurred:\n\nTraceback (most recent call last):\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 230, in main\n process()\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/worker.py\", line 225, in process\n serializer.dump_stream(func(split_index, iterator), outfile)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 2457, in pipeline_func\n return func(split, prev_func(split, iterator))\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 370, in func\n return f(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/rdd.py\", line 1876, in combineLocally\n merger.mergeValues(iterator)\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/shuffle.py\", line 237, in mergeValues\n for k, v in iterator:\n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/util.py\", line 55, in wrapper\n return f(*args, **kwargs)\n File \"\", line 11, in \n File \"/Users/Dan/Desktop/git/FEC_data_notebooks/FEC_data_notebook/lib/python3.6/site-packages/pyspark/python/lib/pyspark.zip/pyspark/sql/types.py\", line 1561, in __getattr__\n raise AttributeError(item)\nAttributeError: cand_id\n\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.handlePythonException(PythonRunner.scala:298)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:438)\n\tat org.apache.spark.api.python.PythonRunner$$anon$1.read(PythonRunner.scala:421)\n\tat org.apache.spark.api.python.BasePythonRunner$ReaderIterator.hasNext(PythonRunner.scala:252)\n\tat org.apache.spark.InterruptibleIterator.hasNext(InterruptibleIterator.scala:37)\n\tat scala.collection.Iterator$GroupedIterator.fill(Iterator.scala:1126)\n\tat scala.collection.Iterator$GroupedIterator.hasNext(Iterator.scala:1132)\n\tat scala.collection.Iterator$$anon$11.hasNext(Iterator.scala:408)\n\tat org.apache.spark.shuffle.sort.BypassMergeSortShuffleWriter.write(BypassMergeSortShuffleWriter.java:125)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:96)\n\tat org.apache.spark.scheduler.ShuffleMapTask.runTask(ShuffleMapTask.scala:53)\n\tat org.apache.spark.scheduler.Task.run(Task.scala:109)\n\tat org.apache.spark.executor.Executor$TaskRunner.run(Executor.scala:345)\n\tat java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1142)\n\tat java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:617)\n\t... 1 more\n" ] } ], diff --git a/start.sh b/start.sh new file mode 100755 index 0000000..abe119c --- /dev/null +++ b/start.sh @@ -0,0 +1,3 @@ +#!/bin/bash +source ./activate && export FEC_data_path=./data && cd ./src && jupyter notebook +