{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "### Ok Ok, lets start with the reference-data\n" ] }, { "cell_type": "code", "execution_count": 59, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:37:27.990889Z", "start_time": "2018-06-07T10:37:27.973219Z" } }, "outputs": [ { "data": { "text/plain": [ "{2009: ['pre-school-data-0910-3.xlsx',\n", " 'post-primary-schools-data-0910-supp-2.xlsx',\n", " 'primary-schools-data-0910-supp-r.xlsx',\n", " 'special-school-data-0910-supp-3.xlsx',\n", " 'nursery-schools-data-0910-supp-3.xlsx'],\n", " 2010: ['special-school-data-1011-supp-2.xlsx',\n", " 'primary-schools-data-1011-supp-inc-unfilled-r.xlsx',\n", " 'post-primary-schools-data-10-11-supp-inc-unfilled.xlsx',\n", " 'pre-school-data-1011-3.xlsx',\n", " 'nursery-schools-data-2010-11-supp-inc-unfilled.xlsx'],\n", " 2011: ['post-primary-schools-data-11-12-supp-inc-unfilled-2.xlsx',\n", " 'nursery-schools-data-2011-12-supp-inc-unfilled-2.xlsx',\n", " 'primary-schools-data-11-12-supp-inc-unfilled-places-r.xlsx',\n", " 'special-school-data-11-12-supp.xlsx',\n", " 'pre-school-data-2011-12.xlsx'],\n", " 2012: ['nursery-schools-data-2012-13-supp-inc-unfilled-places.xlsx',\n", " 'post-primary-schools-data-2012-13-supp-inc-unfilled-places.xlsx',\n", " 'primary-schools-data-2012-13-supp-inc-unfilled-places-2.xlsx',\n", " 'pre-school-data-2012-13.xlsx',\n", " 'special-school-data-2012-13-supp.xlsx'],\n", " 2013: ['nursery-schools-data-13-14-supp-incl-unfilled-places.xlsx',\n", " 'post-primary-schools-data-13-14-supp-inc-unfilled-places.xlsx',\n", " 'special-school-data-2013-14-supp.xlsx',\n", " 'primary-schools-data-2013-14-supp-inc-unfilled-places.xlsx',\n", " 'pre-school-data-2013-14.xlsx'],\n", " 2014: ['School%20level%20-%20nursery%20schools%20data%201415%20supp%20-%20unfilled%20places.XLS',\n", " 'post-primary-schools-data-1415-supp-with-unfilled-places.xlsx',\n", " 'School%20level%20-%20pre%20school%20data%201415.XLS',\n", " 'special-school-data-1415-supp.xlsx',\n", " 'primary-schools-data-1415-supp-with-unfilled-places.xlsx'],\n", " 2015: ['School%20level%20-%20nursery%20schools%20data%201516%20supp.XLS',\n", " 'School%20level%20-%20pre%20school%20data%201516%20supp.XLSX',\n", " 'School%20level%20-%20primary%20schools%20data%201516%20supp_0.XLSX',\n", " 'School%20level%20-%20special_school_data%201516%20supp.XLSX',\n", " 'School-level-post-primary-schools-data-1516_1.XLS'],\n", " 2016: ['School%20level%20-%20special_school_data%201617%20supp_0.XLSX',\n", " 'School%20level%20-%20post%20primary%20schools%20data%201617%20supp_0.XLS',\n", " 'School%20level%20-%20nursery%20schools%20data%201617%20supp.XLS',\n", " 'available%20places%20-%20post-primary%201617%20supp.XLSX',\n", " 'available%20places%20-%20primary%201617%20supp.XLSX',\n", " 'available%20places%20-%20nursery%201617%20supp%20final.XLSX',\n", " 'School%20level%20-%20pre%20school%20data%201617%20supp.XLSX',\n", " 'School%20level%20-%20primary%20schools%20data%201617%20supp.XLSX'],\n", " 2017: ['School%20level%20-%20pre%20school%20data%201718%20supp.xlsx',\n", " 'available%20places%20-%20primary%201718%20supp.xlsx',\n", " 'available%20places%20-%20post-primary%201718%20supp.xlsx',\n", " 'School%20level%20-%20post%20primary%20schools%20data%20supp%201718.xls',\n", " 'School%20level%20-%20nursery%20schools%20data%201718%20supp.xlsx',\n", " 'available%20places%20-%20nursery%201718%20supp.xlsx',\n", " 'School%20level%20-%20special%20school%20data%202017-18_0.xlsx',\n", " 'School%20level%20-%20primary%20schools%20data%20supp%201718.xlsx']}" ] }, "execution_count": 59, "metadata": {}, "output_type": "execute_result" } ], "source": [ "from pathlib import Path\n", "from collections import defaultdict\n", "import pandas as pd\n", "\n", "year_files = defaultdict(list)\n", "dest = Path('./data/education-ni/')\n", "for year_p in dest.iterdir():\n", " try:\n", " year=int(year_p.parts[-1])\n", " for file in year_p.iterdir():\n", " year_files[year].append(file.parts[-1])\n", " except ValueError:\n", " pass\n", " \n", "import warnings\n", "warnings.filterwarnings(\"ignore\", category=DeprecationWarning) \n", "\n", "year_files = dict(sorted(year_files.items()))\n", "year_files" ] }, { "cell_type": "code", "execution_count": 60, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:37:46.434793Z", "start_time": "2018-06-07T10:37:46.430904Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "2009\n", "2010\n", "2011\n", "2012\n", "2013\n", "2014\n", "2015\n", "2016\n", "2017\n" ] } ], "source": [ "for year, files in year_files.items():\n", " print(year)" ] }, { "cell_type": "code", "execution_count": 46, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.343390Z", "start_time": "2018-06-07T10:36:11.338041Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "post-primary-schools-data-13-14-supp-inc-unfilled-places.xlsx\n", "post-primary-schools-data-1415-supp-with-unfilled-places.xlsx\n", "School-level-post-primary-schools-data-1516_1.XLS\n", "post-primary-schools-data-2012-13-supp-inc-unfilled-places.xlsx\n", "post-primary-schools-data-0910-supp-2.xlsx\n", "available%20places%20-%20post-primary%201718%20supp.xlsx\n", "School%20level%20-%20post%20primary%20schools%20data%20supp%201718.xls\n", "post-primary-schools-data-10-11-supp-inc-unfilled.xlsx\n", "post-primary-schools-data-11-12-supp-inc-unfilled-2.xlsx\n", "School%20level%20-%20post%20primary%20schools%20data%201617%20supp_0.XLS\n", "available%20places%20-%20post-primary%201617%20supp.XLSX\n" ] } ], "source": [ "sheets = defaultdict(list)\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " print(file)" ] }, { "cell_type": "code", "execution_count": 47, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.409905Z", "start_time": "2018-06-07T10:36:11.345299Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
0123456789
0Data on Pupils attending post primary schools ...NaNNaNNaNNaNNaNNaNNaNNaNNaN
1NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
2NaNNaNNaNNaNNaNNaNschoolparliamentarydistricturban/
3De refschool nameaddress 1townpostcodeschool typemanagement typeconstituencycouncilrural
41210014Ashfield Girls' High School397 HOLYWOOD ROADBELFASTBT42LYNon-grammarControlledBELFAST EASTBELFASTUrban
\n", "
" ], "text/plain": [ " 0 \\\n", "0 Data on Pupils attending post primary schools ... \n", "1 NaN \n", "2 NaN \n", "3 De ref \n", "4 1210014 \n", "\n", " 1 2 3 4 \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 school name address 1 town postcode \n", "4 Ashfield Girls' High School 397 HOLYWOOD ROAD BELFAST BT42LY \n", "\n", " 5 6 7 8 9 \n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN school parliamentary district urban/ \n", "3 school type management type constituency council rural \n", "4 Non-grammar Controlled BELFAST EAST BELFAST Urban " ] }, "execution_count": 47, "metadata": {}, "output_type": "execute_result" } ], "source": [ "xls = pd.ExcelFile(f'data/education-ni/2017/School%20level%20-%20post%20primary%20schools%20data%20supp%201718.xls')\n", "df = pd.read_excel(xls, 'reference data', header=None)\n", "df.head()" ] }, { "cell_type": "code", "execution_count": 48, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.421145Z", "start_time": "2018-06-07T10:36:11.411773Z" } }, "outputs": [ { "data": { "text/plain": [ "0 De ref\n", "1 school name\n", "2 address 1\n", "3 town\n", "4 postcode\n", "5 school type\n", "6 school management type\n", "7 parliamentary constituency\n", "8 district council\n", "9 urban/ rural\n", "dtype: object" ] }, "execution_count": 48, "metadata": {}, "output_type": "execute_result" } ], "source": [ "join_n_strip = lambda l: ' '.join(l).strip()\n", "\n", "df.ix[1:3].fillna('').apply(join_n_strip, axis=0)" ] }, { "cell_type": "code", "execution_count": 49, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.464415Z", "start_time": "2018-06-07T10:36:11.423291Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
De refschool nameaddress 1townpostcodeschool typeschool management typeparliamentary constituencydistrict councilurban/ rural
0Data on Pupils attending post primary schools ...NaNNaNNaNNaNNaNNaNNaNNaNNaN
1NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
2NaNNaNNaNNaNNaNNaNschoolparliamentarydistricturban/
3De refschool nameaddress 1townpostcodeschool typemanagement typeconstituencycouncilrural
41210014Ashfield Girls' High School397 HOLYWOOD ROADBELFASTBT42LYNon-grammarControlledBELFAST EASTBELFASTUrban
51210015Ashfield Boys' High School395 HOLYWOOD ROADBELFASTBT42LYNon-grammarControlledBELFAST EASTBELFASTUrban
61210021Belfast Model School For Girls35 DUNOWEN GARDENSBELFASTBT146NQNon-grammarControlledBELFAST NORTHBELFASTUrban
71210022Belfast Boys' Model SchoolBALLYSILLAN ROADBELFASTBT146RBNon-grammarControlledBELFAST NORTHBELFASTUrban
81230053St Louise's Comprehensive College468 FALLS ROADBELFASTBT126ENNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
91230104Mercy College BelfastBALLYSILLAN ROADBELFASTBT147QRNon-grammarCatholic MaintainedBELFAST NORTHBELFASTUrban
101230130St Rose’s Dominican College65 BEECHMOUNT AVENUEBELFASTBT127NANon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
111230146Christian Brothers School, BelfastGLEN ROADBELFASTBT118BWNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
121230155St Genevieve's High SchoolTRENCH HOUSEBELFASTBT119JPNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
131230182De La Salle College36 EDENMORE DRIVEBELFASTBT118LTNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
141230262Corpus Christi CollegeARD NA VA ROADBELFASTBT126FFNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
151230275St Joseph's College, Belfast518-572 RAVENHILL ROADBELFASTBT60BYNon-grammarCatholic MaintainedBELFAST SOUTHBELFASTUrban
161230321Blessed Trinity College619 ANTRIM ROADBELFASTBT154DZNon-grammarCatholic MaintainedBELFAST NORTHBELFASTUrban
171240291Colaiste Feirste7 BEECHVIEW PARKBELFASTBT127PYNon-grammarOther MaintainedBELFAST WESTBELFASTUrban
181260269Hazelwood College70 WHITEWELL ROADNEWTOWNABBEYBT367ESNon-grammarGMIBELFAST NORTHBELFASTUrban
191260294Malone Integrated College45 FINAGHY ROAD NORTHBELFASTBT100JBNon-grammarGMIBELFAST SOUTHBELFASTUrban
201410079Grosvenor Grammar School50 MARINA PARKBELFASTBT56BAGrammarControlledBELFAST EASTBELFASTUrban
211410270Wellington College18 CAROLAN ROADBELFASTBT73HEGrammarControlledBELFAST SOUTHBELFASTUrban
221410315Bloomfield Collegiate8 ASTORIA GARDENSBELFASTBT56HWGrammarControlledBELFAST EASTBELFASTUrban
231420020Campbell CollegeBELMONT ROADBELFASTBT42NDGrammarVoluntaryBELFAST EASTBELFASTUrban
241420021St Mary's Christian Brothers' Grammar, Belfast147A GLEN ROADBELFASTBT118NRGrammarVoluntaryBELFAST WESTBELFASTUrban
251420022Methodist College1 MALONE ROADBELFASTBT96BYGrammarVoluntaryBELFAST SOUTHBELFASTUrban
261420027The Royal Belfast Academical InstitutionCOLLEGE SQUARE EASTBELFASTBT16DLGrammarVoluntaryBELFAST SOUTHBELFASTUrban
271420028Belfast Royal Academy5-17 CLIFTONVILLE ROADBELFASTBT146JLGrammarVoluntaryBELFAST NORTHBELFASTUrban
281420029St Dominic's High School, Belfast135-137 FALLS ROADBELFASTBT126AEGrammarVoluntaryBELFAST WESTBELFASTUrban
291420030St Malachy's College, Belfast36 ANTRIM ROADBELFASTBT152AEGrammarVoluntaryBELFAST NORTHBELFASTUrban
.................................
1735230076St Patrick's College, Banbridge38 SCARVA ROADBANBRIDGEBT323ASNon-grammarCatholic MaintainedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1745230108St Mary's High School, NewryUPPER CHAPEL STREETNEWRYBT342DTNon-grammarCatholic MaintainedNEWRY AND ARMAGHNEWRY MOURNE AND DOWNUrban
1755230135St Mark's High SchoolUPPER DROMORE ROADNEWRYBT343PNNon-grammarCatholic MaintainedSOUTH DOWNNEWRY MOURNE AND DOWNUrban
1765230152St Ciaran's High School15 TULLYBRYAN ROADDUNGANNONBT702LYNon-grammarCatholic MaintainedFERMANAGH AND SOUTH TYRONEMID ULSTERRural
1775230157St Paul's High School, Bessbrook108 CAMLOUGH ROADNEWRYBT357EENon-grammarCatholic MaintainedNEWRY AND ARMAGHNEWRY MOURNE AND DOWNRural
1785230167St Joseph's High School, Crossmaglen77 DUNDALK ROADNEWRYBT359HLNon-grammarCatholic MaintainedNEWRY AND ARMAGHNEWRY MOURNE AND DOWNRural
1795230187St Patrick's High School, KeadyMIDDLETOWN ROADKEADYBT603THNon-grammarCatholic MaintainedNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONRural
1805230192St Joseph's College, Coalisland29 SCHOOL LANEDUNGANNONBT714NWNon-grammarCatholic MaintainedMID ULSTERMID ULSTERUrban
1815230213Lismore Comprehensive SchoolDRUMGASKCRAIGAVONBT655DUNon-grammarCatholic MaintainedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1825230218St Catherine's College2A CONVENT ROADARMAGHBT604BGNon-grammarCatholic MaintainedNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1835230278Holy Trinity CollegeCHAPEL STREETCOOKSTOWNBT808QBNon-grammarCatholic MaintainedMID ULSTERMID ULSTERUrban
1845230293St Patrick's College, Dungannon41 KILLYMEAL ROADDUNGANNONBT716LJNon-grammarCatholic MaintainedFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
1855230321St John The Baptist College4 MOY ROADPORTADOWNBT621QQSecondaryCatholic MaintainedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1865250216Brownlow Int CollegeTULLYGALLY ROADCRAIGAVONBT655BSNon-grammarControlled IntegratedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1875260285New-Bridge Integrated College25 DONARD VIEW ROADBANBRIDGEBT323LNNon-grammarGMIUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONRural
1885260286Integrated College Dungannon21 GORTMERRON LINK ROADDUNGANNONBT716LSNon-grammarGMIFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
1895410013Banbridge AcademyLURGAN ROADBANBRIDGEBT324AQGrammarControlledUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1905410057Lurgan College9 COLLEGE WALKCRAIGAVONBT666JWGrammarControlledUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1915410067Portadown College4 KILLYCOMAINE ROADCRAIGAVONBT635BUGrammarControlledUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1925420045St Louis Grammar School, Kilkeel151 NEWRY ROADKILKEELBT344EUGrammarVoluntarySOUTH DOWNNEWRY MOURNE AND DOWNUrban
1935420059Abbey Christian Brothers Grammar School77A ASHGROVE ROADNEWRYBT342QNGrammarVoluntarySOUTH DOWNNEWRY MOURNE AND DOWNUrban
1945420060Our Lady's Grammar SchoolCHEQUER HILLNEWRYBT356DYGrammarVoluntaryNEWRY AND ARMAGHNEWRY MOURNE AND DOWNUrban
1955420062St Colman's College, Newry46 ARMAGH ROADNEWRYBT356PPGrammarVoluntaryNEWRY AND ARMAGHNEWRY MOURNE AND DOWNUrban
1965420073St Joseph's Convent Grammar School, Donaghmore58 CASTLECAULFIELD ROADDUNGANNONBT703HEGrammarVoluntaryMID ULSTERMID ULSTERRural
1975420076Sacred Heart Grammar School, Newry10 ASHGROVE AVENUENEWRYBT341PRGrammarVoluntarySOUTH DOWNNEWRY MOURNE AND DOWNUrban
1985420260The Royal School, Dungannon2 RANFURLEY ROADDUNGANNONBT716APGrammarVoluntaryFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
1995420263The Royal School, ArmaghCOLLEGE HILLARMAGHBT619DHGrammarVoluntaryNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
2005420268St Patrick's Grammar School, ArmaghCATHEDRAL ROADARMAGHBT617QZGrammarVoluntaryNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
2015420304St Patrick's Academy, Dungannon37 KILLYMEAL ROADDUNGANNONBT716DSGrammarVoluntaryFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
2025420314St Ronan’s College12 CORNAKINEGAR ROADLURGANBT679JWGrammarVoluntaryUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
\n", "

203 rows × 10 columns

\n", "
" ], "text/plain": [ " De ref \\\n", "0 Data on Pupils attending post primary schools ... \n", "1 NaN \n", "2 NaN \n", "3 De ref \n", "4 1210014 \n", "5 1210015 \n", "6 1210021 \n", "7 1210022 \n", "8 1230053 \n", "9 1230104 \n", "10 1230130 \n", "11 1230146 \n", "12 1230155 \n", "13 1230182 \n", "14 1230262 \n", "15 1230275 \n", "16 1230321 \n", "17 1240291 \n", "18 1260269 \n", "19 1260294 \n", "20 1410079 \n", "21 1410270 \n", "22 1410315 \n", "23 1420020 \n", "24 1420021 \n", "25 1420022 \n", "26 1420027 \n", "27 1420028 \n", "28 1420029 \n", "29 1420030 \n", ".. ... \n", "173 5230076 \n", "174 5230108 \n", "175 5230135 \n", "176 5230152 \n", "177 5230157 \n", "178 5230167 \n", "179 5230187 \n", "180 5230192 \n", "181 5230213 \n", "182 5230218 \n", "183 5230278 \n", "184 5230293 \n", "185 5230321 \n", "186 5250216 \n", "187 5260285 \n", "188 5260286 \n", "189 5410013 \n", "190 5410057 \n", "191 5410067 \n", "192 5420045 \n", "193 5420059 \n", "194 5420060 \n", "195 5420062 \n", "196 5420073 \n", "197 5420076 \n", "198 5420260 \n", "199 5420263 \n", "200 5420268 \n", "201 5420304 \n", "202 5420314 \n", "\n", " school name address 1 \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 NaN NaN \n", "3 school name address 1 \n", "4 Ashfield Girls' High School 397 HOLYWOOD ROAD \n", "5 Ashfield Boys' High School 395 HOLYWOOD ROAD \n", "6 Belfast Model School For Girls 35 DUNOWEN GARDENS \n", "7 Belfast Boys' Model School BALLYSILLAN ROAD \n", "8 St Louise's Comprehensive College 468 FALLS ROAD \n", "9 Mercy College Belfast BALLYSILLAN ROAD \n", "10 St Rose’s Dominican College 65 BEECHMOUNT AVENUE \n", "11 Christian Brothers School, Belfast GLEN ROAD \n", "12 St Genevieve's High School TRENCH HOUSE \n", "13 De La Salle College 36 EDENMORE DRIVE \n", "14 Corpus Christi College ARD NA VA ROAD \n", "15 St Joseph's College, Belfast 518-572 RAVENHILL ROAD \n", "16 Blessed Trinity College 619 ANTRIM ROAD \n", "17 Colaiste Feirste 7 BEECHVIEW PARK \n", "18 Hazelwood College 70 WHITEWELL ROAD \n", "19 Malone Integrated College 45 FINAGHY ROAD NORTH \n", "20 Grosvenor Grammar School 50 MARINA PARK \n", "21 Wellington College 18 CAROLAN ROAD \n", "22 Bloomfield Collegiate 8 ASTORIA GARDENS \n", "23 Campbell College BELMONT ROAD \n", "24 St Mary's Christian Brothers' Grammar, Belfast 147A GLEN ROAD \n", "25 Methodist College 1 MALONE ROAD \n", "26 The Royal Belfast Academical Institution COLLEGE SQUARE EAST \n", "27 Belfast Royal Academy 5-17 CLIFTONVILLE ROAD \n", "28 St Dominic's High School, Belfast 135-137 FALLS ROAD \n", "29 St Malachy's College, Belfast 36 ANTRIM ROAD \n", ".. ... ... \n", "173 St Patrick's College, Banbridge 38 SCARVA ROAD \n", "174 St Mary's High School, Newry UPPER CHAPEL STREET \n", "175 St Mark's High School UPPER DROMORE ROAD \n", "176 St Ciaran's High School 15 TULLYBRYAN ROAD \n", "177 St Paul's High School, Bessbrook 108 CAMLOUGH ROAD \n", "178 St Joseph's High School, Crossmaglen 77 DUNDALK ROAD \n", "179 St Patrick's High School, Keady MIDDLETOWN ROAD \n", "180 St Joseph's College, Coalisland 29 SCHOOL LANE \n", "181 Lismore Comprehensive School DRUMGASK \n", "182 St Catherine's College 2A CONVENT ROAD \n", "183 Holy Trinity College CHAPEL STREET \n", "184 St Patrick's College, Dungannon 41 KILLYMEAL ROAD \n", "185 St John The Baptist College 4 MOY ROAD \n", "186 Brownlow Int College TULLYGALLY ROAD \n", "187 New-Bridge Integrated College 25 DONARD VIEW ROAD \n", "188 Integrated College Dungannon 21 GORTMERRON LINK ROAD \n", "189 Banbridge Academy LURGAN ROAD \n", "190 Lurgan College 9 COLLEGE WALK \n", "191 Portadown College 4 KILLYCOMAINE ROAD \n", "192 St Louis Grammar School, Kilkeel 151 NEWRY ROAD \n", "193 Abbey Christian Brothers Grammar School 77A ASHGROVE ROAD \n", "194 Our Lady's Grammar School CHEQUER HILL \n", "195 St Colman's College, Newry 46 ARMAGH ROAD \n", "196 St Joseph's Convent Grammar School, Donaghmore 58 CASTLECAULFIELD ROAD \n", "197 Sacred Heart Grammar School, Newry 10 ASHGROVE AVENUE \n", "198 The Royal School, Dungannon 2 RANFURLEY ROAD \n", "199 The Royal School, Armagh COLLEGE HILL \n", "200 St Patrick's Grammar School, Armagh CATHEDRAL ROAD \n", "201 St Patrick's Academy, Dungannon 37 KILLYMEAL ROAD \n", "202 St Ronan’s College 12 CORNAKINEGAR ROAD \n", "\n", " town postcode school type school management type \\\n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN school \n", "3 town postcode school type management type \n", "4 BELFAST BT42LY Non-grammar Controlled \n", "5 BELFAST BT42LY Non-grammar Controlled \n", "6 BELFAST BT146NQ Non-grammar Controlled \n", "7 BELFAST BT146RB Non-grammar Controlled \n", "8 BELFAST BT126EN Non-grammar Catholic Maintained \n", "9 BELFAST BT147QR Non-grammar Catholic Maintained \n", "10 BELFAST BT127NA Non-grammar Catholic Maintained \n", "11 BELFAST BT118BW Non-grammar Catholic Maintained \n", "12 BELFAST BT119JP Non-grammar Catholic Maintained \n", "13 BELFAST BT118LT Non-grammar Catholic Maintained \n", "14 BELFAST BT126FF Non-grammar Catholic Maintained \n", "15 BELFAST BT60BY Non-grammar Catholic Maintained \n", "16 BELFAST BT154DZ Non-grammar Catholic Maintained \n", "17 BELFAST BT127PY Non-grammar Other Maintained \n", "18 NEWTOWNABBEY BT367ES Non-grammar GMI \n", "19 BELFAST BT100JB Non-grammar GMI \n", "20 BELFAST BT56BA Grammar Controlled \n", "21 BELFAST BT73HE Grammar Controlled \n", "22 BELFAST BT56HW Grammar Controlled \n", "23 BELFAST BT42ND Grammar Voluntary \n", "24 BELFAST BT118NR Grammar Voluntary \n", "25 BELFAST BT96BY Grammar Voluntary \n", "26 BELFAST BT16DL Grammar Voluntary \n", "27 BELFAST BT146JL Grammar Voluntary \n", "28 BELFAST BT126AE Grammar Voluntary \n", "29 BELFAST BT152AE Grammar Voluntary \n", ".. ... ... ... ... \n", "173 BANBRIDGE BT323AS Non-grammar Catholic Maintained \n", "174 NEWRY BT342DT Non-grammar Catholic Maintained \n", "175 NEWRY BT343PN Non-grammar Catholic Maintained \n", "176 DUNGANNON BT702LY Non-grammar Catholic Maintained \n", "177 NEWRY BT357EE Non-grammar Catholic Maintained \n", "178 NEWRY BT359HL Non-grammar Catholic Maintained \n", "179 KEADY BT603TH Non-grammar Catholic Maintained \n", "180 DUNGANNON BT714NW Non-grammar Catholic Maintained \n", "181 CRAIGAVON BT655DU Non-grammar Catholic Maintained \n", "182 ARMAGH BT604BG Non-grammar Catholic Maintained \n", "183 COOKSTOWN BT808QB Non-grammar Catholic Maintained \n", "184 DUNGANNON BT716LJ Non-grammar Catholic Maintained \n", "185 PORTADOWN BT621QQ Secondary Catholic Maintained \n", "186 CRAIGAVON BT655BS Non-grammar Controlled Integrated \n", "187 BANBRIDGE BT323LN Non-grammar GMI \n", "188 DUNGANNON BT716LS Non-grammar GMI \n", "189 BANBRIDGE BT324AQ Grammar Controlled \n", "190 CRAIGAVON BT666JW Grammar Controlled \n", "191 CRAIGAVON BT635BU Grammar Controlled \n", "192 KILKEEL BT344EU Grammar Voluntary \n", "193 NEWRY BT342QN Grammar Voluntary \n", "194 NEWRY BT356DY Grammar Voluntary \n", "195 NEWRY BT356PP Grammar Voluntary \n", "196 DUNGANNON BT703HE Grammar Voluntary \n", "197 NEWRY BT341PR Grammar Voluntary \n", "198 DUNGANNON BT716AP Grammar Voluntary \n", "199 ARMAGH BT619DH Grammar Voluntary \n", "200 ARMAGH BT617QZ Grammar Voluntary \n", "201 DUNGANNON BT716DS Grammar Voluntary \n", "202 LURGAN BT679JW Grammar Voluntary \n", "\n", " parliamentary constituency district council \\\n", "0 NaN NaN \n", "1 NaN NaN \n", "2 parliamentary district \n", "3 constituency council \n", "4 BELFAST EAST BELFAST \n", "5 BELFAST EAST BELFAST \n", "6 BELFAST NORTH BELFAST \n", "7 BELFAST NORTH BELFAST \n", "8 BELFAST WEST BELFAST \n", "9 BELFAST NORTH BELFAST \n", "10 BELFAST WEST BELFAST \n", "11 BELFAST WEST BELFAST \n", "12 BELFAST WEST BELFAST \n", "13 BELFAST WEST BELFAST \n", "14 BELFAST WEST BELFAST \n", "15 BELFAST SOUTH BELFAST \n", "16 BELFAST NORTH BELFAST \n", "17 BELFAST WEST BELFAST \n", "18 BELFAST NORTH BELFAST \n", "19 BELFAST SOUTH BELFAST \n", "20 BELFAST EAST BELFAST \n", "21 BELFAST SOUTH BELFAST \n", "22 BELFAST EAST BELFAST \n", "23 BELFAST EAST BELFAST \n", "24 BELFAST WEST BELFAST \n", "25 BELFAST SOUTH BELFAST \n", "26 BELFAST SOUTH BELFAST \n", "27 BELFAST NORTH BELFAST \n", "28 BELFAST WEST BELFAST \n", "29 BELFAST NORTH BELFAST \n", ".. ... ... \n", "173 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "174 NEWRY AND ARMAGH NEWRY MOURNE AND DOWN \n", "175 SOUTH DOWN NEWRY MOURNE AND DOWN \n", "176 FERMANAGH AND SOUTH TYRONE MID ULSTER \n", "177 NEWRY AND ARMAGH NEWRY MOURNE AND DOWN \n", "178 NEWRY AND ARMAGH NEWRY MOURNE AND DOWN \n", "179 NEWRY AND ARMAGH ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "180 MID ULSTER MID ULSTER \n", "181 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "182 NEWRY AND ARMAGH ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "183 MID ULSTER MID ULSTER \n", "184 FERMANAGH AND SOUTH TYRONE MID ULSTER \n", "185 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "186 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "187 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "188 FERMANAGH AND SOUTH TYRONE MID ULSTER \n", "189 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "190 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "191 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "192 SOUTH DOWN NEWRY MOURNE AND DOWN \n", "193 SOUTH DOWN NEWRY MOURNE AND DOWN \n", "194 NEWRY AND ARMAGH NEWRY MOURNE AND DOWN \n", "195 NEWRY AND ARMAGH NEWRY MOURNE AND DOWN \n", "196 MID ULSTER MID ULSTER \n", "197 SOUTH DOWN NEWRY MOURNE AND DOWN \n", "198 FERMANAGH AND SOUTH TYRONE MID ULSTER \n", "199 NEWRY AND ARMAGH ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "200 NEWRY AND ARMAGH ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "201 FERMANAGH AND SOUTH TYRONE MID ULSTER \n", "202 UPPER BANN ARMAGH CITY, BANBRIDGE AND CRAIGAVON \n", "\n", " urban/ rural \n", "0 NaN \n", "1 NaN \n", "2 urban/ \n", "3 rural \n", "4 Urban \n", "5 Urban \n", "6 Urban \n", "7 Urban \n", "8 Urban \n", "9 Urban \n", "10 Urban \n", "11 Urban \n", "12 Urban \n", "13 Urban \n", "14 Urban \n", "15 Urban \n", "16 Urban \n", "17 Urban \n", "18 Urban \n", "19 Urban \n", "20 Urban \n", "21 Urban \n", "22 Urban \n", "23 Urban \n", "24 Urban \n", "25 Urban \n", "26 Urban \n", "27 Urban \n", "28 Urban \n", "29 Urban \n", ".. ... \n", "173 Urban \n", "174 Urban \n", "175 Urban \n", "176 Rural \n", "177 Rural \n", "178 Rural \n", "179 Rural \n", "180 Urban \n", "181 Urban \n", "182 Urban \n", "183 Urban \n", "184 Urban \n", "185 Urban \n", "186 Urban \n", "187 Rural \n", "188 Urban \n", "189 Urban \n", "190 Urban \n", "191 Urban \n", "192 Urban \n", "193 Urban \n", "194 Urban \n", "195 Urban \n", "196 Rural \n", "197 Urban \n", "198 Urban \n", "199 Urban \n", "200 Urban \n", "201 Urban \n", "202 Urban \n", "\n", "[203 rows x 10 columns]" ] }, "execution_count": 49, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df.columns=df.ix[1:3].fillna('').apply(join_n_strip, axis=0).values\n", "df" ] }, { "cell_type": "code", "execution_count": 50, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.517739Z", "start_time": "2018-06-07T10:36:11.466841Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
De refschool nameaddress 1townpostcodeschool typeschool management typeparliamentary constituencydistrict councilurban/ rural
01210014Ashfield Girls' High School397 HOLYWOOD ROADBELFASTBT42LYNon-grammarControlledBELFAST EASTBELFASTUrban
11210015Ashfield Boys' High School395 HOLYWOOD ROADBELFASTBT42LYNon-grammarControlledBELFAST EASTBELFASTUrban
21210021Belfast Model School For Girls35 DUNOWEN GARDENSBELFASTBT146NQNon-grammarControlledBELFAST NORTHBELFASTUrban
31210022Belfast Boys' Model SchoolBALLYSILLAN ROADBELFASTBT146RBNon-grammarControlledBELFAST NORTHBELFASTUrban
41230053St Louise's Comprehensive College468 FALLS ROADBELFASTBT126ENNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
51230104Mercy College BelfastBALLYSILLAN ROADBELFASTBT147QRNon-grammarCatholic MaintainedBELFAST NORTHBELFASTUrban
61230130St Rose’s Dominican College65 BEECHMOUNT AVENUEBELFASTBT127NANon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
71230146Christian Brothers School, BelfastGLEN ROADBELFASTBT118BWNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
81230155St Genevieve's High SchoolTRENCH HOUSEBELFASTBT119JPNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
91230182De La Salle College36 EDENMORE DRIVEBELFASTBT118LTNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
101230262Corpus Christi CollegeARD NA VA ROADBELFASTBT126FFNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
111230275St Joseph's College, Belfast518-572 RAVENHILL ROADBELFASTBT60BYNon-grammarCatholic MaintainedBELFAST SOUTHBELFASTUrban
121230321Blessed Trinity College619 ANTRIM ROADBELFASTBT154DZNon-grammarCatholic MaintainedBELFAST NORTHBELFASTUrban
131240291Colaiste Feirste7 BEECHVIEW PARKBELFASTBT127PYNon-grammarOther MaintainedBELFAST WESTBELFASTUrban
141260269Hazelwood College70 WHITEWELL ROADNEWTOWNABBEYBT367ESNon-grammarGMIBELFAST NORTHBELFASTUrban
151260294Malone Integrated College45 FINAGHY ROAD NORTHBELFASTBT100JBNon-grammarGMIBELFAST SOUTHBELFASTUrban
161410079Grosvenor Grammar School50 MARINA PARKBELFASTBT56BAGrammarControlledBELFAST EASTBELFASTUrban
171410270Wellington College18 CAROLAN ROADBELFASTBT73HEGrammarControlledBELFAST SOUTHBELFASTUrban
181410315Bloomfield Collegiate8 ASTORIA GARDENSBELFASTBT56HWGrammarControlledBELFAST EASTBELFASTUrban
191420020Campbell CollegeBELMONT ROADBELFASTBT42NDGrammarVoluntaryBELFAST EASTBELFASTUrban
201420021St Mary's Christian Brothers' Grammar, Belfast147A GLEN ROADBELFASTBT118NRGrammarVoluntaryBELFAST WESTBELFASTUrban
211420022Methodist College1 MALONE ROADBELFASTBT96BYGrammarVoluntaryBELFAST SOUTHBELFASTUrban
221420027The Royal Belfast Academical InstitutionCOLLEGE SQUARE EASTBELFASTBT16DLGrammarVoluntaryBELFAST SOUTHBELFASTUrban
231420028Belfast Royal Academy5-17 CLIFTONVILLE ROADBELFASTBT146JLGrammarVoluntaryBELFAST NORTHBELFASTUrban
241420029St Dominic's High School, Belfast135-137 FALLS ROADBELFASTBT126AEGrammarVoluntaryBELFAST WESTBELFASTUrban
251420030St Malachy's College, Belfast36 ANTRIM ROADBELFASTBT152AEGrammarVoluntaryBELFAST NORTHBELFASTUrban
261420082Dominican College, Belfast38 FORTWILLIAM PARKBELFASTBT154AQGrammarVoluntaryBELFAST NORTHBELFASTUrban
271420089Strathearn School, Belfast188 BELMONT ROADBELFASTBT42AUGrammarVoluntaryBELFAST EASTBELFASTUrban
281420095Rathmore Grammar SchoolKINGSWAYBELFASTBT100LFGrammarVoluntaryBELFAST SOUTHBELFASTUrban
291420264Victoria CollegeCRANMORE PARKBELFASTBT96JAGrammarVoluntaryBELFAST SOUTHBELFASTUrban
.................................
1695230076St Patrick's College, Banbridge38 SCARVA ROADBANBRIDGEBT323ASNon-grammarCatholic MaintainedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1705230108St Mary's High School, NewryUPPER CHAPEL STREETNEWRYBT342DTNon-grammarCatholic MaintainedNEWRY AND ARMAGHNEWRY MOURNE AND DOWNUrban
1715230135St Mark's High SchoolUPPER DROMORE ROADNEWRYBT343PNNon-grammarCatholic MaintainedSOUTH DOWNNEWRY MOURNE AND DOWNUrban
1725230152St Ciaran's High School15 TULLYBRYAN ROADDUNGANNONBT702LYNon-grammarCatholic MaintainedFERMANAGH AND SOUTH TYRONEMID ULSTERRural
1735230157St Paul's High School, Bessbrook108 CAMLOUGH ROADNEWRYBT357EENon-grammarCatholic MaintainedNEWRY AND ARMAGHNEWRY MOURNE AND DOWNRural
1745230167St Joseph's High School, Crossmaglen77 DUNDALK ROADNEWRYBT359HLNon-grammarCatholic MaintainedNEWRY AND ARMAGHNEWRY MOURNE AND DOWNRural
1755230187St Patrick's High School, KeadyMIDDLETOWN ROADKEADYBT603THNon-grammarCatholic MaintainedNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONRural
1765230192St Joseph's College, Coalisland29 SCHOOL LANEDUNGANNONBT714NWNon-grammarCatholic MaintainedMID ULSTERMID ULSTERUrban
1775230213Lismore Comprehensive SchoolDRUMGASKCRAIGAVONBT655DUNon-grammarCatholic MaintainedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1785230218St Catherine's College2A CONVENT ROADARMAGHBT604BGNon-grammarCatholic MaintainedNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1795230278Holy Trinity CollegeCHAPEL STREETCOOKSTOWNBT808QBNon-grammarCatholic MaintainedMID ULSTERMID ULSTERUrban
1805230293St Patrick's College, Dungannon41 KILLYMEAL ROADDUNGANNONBT716LJNon-grammarCatholic MaintainedFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
1815230321St John The Baptist College4 MOY ROADPORTADOWNBT621QQSecondaryCatholic MaintainedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1825250216Brownlow Int CollegeTULLYGALLY ROADCRAIGAVONBT655BSNon-grammarControlled IntegratedUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1835260285New-Bridge Integrated College25 DONARD VIEW ROADBANBRIDGEBT323LNNon-grammarGMIUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONRural
1845260286Integrated College Dungannon21 GORTMERRON LINK ROADDUNGANNONBT716LSNon-grammarGMIFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
1855410013Banbridge AcademyLURGAN ROADBANBRIDGEBT324AQGrammarControlledUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1865410057Lurgan College9 COLLEGE WALKCRAIGAVONBT666JWGrammarControlledUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1875410067Portadown College4 KILLYCOMAINE ROADCRAIGAVONBT635BUGrammarControlledUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1885420045St Louis Grammar School, Kilkeel151 NEWRY ROADKILKEELBT344EUGrammarVoluntarySOUTH DOWNNEWRY MOURNE AND DOWNUrban
1895420059Abbey Christian Brothers Grammar School77A ASHGROVE ROADNEWRYBT342QNGrammarVoluntarySOUTH DOWNNEWRY MOURNE AND DOWNUrban
1905420060Our Lady's Grammar SchoolCHEQUER HILLNEWRYBT356DYGrammarVoluntaryNEWRY AND ARMAGHNEWRY MOURNE AND DOWNUrban
1915420062St Colman's College, Newry46 ARMAGH ROADNEWRYBT356PPGrammarVoluntaryNEWRY AND ARMAGHNEWRY MOURNE AND DOWNUrban
1925420073St Joseph's Convent Grammar School, Donaghmore58 CASTLECAULFIELD ROADDUNGANNONBT703HEGrammarVoluntaryMID ULSTERMID ULSTERRural
1935420076Sacred Heart Grammar School, Newry10 ASHGROVE AVENUENEWRYBT341PRGrammarVoluntarySOUTH DOWNNEWRY MOURNE AND DOWNUrban
1945420260The Royal School, Dungannon2 RANFURLEY ROADDUNGANNONBT716APGrammarVoluntaryFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
1955420263The Royal School, ArmaghCOLLEGE HILLARMAGHBT619DHGrammarVoluntaryNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1965420268St Patrick's Grammar School, ArmaghCATHEDRAL ROADARMAGHBT617QZGrammarVoluntaryNEWRY AND ARMAGHARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
1975420304St Patrick's Academy, Dungannon37 KILLYMEAL ROADDUNGANNONBT716DSGrammarVoluntaryFERMANAGH AND SOUTH TYRONEMID ULSTERUrban
1985420314St Ronan’s College12 CORNAKINEGAR ROADLURGANBT679JWGrammarVoluntaryUPPER BANNARMAGH CITY, BANBRIDGE AND CRAIGAVONUrban
\n", "

199 rows × 10 columns

\n", "
" ], "text/plain": [ " De ref school name \\\n", "0 1210014 Ashfield Girls' High School \n", "1 1210015 Ashfield Boys' High School \n", "2 1210021 Belfast Model School For Girls \n", "3 1210022 Belfast Boys' Model School \n", "4 1230053 St Louise's Comprehensive College \n", "5 1230104 Mercy College Belfast \n", "6 1230130 St Rose’s Dominican College \n", "7 1230146 Christian Brothers School, Belfast \n", "8 1230155 St Genevieve's High School \n", "9 1230182 De La Salle College \n", "10 1230262 Corpus Christi College \n", "11 1230275 St Joseph's College, Belfast \n", "12 1230321 Blessed Trinity College \n", "13 1240291 Colaiste Feirste \n", "14 1260269 Hazelwood College \n", "15 1260294 Malone Integrated College \n", "16 1410079 Grosvenor Grammar School \n", "17 1410270 Wellington College \n", "18 1410315 Bloomfield Collegiate \n", "19 1420020 Campbell College \n", "20 1420021 St Mary's Christian Brothers' Grammar, Belfast \n", "21 1420022 Methodist College \n", "22 1420027 The Royal Belfast Academical Institution \n", "23 1420028 Belfast Royal Academy \n", "24 1420029 St Dominic's High School, Belfast \n", "25 1420030 St Malachy's College, Belfast \n", "26 1420082 Dominican College, Belfast \n", "27 1420089 Strathearn School, Belfast \n", "28 1420095 Rathmore Grammar School \n", "29 1420264 Victoria College \n", ".. ... ... \n", "169 5230076 St Patrick's College, Banbridge \n", "170 5230108 St Mary's High School, Newry \n", "171 5230135 St Mark's High School \n", "172 5230152 St Ciaran's High School \n", "173 5230157 St Paul's High School, Bessbrook \n", "174 5230167 St Joseph's High School, Crossmaglen \n", "175 5230187 St Patrick's High School, Keady \n", "176 5230192 St Joseph's College, Coalisland \n", "177 5230213 Lismore Comprehensive School \n", "178 5230218 St Catherine's College \n", "179 5230278 Holy Trinity College \n", "180 5230293 St Patrick's College, Dungannon \n", "181 5230321 St John The Baptist College \n", "182 5250216 Brownlow Int College \n", "183 5260285 New-Bridge Integrated College \n", "184 5260286 Integrated College Dungannon \n", "185 5410013 Banbridge Academy \n", "186 5410057 Lurgan College \n", "187 5410067 Portadown College \n", "188 5420045 St Louis Grammar School, Kilkeel \n", "189 5420059 Abbey Christian Brothers Grammar School \n", "190 5420060 Our Lady's Grammar School \n", "191 5420062 St Colman's College, Newry \n", "192 5420073 St Joseph's Convent Grammar School, Donaghmore \n", "193 5420076 Sacred Heart Grammar School, Newry \n", "194 5420260 The Royal School, Dungannon \n", "195 5420263 The Royal School, Armagh \n", "196 5420268 St Patrick's Grammar School, Armagh \n", "197 5420304 St Patrick's Academy, Dungannon \n", "198 5420314 St Ronan’s College \n", "\n", " address 1 town postcode school type \\\n", "0 397 HOLYWOOD ROAD BELFAST BT42LY Non-grammar \n", "1 395 HOLYWOOD ROAD BELFAST BT42LY Non-grammar \n", "2 35 DUNOWEN GARDENS BELFAST BT146NQ Non-grammar \n", "3 BALLYSILLAN ROAD BELFAST BT146RB Non-grammar \n", "4 468 FALLS ROAD BELFAST BT126EN Non-grammar \n", "5 BALLYSILLAN ROAD BELFAST BT147QR Non-grammar \n", "6 65 BEECHMOUNT AVENUE BELFAST BT127NA Non-grammar \n", "7 GLEN ROAD BELFAST BT118BW Non-grammar \n", "8 TRENCH HOUSE BELFAST BT119JP Non-grammar \n", "9 36 EDENMORE DRIVE BELFAST BT118LT Non-grammar \n", "10 ARD NA VA ROAD BELFAST BT126FF Non-grammar \n", "11 518-572 RAVENHILL ROAD BELFAST BT60BY Non-grammar \n", "12 619 ANTRIM ROAD BELFAST BT154DZ Non-grammar \n", "13 7 BEECHVIEW PARK BELFAST BT127PY Non-grammar \n", "14 70 WHITEWELL ROAD NEWTOWNABBEY BT367ES Non-grammar \n", "15 45 FINAGHY ROAD NORTH BELFAST BT100JB Non-grammar \n", "16 50 MARINA PARK BELFAST BT56BA Grammar \n", "17 18 CAROLAN ROAD BELFAST BT73HE Grammar \n", "18 8 ASTORIA GARDENS BELFAST BT56HW Grammar \n", "19 BELMONT ROAD BELFAST BT42ND Grammar \n", "20 147A GLEN ROAD BELFAST BT118NR Grammar \n", "21 1 MALONE ROAD BELFAST BT96BY Grammar \n", "22 COLLEGE SQUARE EAST BELFAST BT16DL Grammar \n", "23 5-17 CLIFTONVILLE ROAD BELFAST BT146JL Grammar \n", "24 135-137 FALLS ROAD BELFAST BT126AE Grammar \n", "25 36 ANTRIM ROAD BELFAST BT152AE Grammar \n", "26 38 FORTWILLIAM PARK BELFAST BT154AQ Grammar \n", "27 188 BELMONT ROAD BELFAST BT42AU Grammar \n", "28 KINGSWAY BELFAST BT100LF Grammar \n", "29 CRANMORE PARK BELFAST BT96JA Grammar \n", ".. ... ... ... ... \n", "169 38 SCARVA ROAD BANBRIDGE BT323AS Non-grammar \n", "170 UPPER CHAPEL STREET NEWRY BT342DT Non-grammar \n", "171 UPPER DROMORE ROAD NEWRY BT343PN Non-grammar \n", "172 15 TULLYBRYAN ROAD DUNGANNON BT702LY Non-grammar \n", "173 108 CAMLOUGH ROAD NEWRY BT357EE Non-grammar \n", "174 77 DUNDALK ROAD NEWRY BT359HL Non-grammar \n", "175 MIDDLETOWN ROAD KEADY BT603TH Non-grammar \n", "176 29 SCHOOL LANE DUNGANNON BT714NW Non-grammar \n", "177 DRUMGASK CRAIGAVON BT655DU Non-grammar \n", "178 2A CONVENT ROAD ARMAGH BT604BG Non-grammar \n", "179 CHAPEL STREET COOKSTOWN BT808QB Non-grammar \n", "180 41 KILLYMEAL ROAD DUNGANNON BT716LJ Non-grammar \n", "181 4 MOY ROAD PORTADOWN BT621QQ Secondary \n", "182 TULLYGALLY ROAD CRAIGAVON BT655BS Non-grammar \n", "183 25 DONARD VIEW ROAD BANBRIDGE BT323LN Non-grammar \n", "184 21 GORTMERRON LINK ROAD DUNGANNON BT716LS Non-grammar \n", "185 LURGAN ROAD BANBRIDGE BT324AQ Grammar \n", "186 9 COLLEGE WALK CRAIGAVON BT666JW Grammar \n", "187 4 KILLYCOMAINE ROAD CRAIGAVON BT635BU Grammar \n", "188 151 NEWRY ROAD KILKEEL BT344EU Grammar \n", "189 77A ASHGROVE ROAD NEWRY BT342QN Grammar \n", "190 CHEQUER HILL NEWRY BT356DY Grammar \n", "191 46 ARMAGH ROAD NEWRY BT356PP Grammar \n", "192 58 CASTLECAULFIELD ROAD DUNGANNON BT703HE Grammar \n", "193 10 ASHGROVE AVENUE NEWRY BT341PR Grammar \n", "194 2 RANFURLEY ROAD DUNGANNON BT716AP Grammar \n", "195 COLLEGE HILL ARMAGH BT619DH Grammar \n", "196 CATHEDRAL ROAD ARMAGH BT617QZ Grammar \n", "197 37 KILLYMEAL ROAD DUNGANNON BT716DS Grammar \n", "198 12 CORNAKINEGAR ROAD LURGAN BT679JW Grammar \n", "\n", " school management type parliamentary constituency \\\n", "0 Controlled BELFAST EAST \n", "1 Controlled BELFAST EAST \n", "2 Controlled BELFAST NORTH \n", "3 Controlled BELFAST NORTH \n", "4 Catholic Maintained BELFAST WEST \n", "5 Catholic Maintained BELFAST NORTH \n", "6 Catholic Maintained BELFAST WEST \n", "7 Catholic Maintained BELFAST WEST \n", "8 Catholic Maintained BELFAST WEST \n", "9 Catholic Maintained BELFAST WEST \n", "10 Catholic Maintained BELFAST WEST \n", "11 Catholic Maintained BELFAST SOUTH \n", "12 Catholic Maintained BELFAST NORTH \n", "13 Other Maintained BELFAST WEST \n", "14 GMI BELFAST NORTH \n", "15 GMI BELFAST SOUTH \n", "16 Controlled BELFAST EAST \n", "17 Controlled BELFAST SOUTH \n", "18 Controlled BELFAST EAST \n", "19 Voluntary BELFAST EAST \n", "20 Voluntary BELFAST WEST \n", "21 Voluntary BELFAST SOUTH \n", "22 Voluntary BELFAST SOUTH \n", "23 Voluntary BELFAST NORTH \n", "24 Voluntary BELFAST WEST \n", "25 Voluntary BELFAST NORTH \n", "26 Voluntary BELFAST NORTH \n", "27 Voluntary BELFAST EAST \n", "28 Voluntary BELFAST SOUTH \n", "29 Voluntary BELFAST SOUTH \n", ".. ... ... \n", "169 Catholic Maintained UPPER BANN \n", "170 Catholic Maintained NEWRY AND ARMAGH \n", "171 Catholic Maintained SOUTH DOWN \n", "172 Catholic Maintained FERMANAGH AND SOUTH TYRONE \n", "173 Catholic Maintained NEWRY AND ARMAGH \n", "174 Catholic Maintained NEWRY AND ARMAGH \n", "175 Catholic Maintained NEWRY AND ARMAGH \n", "176 Catholic Maintained MID ULSTER \n", "177 Catholic Maintained UPPER BANN \n", "178 Catholic Maintained NEWRY AND ARMAGH \n", "179 Catholic Maintained MID ULSTER \n", "180 Catholic Maintained FERMANAGH AND SOUTH TYRONE \n", "181 Catholic Maintained UPPER BANN \n", "182 Controlled Integrated UPPER BANN \n", "183 GMI UPPER BANN \n", "184 GMI FERMANAGH AND SOUTH TYRONE \n", "185 Controlled UPPER BANN \n", "186 Controlled UPPER BANN \n", "187 Controlled UPPER BANN \n", "188 Voluntary SOUTH DOWN \n", "189 Voluntary SOUTH DOWN \n", "190 Voluntary NEWRY AND ARMAGH \n", "191 Voluntary NEWRY AND ARMAGH \n", "192 Voluntary MID ULSTER \n", "193 Voluntary SOUTH DOWN \n", "194 Voluntary FERMANAGH AND SOUTH TYRONE \n", "195 Voluntary NEWRY AND ARMAGH \n", "196 Voluntary NEWRY AND ARMAGH \n", "197 Voluntary FERMANAGH AND SOUTH TYRONE \n", "198 Voluntary UPPER BANN \n", "\n", " district council urban/ rural \n", "0 BELFAST Urban \n", "1 BELFAST Urban \n", "2 BELFAST Urban \n", "3 BELFAST Urban \n", "4 BELFAST Urban \n", "5 BELFAST Urban \n", "6 BELFAST Urban \n", "7 BELFAST Urban \n", "8 BELFAST Urban \n", "9 BELFAST Urban \n", "10 BELFAST Urban \n", "11 BELFAST Urban \n", "12 BELFAST Urban \n", "13 BELFAST Urban \n", "14 BELFAST Urban \n", "15 BELFAST Urban \n", "16 BELFAST Urban \n", "17 BELFAST Urban \n", "18 BELFAST Urban \n", "19 BELFAST Urban \n", "20 BELFAST Urban \n", "21 BELFAST Urban \n", "22 BELFAST Urban \n", "23 BELFAST Urban \n", "24 BELFAST Urban \n", "25 BELFAST Urban \n", "26 BELFAST Urban \n", "27 BELFAST Urban \n", "28 BELFAST Urban \n", "29 BELFAST Urban \n", ".. ... ... \n", "169 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "170 NEWRY MOURNE AND DOWN Urban \n", "171 NEWRY MOURNE AND DOWN Urban \n", "172 MID ULSTER Rural \n", "173 NEWRY MOURNE AND DOWN Rural \n", "174 NEWRY MOURNE AND DOWN Rural \n", "175 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Rural \n", "176 MID ULSTER Urban \n", "177 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "178 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "179 MID ULSTER Urban \n", "180 MID ULSTER Urban \n", "181 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "182 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "183 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Rural \n", "184 MID ULSTER Urban \n", "185 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "186 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "187 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "188 NEWRY MOURNE AND DOWN Urban \n", "189 NEWRY MOURNE AND DOWN Urban \n", "190 NEWRY MOURNE AND DOWN Urban \n", "191 NEWRY MOURNE AND DOWN Urban \n", "192 MID ULSTER Rural \n", "193 NEWRY MOURNE AND DOWN Urban \n", "194 MID ULSTER Urban \n", "195 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "196 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "197 MID ULSTER Urban \n", "198 ARMAGH CITY, BANBRIDGE AND CRAIGAVON Urban \n", "\n", "[199 rows x 10 columns]" ] }, "execution_count": 50, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df = df.drop(df.index[0:4]).reset_index(drop=True)\n", "df" ] }, { "cell_type": "code", "execution_count": 51, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.803125Z", "start_time": "2018-06-07T10:36:11.520592Z" } }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 51, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "df['district council'].value_counts().plot.pie(autopct='%1.0f%%')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "![](img/itshappening.webp)" ] }, { "cell_type": "code", "execution_count": 61, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:37:57.306292Z", "start_time": "2018-06-07T10:37:57.083205Z" } }, "outputs": [ { "ename": "TypeError", "evalue": "('sequence item 2: expected str instance, int found', 'occurred at index 0')", "output_type": "error", "traceback": [ "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", "\u001b[0;31mTypeError\u001b[0m Traceback (most recent call last)", "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 13\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0;34m'post'\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mfile\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 14\u001b[0m \u001b[0mxls\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mExcelFile\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34mf'data/education-ni/{year}/{file}'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 15\u001b[0;31m \u001b[0mdf\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mparse_reference_table\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mxls\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 16\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0mdf\u001b[0m \u001b[0;32mis\u001b[0m \u001b[0;32mnot\u001b[0m \u001b[0;32mNone\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 17\u001b[0m \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34mf'Got reference data for {year}'\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m\u001b[0m in \u001b[0;36mparse_reference_table\u001b[0;34m(xls)\u001b[0m\n\u001b[1;32m 3\u001b[0m \u001b[0mdf\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread_excel\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mxls\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'reference data'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mheader\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 4\u001b[0m \u001b[0mjoin_n_strip\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mlambda\u001b[0m \u001b[0ml\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;34m' '\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjoin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ml\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstrip\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 5\u001b[0;31m \u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcolumns\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mix\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;36m3\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfillna\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m''\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mapply\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mjoin_n_strip\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mvalues\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 6\u001b[0m \u001b[0mdf\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdrop\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;36m4\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mreset_index\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdrop\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 7\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m~/anaconda3/lib/python3.6/site-packages/pandas/core/frame.py\u001b[0m in \u001b[0;36mapply\u001b[0;34m(self, func, axis, broadcast, raw, reduce, args, **kwds)\u001b[0m\n\u001b[1;32m 4875\u001b[0m \u001b[0mf\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 4876\u001b[0m \u001b[0mreduce\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mreduce\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 4877\u001b[0;31m ignore_failures=ignore_failures)\n\u001b[0m\u001b[1;32m 4878\u001b[0m \u001b[0;32melse\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 4879\u001b[0m \u001b[0;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0m_apply_broadcast\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mf\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m~/anaconda3/lib/python3.6/site-packages/pandas/core/frame.py\u001b[0m in \u001b[0;36m_apply_standard\u001b[0;34m(self, func, axis, ignore_failures, reduce)\u001b[0m\n\u001b[1;32m 4971\u001b[0m \u001b[0;32mtry\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 4972\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0menumerate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mseries_gen\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m-> 4973\u001b[0;31m \u001b[0mresults\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m]\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mfunc\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 4974\u001b[0m \u001b[0mkeys\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mappend\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mname\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 4975\u001b[0m \u001b[0;32mexcept\u001b[0m \u001b[0mException\u001b[0m \u001b[0;32mas\u001b[0m \u001b[0me\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m(l)\u001b[0m\n\u001b[1;32m 2\u001b[0m \u001b[0;32mif\u001b[0m \u001b[0;34m'reference data'\u001b[0m \u001b[0;32min\u001b[0m \u001b[0mxls\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0msheet_names\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 3\u001b[0m \u001b[0mdf\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mread_excel\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mxls\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0;34m'reference data'\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mheader\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mNone\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 4\u001b[0;31m \u001b[0mjoin_n_strip\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;32mlambda\u001b[0m \u001b[0ml\u001b[0m\u001b[0;34m:\u001b[0m \u001b[0;34m' '\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mjoin\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0ml\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mstrip\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 5\u001b[0m \u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mcolumns\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mix\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m1\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;36m3\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfillna\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m''\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mapply\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mjoin_n_strip\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mvalues\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 6\u001b[0m \u001b[0mdf\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mdrop\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mindex\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;36m4\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mreset_index\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mdrop\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;32mTrue\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n", "\u001b[0;31mTypeError\u001b[0m: ('sequence item 2: expected str instance, int found', 'occurred at index 0')" ] } ], "source": [ "def parse_reference_table(xls):\n", " if 'reference data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'reference data', header=None)\n", " join_n_strip = lambda l: ' '.join(l).strip()\n", " df.columns=df.ix[1:3].fillna('').apply(join_n_strip, axis=0).values\n", " df = df.drop(df.index[0:4]).reset_index(drop=True)\n", " else:\n", " df=None\n", " return df\n", "\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_reference_table(xls)\n", " if df is not None:\n", " print(f'Got reference data for {year}')\n" ] }, { "cell_type": "code", "execution_count": 62, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:01.143690Z", "start_time": "2018-06-07T10:38:00.550724Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "('sequence item 2: expected str instance, int found', 'occurred at index 0')\n", "Got reference data for 2009\n", "('sequence item 2: expected str instance, int found', 'occurred at index 0')\n", "Got reference data for 2010\n", "('sequence item 2: expected str instance, int found', 'occurred at index 0')\n", "Got reference data for 2011\n", "('sequence item 2: expected str instance, int found', 'occurred at index 0')\n", "Got reference data for 2012\n", "('sequence item 2: expected str instance, int found', 'occurred at index 0')\n", "Got reference data for 2013\n", "Got reference data for 2014\n", "Got reference data for 2015\n", "Got reference data for 2016\n", "Got reference data for 2017\n" ] } ], "source": [ "def parse_reference_table(xls):\n", " if 'reference data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'reference data', header=None)\n", " join_n_strip = lambda l: ' '.join(l).strip()\n", " try:\n", " df.columns=df.ix[1:3].fillna('').apply(join_n_strip, axis=0).values\n", " df = df.drop(df.index[0:4]).reset_index(drop=True)\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_reference_table(xls)\n", " if df is not None:\n", " print(f'Got reference data for {year}')\n" ] }, { "cell_type": "code", "execution_count": 63, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:05.217935Z", "start_time": "2018-06-07T10:38:05.203057Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
De refschool nameaddress 1townpostcodeschool typeschool management typeparliamentary constituencydistrict councilurban/ rural
01210014Ashfield Girls' High School397 HOLYWOOD ROADBELFASTBT42LYNon-grammarControlledBELFAST EASTBELFASTUrban
11210015Ashfield Boys' High School395 HOLYWOOD ROADBELFASTBT42LYNon-grammarControlledBELFAST EASTBELFASTUrban
21210021Belfast Model School For Girls35 DUNOWEN GARDENSBELFASTBT146NQNon-grammarControlledBELFAST NORTHBELFASTUrban
31210022Belfast Boys' Model SchoolBALLYSILLAN ROADBELFASTBT146RBNon-grammarControlledBELFAST NORTHBELFASTUrban
41230053St Louise's Comprehensive College468 FALLS ROADBELFASTBT126ENNon-grammarCatholic MaintainedBELFAST WESTBELFASTUrban
\n", "
" ], "text/plain": [ " De ref school name address 1 town \\\n", "0 1210014 Ashfield Girls' High School 397 HOLYWOOD ROAD BELFAST \n", "1 1210015 Ashfield Boys' High School 395 HOLYWOOD ROAD BELFAST \n", "2 1210021 Belfast Model School For Girls 35 DUNOWEN GARDENS BELFAST \n", "3 1210022 Belfast Boys' Model School BALLYSILLAN ROAD BELFAST \n", "4 1230053 St Louise's Comprehensive College 468 FALLS ROAD BELFAST \n", "\n", " postcode school type school management type parliamentary constituency \\\n", "0 BT42LY Non-grammar Controlled BELFAST EAST \n", "1 BT42LY Non-grammar Controlled BELFAST EAST \n", "2 BT146NQ Non-grammar Controlled BELFAST NORTH \n", "3 BT146RB Non-grammar Controlled BELFAST NORTH \n", "4 BT126EN Non-grammar Catholic Maintained BELFAST WEST \n", "\n", " district council urban/ rural \n", "0 BELFAST Urban \n", "1 BELFAST Urban \n", "2 BELFAST Urban \n", "3 BELFAST Urban \n", "4 BELFAST Urban " ] }, "execution_count": 63, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df.head()" ] }, { "cell_type": "code", "execution_count": 64, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:08.482150Z", "start_time": "2018-06-07T10:38:07.824536Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got reference data for 2009\n", "Got reference data for 2010\n", "Got reference data for 2011\n", "Got reference data for 2012\n", "Got reference data for 2013\n", "Got reference data for 2014\n", "Got reference data for 2015\n", "Got reference data for 2016\n", "Got reference data for 2017\n" ] } ], "source": [ "join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", "\n", "def parse_reference_table(xls):\n", " if 'reference data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'reference data', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[1:h_range].fillna('').apply(join_n_strip_n_lower, axis=0).values\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_reference_table(xls)\n", " if df is not None:\n", " print(f'Got reference data for {year}')\n", " dfs[year]=df\n" ] }, { "cell_type": "code", "execution_count": 65, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:10.816632Z", "start_time": "2018-06-07T10:38:10.520347Z" }, "code_folding": [] }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 65, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "import seaborn as sns \n", "\n", "all_keys = set([k for df in dfs.values() for k in df.keys() ])\n", "df = pd.DataFrame.from_dict({\n", " year: [k in df.keys() for k in all_keys]\n", " for year, df in dfs.items()\n", "}, orient='index')\n", "df.columns=all_keys\n", "sns.heatmap(df.T)" ] }, { "cell_type": "code", "execution_count": 66, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:19.595005Z", "start_time": "2018-06-07T10:38:19.579726Z" } }, "outputs": [], "source": [ "ref_key_map={\n", " 'denino':'de ref',\n", " 'urban/ rural': 'urban_rural',\n", " 'schoolname': 'school name'\n", "}\n", "join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", "\n", "def parse_reference_table(xls):\n", " if 'reference data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'reference data', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[1:h_range].fillna('').apply(join_n_strip_n_lower, axis=0).values\n", " df.rename(columns=ref_key_map, inplace=True)\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df" ] }, { "cell_type": "code", "execution_count": 67, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:21.667359Z", "start_time": "2018-06-07T10:38:20.761431Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got reference data for 2009\n", "Got reference data for 2010\n", "Got reference data for 2011\n", "Got reference data for 2012\n", "Got reference data for 2013\n", "Got reference data for 2014\n", "Got reference data for 2015\n", "Got reference data for 2016\n", "Got reference data for 2017\n" ] }, { "data": { "text/plain": [ "" ] }, "execution_count": 67, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_reference_table(xls)\n", " if df is not None:\n", " print(f'Got reference data for {year}')\n", " dfs[year]=df\n", " \n", "all_keys = set([k for df in dfs.values() for k in df.keys() ])\n", "df = pd.DataFrame.from_dict({\n", " year: [k in df.keys() for k in all_keys]\n", " for year, df in dfs.items()\n", "}, orient='index')\n", "df.columns=all_keys\n", "sns.heatmap(df.T)" ] }, { "cell_type": "code", "execution_count": 68, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:24.375280Z", "start_time": "2018-06-07T10:38:24.369998Z" } }, "outputs": [ { "data": { "text/plain": [ "['parliamentary constituency',\n", " 'urban_rural',\n", " 'school name',\n", " 'school type',\n", " 'address 1',\n", " 'town',\n", " 'postcode',\n", " 'school management type',\n", " 'de ref',\n", " 'district council']" ] }, "execution_count": 68, "metadata": {}, "output_type": "execute_result" } ], "source": [ "cols = [k for k,v in zip(df.columns, df.all()) if v]\n", "cols" ] }, { "cell_type": "code", "execution_count": 69, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:26.047670Z", "start_time": "2018-06-07T10:38:25.115912Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got reference data for 2009\n", "Got reference data for 2010\n", "Got reference data for 2011\n", "Got reference data for 2012\n", "Got reference data for 2013\n", "Got reference data for 2014\n", "Got reference data for 2015\n", "Got reference data for 2016\n", "Got reference data for 2017\n" ] }, { "data": { "text/plain": [ "" ] }, "execution_count": 69, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "\n", "\n", "def parse_reference_table(xls):\n", " cols = [\n", " 'de ref',\n", " 'school name',\n", " 'school type',\n", " 'address 1',\n", " 'postcode',\n", " 'urban_rural',\n", " 'school management type',\n", " 'district council',\n", " 'parliamentary constituency',\n", " 'town'\n", " ]\n", "\n", " ref_key_map={\n", " 'denino':'de ref',\n", " 'urban/ rural': 'urban_rural',\n", " 'schoolname': 'school name'\n", " }\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " \n", " if 'reference data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'reference data', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[1:h_range].fillna('').apply(join_n_strip_n_lower, axis=0).values\n", " df.rename(columns=ref_key_map, inplace=True)\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df = df[cols]\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_reference_table(xls)\n", " if df is not None:\n", " print(f'Got reference data for {year}')\n", " dfs[year]=df\n", " \n", "all_keys = set([k for df in dfs.values() for k in df.keys() ])\n", "df = pd.DataFrame.from_dict({\n", " year: [k in df.keys() for k in all_keys]\n", " for year, df in dfs.items()\n", "}, orient='index')\n", "df.columns=all_keys\n", "sns.heatmap(df.T)" ] }, { "cell_type": "code", "execution_count": 70, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:30.420856Z", "start_time": "2018-06-07T10:38:29.605434Z" } }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 70, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "sheets = defaultdict(list)\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " sheets[year].extend(xls.sheet_names)\n", "\n", "all_sheet_names = set([_ for d in sheets.values() for _ in d])\n", "df = pd.DataFrame.from_dict({\n", " year: [sn in sheet_names for sn in all_sheet_names] \n", " for year, sheet_names in sheets.items()\n", "}, orient='index')\n", "df.columns=all_sheet_names\n", "sns.heatmap(df.T)" ] }, { "cell_type": "code", "execution_count": 71, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:35.401268Z", "start_time": "2018-06-07T10:38:35.395496Z" } }, "outputs": [ { "data": { "text/plain": [ "Index(['meta data', 'gender', 'unfilled places', 'SEN', 'enrolments',\n", " 'School level data', 'Overall', 'newcomers', 'religion',\n", " 'free school meals', 'reference data'],\n", " dtype='object')" ] }, "execution_count": 71, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df.keys()" ] }, { "cell_type": "markdown", "metadata": { "ExecuteTime": { "end_time": "2018-06-06T15:33:48.284478Z", "start_time": "2018-06-06T15:33:48.155990Z" } }, "source": [ "![](img/enrolements_2017.png)" ] }, { "cell_type": "code", "execution_count": 72, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:37.961073Z", "start_time": "2018-06-07T10:38:37.910934Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
0123456789
0Data on Pupils attending post primary schools ...NaNNaNNaNNaNNaNNaNNaNNaNNaN
1NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
2NaNNaNyear of enrolmentNaNNaNNaNNaNNaNNaNNaN
3DE refSchoolnameyear 8year 9year 10year 11year 12year 13year 14total pupils
41210014Ashfield Girls' High School1241141191111136050691
\n", "
" ], "text/plain": [ " 0 \\\n", "0 Data on Pupils attending post primary schools ... \n", "1 NaN \n", "2 NaN \n", "3 DE ref \n", "4 1210014 \n", "\n", " 1 2 3 4 5 \\\n", "0 NaN NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN NaN \n", "2 NaN year of enrolment NaN NaN NaN \n", "3 Schoolname year 8 year 9 year 10 year 11 \n", "4 Ashfield Girls' High School 124 114 119 111 \n", "\n", " 6 7 8 9 \n", "0 NaN NaN NaN NaN \n", "1 NaN NaN NaN NaN \n", "2 NaN NaN NaN NaN \n", "3 year 12 year 13 year 14 total pupils \n", "4 113 60 50 691 " ] }, "execution_count": 72, "metadata": {}, "output_type": "execute_result" } ], "source": [ "xls = pd.ExcelFile(f'data/education-ni/2017/School%20level%20-%20post%20primary%20schools%20data%20supp%201718.xls')\n", "df = pd.read_excel(xls, 'enrolments', header=None)\n", "df.head()" ] }, { "cell_type": "code", "execution_count": 73, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:41.099926Z", "start_time": "2018-06-07T10:38:41.051310Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
de refschoolnameyear of enrolment year 8year 9year 10year 11year 12year 13year 14total pupils
01210014Ashfield Girls' High School1241141191111136050691
11210015Ashfield Boys' High School1261211171211118460740
21210021Belfast Model School For Girls16716016213912112770946
31210022Belfast Boys' Model School1741791651541608976997
41230053St Louise's Comprehensive College2361941892062641601861435
51230104Mercy College Belfast76667176737117450
61230130St Rose’s Dominican College16253237377224243
71230146Christian Brothers School, Belfast107709547408779525
81230155St Genevieve's High School164161152152165138901022
91230182De La Salle College10916516416117311967958
101230262Corpus Christi College24234540383726233
111230275St Joseph's College, Belfast1231121251111044736658
121230321Blessed Trinity College204204216178191189891271
131240291Colaiste Feirste102119102112977148651
141260269Hazelwood College1701711531471449475954
151260294Malone Integrated College69698863857437485
161410079Grosvenor Grammar School1601581621631541501331080
171410270Wellington College1121191141171228573742
181410315Bloomfield Collegiate1011101011101079378700
191420020Campbell College13414314714814796107922
201420021St Mary's Christian Brothers' Grammar, Belfast1781851821741651571241165
211420022Methodist College2412472562552532662581776
221420027The Royal Belfast Academical Institution1521601601641461141161012
231420028Belfast Royal Academy2072112092162092211881461
241420029St Dominic's High School, Belfast1411471451441561491301012
251420030St Malachy's College, Belfast1591611651711661511211094
261420082Dominican College, Belfast152148151153147152981001
271420089Strathearn School, Belfast111116121110111103106778
281420095Rathmore Grammar School1841861861861841831611270
291420264Victoria College132138141136127120103897
.................................
1785230218St Catherine's College1731731591571891251281104
1795230278Holy Trinity College159163171169160112871021
1805230293St Patrick's College, Dungannon10610998921014935590
1815230321St John The Baptist College7750375100170
1825250216Brownlow Int College626243526600285
1835260285New-Bridge Integrated College1091071011061045236615
1845260286Integrated College Dungannon119999794934149592
1855410013Banbridge Academy1851871931961961841601301
1865410057Lurgan College000122116115102455
1875410067Portadown College000205207171161744
1885420045St Louis Grammar School, Kilkeel82838481848169564
1895420059Abbey Christian Brothers Grammar School128130129132136115115885
1905420060Our Lady's Grammar School126124124126125117111853
1915420062St Colman's College, Newry127126131130125118128885
1925420073St Joseph's Convent Grammar School, Donaghmore991021059210210680686
1935420076Sacred Heart Grammar School, Newry123123120120119122116843
1945420260The Royal School, Dungannon9396107931057470638
1955420263The Royal School, Armagh10310399108106103113735
1965420268St Patrick's Grammar School, Armagh126164132155156126108967
1975420304St Patrick's Academy, Dungannon1971981981892001761821340
1985420314St Ronan’s College2852432071822491571461469
199NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
200NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
201NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
202NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
203Source: NI school censusNaNNaNNaNNaNNaNNaNNaNNaNNaN
204NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
205Notes:NaNNaNNaNNaNNaNNaNNaNNaNNaN
2061. Year groups refer to the level of study of ...NaNNaNNaNNaNNaNNaNNaNNaNNaN
2072. Pupils aged 16+ that are not studying level...NaNNaNNaNNaNNaNNaNNaNNaNNaN
\n", "

208 rows × 10 columns

\n", "
" ], "text/plain": [ " de ref \\\n", "0 1210014 \n", "1 1210015 \n", "2 1210021 \n", "3 1210022 \n", "4 1230053 \n", "5 1230104 \n", "6 1230130 \n", "7 1230146 \n", "8 1230155 \n", "9 1230182 \n", "10 1230262 \n", "11 1230275 \n", "12 1230321 \n", "13 1240291 \n", "14 1260269 \n", "15 1260294 \n", "16 1410079 \n", "17 1410270 \n", "18 1410315 \n", "19 1420020 \n", "20 1420021 \n", "21 1420022 \n", "22 1420027 \n", "23 1420028 \n", "24 1420029 \n", "25 1420030 \n", "26 1420082 \n", "27 1420089 \n", "28 1420095 \n", "29 1420264 \n", ".. ... \n", "178 5230218 \n", "179 5230278 \n", "180 5230293 \n", "181 5230321 \n", "182 5250216 \n", "183 5260285 \n", "184 5260286 \n", "185 5410013 \n", "186 5410057 \n", "187 5410067 \n", "188 5420045 \n", "189 5420059 \n", "190 5420060 \n", "191 5420062 \n", "192 5420073 \n", "193 5420076 \n", "194 5420260 \n", "195 5420263 \n", "196 5420268 \n", "197 5420304 \n", "198 5420314 \n", "199 NaN \n", "200 NaN \n", "201 NaN \n", "202 NaN \n", "203 Source: NI school census \n", "204 NaN \n", "205 Notes: \n", "206 1. Year groups refer to the level of study of ... \n", "207 2. Pupils aged 16+ that are not studying level... \n", "\n", " schoolname year of enrolment year 8 \\\n", "0 Ashfield Girls' High School 124 \n", "1 Ashfield Boys' High School 126 \n", "2 Belfast Model School For Girls 167 \n", "3 Belfast Boys' Model School 174 \n", "4 St Louise's Comprehensive College 236 \n", "5 Mercy College Belfast 76 \n", "6 St Rose’s Dominican College 16 \n", "7 Christian Brothers School, Belfast 107 \n", "8 St Genevieve's High School 164 \n", "9 De La Salle College 109 \n", "10 Corpus Christi College 24 \n", "11 St Joseph's College, Belfast 123 \n", "12 Blessed Trinity College 204 \n", "13 Colaiste Feirste 102 \n", "14 Hazelwood College 170 \n", "15 Malone Integrated College 69 \n", "16 Grosvenor Grammar School 160 \n", "17 Wellington College 112 \n", "18 Bloomfield Collegiate 101 \n", "19 Campbell College 134 \n", "20 St Mary's Christian Brothers' Grammar, Belfast 178 \n", "21 Methodist College 241 \n", "22 The Royal Belfast Academical Institution 152 \n", "23 Belfast Royal Academy 207 \n", "24 St Dominic's High School, Belfast 141 \n", "25 St Malachy's College, Belfast 159 \n", "26 Dominican College, Belfast 152 \n", "27 Strathearn School, Belfast 111 \n", "28 Rathmore Grammar School 184 \n", "29 Victoria College 132 \n", ".. ... ... \n", "178 St Catherine's College 173 \n", "179 Holy Trinity College 159 \n", "180 St Patrick's College, Dungannon 106 \n", "181 St John The Baptist College 77 \n", "182 Brownlow Int College 62 \n", "183 New-Bridge Integrated College 109 \n", "184 Integrated College Dungannon 119 \n", "185 Banbridge Academy 185 \n", "186 Lurgan College 0 \n", "187 Portadown College 0 \n", "188 St Louis Grammar School, Kilkeel 82 \n", "189 Abbey Christian Brothers Grammar School 128 \n", "190 Our Lady's Grammar School 126 \n", "191 St Colman's College, Newry 127 \n", "192 St Joseph's Convent Grammar School, Donaghmore 99 \n", "193 Sacred Heart Grammar School, Newry 123 \n", "194 The Royal School, Dungannon 93 \n", "195 The Royal School, Armagh 103 \n", "196 St Patrick's Grammar School, Armagh 126 \n", "197 St Patrick's Academy, Dungannon 197 \n", "198 St Ronan’s College 285 \n", "199 NaN NaN \n", "200 NaN NaN \n", "201 NaN NaN \n", "202 NaN NaN \n", "203 NaN NaN \n", "204 NaN NaN \n", "205 NaN NaN \n", "206 NaN NaN \n", "207 NaN NaN \n", "\n", " year 9 year 10 year 11 year 12 year 13 year 14 total pupils \n", "0 114 119 111 113 60 50 691 \n", "1 121 117 121 111 84 60 740 \n", "2 160 162 139 121 127 70 946 \n", "3 179 165 154 160 89 76 997 \n", "4 194 189 206 264 160 186 1435 \n", "5 66 71 76 73 71 17 450 \n", "6 25 32 37 37 72 24 243 \n", "7 70 95 47 40 87 79 525 \n", "8 161 152 152 165 138 90 1022 \n", "9 165 164 161 173 119 67 958 \n", "10 23 45 40 38 37 26 233 \n", "11 112 125 111 104 47 36 658 \n", "12 204 216 178 191 189 89 1271 \n", "13 119 102 112 97 71 48 651 \n", "14 171 153 147 144 94 75 954 \n", "15 69 88 63 85 74 37 485 \n", "16 158 162 163 154 150 133 1080 \n", "17 119 114 117 122 85 73 742 \n", "18 110 101 110 107 93 78 700 \n", "19 143 147 148 147 96 107 922 \n", "20 185 182 174 165 157 124 1165 \n", "21 247 256 255 253 266 258 1776 \n", "22 160 160 164 146 114 116 1012 \n", "23 211 209 216 209 221 188 1461 \n", "24 147 145 144 156 149 130 1012 \n", "25 161 165 171 166 151 121 1094 \n", "26 148 151 153 147 152 98 1001 \n", "27 116 121 110 111 103 106 778 \n", "28 186 186 186 184 183 161 1270 \n", "29 138 141 136 127 120 103 897 \n", ".. ... ... ... ... ... ... ... \n", "178 173 159 157 189 125 128 1104 \n", "179 163 171 169 160 112 87 1021 \n", "180 109 98 92 101 49 35 590 \n", "181 50 37 5 1 0 0 170 \n", "182 62 43 52 66 0 0 285 \n", "183 107 101 106 104 52 36 615 \n", "184 99 97 94 93 41 49 592 \n", "185 187 193 196 196 184 160 1301 \n", "186 0 0 122 116 115 102 455 \n", "187 0 0 205 207 171 161 744 \n", "188 83 84 81 84 81 69 564 \n", "189 130 129 132 136 115 115 885 \n", "190 124 124 126 125 117 111 853 \n", "191 126 131 130 125 118 128 885 \n", "192 102 105 92 102 106 80 686 \n", "193 123 120 120 119 122 116 843 \n", "194 96 107 93 105 74 70 638 \n", "195 103 99 108 106 103 113 735 \n", "196 164 132 155 156 126 108 967 \n", "197 198 198 189 200 176 182 1340 \n", "198 243 207 182 249 157 146 1469 \n", "199 NaN NaN NaN NaN NaN NaN NaN \n", "200 NaN NaN NaN NaN NaN NaN NaN \n", "201 NaN NaN NaN NaN NaN NaN NaN \n", "202 NaN NaN NaN NaN NaN NaN NaN \n", "203 NaN NaN NaN NaN NaN NaN NaN \n", "204 NaN NaN NaN NaN NaN NaN NaN \n", "205 NaN NaN NaN NaN NaN NaN NaN \n", "206 NaN NaN NaN NaN NaN NaN NaN \n", "207 NaN NaN NaN NaN NaN NaN NaN \n", "\n", "[208 rows x 10 columns]" ] }, "execution_count": 73, "metadata": {}, "output_type": "execute_result" } ], "source": [ "def parse_enrolments_table(xls):\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " \n", " if 'enrolments' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'enrolments', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[1:h_range].fillna('').apply(join_n_strip_n_lower, axis=0).values\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "df= parse_enrolments_table(xls)\n", "df" ] }, { "cell_type": "code", "execution_count": 74, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:41.870545Z", "start_time": "2018-06-07T10:38:41.833695Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
schoolnameyear of enrolment year 8year 9year 10year 11year 12year 13year 14total pupils
de ref
1210014Ashfield Girls' High School1241141191111136050691
1210015Ashfield Boys' High School1261211171211118460740
1210021Belfast Model School For Girls16716016213912112770946
1210022Belfast Boys' Model School1741791651541608976997
1230053St Louise's Comprehensive College2361941892062641601861435
1230104Mercy College Belfast76667176737117450
1230130St Rose’s Dominican College16253237377224243
1230146Christian Brothers School, Belfast107709547408779525
1230155St Genevieve's High School164161152152165138901022
1230182De La Salle College10916516416117311967958
1230262Corpus Christi College24234540383726233
1230275St Joseph's College, Belfast1231121251111044736658
1230321Blessed Trinity College204204216178191189891271
1240291Colaiste Feirste102119102112977148651
1260269Hazelwood College1701711531471449475954
1260294Malone Integrated College69698863857437485
1410079Grosvenor Grammar School1601581621631541501331080
1410270Wellington College1121191141171228573742
1410315Bloomfield Collegiate1011101011101079378700
1420020Campbell College13414314714814796107922
1420021St Mary's Christian Brothers' Grammar, Belfast1781851821741651571241165
1420022Methodist College2412472562552532662581776
1420027The Royal Belfast Academical Institution1521601601641461141161012
1420028Belfast Royal Academy2072112092162092211881461
1420029St Dominic's High School, Belfast1411471451441561491301012
1420030St Malachy's College, Belfast1591611651711661511211094
1420082Dominican College, Belfast152148151153147152981001
1420089Strathearn School, Belfast111116121110111103106778
1420095Rathmore Grammar School1841861861861841831611270
1420264Victoria College132138141136127120103897
..............................
5230218St Catherine's College1731731591571891251281104
5230278Holy Trinity College159163171169160112871021
5230293St Patrick's College, Dungannon10610998921014935590
5230321St John The Baptist College7750375100170
5250216Brownlow Int College626243526600285
5260285New-Bridge Integrated College1091071011061045236615
5260286Integrated College Dungannon119999794934149592
5410013Banbridge Academy1851871931961961841601301
5410057Lurgan College000122116115102455
5410067Portadown College000205207171161744
5420045St Louis Grammar School, Kilkeel82838481848169564
5420059Abbey Christian Brothers Grammar School128130129132136115115885
5420060Our Lady's Grammar School126124124126125117111853
5420062St Colman's College, Newry127126131130125118128885
5420073St Joseph's Convent Grammar School, Donaghmore991021059210210680686
5420076Sacred Heart Grammar School, Newry123123120120119122116843
5420260The Royal School, Dungannon9396107931057470638
5420263The Royal School, Armagh10310399108106103113735
5420268St Patrick's Grammar School, Armagh126164132155156126108967
5420304St Patrick's Academy, Dungannon1971981981892001761821340
5420314St Ronan’s College2852432071822491571461469
NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
Source: NI school censusNaNNaNNaNNaNNaNNaNNaNNaNNaN
NaNNaNNaNNaNNaNNaNNaNNaNNaNNaN
Notes:NaNNaNNaNNaNNaNNaNNaNNaNNaN
1. Year groups refer to the level of study of pupils i.e. Pupils in their final year of GCSEs (including those repeating are in year 12)NaNNaNNaNNaNNaNNaNNaNNaNNaN
2. Pupils aged 16+ that are not studying level 2 or 3 qualifications have been recorded as year 12 pupilsNaNNaNNaNNaNNaNNaNNaNNaNNaN
\n", "

208 rows × 9 columns

\n", "
" ], "text/plain": [ " schoolname \\\n", "de ref \n", "1210014 Ashfield Girls' High School \n", "1210015 Ashfield Boys' High School \n", "1210021 Belfast Model School For Girls \n", "1210022 Belfast Boys' Model School \n", "1230053 St Louise's Comprehensive College \n", "1230104 Mercy College Belfast \n", "1230130 St Rose’s Dominican College \n", "1230146 Christian Brothers School, Belfast \n", "1230155 St Genevieve's High School \n", "1230182 De La Salle College \n", "1230262 Corpus Christi College \n", "1230275 St Joseph's College, Belfast \n", "1230321 Blessed Trinity College \n", "1240291 Colaiste Feirste \n", "1260269 Hazelwood College \n", "1260294 Malone Integrated College \n", "1410079 Grosvenor Grammar School \n", "1410270 Wellington College \n", "1410315 Bloomfield Collegiate \n", "1420020 Campbell College \n", "1420021 St Mary's Christian Brothers' Grammar, Belfast \n", "1420022 Methodist College \n", "1420027 The Royal Belfast Academical Institution \n", "1420028 Belfast Royal Academy \n", "1420029 St Dominic's High School, Belfast \n", "1420030 St Malachy's College, Belfast \n", "1420082 Dominican College, Belfast \n", "1420089 Strathearn School, Belfast \n", "1420095 Rathmore Grammar School \n", "1420264 Victoria College \n", "... ... \n", "5230218 St Catherine's College \n", "5230278 Holy Trinity College \n", "5230293 St Patrick's College, Dungannon \n", "5230321 St John The Baptist College \n", "5250216 Brownlow Int College \n", "5260285 New-Bridge Integrated College \n", "5260286 Integrated College Dungannon \n", "5410013 Banbridge Academy \n", "5410057 Lurgan College \n", "5410067 Portadown College \n", "5420045 St Louis Grammar School, Kilkeel \n", "5420059 Abbey Christian Brothers Grammar School \n", "5420060 Our Lady's Grammar School \n", "5420062 St Colman's College, Newry \n", "5420073 St Joseph's Convent Grammar School, Donaghmore \n", "5420076 Sacred Heart Grammar School, Newry \n", "5420260 The Royal School, Dungannon \n", "5420263 The Royal School, Armagh \n", "5420268 St Patrick's Grammar School, Armagh \n", "5420304 St Patrick's Academy, Dungannon \n", "5420314 St Ronan’s College \n", "NaN NaN \n", "NaN NaN \n", "NaN NaN \n", "NaN NaN \n", "Source: NI school census NaN \n", "NaN NaN \n", "Notes: NaN \n", "1. Year groups refer to the level of study of p... NaN \n", "2. Pupils aged 16+ that are not studying level ... NaN \n", "\n", " year of enrolment year 8 \\\n", "de ref \n", "1210014 124 \n", "1210015 126 \n", "1210021 167 \n", "1210022 174 \n", "1230053 236 \n", "1230104 76 \n", "1230130 16 \n", "1230146 107 \n", "1230155 164 \n", "1230182 109 \n", "1230262 24 \n", "1230275 123 \n", "1230321 204 \n", "1240291 102 \n", "1260269 170 \n", "1260294 69 \n", "1410079 160 \n", "1410270 112 \n", "1410315 101 \n", "1420020 134 \n", "1420021 178 \n", "1420022 241 \n", "1420027 152 \n", "1420028 207 \n", "1420029 141 \n", "1420030 159 \n", "1420082 152 \n", "1420089 111 \n", "1420095 184 \n", "1420264 132 \n", "... ... \n", "5230218 173 \n", "5230278 159 \n", "5230293 106 \n", "5230321 77 \n", "5250216 62 \n", "5260285 109 \n", "5260286 119 \n", "5410013 185 \n", "5410057 0 \n", "5410067 0 \n", "5420045 82 \n", "5420059 128 \n", "5420060 126 \n", "5420062 127 \n", "5420073 99 \n", "5420076 123 \n", "5420260 93 \n", "5420263 103 \n", "5420268 126 \n", "5420304 197 \n", "5420314 285 \n", "NaN NaN \n", "NaN NaN \n", "NaN NaN \n", "NaN NaN \n", "Source: NI school census NaN \n", "NaN NaN \n", "Notes: NaN \n", "1. Year groups refer to the level of study of p... NaN \n", "2. Pupils aged 16+ that are not studying level ... NaN \n", "\n", " year 9 year 10 year 11 \\\n", "de ref \n", "1210014 114 119 111 \n", "1210015 121 117 121 \n", "1210021 160 162 139 \n", "1210022 179 165 154 \n", "1230053 194 189 206 \n", "1230104 66 71 76 \n", "1230130 25 32 37 \n", "1230146 70 95 47 \n", "1230155 161 152 152 \n", "1230182 165 164 161 \n", "1230262 23 45 40 \n", "1230275 112 125 111 \n", "1230321 204 216 178 \n", "1240291 119 102 112 \n", "1260269 171 153 147 \n", "1260294 69 88 63 \n", "1410079 158 162 163 \n", "1410270 119 114 117 \n", "1410315 110 101 110 \n", "1420020 143 147 148 \n", "1420021 185 182 174 \n", "1420022 247 256 255 \n", "1420027 160 160 164 \n", "1420028 211 209 216 \n", "1420029 147 145 144 \n", "1420030 161 165 171 \n", "1420082 148 151 153 \n", "1420089 116 121 110 \n", "1420095 186 186 186 \n", "1420264 138 141 136 \n", "... ... ... ... \n", "5230218 173 159 157 \n", "5230278 163 171 169 \n", "5230293 109 98 92 \n", "5230321 50 37 5 \n", "5250216 62 43 52 \n", "5260285 107 101 106 \n", "5260286 99 97 94 \n", "5410013 187 193 196 \n", "5410057 0 0 122 \n", "5410067 0 0 205 \n", "5420045 83 84 81 \n", "5420059 130 129 132 \n", "5420060 124 124 126 \n", "5420062 126 131 130 \n", "5420073 102 105 92 \n", "5420076 123 120 120 \n", "5420260 96 107 93 \n", "5420263 103 99 108 \n", "5420268 164 132 155 \n", "5420304 198 198 189 \n", "5420314 243 207 182 \n", "NaN NaN NaN NaN \n", "NaN NaN NaN NaN \n", "NaN NaN NaN NaN \n", "NaN NaN NaN NaN \n", "Source: NI school census NaN NaN NaN \n", "NaN NaN NaN NaN \n", "Notes: NaN NaN NaN \n", "1. Year groups refer to the level of study of p... NaN NaN NaN \n", "2. Pupils aged 16+ that are not studying level ... NaN NaN NaN \n", "\n", " year 12 year 13 year 14 \\\n", "de ref \n", "1210014 113 60 50 \n", "1210015 111 84 60 \n", "1210021 121 127 70 \n", "1210022 160 89 76 \n", "1230053 264 160 186 \n", "1230104 73 71 17 \n", "1230130 37 72 24 \n", "1230146 40 87 79 \n", "1230155 165 138 90 \n", "1230182 173 119 67 \n", "1230262 38 37 26 \n", "1230275 104 47 36 \n", "1230321 191 189 89 \n", "1240291 97 71 48 \n", "1260269 144 94 75 \n", "1260294 85 74 37 \n", "1410079 154 150 133 \n", "1410270 122 85 73 \n", "1410315 107 93 78 \n", "1420020 147 96 107 \n", "1420021 165 157 124 \n", "1420022 253 266 258 \n", "1420027 146 114 116 \n", "1420028 209 221 188 \n", "1420029 156 149 130 \n", "1420030 166 151 121 \n", "1420082 147 152 98 \n", "1420089 111 103 106 \n", "1420095 184 183 161 \n", "1420264 127 120 103 \n", "... ... ... ... \n", "5230218 189 125 128 \n", "5230278 160 112 87 \n", "5230293 101 49 35 \n", "5230321 1 0 0 \n", "5250216 66 0 0 \n", "5260285 104 52 36 \n", "5260286 93 41 49 \n", "5410013 196 184 160 \n", "5410057 116 115 102 \n", "5410067 207 171 161 \n", "5420045 84 81 69 \n", "5420059 136 115 115 \n", "5420060 125 117 111 \n", "5420062 125 118 128 \n", "5420073 102 106 80 \n", "5420076 119 122 116 \n", "5420260 105 74 70 \n", "5420263 106 103 113 \n", "5420268 156 126 108 \n", "5420304 200 176 182 \n", "5420314 249 157 146 \n", "NaN NaN NaN NaN \n", "NaN NaN NaN NaN \n", "NaN NaN NaN NaN \n", "NaN NaN NaN NaN \n", "Source: NI school census NaN NaN NaN \n", "NaN NaN NaN NaN \n", "Notes: NaN NaN NaN \n", "1. Year groups refer to the level of study of p... NaN NaN NaN \n", "2. Pupils aged 16+ that are not studying level ... NaN NaN NaN \n", "\n", " total pupils \n", "de ref \n", "1210014 691 \n", "1210015 740 \n", "1210021 946 \n", "1210022 997 \n", "1230053 1435 \n", "1230104 450 \n", "1230130 243 \n", "1230146 525 \n", "1230155 1022 \n", "1230182 958 \n", "1230262 233 \n", "1230275 658 \n", "1230321 1271 \n", "1240291 651 \n", "1260269 954 \n", "1260294 485 \n", "1410079 1080 \n", "1410270 742 \n", "1410315 700 \n", "1420020 922 \n", "1420021 1165 \n", "1420022 1776 \n", "1420027 1012 \n", "1420028 1461 \n", "1420029 1012 \n", "1420030 1094 \n", "1420082 1001 \n", "1420089 778 \n", "1420095 1270 \n", "1420264 897 \n", "... ... \n", "5230218 1104 \n", "5230278 1021 \n", "5230293 590 \n", "5230321 170 \n", "5250216 285 \n", "5260285 615 \n", "5260286 592 \n", "5410013 1301 \n", "5410057 455 \n", "5410067 744 \n", "5420045 564 \n", "5420059 885 \n", "5420060 853 \n", "5420062 885 \n", "5420073 686 \n", "5420076 843 \n", "5420260 638 \n", "5420263 735 \n", "5420268 967 \n", "5420304 1340 \n", "5420314 1469 \n", "NaN NaN \n", "NaN NaN \n", "NaN NaN \n", "NaN NaN \n", "Source: NI school census NaN \n", "NaN NaN \n", "Notes: NaN \n", "1. Year groups refer to the level of study of p... NaN \n", "2. Pupils aged 16+ that are not studying level ... NaN \n", "\n", "[208 rows x 9 columns]" ] }, "execution_count": 74, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df.set_index('de ref')" ] }, { "cell_type": "code", "execution_count": 75, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:42.352573Z", "start_time": "2018-06-07T10:38:42.315910Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
de refschoolnameyear 8year 9year 10year 11year 12year 13year 14total pupils
1945420260The Royal School, Dungannon9396107931057470638
1955420263The Royal School, Armagh10310399108106103113735
1965420268St Patrick's Grammar School, Armagh126164132155156126108967
1975420304St Patrick's Academy, Dungannon1971981981892001761821340
1985420314St Ronan’s College2852432071822491571461469
\n", "
" ], "text/plain": [ " de ref schoolname year 8 year 9 year 10 \\\n", "194 5420260 The Royal School, Dungannon 93 96 107 \n", "195 5420263 The Royal School, Armagh 103 103 99 \n", "196 5420268 St Patrick's Grammar School, Armagh 126 164 132 \n", "197 5420304 St Patrick's Academy, Dungannon 197 198 198 \n", "198 5420314 St Ronan’s College 285 243 207 \n", "\n", " year 11 year 12 year 13 year 14 total pupils \n", "194 93 105 74 70 638 \n", "195 108 106 103 113 735 \n", "196 155 156 126 108 967 \n", "197 189 200 176 182 1340 \n", "198 182 249 157 146 1469 " ] }, "execution_count": 75, "metadata": {}, "output_type": "execute_result" } ], "source": [ "def parse_enrolments_table(xls):\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " strip_n_lower = lambda s: s.strip().lower()\n", " \n", " if 'enrolments' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'enrolments', header=None, skip_footer=5)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[3].fillna('').apply(strip_n_lower).values\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df.dropna(how='all', inplace=True, axis=0)\n", " \n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "parse_enrolments_table(xls).tail()" ] }, { "cell_type": "code", "execution_count": 76, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:42.926747Z", "start_time": "2018-06-07T10:38:42.889118Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
year 8year 9year 10year 11year 12year 13year 14total pupils
de ref
12100141241141191111136050691
12100151261211171211118460740
121002116716016213912112770946
12100221741791651541608976997
12300532361941892062641601861435
123010476667176737117450
123013016253237377224243
1230146107709547408779525
1230155164161152152165138901022
123018210916516416117311967958
123026224234540383726233
12302751231121251111044736658
1230321204204216178191189891271
1240291102119102112977148651
12602691701711531471449475954
126029469698863857437485
14100791601581621631541501331080
14102701121191141171228573742
14103151011101011101079378700
142002013414314714814796107922
14200211781851821741651571241165
14200222412472562552532662581776
14200271521601601641461141161012
14200282072112092162092211881461
14200291411471451441561491301012
14200301591611651711661511211094
1420082152148151153147152981001
1420089111116121110111103106778
14200951841861861861841831611270
1420264132138141136127120103897
...........................
523007610574775648918387
5230108981029993874552576
52301351431231391381426169815
52301521281311191141347396795
52301572442382862542481531371560
5230167114117105931084038615
52301871611611501701721181001032
5230192829079595200362
523021318219318722119696671142
52302181731731591571891251281104
5230278159163171169160112871021
523029310610998921014935590
52303217750375100170
5250216626243526600285
52602851091071011061045236615
5260286119999794934149592
54100131851871931961961841601301
5410057000122116115102455
5410067000205207171161744
542004582838481848169564
5420059128130129132136115115885
5420060126124124126125117111853
5420062127126131130125118128885
5420073991021059210210680686
5420076123123120120119122116843
54202609396107931057470638
542026310310399108106103113735
5420268126164132155156126108967
54203041971981981892001761821340
54203142852432071822491571461469
\n", "

199 rows × 8 columns

\n", "
" ], "text/plain": [ " year 8 year 9 year 10 year 11 year 12 year 13 year 14 total pupils\n", "de ref \n", "1210014 124 114 119 111 113 60 50 691\n", "1210015 126 121 117 121 111 84 60 740\n", "1210021 167 160 162 139 121 127 70 946\n", "1210022 174 179 165 154 160 89 76 997\n", "1230053 236 194 189 206 264 160 186 1435\n", "1230104 76 66 71 76 73 71 17 450\n", "1230130 16 25 32 37 37 72 24 243\n", "1230146 107 70 95 47 40 87 79 525\n", "1230155 164 161 152 152 165 138 90 1022\n", "1230182 109 165 164 161 173 119 67 958\n", "1230262 24 23 45 40 38 37 26 233\n", "1230275 123 112 125 111 104 47 36 658\n", "1230321 204 204 216 178 191 189 89 1271\n", "1240291 102 119 102 112 97 71 48 651\n", "1260269 170 171 153 147 144 94 75 954\n", "1260294 69 69 88 63 85 74 37 485\n", "1410079 160 158 162 163 154 150 133 1080\n", "1410270 112 119 114 117 122 85 73 742\n", "1410315 101 110 101 110 107 93 78 700\n", "1420020 134 143 147 148 147 96 107 922\n", "1420021 178 185 182 174 165 157 124 1165\n", "1420022 241 247 256 255 253 266 258 1776\n", "1420027 152 160 160 164 146 114 116 1012\n", "1420028 207 211 209 216 209 221 188 1461\n", "1420029 141 147 145 144 156 149 130 1012\n", "1420030 159 161 165 171 166 151 121 1094\n", "1420082 152 148 151 153 147 152 98 1001\n", "1420089 111 116 121 110 111 103 106 778\n", "1420095 184 186 186 186 184 183 161 1270\n", "1420264 132 138 141 136 127 120 103 897\n", "... ... ... ... ... ... ... ... ...\n", "5230076 105 74 77 56 48 9 18 387\n", "5230108 98 102 99 93 87 45 52 576\n", "5230135 143 123 139 138 142 61 69 815\n", "5230152 128 131 119 114 134 73 96 795\n", "5230157 244 238 286 254 248 153 137 1560\n", "5230167 114 117 105 93 108 40 38 615\n", "5230187 161 161 150 170 172 118 100 1032\n", "5230192 82 90 79 59 52 0 0 362\n", "5230213 182 193 187 221 196 96 67 1142\n", "5230218 173 173 159 157 189 125 128 1104\n", "5230278 159 163 171 169 160 112 87 1021\n", "5230293 106 109 98 92 101 49 35 590\n", "5230321 77 50 37 5 1 0 0 170\n", "5250216 62 62 43 52 66 0 0 285\n", "5260285 109 107 101 106 104 52 36 615\n", "5260286 119 99 97 94 93 41 49 592\n", "5410013 185 187 193 196 196 184 160 1301\n", "5410057 0 0 0 122 116 115 102 455\n", "5410067 0 0 0 205 207 171 161 744\n", "5420045 82 83 84 81 84 81 69 564\n", "5420059 128 130 129 132 136 115 115 885\n", "5420060 126 124 124 126 125 117 111 853\n", "5420062 127 126 131 130 125 118 128 885\n", "5420073 99 102 105 92 102 106 80 686\n", "5420076 123 123 120 120 119 122 116 843\n", "5420260 93 96 107 93 105 74 70 638\n", "5420263 103 103 99 108 106 103 113 735\n", "5420268 126 164 132 155 156 126 108 967\n", "5420304 197 198 198 189 200 176 182 1340\n", "5420314 285 243 207 182 249 157 146 1469\n", "\n", "[199 rows x 8 columns]" ] }, "execution_count": 76, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df = parse_enrolments_table(xls).set_index('de ref').drop('schoolname', axis=1)\n", "df" ] }, { "cell_type": "code", "execution_count": 77, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:43.497926Z", "start_time": "2018-06-07T10:38:43.467190Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
year 8year 9year 10year 11year 12year 13year 14
de ref
12100141241141191111136050
12100151261211171211118460
121002116716016213912112770
12100221741791651541608976
1230053236194189206264160186
123010476667176737117
123013016253237377224
1230146107709547408779
123015516416115215216513890
123018210916516416117311967
123026224234540383726
12302751231121251111044736
123032120420421617819118989
1240291102119102112977148
12602691701711531471449475
126029469698863857437
1410079160158162163154150133
14102701121191141171228573
14103151011101011101079378
142002013414314714814796107
1420021178185182174165157124
1420022241247256255253266258
1420027152160160164146114116
1420028207211209216209221188
1420029141147145144156149130
1420030159161165171166151121
142008215214815115314715298
1420089111116121110111103106
1420095184186186186184183161
1420264132138141136127120103
........................
523007610574775648918
5230108981029993874552
52301351431231391381426169
52301521281311191141347396
5230157244238286254248153137
5230167114117105931084038
5230187161161150170172118100
5230192829079595200
52302131821931872211969667
5230218173173159157189125128
523027815916317116916011287
523029310610998921014935
52303217750375100
5250216626243526600
52602851091071011061045236
5260286119999794934149
5410013185187193196196184160
5410057000122116115102
5410067000205207171161
542004582838481848169
5420059128130129132136115115
5420060126124124126125117111
5420062127126131130125118128
5420073991021059210210680
5420076123123120120119122116
54202609396107931057470
542026310310399108106103113
5420268126164132155156126108
5420304197198198189200176182
5420314285243207182249157146
\n", "

199 rows × 7 columns

\n", "
" ], "text/plain": [ " year 8 year 9 year 10 year 11 year 12 year 13 year 14\n", "de ref \n", "1210014 124 114 119 111 113 60 50\n", "1210015 126 121 117 121 111 84 60\n", "1210021 167 160 162 139 121 127 70\n", "1210022 174 179 165 154 160 89 76\n", "1230053 236 194 189 206 264 160 186\n", "1230104 76 66 71 76 73 71 17\n", "1230130 16 25 32 37 37 72 24\n", "1230146 107 70 95 47 40 87 79\n", "1230155 164 161 152 152 165 138 90\n", "1230182 109 165 164 161 173 119 67\n", "1230262 24 23 45 40 38 37 26\n", "1230275 123 112 125 111 104 47 36\n", "1230321 204 204 216 178 191 189 89\n", "1240291 102 119 102 112 97 71 48\n", "1260269 170 171 153 147 144 94 75\n", "1260294 69 69 88 63 85 74 37\n", "1410079 160 158 162 163 154 150 133\n", "1410270 112 119 114 117 122 85 73\n", "1410315 101 110 101 110 107 93 78\n", "1420020 134 143 147 148 147 96 107\n", "1420021 178 185 182 174 165 157 124\n", "1420022 241 247 256 255 253 266 258\n", "1420027 152 160 160 164 146 114 116\n", "1420028 207 211 209 216 209 221 188\n", "1420029 141 147 145 144 156 149 130\n", "1420030 159 161 165 171 166 151 121\n", "1420082 152 148 151 153 147 152 98\n", "1420089 111 116 121 110 111 103 106\n", "1420095 184 186 186 186 184 183 161\n", "1420264 132 138 141 136 127 120 103\n", "... ... ... ... ... ... ... ...\n", "5230076 105 74 77 56 48 9 18\n", "5230108 98 102 99 93 87 45 52\n", "5230135 143 123 139 138 142 61 69\n", "5230152 128 131 119 114 134 73 96\n", "5230157 244 238 286 254 248 153 137\n", "5230167 114 117 105 93 108 40 38\n", "5230187 161 161 150 170 172 118 100\n", "5230192 82 90 79 59 52 0 0\n", "5230213 182 193 187 221 196 96 67\n", "5230218 173 173 159 157 189 125 128\n", "5230278 159 163 171 169 160 112 87\n", "5230293 106 109 98 92 101 49 35\n", "5230321 77 50 37 5 1 0 0\n", "5250216 62 62 43 52 66 0 0\n", "5260285 109 107 101 106 104 52 36\n", "5260286 119 99 97 94 93 41 49\n", "5410013 185 187 193 196 196 184 160\n", "5410057 0 0 0 122 116 115 102\n", "5410067 0 0 0 205 207 171 161\n", "5420045 82 83 84 81 84 81 69\n", "5420059 128 130 129 132 136 115 115\n", "5420060 126 124 124 126 125 117 111\n", "5420062 127 126 131 130 125 118 128\n", "5420073 99 102 105 92 102 106 80\n", "5420076 123 123 120 120 119 122 116\n", "5420260 93 96 107 93 105 74 70\n", "5420263 103 103 99 108 106 103 113\n", "5420268 126 164 132 155 156 126 108\n", "5420304 197 198 198 189 200 176 182\n", "5420314 285 243 207 182 249 157 146\n", "\n", "[199 rows x 7 columns]" ] }, "execution_count": 77, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df[[c for c in df if c.startswith('year')]]" ] }, { "cell_type": "code", "execution_count": 78, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:44.183563Z", "start_time": "2018-06-07T10:38:44.034416Z" } }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 78, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAYcAAAEYCAYAAAC3LjroAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADl0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uIDIuMi4yLCBodHRwOi8vbWF0cGxvdGxpYi5vcmcvhp/UCwAAEu1JREFUeJzt3X+w5XV93/HnC5DoaJQlbIlhMWt0ayBaEVegrW1VkmWxTsCYWvlDNkbZRCE1iTMVnUwXtXaIGZMJM8aEyFaoaSiTRKUpZt0SpzbJkO6iUUDU3RAJS0HWLNE0lBDk3T/O53ZP9nMv9+y9e/Z7Tvb5mDlzzvl8f5zX2bm7r/1+v59zbqoKSZLGHTd0AEnS7LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1Dlh6AArdcopp9T69euHjiFJc+X222//RlWtXW69uS2H9evXs3v37qFjSNJcSXLvJOt5WkmS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1JnbT0gfrvVX/rep7v9rV//Lqe5fko6mY6Yc5tpVz5ry/r853f1LmjueVpIkdSwHSVLH00qauhdd/6Kp7v+OLXdMdf/SscgjB0lSxyMHaRl3f/8ZU93/GV++e6r7/9BP/v5U93/5r75qqvvXMDxykCR1LAdJUsdykCR1LAdJUsdykCR1LAdJUsdykCR1LAdJUsdykCR1LAdJUsdykCR1LAdJUsdykCR1LAdJUsdykCR1li2HJKcn+UySLyW5K8nb2/jJSXYm2dPu17TxJLkmyd4kX0xy9ti+trT19yTZMjb+0iR3tG2uSZJpvFlJ0mQmOXJ4HHhHVZ0JnAdcnuRM4Erg1qraANzangNcCGxot63Ah2FUJsA24FzgHGDbQqG0dS4b227z6t+aJGmlli2Hqnqgqj7XHv8VcDdwGnARcH1b7Xrg4vb4IuCGGrkNOCnJs4ELgJ1VdaCqHgZ2ApvbsmdW1W1VVcANY/uSJA3gsK45JFkPvAT4Y+DUqnqgLXoQOLU9Pg24b2yzfW3sycb3LTK+2OtvTbI7ye79+/cfTnRJ0mGYuBySPAP4beCnq+pb48va//jrCGfrVNW1VbWxqjauXbt22i8nScesicohyVMYFcNvVNXvtOGvt1NCtPuH2vj9wOljm69rY082vm6RcUnSQCaZrRTgOuDuqvrFsUU3AwszjrYAnxwbv7TNWjoP+GY7/bQD2JRkTbsQvQnY0ZZ9K8l57bUuHduXJGkAJ0ywzj8F3gjckeRP2ti7gauBm5K8GbgXeH1bdgvwamAv8AjwJoCqOpDkfcCutt57q+pAe/w24KPA04BPtZskaSDLlkNV/QGw1OcOzl9k/QIuX2Jf24Hti4zvBl64XBZJ0tHhJ6QlSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUsRwkSR3LQZLUOWG5FZJsB14DPFRVL2xjVwGXAfvbau+uqlvasncBbwa+DfybqtrRxjcDvwwcD3ykqq5u488FbgS+C7gdeGNVPXak3qCk+fbBf/2aqe7/Hf/ld6e6/3k1yZHDR4HNi4z/UlWd1W4LxXAm8AbgB9o2v5Lk+CTHAx8CLgTOBC5p6wL8fNvX84GHGRWLJGlAy5ZDVX0WODDh/i4Cbqyqv6mqPwP2Aue0296quqcdFdwIXJQkwKuA32rbXw9cfJjvQZJ0hK3mmsMVSb6YZHuSNW3sNOC+sXX2tbGlxr8L+MuqevyQcUnSgFZaDh8GngecBTwAfPCIJXoSSbYm2Z1k9/79+5ffQJK0Iisqh6r6elV9u6qeAH6d0WkjgPuB08dWXdfGlhr/C+CkJCccMr7U615bVRurauPatWtXEl2SNIEVlUOSZ489fS1wZ3t8M/CGJN/RZiFtAP4XsAvYkOS5SU5kdNH65qoq4DPAj7bttwCfXEkmSdKRM8lU1t8EXgGckmQfsA14RZKzgAK+BvwEQFXdleQm4EvA48DlVfXttp8rgB2MprJur6q72ku8E7gxyb8HPg9cd8TenSRpRZYth6q6ZJHhJf8Br6r3A+9fZPwW4JZFxu/h4GkpSdIM8BPSkqSO5SBJ6lgOkqSO5SBJ6lgOkqSO5SBJ6lgOkqSO5SBJ6lgOkqSO5SBJ6lgOkqTOst+tJElauX1X/s+p7n/d1f9sKvv1yEGS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEkdy0GS1LEcJEmdZcshyfYkDyW5c2zs5CQ7k+xp92vaeJJck2Rvki8mOXtsmy1t/T1JtoyNvzTJHW2ba5LkSL9JSdLhmeTI4aPA5kPGrgRuraoNwK3tOcCFwIZ22wp8GEZlAmwDzgXOAbYtFEpb57Kx7Q59LUnSUbZsOVTVZ4EDhwxfBFzfHl8PXDw2fkON3AaclOTZwAXAzqo6UFUPAzuBzW3ZM6vqtqoq4IaxfUmSBrLSaw6nVtUD7fGDwKnt8WnAfWPr7WtjTza+b5FxSdKAVn1Buv2Pv45AlmUl2Zpkd5Ld+/fvPxovKUnHpJWWw9fbKSHa/UNt/H7g9LH11rWxJxtft8j4oqrq2qraWFUb165du8LokqTlrLQcbgYWZhxtAT45Nn5pm7V0HvDNdvppB7ApyZp2IXoTsKMt+1aS89ospUvH9iVJGsgJy62Q5DeBVwCnJNnHaNbR1cBNSd4M3Au8vq1+C/BqYC/wCPAmgKo6kOR9wK623nurauEi99sYzYh6GvCpdpMkDWjZcqiqS5ZYdP4i6xZw+RL72Q5sX2R8N/DC5XJIko4ePyEtSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSeqsqhySfC3JHUn+JMnuNnZykp1J9rT7NW08Sa5JsjfJF5OcPbafLW39PUm2rO4tSZJW60gcObyyqs6qqo3t+ZXArVW1Abi1PQe4ENjQbluBD8OoTIBtwLnAOcC2hUKRJA1jGqeVLgKub4+vBy4eG7+hRm4DTkrybOACYGdVHaiqh4GdwOYp5JIkTWi15VDAp5PcnmRrGzu1qh5ojx8ETm2PTwPuG9t2XxtbaryTZGuS3Ul279+/f5XRJUlLOWGV27+8qu5P8g+AnUm+PL6wqipJrfI1xvd3LXAtwMaNG4/YfiVJf9eqjhyq6v52/xDwcUbXDL7eThfR7h9qq98PnD62+bo2ttS4JGkgKy6HJE9P8p0Lj4FNwJ3AzcDCjKMtwCfb45uBS9uspfOAb7bTTzuATUnWtAvRm9qYJGkgqzmtdCrw8SQL+/nPVfV7SXYBNyV5M3Av8Pq2/i3Aq4G9wCPAmwCq6kCS9wG72nrvraoDq8glSVqlFZdDVd0DvHiR8b8Azl9kvIDLl9jXdmD7SrNIko4sPyEtSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkjuUgSepYDpKkzsyUQ5LNSb6SZG+SK4fOI0nHspkohyTHAx8CLgTOBC5JcuawqSTp2DUT5QCcA+ytqnuq6jHgRuCigTNJ0jFrVsrhNOC+sef72pgkaQCpqqEzkORHgc1V9Zb2/I3AuVV1xSHrbQW2tqcvAL4yxVinAN+Y4v6naZ6zg/mHZv5hTTv/91bV2uVWOmGKAQ7H/cDpY8/XtbG/o6quBa49GoGS7K6qjUfjtY60ec4O5h+a+Yc1K/ln5bTSLmBDkucmORF4A3DzwJkk6Zg1E0cOVfV4kiuAHcDxwPaqumvgWJJ0zJqJcgCoqluAW4bOMeaonL6aknnODuYfmvmHNRP5Z+KCtCRptszKNQdJ0gyxHCRJHctBg8rIuUl+pN3OTZKhc61Wku8fOsOkkjxlkbFThshyuJIcl+S49vjEJGcnOXnoXCuV5G1DZ1gwMxekh5JkI/ALjD5X8S5gO6Ov8/gqsLWqPj9gvCeV5BnAvwVex+izIY8Bfwr8alV9dMBoE0myCfgVYA8HP9eyDnh+krdV1acHC7d6nwaeM3SIJ5PklcB/Ap6a5HOMft6/1hZ/Gjh7qGyTSHIx8GvAE0l+Eng38H+AFyR5a1X910EDLiPJzx46BLwryVMBquoXj36qg475cmD0j9M24CTgj4CfqaofSnJ+W/aPhwy3jN8APg5cALweeDqj76X6uST/sKrePWS4Cfwy8INj/yABkOS5jGaunTFEqEkluWapRYx+nmbdB4ALququ9i0FO5O8sapuY/QeZt024MXA04AvAC+rqq8k+V7gt4GZLgfgPYx+zu/i4J/38cB3DpZozDE/WynJ56vqJe3xn1fVcxZbNouSfKGqXjz2fFdVvawdZn+pqmb61EaSPcAZVfX4IeMnMsr//GGSTSbJXwHvAP5mkcUfrKqZPjWzyM/PDwC/A7wT+HdVNetHDuN/d++sqheOLfvcHOR/DvBB4B7gPVX1SJJ7qur7Bo4GeOQA8Gg7vfEsoJJcXFWfSPIvgG8PnG05f53k5VX1B0l+GDgAUFVPzMl5++3AriQ3cvCLF09n9An56wZLNbldwJ1V9UeHLkhy1dGPc9j+Nsl3V9WDAO0I4nzgd4HnDRttMkmOq6ongB8fGzseOHG4VJOpqj8H/lWSixgdtf3S0JnGeeSQvJjR4fUTwM8AbwW2MDoHftlif/FnRZJ/BHwE2MDo0PTHq+qrSdYCl1TVUqc9ZkaSMxh9PfvCt/DeD9xcVV8aLtVk2oXPR6vqkaGzrESSHwT2V9UXDhl/FnBFVb1/mGSTSfIy4I6qevSQ8fXAy6vqY0PkWokkTweuYvSFo/984DiA5SBJWoRTWTWTknxq6AyrYf5hmX/1vOagwSRZ6oJhgLOOZpaVMP+wzD9dlgOji1rAebN8fWEp85yd0QXd/8Hi0ybnYSqo+Ydl/inymkMz69NWn8y8Zk9yJ/DaqtqzyLL7qur0RTabGeYflvmny2sOB92a5HVzMgX0UPOa/SqW/hn8qaOYY6WuwvxDugrzT41HDk37QNPTgceBRxkd6lVVPXPQYBOY5+ySZpPlIEnqeEF6TJI1jD5Q9tSFsar67HCJJjfP2SXNHq85NEneAnyW0e+xfk+7v2rITJOa8+zHJfknQ+dYKfMPy/zTYzkc9HbgZcC9VfVK4CXAXw4baWJzm719L86Hhs6xUuYflvmnx3I46NGF72hJ8h1V9WXgBQNnmtQ8Z4f5nW21wPzDMv8UeEG6SfJx4E3ATwOvAh4GnlJVrx402ATmOTvM/2wr8w/L/FPKZTn02td1Pwv4vap6bOg8h2Oes0uaHZbDmCQvBzZU1X9sX3v9jKr6s6FzTWKes8P8z7Yy/7DMPwVV5W1UkNsY/VrBr7bn3wP84dC5/r5nb3nfAtzB6HTYZ4D/C/z+0LnMP3w28w9384L0Qa8Ffhj4a4Cq+t/MyO9yncA8Z4c5nm3VmH9Y5p8Cy+Ggx2pU4wX//zczzYt5zg7zP9vK/MMy/xT4CemDbkrya8BJSS5j9Dtpf33gTJOa5+wA+5KcBHyC0e/SfRi4d+BMh8P8wzL/FHhBekySHwI2MZpKtqOqdg4caWLznH3cvM+2Mv+wzH8Es1gOI0l+CvhYVT08dJbDNc/ZF/w9mG1l/gGZ/8jzmsNBpwK7ktyUZPOsfVpxGfOcnSTbgHcC72pDTwE+Nlyiw2P+YZl/OiyHpqp+jtE84+uAHwP2JPkPSZ43aLAJzHP2Zt5nW5l/WOafAsthTJvx82C7PQ6sAX4ryQcGDTaBec7O/M+2Mv+wzD8FlkOT5O1Jbgc+APwh8KKqeivwUuB1g4Zbxjxnbw6dbfXfma/ZVuYflvmnwAvSTZL3ANurqptCluSMqrp7gFgTmefsC+Z9tpX5h2X+I89y0ODmfbaV+Ydl/unwtJJmwVzPtsL8QzP/FHjkoJnQ/kJsYvR7KTYCNwHXVdWfDhpsQuYflvmPPI8cNBPmfLaV+Qdm/iPPIwcNLsnbgUuBbwAfAT5RVX+b5DhgT1XN9Oc1zD8s80+HX7ynWXAy8COHzraqqieSvGagTIfD/MMy/xR45CBJ6njNQZLUsRwkSR3LQZLUsRwkSR3LQZLU+X+Tm7+4y3s0YwAAAABJRU5ErkJggg==\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "df[[c for c in df if c.startswith('year')]].sum().plot.bar()" ] }, { "cell_type": "code", "execution_count": 79, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:44.903497Z", "start_time": "2018-06-07T10:38:44.896726Z" } }, "outputs": [ { "data": { "text/plain": [ "False" ] }, "execution_count": 79, "metadata": {}, "output_type": "execute_result" } ], "source": [ "my_totals = df[[c for c in df if c.startswith('year')]].sum(axis=1)\n", "their_totals = df['total pupils']\n", "any(my_totals!=their_totals)" ] }, { "cell_type": "code", "execution_count": 80, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:46.271140Z", "start_time": "2018-06-07T10:38:45.493049Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got enrolement data for 2009\n", "Got enrolement data for 2010\n", "Got enrolement data for 2011\n", "Got enrolement data for 2012\n", "Got enrolement data for 2013\n", "Got enrolement data for 2014\n", "Got enrolement data for 2015\n", "Got enrolement data for 2016\n", "Got enrolement data for 2017\n" ] } ], "source": [ "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_enrolments_table(xls)\n", " if df is not None:\n", " print(f'Got enrolement data for {year}')\n", " dfs[year]=df" ] }, { "cell_type": "code", "execution_count": 81, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:46.791083Z", "start_time": "2018-06-07T10:38:46.782093Z" } }, "outputs": [ { "data": { "text/plain": [ "{1210014,\n", " 1210015,\n", " 1210021,\n", " 1210022,\n", " 1210266,\n", " 1230026,\n", " 1230053,\n", " 1230089,\n", " 1230104,\n", " 1230130,\n", " 1230146,\n", " '1230155',\n", " 1230155,\n", " '1230155 ',\n", " 1230173,\n", " '1230173',\n", " '1230173 ',\n", " 1230182,\n", " '1230182',\n", " '1230182 ',\n", " 1230262,\n", " '1230275',\n", " 1230275,\n", " '1230275 ',\n", " 1230321,\n", " 1240291,\n", " 1260269,\n", " 1260294,\n", " 1410079,\n", " 1410270,\n", " 1410315,\n", " 1420018,\n", " 1420020,\n", " 1420021,\n", " 1420022,\n", " 1420027,\n", " 1420028,\n", " 1420029,\n", " 1420030,\n", " 1420082,\n", " 1420089,\n", " 1420095,\n", " 1420264,\n", " 1420265,\n", " 1420277,\n", " 2210065,\n", " 2210080,\n", " 2210125,\n", " 2210164,\n", " 2210302,\n", " 2210305,\n", " 2210306,\n", " 2210312,\n", " 2230077,\n", " 2230081,\n", " 2230085,\n", " 2230099,\n", " 2230100,\n", " 2230109,\n", " 2230111,\n", " 2230122,\n", " 2230131,\n", " 2230138,\n", " 2230144,\n", " 2230148,\n", " 2230166,\n", " 2230180,\n", " 2230181,\n", " 2230188,\n", " 2230190,\n", " 2230225,\n", " 2230254,\n", " 2230298,\n", " 2230301,\n", " 2230322,\n", " 2240319,\n", " 2260276,\n", " 2260280,\n", " 2260283,\n", " 2410040,\n", " 2410048,\n", " 2410066,\n", " 2410096,\n", " 2410311,\n", " 2420041,\n", " 2420042,\n", " 2420043,\n", " 2420052,\n", " 2420054,\n", " 2420064,\n", " 2420065,\n", " 2420229,\n", " 2420287,\n", " 2420320,\n", " 3210013,\n", " 3210035,\n", " 3210038,\n", " 3210091,\n", " 3210124,\n", " 3210133,\n", " 3210134,\n", " 3210172,\n", " 3210200,\n", " 3210202,\n", " 3210208,\n", " 3210222,\n", " 3210232,\n", " 3210233,\n", " 3210279,\n", " 3210300,\n", " 3210313,\n", " 3230019,\n", " 3230066,\n", " 3230075,\n", " 3230084,\n", " 3230110,\n", " 3230132,\n", " 3230142,\n", " 3230151,\n", " 3230168,\n", " 3230203,\n", " 3230227,\n", " 3230234,\n", " 3230308,\n", " 3230310,\n", " 3250149,\n", " 3250207,\n", " 3260289,\n", " 3260290,\n", " 3260299,\n", " 3260303,\n", " 3410008,\n", " 3410033,\n", " 3410098,\n", " 3410209,\n", " 3410297,\n", " 3420010,\n", " 3420011,\n", " 3420012,\n", " 3420032,\n", " 3420034,\n", " 3420046,\n", " 3420058,\n", " 3420068,\n", " 3420077,\n", " 3420080,\n", " 3420094,\n", " 3420317,\n", " 4210012,\n", " 4210029,\n", " 4210045,\n", " 4210046,\n", " 4210051,\n", " 4210063,\n", " 4210086,\n", " 4210183,\n", " 4210194,\n", " 4210201,\n", " 4210262,\n", " 4210296,\n", " 4210316,\n", " 4230023,\n", " 4230067,\n", " 4230102,\n", " 4230107,\n", " 4230161,\n", " 4230165,\n", " 4230211,\n", " 4230223,\n", " 4230224,\n", " 4250024,\n", " 4250072,\n", " 4260255,\n", " 4260281,\n", " 4260295,\n", " 4260309,\n", " 4410063,\n", " 4410085,\n", " 4410097,\n", " 4420015,\n", " 4420044,\n", " 4420050,\n", " 4420051,\n", " 4420086,\n", " 4420088,\n", " 4420259,\n", " 5210016,\n", " 5210025,\n", " 5210043,\n", " 5210047,\n", " 5210054,\n", " 5210064,\n", " 5210083,\n", " 5210097,\n", " 5210121,\n", " 5210127,\n", " 5210143,\n", " 5210153,\n", " 5210186,\n", " 5210230,\n", " 5210231,\n", " 5210271,\n", " 5210282,\n", " 5230056,\n", " 5230059,\n", " 5230070,\n", " 5230076,\n", " 5230088,\n", " 5230108,\n", " 5230135,\n", " 5230152,\n", " 5230157,\n", " 5230160,\n", " 5230167,\n", " 5230187,\n", " 5230192,\n", " 5230213,\n", " 5230218,\n", " 5230256,\n", " 5230278,\n", " 5230293,\n", " 5230321,\n", " 5250216,\n", " 5260285,\n", " 5260286,\n", " 5410013,\n", " 5410057,\n", " 5410067,\n", " 5420045,\n", " 5420056,\n", " 5420059,\n", " 5420060,\n", " 5420062,\n", " 5420073,\n", " 5420076,\n", " 5420260,\n", " 5420263,\n", " 5420268,\n", " 5420304,\n", " 5420314}" ] }, "execution_count": 81, "metadata": {}, "output_type": "execute_result" } ], "source": [ "all_de_refs = set([_ for d in dfs.values() for _ in d['de ref'].values])\n", "all_de_refs" ] }, { "cell_type": "code", "execution_count": 82, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:47.755895Z", "start_time": "2018-06-07T10:38:47.748919Z" } }, "outputs": [ { "data": { "text/plain": [ "{1210014,\n", " 1210015,\n", " 1210021,\n", " 1210022,\n", " 1210266,\n", " 1230026,\n", " 1230053,\n", " 1230089,\n", " 1230104,\n", " 1230130,\n", " 1230146,\n", " 1230155,\n", " 1230173,\n", " 1230182,\n", " 1230262,\n", " 1230275,\n", " 1230321,\n", " 1240291,\n", " 1260269,\n", " 1260294,\n", " 1410079,\n", " 1410270,\n", " 1410315,\n", " 1420018,\n", " 1420020,\n", " 1420021,\n", " 1420022,\n", " 1420027,\n", " 1420028,\n", " 1420029,\n", " 1420030,\n", " 1420082,\n", " 1420089,\n", " 1420095,\n", " 1420264,\n", " 1420265,\n", " 1420277,\n", " 2210065,\n", " 2210080,\n", " 2210125,\n", " 2210164,\n", " 2210302,\n", " 2210305,\n", " 2210306,\n", " 2210312,\n", " 2230077,\n", " 2230081,\n", " 2230085,\n", " 2230099,\n", " 2230100,\n", " 2230109,\n", " 2230111,\n", " 2230122,\n", " 2230131,\n", " 2230138,\n", " 2230144,\n", " 2230148,\n", " 2230166,\n", " 2230180,\n", " 2230181,\n", " 2230188,\n", " 2230190,\n", " 2230225,\n", " 2230254,\n", " 2230298,\n", " 2230301,\n", " 2230322,\n", " 2240319,\n", " 2260276,\n", " 2260280,\n", " 2260283,\n", " 2410040,\n", " 2410048,\n", " 2410066,\n", " 2410096,\n", " 2410311,\n", " 2420041,\n", " 2420042,\n", " 2420043,\n", " 2420052,\n", " 2420054,\n", " 2420064,\n", " 2420065,\n", " 2420229,\n", " 2420287,\n", " 2420320,\n", " 3210013,\n", " 3210035,\n", " 3210038,\n", " 3210091,\n", " 3210124,\n", " 3210133,\n", " 3210134,\n", " 3210172,\n", " 3210200,\n", " 3210202,\n", " 3210208,\n", " 3210222,\n", " 3210232,\n", " 3210233,\n", " 3210279,\n", " 3210300,\n", " 3210313,\n", " 3230019,\n", " 3230066,\n", " 3230075,\n", " 3230084,\n", " 3230110,\n", " 3230132,\n", " 3230142,\n", " 3230151,\n", " 3230168,\n", " 3230203,\n", " 3230227,\n", " 3230234,\n", " 3230308,\n", " 3230310,\n", " 3250149,\n", " 3250207,\n", " 3260289,\n", " 3260290,\n", " 3260299,\n", " 3260303,\n", " 3410008,\n", " 3410033,\n", " 3410098,\n", " 3410209,\n", " 3410297,\n", " 3420010,\n", " 3420011,\n", " 3420012,\n", " 3420032,\n", " 3420034,\n", " 3420046,\n", " 3420058,\n", " 3420068,\n", " 3420077,\n", " 3420080,\n", " 3420094,\n", " 3420317,\n", " 4210012,\n", " 4210029,\n", " 4210045,\n", " 4210046,\n", " 4210051,\n", " 4210063,\n", " 4210086,\n", " 4210183,\n", " 4210194,\n", " 4210201,\n", " 4210262,\n", " 4210296,\n", " 4210316,\n", " 4230023,\n", " 4230067,\n", " 4230102,\n", " 4230107,\n", " 4230161,\n", " 4230165,\n", " 4230211,\n", " 4230223,\n", " 4230224,\n", " 4250024,\n", " 4250072,\n", " 4260255,\n", " 4260281,\n", " 4260295,\n", " 4260309,\n", " 4410063,\n", " 4410085,\n", " 4410097,\n", " 4420015,\n", " 4420044,\n", " 4420050,\n", " 4420051,\n", " 4420086,\n", " 4420088,\n", " 4420259,\n", " 5210016,\n", " 5210025,\n", " 5210043,\n", " 5210047,\n", " 5210054,\n", " 5210064,\n", " 5210083,\n", " 5210097,\n", " 5210121,\n", " 5210127,\n", " 5210143,\n", " 5210153,\n", " 5210186,\n", " 5210230,\n", " 5210231,\n", " 5210271,\n", " 5210282,\n", " 5230056,\n", " 5230059,\n", " 5230070,\n", " 5230076,\n", " 5230088,\n", " 5230108,\n", " 5230135,\n", " 5230152,\n", " 5230157,\n", " 5230160,\n", " 5230167,\n", " 5230187,\n", " 5230192,\n", " 5230213,\n", " 5230218,\n", " 5230256,\n", " 5230278,\n", " 5230293,\n", " 5230321,\n", " 5250216,\n", " 5260285,\n", " 5260286,\n", " 5410013,\n", " 5410057,\n", " 5410067,\n", " 5420045,\n", " 5420056,\n", " 5420059,\n", " 5420060,\n", " 5420062,\n", " 5420073,\n", " 5420076,\n", " 5420260,\n", " 5420263,\n", " 5420268,\n", " 5420304,\n", " 5420314}" ] }, "execution_count": 82, "metadata": {}, "output_type": "execute_result" } ], "source": [ "all_de_refs = set([int(_) for d in dfs.values() for _ in d['de ref'].values])\n", "all_de_refs" ] }, { "cell_type": "code", "execution_count": 83, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:48.793652Z", "start_time": "2018-06-07T10:38:48.493937Z" } }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 83, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "df = pd.DataFrame.from_dict({\n", " year: [dr in df['de ref'].values for dr in all_de_refs] \n", " for year, df in dfs.items()\n", "}, orient='index')\n", "df.columns=all_de_refs\n", "sns.heatmap(df.T)" ] }, { "cell_type": "code", "execution_count": 84, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:49.433620Z", "start_time": "2018-06-07T10:38:49.429249Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "2009:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'year 15' 'total pupils']\n", "2010:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'year 15' 'total pupils']\n", "2011:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'year 15' 'total pupils']\n", "2012:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'year 15' 'total pupils']\n", "2013:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'year 15' 'total pupils']\n", "2014:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'year 15' 'total pupils']\n", "2015:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'year 15' 'total pupils']\n", "2016:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'total pupils']\n", "2017:['de ref' 'schoolname' 'year 8' 'year 9' 'year 10' 'year 11' 'year 12'\n", " 'year 13' 'year 14' 'total pupils']\n" ] } ], "source": [ "for year, df in dfs.items():\n", " print(f\"{year}:{df.keys().values}\")" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Grand pivot\n" ] }, { "cell_type": "code", "execution_count": 85, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:51.359399Z", "start_time": "2018-06-07T10:38:50.653976Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got enrolement data for 2009\n", "Got enrolement data for 2010\n", "Got enrolement data for 2011\n", "Got enrolement data for 2012\n", "Got enrolement data for 2013\n", "Got enrolement data for 2014\n", "Got enrolement data for 2015\n", "Got enrolement data for 2016\n", "Got enrolement data for 2017\n" ] } ], "source": [ "def parse_enrolments_table(xls):\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " strip_n_lower = lambda s: s.strip().lower()\n", " unyearify = lambda s: int(s.replace('year ',''))\n", " \n", " if 'enrolments' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'enrolments', header=None, skip_footer=5)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[3].fillna('').apply(strip_n_lower).values\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df.dropna(how='all', inplace=True, axis=0)\n", " df['de ref'] = df['de ref'].astype(int)\n", " df.drop('schoolname',axis=1, inplace=True)\n", " df.drop('total pupils',axis=1, inplace=True)\n", " df.set_index('de ref', inplace=True)\n", " df.rename(columns=unyearify, inplace=True)\n", " df=df.astype(float)\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_enrolments_table(xls)\n", " if df is not None:\n", " print(f'Got enrolement data for {year}')\n", " dfs[year]=df\n" ] }, { "cell_type": "code", "execution_count": 86, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:52.466173Z", "start_time": "2018-06-07T10:38:52.453566Z" } }, "outputs": [ { "data": { "text/plain": [ "\n", "Dimensions: 9 (items) x 232 (major_axis) x 8 (minor_axis)\n", "Items axis: 2009 to 2017\n", "Major_axis axis: 1210014 to 5420314\n", "Minor_axis axis: 8 to 15" ] }, "execution_count": 86, "metadata": {}, "output_type": "execute_result" } ], "source": [ "panel = pd.Panel(dfs)\n", "panel" ] }, { "cell_type": "code", "execution_count": 87, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:53.218395Z", "start_time": "2018-06-07T10:38:53.203711Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
200920102011201220132014201520162017
823116.023113.021770.021322.021418.021367.021792.022571.022817.0
923859.023403.022925.021928.021425.021481.021422.022284.022650.0
1022954.024155.023245.023101.021971.021527.021443.021864.022381.0
1123521.023277.024094.023524.023299.022092.021601.022118.022102.0
1223808.023656.022967.024027.023353.023166.021864.022091.022099.0
1314912.015652.015421.015892.016567.016208.015912.015667.015347.0
1412607.013097.013274.013482.013554.014174.013922.013818.013149.0
15100.0154.0154.0196.0201.0275.0365.00.00.0
\n", "
" ], "text/plain": [ " 2009 2010 2011 2012 2013 2014 2015 2016 \\\n", "8 23116.0 23113.0 21770.0 21322.0 21418.0 21367.0 21792.0 22571.0 \n", "9 23859.0 23403.0 22925.0 21928.0 21425.0 21481.0 21422.0 22284.0 \n", "10 22954.0 24155.0 23245.0 23101.0 21971.0 21527.0 21443.0 21864.0 \n", "11 23521.0 23277.0 24094.0 23524.0 23299.0 22092.0 21601.0 22118.0 \n", "12 23808.0 23656.0 22967.0 24027.0 23353.0 23166.0 21864.0 22091.0 \n", "13 14912.0 15652.0 15421.0 15892.0 16567.0 16208.0 15912.0 15667.0 \n", "14 12607.0 13097.0 13274.0 13482.0 13554.0 14174.0 13922.0 13818.0 \n", "15 100.0 154.0 154.0 196.0 201.0 275.0 365.0 0.0 \n", "\n", " 2017 \n", "8 22817.0 \n", "9 22650.0 \n", "10 22381.0 \n", "11 22102.0 \n", "12 22099.0 \n", "13 15347.0 \n", "14 13149.0 \n", "15 0.0 " ] }, "execution_count": 87, "metadata": {}, "output_type": "execute_result" } ], "source": [ "panel.sum(axis=1)\n" ] }, { "cell_type": "code", "execution_count": 88, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:54.215940Z", "start_time": "2018-06-07T10:38:53.918588Z" } }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 88, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "sns.heatmap(panel.sum(axis=2))\n" ] }, { "cell_type": "code", "execution_count": 89, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:55.336585Z", "start_time": "2018-06-07T10:38:55.189210Z" } }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 89, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "panel.sum().sum().plot()" ] }, { "cell_type": "markdown", "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:38:56.389044Z", "start_time": "2018-06-07T10:38:56.386530Z" } }, "source": [ "## Now to start bringing these together!\n", "\n" ] }, { "cell_type": "code", "execution_count": 91, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:03.162277Z", "start_time": "2018-06-07T10:39:02.461754Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got enrolement data for 2009\n", "Got enrolement data for 2010\n", "Got enrolement data for 2011\n", "Got enrolement data for 2012\n", "Got enrolement data for 2013\n", "Got enrolement data for 2014\n", "Got enrolement data for 2015\n", "Got enrolement data for 2016\n", "Got enrolement data for 2017\n" ] } ], "source": [ "def parse_enrolments_table(xls):\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " strip_n_lower = lambda s: s.strip().lower()\n", " unyearify = lambda s: int(s.replace('year ',''))\n", " \n", " if 'enrolments' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'enrolments', header=None, skip_footer=5)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[3].fillna('').apply(strip_n_lower).values\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df.dropna(how='all', inplace=True, axis=0)\n", " df['de ref'] = df['de ref'].astype(int)\n", " df.drop('schoolname',axis=1, inplace=True)\n", " df.drop('total pupils',axis=1, inplace=True)\n", " df.set_index('de ref', inplace=True)\n", " df.rename(columns=unyearify, inplace=True)\n", " df=df.astype(float)\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_enrolments_table(xls)\n", " if df is not None:\n", " print(f'Got enrolement data for {year}')\n", " dfs[year]=df\n", "enrolements = pd.Panel(dfs)" ] }, { "cell_type": "code", "execution_count": 92, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:05.953855Z", "start_time": "2018-06-07T10:39:04.638737Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got reference data for 2009\n", "Got reference data for 2010\n", "Got reference data for 2011\n", "Got reference data for 2012\n", "Got reference data for 2013\n", "Got reference data for 2014\n", "Got reference data for 2015\n", "Got reference data for 2016\n", "Got reference data for 2017\n" ] } ], "source": [ "def parse_reference_table(xls):\n", " cols = [\n", " 'de ref',\n", " 'school name',\n", " 'school type',\n", " 'address 1',\n", " 'postcode',\n", " 'urban_rural',\n", " 'school management type',\n", " 'district council',\n", " 'parliamentary constituency',\n", " 'town'\n", " ]\n", " \n", " categories = [\n", " 'school type',\n", " 'urban_rural',\n", " 'school management type',\n", " 'district council',\n", " 'parliamentary constituency',\n", " 'town'\n", " ]\n", "\n", " ref_key_map={\n", " 'denino':'de ref',\n", " 'urban/ rural': 'urban_rural',\n", " 'schoolname': 'school name'\n", " }\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " \n", " if 'reference data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'reference data', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[1:h_range].fillna('').apply(join_n_strip_n_lower, axis=0).values\n", " df.rename(columns=ref_key_map, inplace=True)\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df = df[cols]\n", " df['de ref'] = df['de ref'].astype(int)\n", " df.set_index('de ref', inplace=True)\n", " for c in df:\n", " df[c]=df[c].str.lower().str.strip()\n", " for c in categories:\n", " df[c] = df[c].astype('category')\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_reference_table(xls)\n", " if df is not None:\n", " print(f'Got reference data for {year}')\n", " dfs[year]=df\n", "reference = pd.Panel(dfs)" ] }, { "cell_type": "code", "execution_count": 93, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:08.413228Z", "start_time": "2018-06-07T10:39:08.367923Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
200920102011201220132014201520162017
de refminor
1210014school nameashfield girls' high schoolashfield girls' high schoolashfield girls' high schoolashfield girls' high schoolashfield girls' high schoolashfield girls' high schoolashfield girls' high schoolashfield girls' high schoolashfield girls' high school
school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1holywood roadholywood roadholywood roadholywood roadholywood roadholywood road397 holywood road397 holywood road397 holywood road
postcodebt4 2lybt42lybt42lybt42lybt42lybt42lybt4 2lybt42lybt42ly
urban_ruralurbanurbanurbanurbanurbanurbanurbanurbanurban
school management typecontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolled
district councilbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfast
parliamentary constituencybelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast east
townbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfast
1210015school nameashfield boys' high schoolashfield boys' high schoolashfield boys' high schoolashfield boys' high schoolashfield boys' high schoolashfield boys' high schoolashfield boys' high schoolashfield boys' high schoolashfield boys' high school
school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1holywood roadholywood roadholywood roadholywood roadholywood roadholywood road395 holywood road395 holywood road395 holywood road
postcodebt4 2lybt42lybt42lybt42lybt42lybt42lybt4 2lybt42lybt42ly
urban_ruralurbanurbanurbanurbanurbanurbanurbanurbanurban
school management typecontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolled
district councilbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfast
parliamentary constituencybelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast eastbelfast east
townbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfast
1210021school namebelfast model school for girlsbelfast model school for girlsbelfast model school for girlsbelfast model school for girlsbelfast model school for girlsbelfast model school for girlsbelfast model school for girlsbelfast model school for girlsbelfast model school for girls
school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1dunkeld gardensdunkeld gardensdunkeld gardensdunkeld gardensdunkeld gardensdunkeld gardens35 dunowen gardens35 dunowen gardens35 dunowen gardens
postcodebt14 6ntbt146ntbt146ntbt146ntbt146ntbt146ntbt14 6nqbt146nqbt146nq
urban_ruralurbanurbanurbanurbanurbanurbanurbanurbanurban
school management typecontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolledcontrolled
district councilbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfast
parliamentary constituencybelfast northbelfast northbelfast northbelfast northbelfast northbelfast northbelfast northbelfast northbelfast north
townbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfastbelfast
1210022school namebelfast boys' model schoolbelfast boys' model schoolbelfast boys' model schoolbelfast boys' model schoolbelfast boys' model schoolbelfast boys' model schoolbelfast boys' model schoolbelfast boys' model schoolbelfast boys' model school
school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1ballysillan roadballysillan roadballysillan roadballysillan roadballysillan roadballysillan roadballysillan roadballysillan roadballysillan road
.................................
5420260district councildungannondungannondungannondungannondungannondungannonmid ulstermid ulstermid ulster
parliamentary constituencyfermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyrone
towndungannondungannondungannondungannondungannondungannondungannondungannondungannon
5420263school namethe royal school armaghthe royal school armaghthe royal school armaghthe royal school armaghthe royal school armaghthe royal school, armaghthe royal school, armaghthe royal school, armaghthe royal school, armagh
school typegrammargrammargrammargrammargrammargrammargrammargrammargrammar
address 1college hillcollege hillcollege hillcollege hillcollege hillcollege hillcollege hillcollege hillcollege hill
postcodebt61 9dhbt619dhbt619dhbt619dhbt619dhbt619dhbt61 9dhbt619dhbt619dh
urban_ruralurbanurbanurbanurbanurbanurbanurbanurbanurban
school management typevoluntaryvoluntaryvoluntary - other managedvoluntary - other managedvoluntary - other managedvoluntaryvoluntaryvoluntaryvoluntary
district councilarmagharmagharmagharmagharmagharmagharmagh city, banbridge and craigavonarmagh city, banbridge and craigavonarmagh city, banbridge and craigavon
parliamentary constituencynewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armagh
townarmagharmagharmagharmagharmagharmagharmagharmagharmagh
5420268school namest patrick's grammar schoolst patrick's grammar schoolst patrick's grammar schoolst patrick's grammar schoolst patrick's grammar schoolst patrick's grammar school, armaghst patrick's grammar school, armaghst patrick's grammar school, armaghst patrick's grammar school, armagh
school typegrammargrammargrammargrammargrammargrammargrammargrammargrammar
address 1cathedral roadcathedral roadcathedral roadcathedral roadcathedral roadcathedral roadcathedral roadcathedral roadcathedral road
postcodebt61 7qzbt617qzbt617qzbt617qzbt617qzbt617qzbt61 7qzbt617qzbt617qz
urban_ruralurbanurbanurbanurbanurbanurbanurbanurbanurban
school management typevoluntaryvoluntaryvoluntary - rc managedvoluntary - rc managedvoluntary - rc managedvoluntaryvoluntaryvoluntaryvoluntary
district councilarmagharmagharmagharmagharmagharmagharmagh city, banbridge and craigavonarmagh city, banbridge and craigavonarmagh city, banbridge and craigavon
parliamentary constituencynewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armaghnewry and armagh
townarmagharmagharmagharmagharmagharmagharmagharmagharmagh
5420304school namest patrick's academyst patrick's academyst patrick's academyst patrick's academyst patrick's academyst patrick's academy, dungannonst patrick's academy, dungannonst patrick's academy, dungannonst patrick's academy, dungannon
school typegrammargrammargrammargrammargrammargrammargrammargrammargrammar
address 137 killymeal road37 killymeal road37 killymeal road37 killymeal road37 killymeal road37 killymeal road37 killymeal road37 killymeal road37 killymeal road
postcodebt71 6dsbt716dsbt716dsbt716dsbt716dsbt716dsbt71 6dsbt716dsbt716ds
urban_ruralurbanurbanurbanurbanurbanurbanurbanurbanurban
school management typevoluntaryvoluntaryvoluntary - rc managedvoluntary - rc managedvoluntary - rc managedvoluntaryvoluntaryvoluntaryvoluntary
district councildungannondungannondungannondungannondungannondungannonmid ulstermid ulstermid ulster
parliamentary constituencyfermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyronefermanagh and south tyrone
towndungannondungannondungannondungannondungannondungannondungannondungannondungannon
\n", "

1673 rows × 9 columns

\n", "
" ], "text/plain": [ " 2009 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt4 2ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt4 2ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt14 6nt \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt61 9dh \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt61 7qz \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt71 6ds \n", " urban_rural urban \n", " school management type voluntary \n", " district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2010 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt619dh \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt617qz \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt716ds \n", " urban_rural urban \n", " school management type voluntary \n", " district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2011 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt619dh \n", " urban_rural urban \n", " school management type voluntary - other managed \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt617qz \n", " urban_rural urban \n", " school management type voluntary - rc managed \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt716ds \n", " urban_rural urban \n", " school management type voluntary - rc managed \n", " district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2012 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt619dh \n", " urban_rural urban \n", " school management type voluntary - other managed \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt617qz \n", " urban_rural urban \n", " school management type voluntary - rc managed \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt716ds \n", " urban_rural urban \n", " school management type voluntary - rc managed \n", " district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2013 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt619dh \n", " urban_rural urban \n", " school management type voluntary - other managed \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt617qz \n", " urban_rural urban \n", " school management type voluntary - rc managed \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt716ds \n", " urban_rural urban \n", " school management type voluntary - rc managed \n", " district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2014 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school, armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt619dh \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school, armagh \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt617qz \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy, dungannon \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt716ds \n", " urban_rural urban \n", " school management type voluntary \n", " district council dungannon \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2015 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 397 holywood road \n", " postcode bt4 2ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 395 holywood road \n", " postcode bt4 2ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 35 dunowen gardens \n", " postcode bt14 6nq \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council mid ulster \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school, armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt61 9dh \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school, armagh \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt61 7qz \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy, dungannon \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt71 6ds \n", " urban_rural urban \n", " school management type voluntary \n", " district council mid ulster \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2016 \\\n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type secondary \n", " address 1 397 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type secondary \n", " address 1 395 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type secondary \n", " address 1 35 dunowen gardens \n", " postcode bt146nq \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type secondary \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council mid ulster \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school, armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt619dh \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school, armagh \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt617qz \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy, dungannon \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt716ds \n", " urban_rural urban \n", " school management type voluntary \n", " district council mid ulster \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", " 2017 \n", "de ref minor \n", "1210014 school name ashfield girls' high school \n", " school type non-grammar \n", " address 1 397 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210015 school name ashfield boys' high school \n", " school type non-grammar \n", " address 1 395 holywood road \n", " postcode bt42ly \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast east \n", " town belfast \n", "1210021 school name belfast model school for girls \n", " school type non-grammar \n", " address 1 35 dunowen gardens \n", " postcode bt146nq \n", " urban_rural urban \n", " school management type controlled \n", " district council belfast \n", " parliamentary constituency belfast north \n", " town belfast \n", "1210022 school name belfast boys' model school \n", " school type non-grammar \n", " address 1 ballysillan road \n", "... ... \n", "5420260 district council mid ulster \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "5420263 school name the royal school, armagh \n", " school type grammar \n", " address 1 college hill \n", " postcode bt619dh \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420268 school name st patrick's grammar school, armagh \n", " school type grammar \n", " address 1 cathedral road \n", " postcode bt617qz \n", " urban_rural urban \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", " parliamentary constituency newry and armagh \n", " town armagh \n", "5420304 school name st patrick's academy, dungannon \n", " school type grammar \n", " address 1 37 killymeal road \n", " postcode bt716ds \n", " urban_rural urban \n", " school management type voluntary \n", " district council mid ulster \n", " parliamentary constituency fermanagh and south tyrone \n", " town dungannon \n", "\n", "[1673 rows x 9 columns]" ] }, "execution_count": 93, "metadata": {}, "output_type": "execute_result" } ], "source": [ "reference.to_frame()" ] }, { "cell_type": "code", "execution_count": 94, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:09.561567Z", "start_time": "2018-06-07T10:39:09.318581Z" } }, "outputs": [ { "data": { "text/plain": [ "de ref minor \n", "1210014 school name False\n", " school type True\n", " address 1 True\n", " postcode True\n", " urban_rural False\n", " school management type False\n", " district council False\n", " parliamentary constituency False\n", " town False\n", "1210015 school name False\n", " school type True\n", " address 1 True\n", " postcode True\n", " urban_rural False\n", " school management type False\n", " district council False\n", " parliamentary constituency False\n", " town False\n", "1210021 school name False\n", " school type True\n", " address 1 True\n", " postcode True\n", " urban_rural False\n", " school management type False\n", " district council False\n", " parliamentary constituency False\n", " town False\n", "1210022 school name False\n", " school type True\n", " address 1 False\n", " ... \n", "5420260 district council True\n", " parliamentary constituency False\n", " town False\n", "5420263 school name True\n", " school type False\n", " address 1 False\n", " postcode True\n", " urban_rural False\n", " school management type True\n", " district council True\n", " parliamentary constituency False\n", " town False\n", "5420268 school name True\n", " school type False\n", " address 1 False\n", " postcode True\n", " urban_rural False\n", " school management type True\n", " district council True\n", " parliamentary constituency False\n", " town False\n", "5420304 school name True\n", " school type False\n", " address 1 False\n", " postcode True\n", " urban_rural False\n", " school management type True\n", " district council True\n", " parliamentary constituency False\n", " town False\n", "Length: 1673, dtype: bool" ] }, "execution_count": 94, "metadata": {}, "output_type": "execute_result" } ], "source": [ "reference.to_frame().apply(pd.Series.nunique, axis=1)!=1" ] }, { "cell_type": "code", "execution_count": 95, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:14.189085Z", "start_time": "2018-06-07T10:39:13.924233Z" } }, "outputs": [ { "data": { "text/plain": [ "minor\n", "school name 252.0\n", "school type 311.0\n", "address 1 241.0\n", "postcode 408.0\n", "urban_rural 195.0\n", "school management type 364.0\n", "district council 365.0\n", "parliamentary constituency 198.0\n", "town 187.0\n", "dtype: float64" ] }, "execution_count": 95, "metadata": {}, "output_type": "execute_result" } ], "source": [ "reference.to_frame().apply(pd.Series.nunique, axis=1).unstack('minor').sum()" ] }, { "cell_type": "code", "execution_count": 96, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:14.615892Z", "start_time": "2018-06-07T10:39:14.346792Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
200920102011201220132014201520162017
de refminor
1210014school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1holywood roadholywood roadholywood roadholywood roadholywood roadholywood road397 holywood road397 holywood road397 holywood road
postcodebt4 2lybt42lybt42lybt42lybt42lybt42lybt4 2lybt42lybt42ly
1210015school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1holywood roadholywood roadholywood roadholywood roadholywood roadholywood road395 holywood road395 holywood road395 holywood road
postcodebt4 2lybt42lybt42lybt42lybt42lybt42lybt4 2lybt42lybt42ly
1210021school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1dunkeld gardensdunkeld gardensdunkeld gardensdunkeld gardensdunkeld gardensdunkeld gardens35 dunowen gardens35 dunowen gardens35 dunowen gardens
postcodebt14 6ntbt146ntbt146ntbt146ntbt146ntbt146ntbt14 6nqbt146nqbt146nq
1210022school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
postcodebt14 6rbbt146rbbt146rbbt146rbbt146rbbt146rbbt14 6rbbt146rbbt146rb
1230053school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
postcodebt12 6enbt126enbt126enbt126enbt126enbt126enbt12 6enbt126enbt126en
school management typerc maintainedroman catholic maintainedrc maintainedrc maintainedrc maintainedcatholic maintainedcatholic maintainedcatholic maintainedcatholic maintained
1230104school nameour lady of mercy girls' schoolour lady of mercy girls' schoolour lady of mercy girls' schoolour lady of mercy girls' schoolour lady of mercy girls' schoolmercy collegemercy collegemercy collegemercy college belfast
school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
postcodebt14 7qrbt147qrbt147qrbt147qrbt147qrbt147qrbt14 7qrbt147qrbt147qr
school management typerc maintainedroman catholic maintainedrc maintainedrc maintainedrc maintainedcatholic maintainedcatholic maintainedcatholic maintainedcatholic maintained
1230130school namest rose's high schoolst rose's high schoolst rose's high schoolst rose's high schoolst rose's high schoolst rose’s dominican collegest rose’s dominican collegest rose’s dominican collegest rose’s dominican college
school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
address 1beechmount avenuebeechmount avenuebeechmount avenuebeechmount avenuebeechmount avenuebeechmount avenue65 beechmount avenue65 beechmount avenue65 beechmount avenue
postcodebt12 7nabt127nabt127nabt127nabt127nabt127nabt12 7nabt127nabt127na
school management typerc maintainedroman catholic maintainedrc maintainedrc maintainedrc maintainedcatholic maintainedcatholic maintainedcatholic maintainedcatholic maintained
1230146school namechristian brothers schoolchristian brothers schoolchristian brothers schoolchristian brothers schoolchristian brothers schoolchristian brothers school, belfastchristian brothers school, belfastchristian brothers school, belfastchristian brothers school, belfast
school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
postcodebt11 8bwbt118bwbt118bwbt118bwbt118bwbt118bwbt11 8bwbt118bwbt118bw
school management typerc maintainedroman catholic maintainedrc maintainedrc maintainedrc maintainedcatholic maintainedcatholic maintainedcatholic maintainedcatholic maintained
1230155school typesecondarysecondarysecondarysecondarysecondarysecondarysecondarysecondarynon-grammar
postcodebt11 9jpbt119jpbt119jpbt119jpbt119jpbt119jpbt11 9jpbt119jpbt119jp
school management typerc maintainedroman catholic maintainedrc maintainedrc maintainedrc maintainedcatholic maintainedcatholic maintainedcatholic maintainedcatholic maintained
.................................
5420062school namest colman's collegest colman's collegest colman's collegest colman's collegest colman's collegest colman's college, newryst colman's college, newryst colman's college, newryst colman's college, newry
postcodebt35 6ppbt356ppbt356ppbt356ppbt356ppbt356ppbt35 6ppbt356ppbt356pp
school management typevoluntaryvoluntaryvoluntary - rc managedvoluntary - rc managedvoluntary - rc managedvoluntaryvoluntaryvoluntaryvoluntary
district councilnewry & mournenewry & mournenewry and mournenewry and mournenewry and mournenewry and mournenewry mourne and downnewry mourne and downnewry mourne and down
5420073school namest joseph's grammar schoolst joseph's grammar schoolst joseph's grammar schoolst joseph's grammar schoolst joseph's grammar schoolst joseph's convent grammar school, donaghmorest joseph's convent grammar school, donaghmorest joseph's convent grammar school, donaghmorest joseph's convent grammar school, donaghmore
postcodebt70 3hebt703hebt703hebt703hebt703hebt703hebt70 3hebt703hebt703he
school management typevoluntaryvoluntaryvoluntary - rc managedvoluntary - rc managedvoluntary - rc managedvoluntaryvoluntaryvoluntaryvoluntary
district councildungannondungannondungannondungannondungannondungannonmid ulstermid ulstermid ulster
5420076school namesacred heart grammar schoolsacred heart grammar schoolsacred heart grammar schoolsacred heart grammar schoolsacred heart grammar schoolsacred heart grammar school, newrysacred heart grammar school, newrysacred heart grammar school, newrysacred heart grammar school, newry
postcodebt34 1prbt341prbt341prbt341prbt341prbt341prbt34 1prbt341prbt341pr
school management typevoluntaryvoluntaryvoluntary - rc managedvoluntary - rc managedvoluntary - rc managedvoluntaryvoluntaryvoluntaryvoluntary
district councilnewry & mournenewry & mournenewry and mournenewry and mournenewry and mournenewry and mournenewry mourne and downnewry mourne and downnewry mourne and down
parliamentary constituencynewry and armaghnewry and armaghsouth downsouth downsouth downsouth downsouth downsouth downsouth down
5420260school namethe royal school dungannonthe royal school dungannonthe royal school dungannonthe royal school dungannonthe royal school dungannonthe royal school, dungannonthe royal school, dungannonthe royal school, dungannonthe royal school, dungannon
address 11 ranfurley road1 ranfurley road1 ranfurley road1 ranfurley road1 ranfurley road1 ranfurley road2 ranfurley road2 ranfurley road2 ranfurley road
postcodebt71 6apbt716apbt716apbt716apbt716apbt716apbt71 6apbt716apbt716ap
school management typevoluntaryvoluntaryvoluntary - other managedvoluntary - other managedvoluntary - other managedvoluntaryvoluntaryvoluntaryvoluntary
district councildungannondungannondungannondungannondungannondungannonmid ulstermid ulstermid ulster
5420263school namethe royal school armaghthe royal school armaghthe royal school armaghthe royal school armaghthe royal school armaghthe royal school, armaghthe royal school, armaghthe royal school, armaghthe royal school, armagh
postcodebt61 9dhbt619dhbt619dhbt619dhbt619dhbt619dhbt61 9dhbt619dhbt619dh
school management typevoluntaryvoluntaryvoluntary - other managedvoluntary - other managedvoluntary - other managedvoluntaryvoluntaryvoluntaryvoluntary
district councilarmagharmagharmagharmagharmagharmagharmagh city, banbridge and craigavonarmagh city, banbridge and craigavonarmagh city, banbridge and craigavon
5420268school namest patrick's grammar schoolst patrick's grammar schoolst patrick's grammar schoolst patrick's grammar schoolst patrick's grammar schoolst patrick's grammar school, armaghst patrick's grammar school, armaghst patrick's grammar school, armaghst patrick's grammar school, armagh
postcodebt61 7qzbt617qzbt617qzbt617qzbt617qzbt617qzbt61 7qzbt617qzbt617qz
school management typevoluntaryvoluntaryvoluntary - rc managedvoluntary - rc managedvoluntary - rc managedvoluntaryvoluntaryvoluntaryvoluntary
district councilarmagharmagharmagharmagharmagharmagharmagh city, banbridge and craigavonarmagh city, banbridge and craigavonarmagh city, banbridge and craigavon
5420304school namest patrick's academyst patrick's academyst patrick's academyst patrick's academyst patrick's academyst patrick's academy, dungannonst patrick's academy, dungannonst patrick's academy, dungannonst patrick's academy, dungannon
postcodebt71 6dsbt716dsbt716dsbt716dsbt716dsbt716dsbt71 6dsbt716dsbt716ds
school management typevoluntaryvoluntaryvoluntary - rc managedvoluntary - rc managedvoluntary - rc managedvoluntaryvoluntaryvoluntaryvoluntary
district councildungannondungannondungannondungannondungannondungannonmid ulstermid ulstermid ulster
\n", "

723 rows × 9 columns

\n", "
" ], "text/plain": [ " 2009 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 holywood road \n", " postcode bt4 2ly \n", "1210015 school type secondary \n", " address 1 holywood road \n", " postcode bt4 2ly \n", "1210021 school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt14 6nt \n", "1210022 school type secondary \n", " postcode bt14 6rb \n", "1230053 school type secondary \n", " postcode bt12 6en \n", " school management type rc maintained \n", "1230104 school name our lady of mercy girls' school \n", " school type secondary \n", " postcode bt14 7qr \n", " school management type rc maintained \n", "1230130 school name st rose's high school \n", " school type secondary \n", " address 1 beechmount avenue \n", " postcode bt12 7na \n", " school management type rc maintained \n", "1230146 school name christian brothers school \n", " school type secondary \n", " postcode bt11 8bw \n", " school management type rc maintained \n", "1230155 school type secondary \n", " postcode bt11 9jp \n", " school management type rc maintained \n", "... ... \n", "5420062 school name st colman's college \n", " postcode bt35 6pp \n", " school management type voluntary \n", " district council newry & mourne \n", "5420073 school name st joseph's grammar school \n", " postcode bt70 3he \n", " school management type voluntary \n", " district council dungannon \n", "5420076 school name sacred heart grammar school \n", " postcode bt34 1pr \n", " school management type voluntary \n", " district council newry & mourne \n", " parliamentary constituency newry and armagh \n", "5420260 school name the royal school dungannon \n", " address 1 1 ranfurley road \n", " postcode bt71 6ap \n", " school management type voluntary \n", " district council dungannon \n", "5420263 school name the royal school armagh \n", " postcode bt61 9dh \n", " school management type voluntary \n", " district council armagh \n", "5420268 school name st patrick's grammar school \n", " postcode bt61 7qz \n", " school management type voluntary \n", " district council armagh \n", "5420304 school name st patrick's academy \n", " postcode bt71 6ds \n", " school management type voluntary \n", " district council dungannon \n", "\n", " 2010 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210015 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210021 school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", "1210022 school type secondary \n", " postcode bt146rb \n", "1230053 school type secondary \n", " postcode bt126en \n", " school management type roman catholic maintained \n", "1230104 school name our lady of mercy girls' school \n", " school type secondary \n", " postcode bt147qr \n", " school management type roman catholic maintained \n", "1230130 school name st rose's high school \n", " school type secondary \n", " address 1 beechmount avenue \n", " postcode bt127na \n", " school management type roman catholic maintained \n", "1230146 school name christian brothers school \n", " school type secondary \n", " postcode bt118bw \n", " school management type roman catholic maintained \n", "1230155 school type secondary \n", " postcode bt119jp \n", " school management type roman catholic maintained \n", "... ... \n", "5420062 school name st colman's college \n", " postcode bt356pp \n", " school management type voluntary \n", " district council newry & mourne \n", "5420073 school name st joseph's grammar school \n", " postcode bt703he \n", " school management type voluntary \n", " district council dungannon \n", "5420076 school name sacred heart grammar school \n", " postcode bt341pr \n", " school management type voluntary \n", " district council newry & mourne \n", " parliamentary constituency newry and armagh \n", "5420260 school name the royal school dungannon \n", " address 1 1 ranfurley road \n", " postcode bt716ap \n", " school management type voluntary \n", " district council dungannon \n", "5420263 school name the royal school armagh \n", " postcode bt619dh \n", " school management type voluntary \n", " district council armagh \n", "5420268 school name st patrick's grammar school \n", " postcode bt617qz \n", " school management type voluntary \n", " district council armagh \n", "5420304 school name st patrick's academy \n", " postcode bt716ds \n", " school management type voluntary \n", " district council dungannon \n", "\n", " 2011 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210015 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210021 school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", "1210022 school type secondary \n", " postcode bt146rb \n", "1230053 school type secondary \n", " postcode bt126en \n", " school management type rc maintained \n", "1230104 school name our lady of mercy girls' school \n", " school type secondary \n", " postcode bt147qr \n", " school management type rc maintained \n", "1230130 school name st rose's high school \n", " school type secondary \n", " address 1 beechmount avenue \n", " postcode bt127na \n", " school management type rc maintained \n", "1230146 school name christian brothers school \n", " school type secondary \n", " postcode bt118bw \n", " school management type rc maintained \n", "1230155 school type secondary \n", " postcode bt119jp \n", " school management type rc maintained \n", "... ... \n", "5420062 school name st colman's college \n", " postcode bt356pp \n", " school management type voluntary - rc managed \n", " district council newry and mourne \n", "5420073 school name st joseph's grammar school \n", " postcode bt703he \n", " school management type voluntary - rc managed \n", " district council dungannon \n", "5420076 school name sacred heart grammar school \n", " postcode bt341pr \n", " school management type voluntary - rc managed \n", " district council newry and mourne \n", " parliamentary constituency south down \n", "5420260 school name the royal school dungannon \n", " address 1 1 ranfurley road \n", " postcode bt716ap \n", " school management type voluntary - other managed \n", " district council dungannon \n", "5420263 school name the royal school armagh \n", " postcode bt619dh \n", " school management type voluntary - other managed \n", " district council armagh \n", "5420268 school name st patrick's grammar school \n", " postcode bt617qz \n", " school management type voluntary - rc managed \n", " district council armagh \n", "5420304 school name st patrick's academy \n", " postcode bt716ds \n", " school management type voluntary - rc managed \n", " district council dungannon \n", "\n", " 2012 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210015 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210021 school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", "1210022 school type secondary \n", " postcode bt146rb \n", "1230053 school type secondary \n", " postcode bt126en \n", " school management type rc maintained \n", "1230104 school name our lady of mercy girls' school \n", " school type secondary \n", " postcode bt147qr \n", " school management type rc maintained \n", "1230130 school name st rose's high school \n", " school type secondary \n", " address 1 beechmount avenue \n", " postcode bt127na \n", " school management type rc maintained \n", "1230146 school name christian brothers school \n", " school type secondary \n", " postcode bt118bw \n", " school management type rc maintained \n", "1230155 school type secondary \n", " postcode bt119jp \n", " school management type rc maintained \n", "... ... \n", "5420062 school name st colman's college \n", " postcode bt356pp \n", " school management type voluntary - rc managed \n", " district council newry and mourne \n", "5420073 school name st joseph's grammar school \n", " postcode bt703he \n", " school management type voluntary - rc managed \n", " district council dungannon \n", "5420076 school name sacred heart grammar school \n", " postcode bt341pr \n", " school management type voluntary - rc managed \n", " district council newry and mourne \n", " parliamentary constituency south down \n", "5420260 school name the royal school dungannon \n", " address 1 1 ranfurley road \n", " postcode bt716ap \n", " school management type voluntary - other managed \n", " district council dungannon \n", "5420263 school name the royal school armagh \n", " postcode bt619dh \n", " school management type voluntary - other managed \n", " district council armagh \n", "5420268 school name st patrick's grammar school \n", " postcode bt617qz \n", " school management type voluntary - rc managed \n", " district council armagh \n", "5420304 school name st patrick's academy \n", " postcode bt716ds \n", " school management type voluntary - rc managed \n", " district council dungannon \n", "\n", " 2013 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210015 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210021 school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", "1210022 school type secondary \n", " postcode bt146rb \n", "1230053 school type secondary \n", " postcode bt126en \n", " school management type rc maintained \n", "1230104 school name our lady of mercy girls' school \n", " school type secondary \n", " postcode bt147qr \n", " school management type rc maintained \n", "1230130 school name st rose's high school \n", " school type secondary \n", " address 1 beechmount avenue \n", " postcode bt127na \n", " school management type rc maintained \n", "1230146 school name christian brothers school \n", " school type secondary \n", " postcode bt118bw \n", " school management type rc maintained \n", "1230155 school type secondary \n", " postcode bt119jp \n", " school management type rc maintained \n", "... ... \n", "5420062 school name st colman's college \n", " postcode bt356pp \n", " school management type voluntary - rc managed \n", " district council newry and mourne \n", "5420073 school name st joseph's grammar school \n", " postcode bt703he \n", " school management type voluntary - rc managed \n", " district council dungannon \n", "5420076 school name sacred heart grammar school \n", " postcode bt341pr \n", " school management type voluntary - rc managed \n", " district council newry and mourne \n", " parliamentary constituency south down \n", "5420260 school name the royal school dungannon \n", " address 1 1 ranfurley road \n", " postcode bt716ap \n", " school management type voluntary - other managed \n", " district council dungannon \n", "5420263 school name the royal school armagh \n", " postcode bt619dh \n", " school management type voluntary - other managed \n", " district council armagh \n", "5420268 school name st patrick's grammar school \n", " postcode bt617qz \n", " school management type voluntary - rc managed \n", " district council armagh \n", "5420304 school name st patrick's academy \n", " postcode bt716ds \n", " school management type voluntary - rc managed \n", " district council dungannon \n", "\n", " 2014 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210015 school type secondary \n", " address 1 holywood road \n", " postcode bt42ly \n", "1210021 school type secondary \n", " address 1 dunkeld gardens \n", " postcode bt146nt \n", "1210022 school type secondary \n", " postcode bt146rb \n", "1230053 school type secondary \n", " postcode bt126en \n", " school management type catholic maintained \n", "1230104 school name mercy college \n", " school type secondary \n", " postcode bt147qr \n", " school management type catholic maintained \n", "1230130 school name st rose’s dominican college \n", " school type secondary \n", " address 1 beechmount avenue \n", " postcode bt127na \n", " school management type catholic maintained \n", "1230146 school name christian brothers school, belfast \n", " school type secondary \n", " postcode bt118bw \n", " school management type catholic maintained \n", "1230155 school type secondary \n", " postcode bt119jp \n", " school management type catholic maintained \n", "... ... \n", "5420062 school name st colman's college, newry \n", " postcode bt356pp \n", " school management type voluntary \n", " district council newry and mourne \n", "5420073 school name st joseph's convent grammar school, donaghmore \n", " postcode bt703he \n", " school management type voluntary \n", " district council dungannon \n", "5420076 school name sacred heart grammar school, newry \n", " postcode bt341pr \n", " school management type voluntary \n", " district council newry and mourne \n", " parliamentary constituency south down \n", "5420260 school name the royal school, dungannon \n", " address 1 1 ranfurley road \n", " postcode bt716ap \n", " school management type voluntary \n", " district council dungannon \n", "5420263 school name the royal school, armagh \n", " postcode bt619dh \n", " school management type voluntary \n", " district council armagh \n", "5420268 school name st patrick's grammar school, armagh \n", " postcode bt617qz \n", " school management type voluntary \n", " district council armagh \n", "5420304 school name st patrick's academy, dungannon \n", " postcode bt716ds \n", " school management type voluntary \n", " district council dungannon \n", "\n", " 2015 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 397 holywood road \n", " postcode bt4 2ly \n", "1210015 school type secondary \n", " address 1 395 holywood road \n", " postcode bt4 2ly \n", "1210021 school type secondary \n", " address 1 35 dunowen gardens \n", " postcode bt14 6nq \n", "1210022 school type secondary \n", " postcode bt14 6rb \n", "1230053 school type secondary \n", " postcode bt12 6en \n", " school management type catholic maintained \n", "1230104 school name mercy college \n", " school type secondary \n", " postcode bt14 7qr \n", " school management type catholic maintained \n", "1230130 school name st rose’s dominican college \n", " school type secondary \n", " address 1 65 beechmount avenue \n", " postcode bt12 7na \n", " school management type catholic maintained \n", "1230146 school name christian brothers school, belfast \n", " school type secondary \n", " postcode bt11 8bw \n", " school management type catholic maintained \n", "1230155 school type secondary \n", " postcode bt11 9jp \n", " school management type catholic maintained \n", "... ... \n", "5420062 school name st colman's college, newry \n", " postcode bt35 6pp \n", " school management type voluntary \n", " district council newry mourne and down \n", "5420073 school name st joseph's convent grammar school, donaghmore \n", " postcode bt70 3he \n", " school management type voluntary \n", " district council mid ulster \n", "5420076 school name sacred heart grammar school, newry \n", " postcode bt34 1pr \n", " school management type voluntary \n", " district council newry mourne and down \n", " parliamentary constituency south down \n", "5420260 school name the royal school, dungannon \n", " address 1 2 ranfurley road \n", " postcode bt71 6ap \n", " school management type voluntary \n", " district council mid ulster \n", "5420263 school name the royal school, armagh \n", " postcode bt61 9dh \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", "5420268 school name st patrick's grammar school, armagh \n", " postcode bt61 7qz \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", "5420304 school name st patrick's academy, dungannon \n", " postcode bt71 6ds \n", " school management type voluntary \n", " district council mid ulster \n", "\n", " 2016 \\\n", "de ref minor \n", "1210014 school type secondary \n", " address 1 397 holywood road \n", " postcode bt42ly \n", "1210015 school type secondary \n", " address 1 395 holywood road \n", " postcode bt42ly \n", "1210021 school type secondary \n", " address 1 35 dunowen gardens \n", " postcode bt146nq \n", "1210022 school type secondary \n", " postcode bt146rb \n", "1230053 school type secondary \n", " postcode bt126en \n", " school management type catholic maintained \n", "1230104 school name mercy college \n", " school type secondary \n", " postcode bt147qr \n", " school management type catholic maintained \n", "1230130 school name st rose’s dominican college \n", " school type secondary \n", " address 1 65 beechmount avenue \n", " postcode bt127na \n", " school management type catholic maintained \n", "1230146 school name christian brothers school, belfast \n", " school type secondary \n", " postcode bt118bw \n", " school management type catholic maintained \n", "1230155 school type secondary \n", " postcode bt119jp \n", " school management type catholic maintained \n", "... ... \n", "5420062 school name st colman's college, newry \n", " postcode bt356pp \n", " school management type voluntary \n", " district council newry mourne and down \n", "5420073 school name st joseph's convent grammar school, donaghmore \n", " postcode bt703he \n", " school management type voluntary \n", " district council mid ulster \n", "5420076 school name sacred heart grammar school, newry \n", " postcode bt341pr \n", " school management type voluntary \n", " district council newry mourne and down \n", " parliamentary constituency south down \n", "5420260 school name the royal school, dungannon \n", " address 1 2 ranfurley road \n", " postcode bt716ap \n", " school management type voluntary \n", " district council mid ulster \n", "5420263 school name the royal school, armagh \n", " postcode bt619dh \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", "5420268 school name st patrick's grammar school, armagh \n", " postcode bt617qz \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", "5420304 school name st patrick's academy, dungannon \n", " postcode bt716ds \n", " school management type voluntary \n", " district council mid ulster \n", "\n", " 2017 \n", "de ref minor \n", "1210014 school type non-grammar \n", " address 1 397 holywood road \n", " postcode bt42ly \n", "1210015 school type non-grammar \n", " address 1 395 holywood road \n", " postcode bt42ly \n", "1210021 school type non-grammar \n", " address 1 35 dunowen gardens \n", " postcode bt146nq \n", "1210022 school type non-grammar \n", " postcode bt146rb \n", "1230053 school type non-grammar \n", " postcode bt126en \n", " school management type catholic maintained \n", "1230104 school name mercy college belfast \n", " school type non-grammar \n", " postcode bt147qr \n", " school management type catholic maintained \n", "1230130 school name st rose’s dominican college \n", " school type non-grammar \n", " address 1 65 beechmount avenue \n", " postcode bt127na \n", " school management type catholic maintained \n", "1230146 school name christian brothers school, belfast \n", " school type non-grammar \n", " postcode bt118bw \n", " school management type catholic maintained \n", "1230155 school type non-grammar \n", " postcode bt119jp \n", " school management type catholic maintained \n", "... ... \n", "5420062 school name st colman's college, newry \n", " postcode bt356pp \n", " school management type voluntary \n", " district council newry mourne and down \n", "5420073 school name st joseph's convent grammar school, donaghmore \n", " postcode bt703he \n", " school management type voluntary \n", " district council mid ulster \n", "5420076 school name sacred heart grammar school, newry \n", " postcode bt341pr \n", " school management type voluntary \n", " district council newry mourne and down \n", " parliamentary constituency south down \n", "5420260 school name the royal school, dungannon \n", " address 1 2 ranfurley road \n", " postcode bt716ap \n", " school management type voluntary \n", " district council mid ulster \n", "5420263 school name the royal school, armagh \n", " postcode bt619dh \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", "5420268 school name st patrick's grammar school, armagh \n", " postcode bt617qz \n", " school management type voluntary \n", " district council armagh city, banbridge and craigavon \n", "5420304 school name st patrick's academy, dungannon \n", " postcode bt716ds \n", " school management type voluntary \n", " district council mid ulster \n", "\n", "[723 rows x 9 columns]" ] }, "execution_count": 96, "metadata": {}, "output_type": "execute_result" } ], "source": [ "reference.to_frame()[reference.to_frame().apply(pd.Series.nunique, axis=1)!=1]" ] }, { "cell_type": "code", "execution_count": 97, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:15.036158Z", "start_time": "2018-06-07T10:39:15.030307Z" }, "scrolled": true }, "outputs": [ { "data": { "text/plain": [ "Counter({'catholic maintained': 258,\n", " 'controlled': 628,\n", " 'controlled integrated': 45,\n", " 'gmi': 120,\n", " 'grant maintained integrated': 15,\n", " nan: 201,\n", " 'other maintained': 12,\n", " 'rc maintained': 282,\n", " 'roman catholic maintained': 71,\n", " 'voluntary': 303,\n", " 'voluntary - other managed': 66,\n", " 'voluntary - rc managed': 87})" ] }, "execution_count": 97, "metadata": {}, "output_type": "execute_result" } ], "source": [ "from collections import Counter\n", "Counter(reference[:,:,'school management type'].values.ravel('k'))" ] }, { "cell_type": "code", "execution_count": 98, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:19.901133Z", "start_time": "2018-06-07T10:39:19.897349Z" } }, "outputs": [], "source": [ "reference_value_rename = {\n", " 'school management type':{\n", " 'controlled integrated':'integrated',\n", " 'roman catholic maintained':'rc maintained',\n", " 'grant maintained integrated':'gmi',\n", " 'voluntary - other managed':'other maintained',\n", " 'voluntary - rc managed':'rc maintained',\n", " 'catholic maintained':'rc maintained'\n", " }\n", "}" ] }, { "cell_type": "code", "execution_count": 99, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:39:22.743993Z", "start_time": "2018-06-07T10:39:21.417598Z" }, "code_folding": [] }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got reference data for 2009\n", "Got reference data for 2010\n", "Got reference data for 2011\n", "Got reference data for 2012\n", "Got reference data for 2013\n", "Got reference data for 2014\n", "Got reference data for 2015\n", "Got reference data for 2016\n", "Got reference data for 2017\n" ] } ], "source": [ "\n", "import numpy as np\n", "def parse_reference_table(xls):\n", " cols = [\n", " 'de ref',\n", " 'school name',\n", " 'school type',\n", " 'address 1',\n", " 'postcode',\n", " 'urban_rural',\n", " 'school management type',\n", " 'district council',\n", " 'parliamentary constituency',\n", " 'town'\n", " ]\n", " \n", " categories = [\n", " 'school type',\n", " 'urban_rural',\n", " 'school management type',\n", " 'district council',\n", " 'parliamentary constituency',\n", " 'town'\n", " ]\n", "\n", " ref_key_map={\n", " 'denino':'de ref',\n", " 'urban/ rural': 'urban_rural',\n", " 'schoolname': 'school name'\n", " }\n", " \n", " reference_value_rename = {\n", " 'school management type':{\n", " 'gmi':'integrated',\n", " 'controlled integrated':'integrated',\n", " 'roman catholic maintained':'rc maintained',\n", " 'grant maintained integrated':'integrated',\n", " 'voluntary - other managed':'voluntary',\n", " 'voluntary - rc managed':'voluntary',\n", " 'catholic maintained':'rc maintained'\n", " }\n", " }\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " \n", " if 'reference data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'reference data', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[1:h_range].fillna('').apply(join_n_strip_n_lower, axis=0).values\n", " df.rename(columns=ref_key_map, inplace=True)\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df = df[cols]\n", " df['de ref'] = df['de ref'].astype(int)\n", " df.set_index('de ref', inplace=True)\n", " for c in df:\n", " df[c]=df[c].str.lower().str.strip() \n", " df.replace(reference_value_rename, inplace=True)\n", " for c in categories:\n", " df[c].fillna('NA', inplace=True)\n", " df[c] = df[c].astype('category')\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_reference_table(xls)\n", " if df is not None:\n", " print(f'Got reference data for {year}')\n", " dfs[year]=df\n", "reference = pd.Panel(dfs)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## Parse Available" ] }, { "cell_type": "code", "execution_count": 203, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T13:31:25.360872Z", "start_time": "2018-06-07T13:31:24.310106Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Got available data for 2010\n", "Got available data for 2011\n", "Got available data for 2012\n", "Got available data for 2013\n", "Got available data for 2014\n", "Got available data for 2015\n", "Got available data for 2016\n", "Got available data for 2017\n" ] }, { "data": { "text/plain": [ "\n", "Dimensions: 8 (items) x 229 (major_axis) x 5 (minor_axis)\n", "Items axis: 2010 to 2017\n", "Major_axis axis: 1210014 to 5420314\n", "Minor_axis axis: actual enrolments to supernumerary pupils" ] }, "execution_count": 203, "metadata": {}, "output_type": "execute_result" } ], "source": [ "\"\"\"School level data\"\"\"\n", "\n", "def parse_available_table(xls):\n", " ref_key_map={\n", " 'schoolname': 'school name',\n", " 'total unfilled places': 'available places',\n", " 'unfilled places': 'available places',\n", " 'total approved enrolment number': 'approved enrolments'\n", " }\n", " \n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " \n", " if 'School level data' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'School level data', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " elif 'unfilled places' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'unfilled places', header=None)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " else:\n", " df=None\n", " \n", " if df is not None:\n", " try:\n", " df.columns=df.ix[1:h_range].fillna('').apply(join_n_strip_n_lower, axis=0).values\n", " df.rename(columns=ref_key_map, inplace=True)\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df=df.applymap(lambda x: np.nan if isinstance(x, str) and x.isspace() else x)\n", " df.dropna(how='all', axis=1, inplace=True)\n", " df.dropna(how='any', axis=0, inplace=True)\n", " if df.shape[1] == 6: # recent doesn't have fecking headers\n", " cols = list(df.columns)\n", " cols[0] = 'de ref'\n", " cols[1] = 'school name'\n", " df.columns=cols\n", " df.drop('school name', axis=1, inplace=True)\n", " df['de ref'] = df['de ref'].astype(int)\n", " df.set_index('de ref', inplace=True)\n", " df.replace('*',2.0, inplace=True) # * == < 5\n", " df.replace('!',1, inplace=True) # ! avoid identification, so it's prob one or two\n", " df.dropna(how='all', inplace=True, axis=1)\n", " df.astype(int, inplace=True)\n", " \n", "\n", " \n", " except TypeError as e:\n", " print(e)\n", "\n", " return df\n", "dfs={}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_available_table(xls)\n", " if df is not None:\n", " print(f'Got available data for {year}')\n", " dfs[year]=df\n", " \n", "available = pd.Panel(dfs)\n", "available" ] }, { "cell_type": "code", "execution_count": 205, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T13:31:32.471950Z", "start_time": "2018-06-07T13:31:32.441846Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
actual enrolmentsapproved admissionsapproved enrolmentsavailable placessupernumerary pupils
de ref
1210014NaNNaN660.00.0NaN
1210015NaNNaN600.00.0NaN
1210021NaNNaN950.056.0NaN
1210022NaNNaN905.012.0NaN
1210266NaNNaN548.02.0NaN
1230026NaNNaN780.0111.0NaN
1230053NaNNaN2280.0787.0NaN
1230089NaNNaN650.00.0NaN
1230104NaNNaN650.0238.0NaN
1230130NaNNaN575.0237.0NaN
1230146NaNNaN750.0305.0NaN
1230155NaNNaN1000.00.0NaN
1230173NaNNaNNaNNaNNaN
1230182NaNNaN1025.09.0NaN
1230262NaNNaN600.0232.0NaN
1230275NaNNaN664.0143.0NaN
1230321NaNNaNNaNNaNNaN
1240291NaNNaN600.060.0NaN
1260269NaNNaN850.014.0NaN
1260294NaNNaN800.0189.0NaN
1410079NaNNaN1075.00.0NaN
1410270NaNNaN770.00.0NaN
1410315NaNNaNNaNNaNNaN
1420018NaNNaN710.02.0NaN
1420020NaNNaN950.073.0NaN
1420021NaNNaN1180.00.0NaN
1420022NaNNaN1810.074.0NaN
1420027NaNNaN1050.032.0NaN
1420028NaNNaN1410.019.0NaN
1420029NaNNaN966.00.0NaN
..................
5230152NaNNaN760.00.0NaN
5230157NaNNaN1355.00.0NaN
5230160NaNNaN450.0291.0NaN
5230167NaNNaN600.017.0NaN
5230187NaNNaN1000.037.0NaN
5230192NaNNaN680.0403.0NaN
5230213NaNNaN1200.088.0NaN
5230218NaNNaN1029.00.0NaN
5230256NaNNaN800.0646.0NaN
5230278NaNNaN960.043.0NaN
5230293NaNNaN575.00.0NaN
5230321NaNNaNNaNNaNNaN
5250216NaNNaN450.0149.0NaN
5260285NaNNaN500.00.0NaN
5260286NaNNaN500.00.0NaN
5410013NaNNaN1320.05.0NaN
5410057NaNNaN440.02.0NaN
5410067NaNNaN780.00.0NaN
5420045NaNNaN570.00.0NaN
5420056NaNNaN570.00.0NaN
5420059NaNNaN850.00.0NaN
5420060NaNNaN860.08.0NaN
5420062NaNNaN860.00.0NaN
5420073NaNNaN575.00.0NaN
5420076NaNNaN875.025.0NaN
5420260NaNNaN650.05.0NaN
5420263NaNNaN650.00.0NaN
5420268NaNNaN750.00.0NaN
5420304NaNNaN1400.031.0NaN
5420314NaNNaNNaNNaNNaN
\n", "

229 rows × 5 columns

\n", "
" ], "text/plain": [ " actual enrolments approved admissions approved enrolments \\\n", "de ref \n", "1210014 NaN NaN 660.0 \n", "1210015 NaN NaN 600.0 \n", "1210021 NaN NaN 950.0 \n", "1210022 NaN NaN 905.0 \n", "1210266 NaN NaN 548.0 \n", "1230026 NaN NaN 780.0 \n", "1230053 NaN NaN 2280.0 \n", "1230089 NaN NaN 650.0 \n", "1230104 NaN NaN 650.0 \n", "1230130 NaN NaN 575.0 \n", "1230146 NaN NaN 750.0 \n", "1230155 NaN NaN 1000.0 \n", "1230173 NaN NaN NaN \n", "1230182 NaN NaN 1025.0 \n", "1230262 NaN NaN 600.0 \n", "1230275 NaN NaN 664.0 \n", "1230321 NaN NaN NaN \n", "1240291 NaN NaN 600.0 \n", "1260269 NaN NaN 850.0 \n", "1260294 NaN NaN 800.0 \n", "1410079 NaN NaN 1075.0 \n", "1410270 NaN NaN 770.0 \n", "1410315 NaN NaN NaN \n", "1420018 NaN NaN 710.0 \n", "1420020 NaN NaN 950.0 \n", "1420021 NaN NaN 1180.0 \n", "1420022 NaN NaN 1810.0 \n", "1420027 NaN NaN 1050.0 \n", "1420028 NaN NaN 1410.0 \n", "1420029 NaN NaN 966.0 \n", "... ... ... ... \n", "5230152 NaN NaN 760.0 \n", "5230157 NaN NaN 1355.0 \n", "5230160 NaN NaN 450.0 \n", "5230167 NaN NaN 600.0 \n", "5230187 NaN NaN 1000.0 \n", "5230192 NaN NaN 680.0 \n", "5230213 NaN NaN 1200.0 \n", "5230218 NaN NaN 1029.0 \n", "5230256 NaN NaN 800.0 \n", "5230278 NaN NaN 960.0 \n", "5230293 NaN NaN 575.0 \n", "5230321 NaN NaN NaN \n", "5250216 NaN NaN 450.0 \n", "5260285 NaN NaN 500.0 \n", "5260286 NaN NaN 500.0 \n", "5410013 NaN NaN 1320.0 \n", "5410057 NaN NaN 440.0 \n", "5410067 NaN NaN 780.0 \n", "5420045 NaN NaN 570.0 \n", "5420056 NaN NaN 570.0 \n", "5420059 NaN NaN 850.0 \n", "5420060 NaN NaN 860.0 \n", "5420062 NaN NaN 860.0 \n", "5420073 NaN NaN 575.0 \n", "5420076 NaN NaN 875.0 \n", "5420260 NaN NaN 650.0 \n", "5420263 NaN NaN 650.0 \n", "5420268 NaN NaN 750.0 \n", "5420304 NaN NaN 1400.0 \n", "5420314 NaN NaN NaN \n", "\n", " available places supernumerary pupils \n", "de ref \n", "1210014 0.0 NaN \n", "1210015 0.0 NaN \n", "1210021 56.0 NaN \n", "1210022 12.0 NaN \n", "1210266 2.0 NaN \n", "1230026 111.0 NaN \n", "1230053 787.0 NaN \n", "1230089 0.0 NaN \n", "1230104 238.0 NaN \n", "1230130 237.0 NaN \n", "1230146 305.0 NaN \n", "1230155 0.0 NaN \n", "1230173 NaN NaN \n", "1230182 9.0 NaN \n", "1230262 232.0 NaN \n", "1230275 143.0 NaN \n", "1230321 NaN NaN \n", "1240291 60.0 NaN \n", "1260269 14.0 NaN \n", "1260294 189.0 NaN \n", "1410079 0.0 NaN \n", "1410270 0.0 NaN \n", "1410315 NaN NaN \n", "1420018 2.0 NaN \n", "1420020 73.0 NaN \n", "1420021 0.0 NaN \n", "1420022 74.0 NaN \n", "1420027 32.0 NaN \n", "1420028 19.0 NaN \n", "1420029 0.0 NaN \n", "... ... ... \n", "5230152 0.0 NaN \n", "5230157 0.0 NaN \n", "5230160 291.0 NaN \n", "5230167 17.0 NaN \n", "5230187 37.0 NaN \n", "5230192 403.0 NaN \n", "5230213 88.0 NaN \n", "5230218 0.0 NaN \n", "5230256 646.0 NaN \n", "5230278 43.0 NaN \n", "5230293 0.0 NaN \n", "5230321 NaN NaN \n", "5250216 149.0 NaN \n", "5260285 0.0 NaN \n", "5260286 0.0 NaN \n", "5410013 5.0 NaN \n", "5410057 2.0 NaN \n", "5410067 0.0 NaN \n", "5420045 0.0 NaN \n", "5420056 0.0 NaN \n", "5420059 0.0 NaN \n", "5420060 8.0 NaN \n", "5420062 0.0 NaN \n", "5420073 0.0 NaN \n", "5420076 25.0 NaN \n", "5420260 5.0 NaN \n", "5420263 0.0 NaN \n", "5420268 0.0 NaN \n", "5420304 31.0 NaN \n", "5420314 NaN NaN \n", "\n", "[229 rows x 5 columns]" ] }, "execution_count": 205, "metadata": {}, "output_type": "execute_result" } ], "source": [ "available[2013]" ] }, { "cell_type": "code", "execution_count": 200, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T13:30:34.788395Z", "start_time": "2018-06-07T13:30:34.564355Z" } }, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 200, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "all_ = set([_ for df in dfs.values() for _ in df.keys()])\n", "df = pd.DataFrame.from_dict({\n", " year: [sn in these_ for sn in all_] \n", " for year, these_ in dfs.items()\n", "}, orient='index')\n", "df.columns=all_\n", "sns.heatmap(df.T)" ] }, { "cell_type": "code", "execution_count": 201, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T13:30:34.985452Z", "start_time": "2018-06-07T13:30:34.981525Z" } }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "2010:(217, 2):approved enrolments,available places\n", "2011:(216, 2):approved enrolments,available places\n", "2012:(215, 2):available places,approved enrolments\n", "2013:(210, 2):available places,approved enrolments\n", "2014:(208, 1):available places\n", "2015:(202, 3):approved admissions,approved enrolments,available places\n", "2016:(201, 4):approved enrolments,actual enrolments,supernumerary pupils,available places\n", "2017:(199, 4):approved enrolments,actual enrolments,supernumerary pupils,available places\n" ] } ], "source": [ "for year,df in dfs.items():\n", " print(f\"{year}:{df.shape}:{','.join(df.keys())}\")" ] }, { "cell_type": "code", "execution_count": 178, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T11:28:49.631140Z", "start_time": "2018-06-07T11:28:49.624851Z" } }, "outputs": [ { "data": { "text/plain": [ "Counter({'actual enrolments': 2,\n", " 'approved admissions': 1,\n", " 'approved enrolments': 7,\n", " 'available places': 8,\n", " 'supernumerary pupils': 2})" ] }, "execution_count": 178, "metadata": {}, "output_type": "execute_result" } ], "source": [ "Counter([_ for df in dfs.values() for _ in df.keys()])" ] }, { "cell_type": "code", "execution_count": 179, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T11:28:59.421960Z", "start_time": "2018-06-07T11:28:59.417040Z" } }, "outputs": [ { "data": { "text/plain": [ "approved enrolments float64\n", "actual enrolments float64\n", "supernumerary pupils float64\n", "available places float64\n", "dtype: object" ] }, "execution_count": 179, "metadata": {}, "output_type": "execute_result" } ], "source": [ "dfs[2017].dtypes" ] }, { "cell_type": "code", "execution_count": 186, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T11:30:08.689101Z", "start_time": "2018-06-07T11:30:08.678874Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
approved enrolmentsavailable places
2010159503.017780.0
2011159793.019473.0
2012158906.020256.0
2013156996.019599.0
20140.021151.0
2015153916.020186.0
2016154131.020946.0
2017154098.021022.0
\n", "
" ], "text/plain": [ " approved enrolments available places\n", "2010 159503.0 17780.0\n", "2011 159793.0 19473.0\n", "2012 158906.0 20256.0\n", "2013 156996.0 19599.0\n", "2014 0.0 21151.0\n", "2015 153916.0 20186.0\n", "2016 154131.0 20946.0\n", "2017 154098.0 21022.0" ] }, "execution_count": 186, "metadata": {}, "output_type": "execute_result" } ], "source": [ "available.sum().ix[['approved enrolments','available places']].T" ] }, { "cell_type": "markdown", "metadata": { "ExecuteTime": { "end_time": "2018-06-07T11:22:55.956810Z", "start_time": "2018-06-07T11:22:55.826546Z" } }, "source": [ "![](img/starman.png)" ] }, { "cell_type": "code", "execution_count": 19, "metadata": { "ExecuteTime": { "end_time": "2018-06-08T11:43:11.883408Z", "start_time": "2018-06-08T11:43:11.072285Z" } }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/Users/andrew.bolster/anaconda3/lib/python3.6/site-packages/ipykernel/__main__.py:29: DeprecationWarning: \n", ".ix is deprecated. Please use\n", ".loc for label based indexing or\n", ".iloc for positional indexing\n", "\n", "See the documentation here:\n", "http://pandas.pydata.org/pandas-docs/stable/indexing.html#ix-indexer-is-deprecated\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "Got fsm data for 2009\n", "Got fsm data for 2010\n", "Got fsm data for 2011\n", "Got fsm data for 2012\n", "Got fsm data for 2013\n", "Got fsm data for 2014\n", "Got fsm data for 2015\n", "Got fsm data for 2016\n", "Got fsm data for 2017\n" ] } ], "source": [ "from collections import defaultdict\n", "import numpy as np\n", "from pathlib import Path\n", "import pandas as pd\n", "\n", "## Initialisation and re-walking already extracted\n", "## Datasets.\n", "\n", "year_files = defaultdict(list)\n", "dest = Path('./data/education-ni/')\n", "for year_p in dest.iterdir():\n", " try:\n", " year=int(year_p.parts[-1])\n", " for file in year_p.iterdir():\n", " year_files[year].append(file.parts[-1])\n", " except ValueError:\n", " pass\n", " \n", "year_files = dict(sorted(year_files.items()))\n", "year_files\n", "\n", "def parse_fsm_table(xls):\n", " join_n_strip_n_lower = lambda l: ' '.join(l).strip().lower()\n", " strip_n_lower = lambda s: s.strip().lower()\n", " unyearify = lambda s: int(s.replace('year ',''))\n", " \n", " if 'free school meals' in xls.sheet_names:\n", " df = pd.read_excel(xls, 'free school meals', header=None, skip_footer=5)\n", " h_range = 2 if isinstance(df.ix[3,0], int) else 3\n", " try:\n", " df.columns=df.ix[3].fillna('').apply(strip_n_lower).values\n", " df = df.drop(df.index[0:h_range+1]).reset_index(drop=True)\n", " df.dropna(how='all', inplace=True, axis=0)\n", " df['de ref'] = df['de ref'].astype(int)\n", " df.drop('schoolname',axis=1, inplace=True)\n", " df.drop('free school meals', axis=1, inplace=True)\n", " df.set_index('de ref', inplace=True)\n", " df.replace('#',pd.np.nan, inplace=True) # # = Undisclosed\n", " df.replace('*',2.0, inplace=True) # * == < 5\n", " df.replace('!',1, inplace=True) # ! avoid identification, so it's prob one or two\n", " \n", " df=df.astype(float)\n", " except TypeError as e:\n", " print(e)\n", " else:\n", " df=None\n", " return df\n", "\n", "dfs = {}\n", "for year, files in year_files.items():\n", " for file in files:\n", " if 'post' in file:\n", " xls = pd.ExcelFile(f'data/education-ni/{year}/{file}')\n", " df = parse_fsm_table(xls)\n", " if df is not None:\n", " print(f'Got fsm data for {year}')\n", " dfs[year]=df\n", "fsm = pd.Panel(dfs)" ] }, { "cell_type": "code", "execution_count": 17, "metadata": { "ExecuteTime": { "end_time": "2018-06-08T11:41:44.452740Z", "start_time": "2018-06-08T11:41:44.413255Z" } }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
200920102011201220132014201520162017
de refminor
1210014pupils672.000000688.000000703.000000708.000000704.000000697.000000704.000000696.000000691.000000
fsme132.000000153.000000170.000000183.000000171.000000241.000000277.000000301.000000310.000000
free school meals0.1964290.2223840.2418210.2584750.2428980.3457680.3934660.4324710.448625
1210015pupils647.000000650.000000649.000000666.000000709.000000737.000000744.000000728.000000740.000000
fsme127.000000141.000000157.000000177.000000173.000000270.000000312.000000332.000000326.000000
free school meals0.1962910.2169230.2419110.2657660.2440060.3663500.4193550.4560440.440541
1210021pupils963.000000929.000000899.000000930.000000916.000000884.000000910.000000954.000000946.000000
fsme376.000000359.000000367.000000379.000000368.000000452.000000522.000000572.000000580.000000
free school meals0.3904470.3864370.4082310.4075270.4017470.5113120.5736260.5995810.613108
1210022pupils907.000000932.000000913.000000930.000000943.000000969.000000968.000000991.000000997.000000
fsme363.000000392.000000384.000000390.000000380.000000522.000000548.000000575.000000588.000000
free school meals0.4002210.4206010.4205910.4193550.4029690.5387000.5661160.5802220.589769
1230053pupils1547.0000001530.0000001530.0000001521.0000001516.0000001518.0000001474.0000001420.0000001435.000000
fsme546.000000551.000000578.000000618.000000563.000000821.000000834.000000847.000000860.000000
free school meals0.3529410.3601310.3777780.4063120.3713720.5408430.5658070.5964790.599303
1230104pupils438.000000429.000000384.000000367.000000423.000000433.000000446.000000452.000000450.000000
fsme184.000000188.000000184.000000192.000000217.000000337.000000333.000000323.000000315.000000
free school meals0.4200910.4382280.4791670.5231610.5130020.7782910.7466370.7146020.700000
1230130pupils468.000000440.000000406.000000388.000000352.000000316.000000273.000000240.000000243.000000
fsme272.000000244.000000239.000000214.000000183.000000217.000000187.000000171.000000166.000000
free school meals0.5811970.5545450.5886700.5515460.5198860.6867090.6849820.7125000.683128
1230146pupils508.000000513.000000528.000000529.000000490.000000490.000000498.000000500.000000525.000000
fsme242.000000237.000000245.000000286.000000236.000000270.000000317.000000326.000000329.000000
free school meals0.4763780.4619880.4640150.5406430.4816330.5510200.6365460.6520000.626667
1230155pupils1011.0000001027.0000001043.0000001069.0000001078.0000001061.0000001070.0000001059.0000001022.000000
fsme327.000000349.000000401.000000417.000000409.000000539.000000584.000000591.000000559.000000
free school meals0.3234420.3398250.3844680.3900840.3794060.5080110.5457940.5580740.546967
1230182pupils1116.0000001088.0000001088.0000001098.0000001093.0000001116.0000001117.0000001104.000000958.000000
fsme348.000000348.000000359.000000386.000000345.000000535.000000562.000000588.000000508.000000
free school meals0.3118280.3198530.3299630.3515480.3156450.4793910.5031330.5326090.530271
.................................
5410013pupils1311.0000001325.0000001324.0000001331.0000001327.0000001324.0000001320.0000001312.0000001301.000000
fsme38.00000046.00000048.00000056.00000048.00000067.00000076.00000083.00000086.000000
free school meals0.0289860.0347170.0362540.0420740.0361720.0506040.0575760.0632620.066103
5410057pupils432.000000438.000000455.000000457.000000451.000000453.000000455.000000451.000000455.000000
fsme20.00000027.00000024.00000021.00000025.00000037.00000038.00000041.00000050.000000
free school meals0.0462960.0616440.0527470.0459520.0554320.0816780.0835160.0909090.109890
5410067pupils789.000000788.000000780.000000778.000000798.000000791.000000788.000000778.000000744.000000
fsme27.00000035.00000031.00000034.00000037.00000046.00000058.00000073.00000064.000000
free school meals0.0342210.0444160.0397440.0437020.0463660.0581540.0736040.0938300.086022
5420045pupils586.000000587.000000585.000000587.000000586.000000591.000000588.000000564.000000564.000000
fsme76.00000079.00000071.00000085.00000073.000000135.000000131.000000131.000000126.000000
free school meals0.1296930.1345830.1213680.1448040.1245730.2284260.2227890.2322700.223404
5420059pupils880.000000887.000000894.000000907.000000900.000000911.000000902.000000882.000000885.000000
fsme77.00000088.00000085.00000087.00000084.000000141.000000155.000000149.000000125.000000
free school meals0.0875000.0992110.0950780.0959210.0933330.1547750.1718400.1689340.141243
5420060pupils861.000000861.000000864.000000861.000000858.000000845.000000853.000000854.000000853.000000
fsme71.00000077.00000080.00000084.00000081.000000129.000000123.000000124.000000116.000000
free school meals0.0824620.0894310.0925930.0975610.0944060.1526630.1441970.1451990.135991
5420062pupils919.000000940.000000942.000000920.000000900.000000904.000000897.000000903.000000885.000000
fsme57.00000070.00000072.00000082.00000083.000000135.000000132.000000140.000000134.000000
free school meals0.0620240.0744680.0764330.0891300.0922220.1493360.1471570.1550390.151412
5420073pupils527.000000555.000000579.000000604.000000635.000000678.000000707.000000709.000000686.000000
fsme82.00000081.00000089.00000095.00000088.000000155.000000170.000000195.000000168.000000
free school meals0.1555980.1459460.1537130.1572850.1385830.2286140.2404530.2750350.244898
5420076pupils836.000000846.000000845.000000849.000000855.000000853.000000854.000000852.000000843.000000
fsme56.00000068.00000079.00000078.00000074.000000122.000000131.000000130.000000131.000000
free school meals0.0669860.0803780.0934910.0918730.0865500.1430250.1533960.1525820.155397
5420260pupils646.000000658.000000665.000000652.000000653.000000660.000000650.000000652.000000638.000000
fsme29.00000031.00000031.00000031.00000028.00000058.00000064.00000062.00000061.000000
free school meals0.0448920.0471120.0466170.0475460.0428790.0878790.0984620.0950920.095611
\n", "

547 rows × 9 columns

\n", "
" ], "text/plain": [ " 2009 2010 2011 2012 \\\n", "de ref minor \n", "1210014 pupils 672.000000 688.000000 703.000000 708.000000 \n", " fsme 132.000000 153.000000 170.000000 183.000000 \n", " free school meals 0.196429 0.222384 0.241821 0.258475 \n", "1210015 pupils 647.000000 650.000000 649.000000 666.000000 \n", " fsme 127.000000 141.000000 157.000000 177.000000 \n", " free school meals 0.196291 0.216923 0.241911 0.265766 \n", "1210021 pupils 963.000000 929.000000 899.000000 930.000000 \n", " fsme 376.000000 359.000000 367.000000 379.000000 \n", " free school meals 0.390447 0.386437 0.408231 0.407527 \n", "1210022 pupils 907.000000 932.000000 913.000000 930.000000 \n", " fsme 363.000000 392.000000 384.000000 390.000000 \n", " free school meals 0.400221 0.420601 0.420591 0.419355 \n", "1230053 pupils 1547.000000 1530.000000 1530.000000 1521.000000 \n", " fsme 546.000000 551.000000 578.000000 618.000000 \n", " free school meals 0.352941 0.360131 0.377778 0.406312 \n", "1230104 pupils 438.000000 429.000000 384.000000 367.000000 \n", " fsme 184.000000 188.000000 184.000000 192.000000 \n", " free school meals 0.420091 0.438228 0.479167 0.523161 \n", "1230130 pupils 468.000000 440.000000 406.000000 388.000000 \n", " fsme 272.000000 244.000000 239.000000 214.000000 \n", " free school meals 0.581197 0.554545 0.588670 0.551546 \n", "1230146 pupils 508.000000 513.000000 528.000000 529.000000 \n", " fsme 242.000000 237.000000 245.000000 286.000000 \n", " free school meals 0.476378 0.461988 0.464015 0.540643 \n", "1230155 pupils 1011.000000 1027.000000 1043.000000 1069.000000 \n", " fsme 327.000000 349.000000 401.000000 417.000000 \n", " free school meals 0.323442 0.339825 0.384468 0.390084 \n", "1230182 pupils 1116.000000 1088.000000 1088.000000 1098.000000 \n", " fsme 348.000000 348.000000 359.000000 386.000000 \n", " free school meals 0.311828 0.319853 0.329963 0.351548 \n", "... ... ... ... ... \n", "5410013 pupils 1311.000000 1325.000000 1324.000000 1331.000000 \n", " fsme 38.000000 46.000000 48.000000 56.000000 \n", " free school meals 0.028986 0.034717 0.036254 0.042074 \n", "5410057 pupils 432.000000 438.000000 455.000000 457.000000 \n", " fsme 20.000000 27.000000 24.000000 21.000000 \n", " free school meals 0.046296 0.061644 0.052747 0.045952 \n", "5410067 pupils 789.000000 788.000000 780.000000 778.000000 \n", " fsme 27.000000 35.000000 31.000000 34.000000 \n", " free school meals 0.034221 0.044416 0.039744 0.043702 \n", "5420045 pupils 586.000000 587.000000 585.000000 587.000000 \n", " fsme 76.000000 79.000000 71.000000 85.000000 \n", " free school meals 0.129693 0.134583 0.121368 0.144804 \n", "5420059 pupils 880.000000 887.000000 894.000000 907.000000 \n", " fsme 77.000000 88.000000 85.000000 87.000000 \n", " free school meals 0.087500 0.099211 0.095078 0.095921 \n", "5420060 pupils 861.000000 861.000000 864.000000 861.000000 \n", " fsme 71.000000 77.000000 80.000000 84.000000 \n", " free school meals 0.082462 0.089431 0.092593 0.097561 \n", "5420062 pupils 919.000000 940.000000 942.000000 920.000000 \n", " fsme 57.000000 70.000000 72.000000 82.000000 \n", " free school meals 0.062024 0.074468 0.076433 0.089130 \n", "5420073 pupils 527.000000 555.000000 579.000000 604.000000 \n", " fsme 82.000000 81.000000 89.000000 95.000000 \n", " free school meals 0.155598 0.145946 0.153713 0.157285 \n", "5420076 pupils 836.000000 846.000000 845.000000 849.000000 \n", " fsme 56.000000 68.000000 79.000000 78.000000 \n", " free school meals 0.066986 0.080378 0.093491 0.091873 \n", "5420260 pupils 646.000000 658.000000 665.000000 652.000000 \n", " fsme 29.000000 31.000000 31.000000 31.000000 \n", " free school meals 0.044892 0.047112 0.046617 0.047546 \n", "\n", " 2013 2014 2015 2016 \\\n", "de ref minor \n", "1210014 pupils 704.000000 697.000000 704.000000 696.000000 \n", " fsme 171.000000 241.000000 277.000000 301.000000 \n", " free school meals 0.242898 0.345768 0.393466 0.432471 \n", "1210015 pupils 709.000000 737.000000 744.000000 728.000000 \n", " fsme 173.000000 270.000000 312.000000 332.000000 \n", " free school meals 0.244006 0.366350 0.419355 0.456044 \n", "1210021 pupils 916.000000 884.000000 910.000000 954.000000 \n", " fsme 368.000000 452.000000 522.000000 572.000000 \n", " free school meals 0.401747 0.511312 0.573626 0.599581 \n", "1210022 pupils 943.000000 969.000000 968.000000 991.000000 \n", " fsme 380.000000 522.000000 548.000000 575.000000 \n", " free school meals 0.402969 0.538700 0.566116 0.580222 \n", "1230053 pupils 1516.000000 1518.000000 1474.000000 1420.000000 \n", " fsme 563.000000 821.000000 834.000000 847.000000 \n", " free school meals 0.371372 0.540843 0.565807 0.596479 \n", "1230104 pupils 423.000000 433.000000 446.000000 452.000000 \n", " fsme 217.000000 337.000000 333.000000 323.000000 \n", " free school meals 0.513002 0.778291 0.746637 0.714602 \n", "1230130 pupils 352.000000 316.000000 273.000000 240.000000 \n", " fsme 183.000000 217.000000 187.000000 171.000000 \n", " free school meals 0.519886 0.686709 0.684982 0.712500 \n", "1230146 pupils 490.000000 490.000000 498.000000 500.000000 \n", " fsme 236.000000 270.000000 317.000000 326.000000 \n", " free school meals 0.481633 0.551020 0.636546 0.652000 \n", "1230155 pupils 1078.000000 1061.000000 1070.000000 1059.000000 \n", " fsme 409.000000 539.000000 584.000000 591.000000 \n", " free school meals 0.379406 0.508011 0.545794 0.558074 \n", "1230182 pupils 1093.000000 1116.000000 1117.000000 1104.000000 \n", " fsme 345.000000 535.000000 562.000000 588.000000 \n", " free school meals 0.315645 0.479391 0.503133 0.532609 \n", "... ... ... ... ... \n", "5410013 pupils 1327.000000 1324.000000 1320.000000 1312.000000 \n", " fsme 48.000000 67.000000 76.000000 83.000000 \n", " free school meals 0.036172 0.050604 0.057576 0.063262 \n", "5410057 pupils 451.000000 453.000000 455.000000 451.000000 \n", " fsme 25.000000 37.000000 38.000000 41.000000 \n", " free school meals 0.055432 0.081678 0.083516 0.090909 \n", "5410067 pupils 798.000000 791.000000 788.000000 778.000000 \n", " fsme 37.000000 46.000000 58.000000 73.000000 \n", " free school meals 0.046366 0.058154 0.073604 0.093830 \n", "5420045 pupils 586.000000 591.000000 588.000000 564.000000 \n", " fsme 73.000000 135.000000 131.000000 131.000000 \n", " free school meals 0.124573 0.228426 0.222789 0.232270 \n", "5420059 pupils 900.000000 911.000000 902.000000 882.000000 \n", " fsme 84.000000 141.000000 155.000000 149.000000 \n", " free school meals 0.093333 0.154775 0.171840 0.168934 \n", "5420060 pupils 858.000000 845.000000 853.000000 854.000000 \n", " fsme 81.000000 129.000000 123.000000 124.000000 \n", " free school meals 0.094406 0.152663 0.144197 0.145199 \n", "5420062 pupils 900.000000 904.000000 897.000000 903.000000 \n", " fsme 83.000000 135.000000 132.000000 140.000000 \n", " free school meals 0.092222 0.149336 0.147157 0.155039 \n", "5420073 pupils 635.000000 678.000000 707.000000 709.000000 \n", " fsme 88.000000 155.000000 170.000000 195.000000 \n", " free school meals 0.138583 0.228614 0.240453 0.275035 \n", "5420076 pupils 855.000000 853.000000 854.000000 852.000000 \n", " fsme 74.000000 122.000000 131.000000 130.000000 \n", " free school meals 0.086550 0.143025 0.153396 0.152582 \n", "5420260 pupils 653.000000 660.000000 650.000000 652.000000 \n", " fsme 28.000000 58.000000 64.000000 62.000000 \n", " free school meals 0.042879 0.087879 0.098462 0.095092 \n", "\n", " 2017 \n", "de ref minor \n", "1210014 pupils 691.000000 \n", " fsme 310.000000 \n", " free school meals 0.448625 \n", "1210015 pupils 740.000000 \n", " fsme 326.000000 \n", " free school meals 0.440541 \n", "1210021 pupils 946.000000 \n", " fsme 580.000000 \n", " free school meals 0.613108 \n", "1210022 pupils 997.000000 \n", " fsme 588.000000 \n", " free school meals 0.589769 \n", "1230053 pupils 1435.000000 \n", " fsme 860.000000 \n", " free school meals 0.599303 \n", "1230104 pupils 450.000000 \n", " fsme 315.000000 \n", " free school meals 0.700000 \n", "1230130 pupils 243.000000 \n", " fsme 166.000000 \n", " free school meals 0.683128 \n", "1230146 pupils 525.000000 \n", " fsme 329.000000 \n", " free school meals 0.626667 \n", "1230155 pupils 1022.000000 \n", " fsme 559.000000 \n", " free school meals 0.546967 \n", "1230182 pupils 958.000000 \n", " fsme 508.000000 \n", " free school meals 0.530271 \n", "... ... \n", "5410013 pupils 1301.000000 \n", " fsme 86.000000 \n", " free school meals 0.066103 \n", "5410057 pupils 455.000000 \n", " fsme 50.000000 \n", " free school meals 0.109890 \n", "5410067 pupils 744.000000 \n", " fsme 64.000000 \n", " free school meals 0.086022 \n", "5420045 pupils 564.000000 \n", " fsme 126.000000 \n", " free school meals 0.223404 \n", "5420059 pupils 885.000000 \n", " fsme 125.000000 \n", " free school meals 0.141243 \n", "5420060 pupils 853.000000 \n", " fsme 116.000000 \n", " free school meals 0.135991 \n", "5420062 pupils 885.000000 \n", " fsme 134.000000 \n", " free school meals 0.151412 \n", "5420073 pupils 686.000000 \n", " fsme 168.000000 \n", " free school meals 0.244898 \n", "5420076 pupils 843.000000 \n", " fsme 131.000000 \n", " free school meals 0.155397 \n", "5420260 pupils 638.000000 \n", " fsme 61.000000 \n", " free school meals 0.095611 \n", "\n", "[547 rows x 9 columns]" ] }, "execution_count": 17, "metadata": {}, "output_type": "execute_result" } ], "source": [ "fsm.to_frame()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## New heading" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.972386Z", "start_time": "2018-06-07T10:36:11.946Z" } }, "outputs": [], "source": [ "dfs[2016]" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.973678Z", "start_time": "2018-06-07T10:36:11.949Z" } }, "outputs": [], "source": [ "Counter(reference[:,:,'school management type'].values.ravel('k'))" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.974946Z", "start_time": "2018-06-07T10:36:11.954Z" } }, "outputs": [], "source": [ "reference[:,:,'school management type'].apply(Counter, axis=0)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.975973Z", "start_time": "2018-06-07T10:36:11.960Z" } }, "outputs": [], "source": [ "categories=pd.DataFrame.from_dict({\n", " year: dict(c)\n", " for year,c in reference[:,:,'school management type'].apply(Counter, axis=0).iteritems()\n", "})\n", "categories.plot.bar()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.977774Z", "start_time": "2018-06-07T10:36:11.963Z" } }, "outputs": [], "source": [ "pd.DataFrame.from_dict({\n", " category:\n", " enrolements[:,(reference.minor_xs('school management type')==category).any(axis=1),:].sum().sum()\n", " for category in categories.drop(np.nan).index\n", "}).plot()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.983348Z", "start_time": "2018-06-07T10:36:11.968Z" } }, "outputs": [], "source": [ "enrolements.sum().sum().plot()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.989380Z", "start_time": "2018-06-07T10:36:11.971Z" } }, "outputs": [], "source": [ "\n", "Counter(reference.minor_xs('town').values.ravel('k'))" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:11.995484Z", "start_time": "2018-06-07T10:36:11.975Z" } }, "outputs": [], "source": [ "gazetteer = \"45341066-1998-4116-b234-6223e7e19397\"\n", "gztr = pd.DataFrame.from_records(dataset_generator(gazetteer))\n", "gztr" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:12.002026Z", "start_time": "2018-06-07T10:36:11.979Z" } }, "outputs": [], "source": [ "gztr['town'] = gztr['PLACENAME'].str.lower()\n", "town_lookup = gztr.set_index('town')[['X','Y']]\n", "town_lookup" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:12.007460Z", "start_time": "2018-06-07T10:36:11.981Z" } }, "outputs": [], "source": [ "for town, n in Counter(reference.minor_xs('town').values.ravel('k')).items():\n", " if town not in town_lookup.index:\n", " print(f\"{town}:{n}\")" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:12.013210Z", "start_time": "2018-06-07T10:36:11.985Z" } }, "outputs": [], "source": [ "from shapely.geometry import Point\n", "from pyproj import Proj, transform\n", "prj_wgs = Proj(proj='latlong',datum='WGS84')\n", "prj_itm = Proj(init='EPSG:29903')\n", "\n", "def apply_itm_to_wgs(row, e='eastings', n='northings'):\n", " eastings, northings = row[e], row[n]\n", " if eastings is not None and northings is not None: \n", " long,lat = transform(prj_itm, prj_wgs, eastings, northings)\n", " else:\n", " long,lat = None,None\n", " \n", " return pd.Series({'latitude':lat,'longitude':long})\n", "town_lookup = gpd.GeoDataFrame(town_lookup, crs={'init': 'epsg:4326'},\n", " geometry=town_lookup.apply(lambda r: Point(apply_itm_to_wgs(r, e='Y',n='X')), axis=1))\n", "town_lookup.plot()" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:12.019400Z", "start_time": "2018-06-07T10:36:11.987Z" } }, "outputs": [], "source": [ "categories = set(reference.minor_xs('town').values.ravel('k'))\n", "df= pd.DataFrame.from_dict({\n", " category:\n", " enrolements[:,(reference.minor_xs('town')==category).any(axis=1),:].sum().sum()\n", " for category in categories\n", "}).T.drop(np.nan)\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:12.025399Z", "start_time": "2018-06-07T10:36:11.991Z" } }, "outputs": [], "source": [ "town_stats = gpd.GeoDataFrame(geometry=town_lookup.apply(lambda r: Point(apply_itm_to_wgs(r, e='Y',n='X')), axis=1))\n", "town_stats['mean_enrolment'] = df.mean(axis=1)\n", "town_stats['2017_change'] = (-1+df[2017]/df.mean(axis=1))\n", "town_stats.plot(column='2017_change')" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:12.030985Z", "start_time": "2018-06-07T10:36:11.993Z" }, "code_folding": [] }, "outputs": [], "source": [ "constituency_shp = 'http://osni-spatial-ni.opendata.arcgis.com/datasets/563dc2ec3d9943428e3fe68966d40deb_3.zip'\n", "urllib.request.urlretrieve(constituency_shp, 'data/constituency.zip')\n", "import zipfile\n", "with zipfile.ZipFile('data/constituency.zip','r') as z:\n", " z.extractall('data/')" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "ExecuteTime": { "end_time": "2018-06-07T10:36:12.036793Z", "start_time": "2018-06-07T10:36:11.997Z" } }, "outputs": [], "source": [ "import geopandas as gpd\n", "df = gpd.GeoDataFrame.from_file('data/OSNI_Open_Data_Largescale_Boundaries__Parliamentary_Constituencies_2008.shp')\n", "df" ] } ], "metadata": { "kernelspec": { "display_name": "Python [conda root]", "language": "python", "name": "conda-root-py" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.4" }, "toc": { "base_numbering": 1, "nav_menu": {}, "number_sections": true, "sideBar": true, "skip_h1_title": false, "title_cell": "Table of Contents", "title_sidebar": "Contents", "toc_cell": false, "toc_position": {}, "toc_section_display": true, "toc_window_display": false } }, "nbformat": 4, "nbformat_minor": 2 }