{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# Getting Started" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "This module provides cached loading of open datasets from Faculty. To view\n", "the available datasets:" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [], "source": [ "from faculty_extras import opendata" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "['higgs_boson/README.md',\n", " 'higgs_boson/higgs.csv',\n", " 'higgs_boson/higgs_test.csv',\n", " 'higgs_boson/higgs_train.csv',\n", " 'higgs_boson/higgs_validate.csv',\n", " 'tutorials/supermarkets/.ipynb_checkpoints/modify-checkpoint.ipynb',\n", " 'tutorials/supermarkets/README.md',\n", " 'tutorials/supermarkets/lidl.csv',\n", " 'tutorials/supermarkets/waitrose.csv',\n", " 'uk_2011_census/census_by_outputarea.csv',\n", " 'uk_2011_census/census_variable_info.csv',\n", " 'uk_2011_census/outputarea_localauthority_mapping.csv',\n", " 'uk_2011_census/outputarea_lsoa_msoa_mapping.csv',\n", " 'uk_2011_census/outputarea_parliamentaryconstituency_mapping.csv',\n", " 'uk_2011_census/postcode_outputarea_mapping.csv',\n", " 'uk_2011_census/ukpostcodes.csv',\n", " 'uk_statistical_boundaries/geojson/local_authorities.json',\n", " 'uk_statistical_boundaries/geojson/lower_super_output_areas.json',\n", " 'uk_statistical_boundaries/geojson/middle_super_output_areas.json',\n", " 'uk_statistical_boundaries/geojson/output_areas.json',\n", " 'uk_statistical_boundaries/geojson/parliamentary_constituencies.json',\n", " 'uk_statistical_boundaries/topojson/uk_statistical_boundaries.json',\n", " 'us_flights/README.md',\n", " 'us_flights/us_flights_1987.csv',\n", " 'us_flights/us_flights_1988.csv',\n", " 'us_flights/us_flights_1989.csv',\n", " 'us_flights/us_flights_1990.csv',\n", " 'us_flights/us_flights_1991.csv',\n", " 'us_flights/us_flights_1992.csv',\n", " 'us_flights/us_flights_1993.csv',\n", " 'us_flights/us_flights_1994.csv',\n", " 'us_flights/us_flights_1995.csv',\n", " 'us_flights/us_flights_1996.csv',\n", " 'us_flights/us_flights_1997.csv',\n", " 'us_flights/us_flights_1998.csv',\n", " 'us_flights/us_flights_1999.csv',\n", " 'us_flights/us_flights_2000.csv',\n", " 'us_flights/us_flights_2001.csv',\n", " 'us_flights/us_flights_2002.csv',\n", " 'us_flights/us_flights_2003.csv',\n", " 'us_flights/us_flights_2004.csv',\n", " 'us_flights/us_flights_2005.csv',\n", " 'us_flights/us_flights_2006.csv',\n", " 'us_flights/us_flights_2007.csv',\n", " 'us_flights/us_flights_2008.csv',\n", " 'us_flights/us_flights_dtypes.json']" ] }, "execution_count": 2, "metadata": {}, "output_type": "execute_result" } ], "source": [ "opendata.ls()" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "To load one of the datasets into a pandas DataFrame:" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [], "source": [ "df = opendata.load(\"uk_2011_census/census_by_outputarea.csv\")" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
| \n", " | OA | \n", "Total_Population | \n", "Total_Households | \n", "Total_Dwellings | \n", "Total_Household_Spaces | \n", "Total_Population_16_and_over | \n", "Total_Population_16_to_74 | \n", "Total_Pop_No_NI_Students_16_to_74 | \n", "Total_Employment_16_to_74 | \n", "Total_Pop_in_Housesholds_16_and_over | \n", "... | \n", "u158 | \n", "u159 | \n", "u160 | \n", "u161 | \n", "u162 | \n", "u163 | \n", "u164 | \n", "u165 | \n", "u166 | \n", "u167 | \n", "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", "E00000001 | \n", "194 | \n", "99 | \n", "115 | \n", "115 | \n", "173 | \n", "148 | \n", "148 | \n", "102 | \n", "173 | \n", "... | \n", "6 | \n", "18 | \n", "57 | \n", "14 | \n", "9 | \n", "2 | \n", "2 | \n", "0 | \n", "0 | \n", "0 | \n", "
| 1 | \n", "E00000003 | \n", "250 | \n", "112 | \n", "125 | \n", "125 | \n", "218 | \n", "199 | \n", "199 | \n", "147 | \n", "218 | \n", "... | \n", "10 | \n", "24 | \n", "74 | \n", "32 | \n", "6 | \n", "2 | \n", "1 | \n", "2 | \n", "1 | \n", "5 | \n", "
| 2 | \n", "E00000005 | \n", "367 | \n", "217 | \n", "241 | \n", "241 | \n", "337 | \n", "304 | \n", "304 | \n", "241 | \n", "337 | \n", "... | \n", "16 | \n", "37 | \n", "117 | \n", "52 | \n", "12 | \n", "7 | \n", "9 | \n", "3 | \n", "0 | \n", "4 | \n", "
| 3 | \n", "E00000007 | \n", "123 | \n", "83 | \n", "103 | \n", "103 | \n", "113 | \n", "111 | \n", "111 | \n", "86 | \n", "113 | \n", "... | \n", "4 | \n", "18 | \n", "36 | \n", "20 | \n", "9 | \n", "0 | \n", "2 | \n", "0 | \n", "0 | \n", "1 | \n", "
| 4 | \n", "E00000010 | \n", "102 | \n", "78 | \n", "79 | \n", "79 | \n", "97 | \n", "86 | \n", "86 | \n", "59 | \n", "97 | \n", "... | \n", "12 | \n", "11 | \n", "16 | \n", "16 | \n", "6 | \n", "0 | \n", "5 | \n", "0 | \n", "0 | \n", "5 | \n", "
5 rows × 178 columns
\n", "