{ "cells": [ { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "import itertools\n", "import collections\n", "import json\n", "import pandas as pd\n", "import numpy as np\n", "from scipy.stats import gmean\n", "import datetime\n", "\n", "import matplotlib as mpl\n", "import matplotlib.pyplot as plt\n", "%matplotlib inline" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ " % Total % Received % Xferd Average Speed Time Time Time Current\n", " Dload Upload Total Spent Left Speed\n", "100 1292 0 1292 0 0 1196 0 --:--:-- 0:00:01 --:--:-- 1196\n" ] } ], "source": [ "!curl \"https://api.coronavirus-staging.data.gov.uk/v1/data?filters=areaName=United%2520Kingdom;areaType=overview&structure=%7B%22date%22:%22date%22,%22areaName%22:%22areaName%22,%22areaType%22:%22areaType%22,%22newAdmissions%22:%22newAdmissions%22,%22cumAdmissions%22:%22cumAdmissions%22%7D&format=csv\" | gunzip > hospital_admissions.csv" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [], "source": [ "raw_data = pd.read_csv('hospital_admissions.csv', \n", " parse_dates=[0], dayfirst=True,\n", " )" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "date datetime64[ns]\n", "areaName object\n", "areaType object\n", "newAdmissions int64\n", "cumAdmissions int64\n", "dtype: object" ] }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "raw_data.dtypes" ] }, { "cell_type": "code", "execution_count": 6, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | areaName | \n", "areaType | \n", "newAdmissions | \n", "cumAdmissions | \n", "
---|---|---|---|---|
date | \n", "\n", " | \n", " | \n", " | \n", " |
2020-03-23 | \n", "United Kingdom | \n", "overview | \n", "1687 | \n", "6794 | \n", "
2020-03-24 | \n", "United Kingdom | \n", "overview | \n", "1931 | \n", "8725 | \n", "
2020-03-25 | \n", "United Kingdom | \n", "overview | \n", "1968 | \n", "10693 | \n", "
2020-03-26 | \n", "United Kingdom | \n", "overview | \n", "2222 | \n", "12915 | \n", "
2020-03-27 | \n", "United Kingdom | \n", "overview | \n", "2165 | \n", "15080 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2020-08-01 | \n", "United Kingdom | \n", "overview | \n", "133 | \n", "132672 | \n", "
2020-08-02 | \n", "United Kingdom | \n", "overview | \n", "109 | \n", "132781 | \n", "
2020-08-03 | \n", "United Kingdom | \n", "overview | \n", "89 | \n", "132870 | \n", "
2020-08-04 | \n", "United Kingdom | \n", "overview | \n", "126 | \n", "132996 | \n", "
2020-08-05 | \n", "United Kingdom | \n", "overview | \n", "128 | \n", "133124 | \n", "
136 rows × 4 columns
\n", "\n", " | cases | \n", "deaths | \n", "cases_culm | \n", "deaths_culm | \n", "cases_diff | \n", "deaths_diff | \n", "
---|---|---|---|---|---|---|
dateRep | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
2019-12-31 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "
2020-01-01 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
2020-01-02 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
2020-01-03 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
2020-01-04 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2020-08-14 | \n", "1129 | \n", "-5359 | \n", "314927 | \n", "41347 | \n", "120.0 | \n", "-5539.0 | \n", "
2020-08-15 | \n", "1440 | \n", "10 | \n", "316367 | \n", "41357 | \n", "311.0 | \n", "5369.0 | \n", "
2020-08-16 | \n", "1077 | \n", "4 | \n", "317444 | \n", "41361 | \n", "-363.0 | \n", "-6.0 | \n", "
2020-08-17 | \n", "1040 | \n", "5 | \n", "318484 | \n", "41366 | \n", "-37.0 | \n", "1.0 | \n", "
2020-08-18 | \n", "713 | \n", "3 | \n", "319197 | \n", "41369 | \n", "-327.0 | \n", "-2.0 | \n", "
232 rows × 6 columns
\n", "\n", " | cases | \n", "deaths | \n", "cases_culm | \n", "deaths_culm | \n", "cases_diff | \n", "deaths_diff | \n", "
---|---|---|---|---|---|---|
dateRep | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
2019-12-31 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "
2020-01-01 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
2020-01-02 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
2020-01-03 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
2020-01-04 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2020-08-14 | \n", "1129 | \n", "-5359 | \n", "314927 | \n", "41347 | \n", "120.0 | \n", "-5539.0 | \n", "
2020-08-15 | \n", "1440 | \n", "10 | \n", "316367 | \n", "41357 | \n", "311.0 | \n", "5369.0 | \n", "
2020-08-16 | \n", "1077 | \n", "4 | \n", "317444 | \n", "41361 | \n", "-363.0 | \n", "-6.0 | \n", "
2020-08-17 | \n", "1040 | \n", "5 | \n", "318484 | \n", "41366 | \n", "-37.0 | \n", "1.0 | \n", "
2020-08-18 | \n", "713 | \n", "3 | \n", "319197 | \n", "41369 | \n", "-327.0 | \n", "-2.0 | \n", "
232 rows × 6 columns
\n", "\n", " | cases | \n", "deaths | \n", "cases_culm | \n", "deaths_culm | \n", "cases_diff | \n", "deaths_diff | \n", "newAdmissions | \n", "cumAdmissions | \n", "deaths_m7 | \n", "cases_m7 | \n", "admissions_m7 | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|
2019-12-31 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-01 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-02 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-03 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-04 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2020-08-14 | \n", "1129 | \n", "-5359 | \n", "314927 | \n", "41347 | \n", "120.0 | \n", "-5539.0 | \n", "NaN | \n", "NaN | \n", "-723.714286 | \n", "970.428571 | \n", "NaN | \n", "
2020-08-15 | \n", "1440 | \n", "10 | \n", "316367 | \n", "41357 | \n", "311.0 | \n", "5369.0 | \n", "NaN | \n", "NaN | \n", "-736.285714 | \n", "1051.714286 | \n", "NaN | \n", "
2020-08-16 | \n", "1077 | \n", "4 | \n", "317444 | \n", "41361 | \n", "-363.0 | \n", "-6.0 | \n", "NaN | \n", "NaN | \n", "-743.571429 | \n", "1097.285714 | \n", "NaN | \n", "
2020-08-17 | \n", "1040 | \n", "5 | \n", "318484 | \n", "41366 | \n", "-37.0 | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "-744.000000 | \n", "1094.142857 | \n", "NaN | \n", "
2020-08-18 | \n", "713 | \n", "3 | \n", "319197 | \n", "41369 | \n", "-327.0 | \n", "-2.0 | \n", "NaN | \n", "NaN | \n", "-736.714286 | \n", "1079.428571 | \n", "NaN | \n", "
232 rows × 11 columns
\n", "\n", " | cases | \n", "deaths | \n", "cases_culm | \n", "deaths_culm | \n", "cases_diff | \n", "deaths_diff | \n", "newAdmissions | \n", "cumAdmissions | \n", "deaths_m7 | \n", "cases_m7 | \n", "admissions_m7 | \n", "cases_m7n | \n", "deaths_m7n | \n", "admissions_m7n | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
2019-12-31 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-01 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-02 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-03 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-04 | \n", "0 | \n", "0 | \n", "0 | \n", "0 | \n", "0.0 | \n", "0.0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "0.000000 | \n", "0.000000 | \n", "NaN | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2020-08-14 | \n", "1129 | \n", "-5359 | \n", "314927 | \n", "41347 | \n", "120.0 | \n", "-5539.0 | \n", "NaN | \n", "NaN | \n", "-723.714286 | \n", "970.428571 | \n", "NaN | \n", "0.200248 | \n", "-0.766067 | \n", "NaN | \n", "
2020-08-15 | \n", "1440 | \n", "10 | \n", "316367 | \n", "41357 | \n", "311.0 | \n", "5369.0 | \n", "NaN | \n", "NaN | \n", "-736.285714 | \n", "1051.714286 | \n", "NaN | \n", "0.217021 | \n", "-0.779374 | \n", "NaN | \n", "
2020-08-16 | \n", "1077 | \n", "4 | \n", "317444 | \n", "41361 | \n", "-363.0 | \n", "-6.0 | \n", "NaN | \n", "NaN | \n", "-743.571429 | \n", "1097.285714 | \n", "NaN | \n", "0.226425 | \n", "-0.787086 | \n", "NaN | \n", "
2020-08-17 | \n", "1040 | \n", "5 | \n", "318484 | \n", "41366 | \n", "-37.0 | \n", "1.0 | \n", "NaN | \n", "NaN | \n", "-744.000000 | \n", "1094.142857 | \n", "NaN | \n", "0.225776 | \n", "-0.787540 | \n", "NaN | \n", "
2020-08-18 | \n", "713 | \n", "3 | \n", "319197 | \n", "41369 | \n", "-327.0 | \n", "-2.0 | \n", "NaN | \n", "NaN | \n", "-736.714286 | \n", "1079.428571 | \n", "NaN | \n", "0.222740 | \n", "-0.779828 | \n", "NaN | \n", "
232 rows × 14 columns
\n", "\n", " | cases | \n", "cases_culm | \n", "deaths | \n", "deaths_culm | \n", "newAdmissions | \n", "cumAdmissions | \n", "deaths_m7 | \n", "cases_m7 | \n", "admissions_m7 | \n", "cases_m7n | \n", "deaths_m7n | \n", "admissions_m7n | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
2019-12-31 | \n", "0.0 | \n", "0.0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.0 | \n", "NaN | \n", "0.0 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-01 | \n", "0.0 | \n", "0.0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.0 | \n", "NaN | \n", "0.0 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-02 | \n", "0.0 | \n", "0.0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.0 | \n", "NaN | \n", "0.0 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-03 | \n", "0.0 | \n", "0.0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.0 | \n", "NaN | \n", "0.0 | \n", "0.000000 | \n", "NaN | \n", "
2020-01-04 | \n", "0.0 | \n", "0.0 | \n", "0 | \n", "0 | \n", "NaN | \n", "NaN | \n", "0.000000 | \n", "0.0 | \n", "NaN | \n", "0.0 | \n", "0.000000 | \n", "NaN | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2020-08-14 | \n", "NaN | \n", "NaN | \n", "-5359 | \n", "41347 | \n", "NaN | \n", "NaN | \n", "-723.714286 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "-1.685296 | \n", "NaN | \n", "
2020-08-15 | \n", "NaN | \n", "NaN | \n", "10 | \n", "41357 | \n", "NaN | \n", "NaN | \n", "-736.285714 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "-1.714571 | \n", "NaN | \n", "
2020-08-16 | \n", "NaN | \n", "NaN | \n", "4 | \n", "41361 | \n", "NaN | \n", "NaN | \n", "-743.571429 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "-1.731537 | \n", "NaN | \n", "
2020-08-17 | \n", "NaN | \n", "NaN | \n", "5 | \n", "41366 | \n", "NaN | \n", "NaN | \n", "-744.000000 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "-1.732535 | \n", "NaN | \n", "
2020-08-18 | \n", "NaN | \n", "NaN | \n", "3 | \n", "41369 | \n", "NaN | \n", "NaN | \n", "-736.714286 | \n", "NaN | \n", "NaN | \n", "NaN | \n", "-1.715569 | \n", "NaN | \n", "
232 rows × 12 columns
\n", "\n", " | areaType | \n", "areaName | \n", "newCasesByPublishDate | \n", "cumCasesByPublishDate | \n", "
---|---|---|---|---|
date | \n", "\n", " | \n", " | \n", " | \n", " |
2020-03-10 | \n", "overview | \n", "United Kingdom | \n", "NaN | \n", "373 | \n", "
2020-03-11 | \n", "overview | \n", "United Kingdom | \n", "83.0 | \n", "456 | \n", "
2020-03-12 | \n", "overview | \n", "United Kingdom | \n", "134.0 | \n", "590 | \n", "
2020-03-13 | \n", "overview | \n", "United Kingdom | \n", "207.0 | \n", "797 | \n", "
2020-03-14 | \n", "overview | \n", "United Kingdom | \n", "264.0 | \n", "1061 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
2020-06-29 | \n", "overview | \n", "United Kingdom | \n", "815.0 | \n", "311965 | \n", "
2020-06-30 | \n", "overview | \n", "United Kingdom | \n", "689.0 | \n", "312654 | \n", "
2020-07-01 | \n", "overview | \n", "United Kingdom | \n", "829.0 | \n", "313483 | \n", "
2020-07-02 | \n", "overview | \n", "United Kingdom | \n", "576.0 | \n", "283757 | \n", "
2020-07-03 | \n", "overview | \n", "United Kingdom | \n", "544.0 | \n", "284276 | \n", "
116 rows × 4 columns
\n", "