{ "cells": [ { "cell_type": "markdown", "id": "740a2d15", "metadata": {}, "source": [ "# KNN imputation " ] }, { "cell_type": "code", "execution_count": 1, "id": "bfae286d", "metadata": {}, "outputs": [], "source": [ "import os\n", "import pandas as pd\n", "import numpy as np\n", "\n", "from sklearn.experimental import enable_iterative_imputer\n", "from sklearn.impute import IterativeImputer\n", "from sklearn.impute import KNNImputer" ] }, { "cell_type": "code", "execution_count": 3, "id": "f65f7221", "metadata": {}, "outputs": [], "source": [ "master = pd.read_csv('https://raw.githubusercontent.com/CharlotteJames/ed-forecast/main/data/master_scaled_impute.csv',\n", " index_col=0)" ] }, { "cell_type": "code", "execution_count": 4, "id": "6ab9ea01", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | ccg | \n", "month | \n", "111_111_offered | \n", "111_111_answered | \n", "amb_sys_made | \n", "amb_sys_answered | \n", "gp_appt_attended | \n", "gp_appt_available | \n", "ae_attendances_attendances | \n", "population | \n", "People | \n", "Places | \n", "Lives | \n", "year | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "00N | \n", "Jan | \n", "568.479362 | \n", "459.899870 | \n", "216.450677 | \n", "148.439545 | \n", "4338.335607 | \n", "4738.295678 | \n", "385.585466 | \n", "15.0265 | \n", "94.8 | \n", "101.7 | \n", "96.8 | \n", "2018 | \n", "
1 | \n", "00N | \n", "Feb | \n", "472.022555 | \n", "395.194004 | \n", "204.869142 | \n", "147.335865 | \n", "3704.655109 | \n", "4074.002595 | \n", "347.519382 | \n", "15.0265 | \n", "94.8 | \n", "101.7 | \n", "96.8 | \n", "2018 | \n", "
2 | \n", "00N | \n", "Mar | \n", "541.224032 | \n", "453.863381 | \n", "233.092813 | \n", "168.121234 | \n", "3907.696403 | \n", "4321.498686 | \n", "383.389345 | \n", "15.0265 | \n", "94.8 | \n", "101.7 | \n", "96.8 | \n", "2018 | \n", "
3 | \n", "00N | \n", "Apr | \n", "506.059962 | \n", "438.172926 | \n", "210.990836 | \n", "149.848422 | \n", "3721.092736 | \n", "4089.042691 | \n", "396.299870 | \n", "15.0265 | \n", "94.8 | \n", "101.7 | \n", "96.8 | \n", "2018 | \n", "
4 | \n", "00N | \n", "May | \n", "517.326603 | \n", "452.985246 | \n", "223.273261 | \n", "164.595494 | \n", "3848.800453 | \n", "4224.337005 | \n", "422.187469 | \n", "15.0265 | \n", "94.8 | \n", "101.7 | \n", "96.8 | \n", "2018 | \n", "