{
 "cells": [
  {
   "attachments": {},
   "cell_type": "markdown",
   "id": "4c9be1ce",
   "metadata": {},
   "source": [
    "Basic Statistics\n",
    "================\n",
    "\n",
    "This Notebook shows us how to use the `pandas` to find\n",
    "basic quantitative descriptions of our data\n",
    "\n",
    "Topics in this Notebook:\n",
    "\n",
    "- dropping columns\n",
    "- minimum and maximum ranges\n",
    "- averages\n",
    "- counts\n",
    "- sorting data\n",
    "- correlations with `corr()`\n",
    "- `describe()`"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "98a332e1",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dbn</th>\n",
       "      <th>district</th>\n",
       "      <th>boro</th>\n",
       "      <th>school_name</th>\n",
       "      <th>total_enrollment</th>\n",
       "      <th>asian_pct</th>\n",
       "      <th>black_pct</th>\n",
       "      <th>hispanic_pct</th>\n",
       "      <th>white_pct</th>\n",
       "      <th>swd_pct</th>\n",
       "      <th>ell_pct</th>\n",
       "      <th>poverty_pct</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>01M015</td>\n",
       "      <td>1</td>\n",
       "      <td>Manhattan</td>\n",
       "      <td>P.S. 015 Roberto Clemente</td>\n",
       "      <td>193</td>\n",
       "      <td>0.135</td>\n",
       "      <td>0.275</td>\n",
       "      <td>0.528</td>\n",
       "      <td>0.057</td>\n",
       "      <td>0.223</td>\n",
       "      <td>0.109</td>\n",
       "      <td>0.819</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>01M019</td>\n",
       "      <td>1</td>\n",
       "      <td>Manhattan</td>\n",
       "      <td>P.S. 019 Asher Levy</td>\n",
       "      <td>212</td>\n",
       "      <td>0.061</td>\n",
       "      <td>0.193</td>\n",
       "      <td>0.613</td>\n",
       "      <td>0.080</td>\n",
       "      <td>0.392</td>\n",
       "      <td>0.042</td>\n",
       "      <td>0.712</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>01M020</td>\n",
       "      <td>1</td>\n",
       "      <td>Manhattan</td>\n",
       "      <td>P.S. 020 Anna Silver</td>\n",
       "      <td>412</td>\n",
       "      <td>0.248</td>\n",
       "      <td>0.133</td>\n",
       "      <td>0.522</td>\n",
       "      <td>0.073</td>\n",
       "      <td>0.218</td>\n",
       "      <td>0.119</td>\n",
       "      <td>0.709</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>01M034</td>\n",
       "      <td>1</td>\n",
       "      <td>Manhattan</td>\n",
       "      <td>P.S. 034 Franklin D. Roosevelt</td>\n",
       "      <td>273</td>\n",
       "      <td>0.026</td>\n",
       "      <td>0.381</td>\n",
       "      <td>0.557</td>\n",
       "      <td>0.029</td>\n",
       "      <td>0.392</td>\n",
       "      <td>0.062</td>\n",
       "      <td>0.960</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>01M063</td>\n",
       "      <td>1</td>\n",
       "      <td>Manhattan</td>\n",
       "      <td>The STAR Academy - P.S.63</td>\n",
       "      <td>208</td>\n",
       "      <td>0.029</td>\n",
       "      <td>0.192</td>\n",
       "      <td>0.635</td>\n",
       "      <td>0.091</td>\n",
       "      <td>0.279</td>\n",
       "      <td>0.014</td>\n",
       "      <td>0.769</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "       dbn  district       boro                     school_name  \\\n",
       "4   01M015         1  Manhattan       P.S. 015 Roberto Clemente   \n",
       "9   01M019         1  Manhattan             P.S. 019 Asher Levy   \n",
       "14  01M020         1  Manhattan            P.S. 020 Anna Silver   \n",
       "19  01M034         1  Manhattan  P.S. 034 Franklin D. Roosevelt   \n",
       "24  01M063         1  Manhattan       The STAR Academy - P.S.63   \n",
       "\n",
       "    total_enrollment  asian_pct  black_pct  hispanic_pct  white_pct  swd_pct  \\\n",
       "4                193      0.135      0.275         0.528      0.057    0.223   \n",
       "9                212      0.061      0.193         0.613      0.080    0.392   \n",
       "14               412      0.248      0.133         0.522      0.073    0.218   \n",
       "19               273      0.026      0.381         0.557      0.029    0.392   \n",
       "24               208      0.029      0.192         0.635      0.091    0.279   \n",
       "\n",
       "    ell_pct  poverty_pct  \n",
       "4     0.109        0.819  \n",
       "9     0.042        0.712  \n",
       "14    0.119        0.709  \n",
       "19    0.062        0.960  \n",
       "24    0.014        0.769  "
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# import schools from the nycschool package\n",
    "from nycschools import schools\n",
    "\n",
    "# load the demographic data into a `DataFrame` called df\n",
    "df = schools.load_school_demographics()\n",
    "\n",
    "# let's just use one year of data\n",
    "df = df[df.ay == 2020]\n",
    "\n",
    "# use a subset of columns for this notebook\n",
    "cols = [\n",
    "    'dbn',\n",
    "    'district',\n",
    "    'boro',\n",
    "    'school_name',\n",
    "    'total_enrollment',\n",
    "    'asian_pct',\n",
    "    'black_pct',\n",
    "    'hispanic_pct',\n",
    "    'white_pct',\n",
    "    'swd_pct',\n",
    "    'ell_pct',\n",
    "    'poverty_pct'\n",
    "]\n",
    "df = df[cols]\n",
    "\n",
    "\n",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "dcec0f0c",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>dbn</th>\n",
       "      <th>district</th>\n",
       "      <th>boro</th>\n",
       "      <th>school_name</th>\n",
       "      <th>total_enrollment</th>\n",
       "      <th>asian_pct</th>\n",
       "      <th>black_pct</th>\n",
       "      <th>hispanic_pct</th>\n",
       "      <th>white_pct</th>\n",
       "      <th>swd_pct</th>\n",
       "      <th>ell_pct</th>\n",
       "      <th>poverty_pct</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>3723</th>\n",
       "      <td>13K430</td>\n",
       "      <td>13</td>\n",
       "      <td>Brooklyn</td>\n",
       "      <td>Brooklyn Technical High School</td>\n",
       "      <td>5921</td>\n",
       "      <td>0.599</td>\n",
       "      <td>0.056</td>\n",
       "      <td>0.066</td>\n",
       "      <td>0.237</td>\n",
       "      <td>0.016</td>\n",
       "      <td>0.001</td>\n",
       "      <td>0.590</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5310</th>\n",
       "      <td>20K490</td>\n",
       "      <td>20</td>\n",
       "      <td>Brooklyn</td>\n",
       "      <td>Fort Hamilton High School</td>\n",
       "      <td>4678</td>\n",
       "      <td>0.290</td>\n",
       "      <td>0.025</td>\n",
       "      <td>0.317</td>\n",
       "      <td>0.347</td>\n",
       "      <td>0.153</td>\n",
       "      <td>0.162</td>\n",
       "      <td>0.706</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6686</th>\n",
       "      <td>26Q430</td>\n",
       "      <td>26</td>\n",
       "      <td>Queens</td>\n",
       "      <td>Francis Lewis High School</td>\n",
       "      <td>4424</td>\n",
       "      <td>0.577</td>\n",
       "      <td>0.047</td>\n",
       "      <td>0.210</td>\n",
       "      <td>0.150</td>\n",
       "      <td>0.150</td>\n",
       "      <td>0.115</td>\n",
       "      <td>0.690</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5802</th>\n",
       "      <td>22K405</td>\n",
       "      <td>22</td>\n",
       "      <td>Brooklyn</td>\n",
       "      <td>Midwood High School</td>\n",
       "      <td>4109</td>\n",
       "      <td>0.354</td>\n",
       "      <td>0.255</td>\n",
       "      <td>0.133</td>\n",
       "      <td>0.225</td>\n",
       "      <td>0.138</td>\n",
       "      <td>0.036</td>\n",
       "      <td>0.723</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5807</th>\n",
       "      <td>22K425</td>\n",
       "      <td>22</td>\n",
       "      <td>Brooklyn</td>\n",
       "      <td>James Madison High School</td>\n",
       "      <td>3851</td>\n",
       "      <td>0.209</td>\n",
       "      <td>0.128</td>\n",
       "      <td>0.175</td>\n",
       "      <td>0.472</td>\n",
       "      <td>0.154</td>\n",
       "      <td>0.121</td>\n",
       "      <td>0.758</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7279</th>\n",
       "      <td>28Q440</td>\n",
       "      <td>28</td>\n",
       "      <td>Queens</td>\n",
       "      <td>Forest Hills High School</td>\n",
       "      <td>3775</td>\n",
       "      <td>0.247</td>\n",
       "      <td>0.065</td>\n",
       "      <td>0.381</td>\n",
       "      <td>0.272</td>\n",
       "      <td>0.164</td>\n",
       "      <td>0.093</td>\n",
       "      <td>0.702</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8199</th>\n",
       "      <td>31R455</td>\n",
       "      <td>31</td>\n",
       "      <td>Staten Island</td>\n",
       "      <td>Tottenville High School</td>\n",
       "      <td>3726</td>\n",
       "      <td>0.072</td>\n",
       "      <td>0.014</td>\n",
       "      <td>0.132</td>\n",
       "      <td>0.761</td>\n",
       "      <td>0.227</td>\n",
       "      <td>0.023</td>\n",
       "      <td>0.416</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5557</th>\n",
       "      <td>21K525</td>\n",
       "      <td>21</td>\n",
       "      <td>Brooklyn</td>\n",
       "      <td>Edward R. Murrow High School</td>\n",
       "      <td>3691</td>\n",
       "      <td>0.274</td>\n",
       "      <td>0.176</td>\n",
       "      <td>0.193</td>\n",
       "      <td>0.308</td>\n",
       "      <td>0.178</td>\n",
       "      <td>0.125</td>\n",
       "      <td>0.670</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5300</th>\n",
       "      <td>20K445</td>\n",
       "      <td>20</td>\n",
       "      <td>Brooklyn</td>\n",
       "      <td>New Utrecht High School</td>\n",
       "      <td>3572</td>\n",
       "      <td>0.391</td>\n",
       "      <td>0.030</td>\n",
       "      <td>0.336</td>\n",
       "      <td>0.234</td>\n",
       "      <td>0.165</td>\n",
       "      <td>0.218</td>\n",
       "      <td>0.796</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6681</th>\n",
       "      <td>26Q415</td>\n",
       "      <td>26</td>\n",
       "      <td>Queens</td>\n",
       "      <td>Benjamin N. Cardozo High School</td>\n",
       "      <td>3405</td>\n",
       "      <td>0.423</td>\n",
       "      <td>0.214</td>\n",
       "      <td>0.223</td>\n",
       "      <td>0.120</td>\n",
       "      <td>0.145</td>\n",
       "      <td>0.051</td>\n",
       "      <td>0.668</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "         dbn  district           boro                      school_name  \\\n",
       "3723  13K430        13       Brooklyn   Brooklyn Technical High School   \n",
       "5310  20K490        20       Brooklyn        Fort Hamilton High School   \n",
       "6686  26Q430        26         Queens        Francis Lewis High School   \n",
       "5802  22K405        22       Brooklyn              Midwood High School   \n",
       "5807  22K425        22       Brooklyn        James Madison High School   \n",
       "7279  28Q440        28         Queens         Forest Hills High School   \n",
       "8199  31R455        31  Staten Island          Tottenville High School   \n",
       "5557  21K525        21       Brooklyn     Edward R. Murrow High School   \n",
       "5300  20K445        20       Brooklyn          New Utrecht High School   \n",
       "6681  26Q415        26         Queens  Benjamin N. Cardozo High School   \n",
       "\n",
       "      total_enrollment  asian_pct  black_pct  hispanic_pct  white_pct  \\\n",
       "3723              5921      0.599      0.056         0.066      0.237   \n",
       "5310              4678      0.290      0.025         0.317      0.347   \n",
       "6686              4424      0.577      0.047         0.210      0.150   \n",
       "5802              4109      0.354      0.255         0.133      0.225   \n",
       "5807              3851      0.209      0.128         0.175      0.472   \n",
       "7279              3775      0.247      0.065         0.381      0.272   \n",
       "8199              3726      0.072      0.014         0.132      0.761   \n",
       "5557              3691      0.274      0.176         0.193      0.308   \n",
       "5300              3572      0.391      0.030         0.336      0.234   \n",
       "6681              3405      0.423      0.214         0.223      0.120   \n",
       "\n",
       "      swd_pct  ell_pct  poverty_pct  \n",
       "3723    0.016    0.001        0.590  \n",
       "5310    0.153    0.162        0.706  \n",
       "6686    0.150    0.115        0.690  \n",
       "5802    0.138    0.036        0.723  \n",
       "5807    0.154    0.121        0.758  \n",
       "7279    0.164    0.093        0.702  \n",
       "8199    0.227    0.023        0.416  \n",
       "5557    0.178    0.125        0.670  \n",
       "5300    0.165    0.218        0.796  \n",
       "6681    0.145    0.051        0.668  "
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# sort the data and show just the 10 largest schools\n",
    "# sort in descending order (biggest --> smallest)\n",
    "data = df.sort_values(by=\"total_enrollment\", ascending=False)\n",
    "\n",
    "# show the first 10 rows\n",
    "data[:10]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "2386fe42",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The largest school: 5921\n",
      "The smallest school: 7\n",
      "Avg (mean) school size: 560.79296875\n",
      "Avg (median) school size: 460.5\n",
      "Avg (mode, can return multiple values) school size: [479, 714]\n"
     ]
    }
   ],
   "source": [
    "# get just the total_enrollment column, called a Series in pandas\n",
    "enrollment = df[\"total_enrollment\"]\n",
    "print(\"The largest school:\", enrollment.max())\n",
    "print(\"The smallest school:\", enrollment.min())\n",
    "\n",
    "print(\"Avg (mean) school size:\", enrollment.mean())\n",
    "print(\"Avg (median) school size:\", enrollment.median())\n",
    "print(\"Avg (mode, can return multiple values) school size:\", list(enrollment.mode()))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "2cf28566",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>district</th>\n",
       "      <th>total_enrollment</th>\n",
       "      <th>asian_pct</th>\n",
       "      <th>black_pct</th>\n",
       "      <th>hispanic_pct</th>\n",
       "      <th>white_pct</th>\n",
       "      <th>swd_pct</th>\n",
       "      <th>ell_pct</th>\n",
       "      <th>poverty_pct</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>count</th>\n",
       "      <td>2048.00000</td>\n",
       "      <td>2048.000000</td>\n",
       "      <td>2048.000000</td>\n",
       "      <td>2048.000000</td>\n",
       "      <td>2048.000000</td>\n",
       "      <td>2048.000000</td>\n",
       "      <td>2048.000000</td>\n",
       "      <td>2048.000000</td>\n",
       "      <td>2048.000000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>mean</th>\n",
       "      <td>27.62207</td>\n",
       "      <td>560.792969</td>\n",
       "      <td>0.117710</td>\n",
       "      <td>0.302644</td>\n",
       "      <td>0.431721</td>\n",
       "      <td>0.118602</td>\n",
       "      <td>0.237641</td>\n",
       "      <td>0.141212</td>\n",
       "      <td>0.766560</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>std</th>\n",
       "      <td>26.68098</td>\n",
       "      <td>461.014510</td>\n",
       "      <td>0.166804</td>\n",
       "      <td>0.256375</td>\n",
       "      <td>0.246118</td>\n",
       "      <td>0.168041</td>\n",
       "      <td>0.160780</td>\n",
       "      <td>0.143127</td>\n",
       "      <td>0.194297</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>min</th>\n",
       "      <td>1.00000</td>\n",
       "      <td>7.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.015000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.000000</td>\n",
       "      <td>0.050000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25%</th>\n",
       "      <td>10.00000</td>\n",
       "      <td>304.000000</td>\n",
       "      <td>0.015000</td>\n",
       "      <td>0.081474</td>\n",
       "      <td>0.206000</td>\n",
       "      <td>0.016000</td>\n",
       "      <td>0.163000</td>\n",
       "      <td>0.049000</td>\n",
       "      <td>0.711000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50%</th>\n",
       "      <td>19.00000</td>\n",
       "      <td>460.500000</td>\n",
       "      <td>0.046000</td>\n",
       "      <td>0.245000</td>\n",
       "      <td>0.405000</td>\n",
       "      <td>0.036000</td>\n",
       "      <td>0.208000</td>\n",
       "      <td>0.100000</td>\n",
       "      <td>0.827000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>75%</th>\n",
       "      <td>30.00000</td>\n",
       "      <td>663.250000</td>\n",
       "      <td>0.148000</td>\n",
       "      <td>0.472250</td>\n",
       "      <td>0.631250</td>\n",
       "      <td>0.145250</td>\n",
       "      <td>0.261000</td>\n",
       "      <td>0.187250</td>\n",
       "      <td>0.903000</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>max</th>\n",
       "      <td>84.00000</td>\n",
       "      <td>5921.000000</td>\n",
       "      <td>0.926000</td>\n",
       "      <td>0.935000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.945000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.960000</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "         district  total_enrollment    asian_pct    black_pct  hispanic_pct  \\\n",
       "count  2048.00000       2048.000000  2048.000000  2048.000000   2048.000000   \n",
       "mean     27.62207        560.792969     0.117710     0.302644      0.431721   \n",
       "std      26.68098        461.014510     0.166804     0.256375      0.246118   \n",
       "min       1.00000          7.000000     0.000000     0.000000      0.015000   \n",
       "25%      10.00000        304.000000     0.015000     0.081474      0.206000   \n",
       "50%      19.00000        460.500000     0.046000     0.245000      0.405000   \n",
       "75%      30.00000        663.250000     0.148000     0.472250      0.631250   \n",
       "max      84.00000       5921.000000     0.926000     0.935000      1.000000   \n",
       "\n",
       "         white_pct      swd_pct      ell_pct  poverty_pct  \n",
       "count  2048.000000  2048.000000  2048.000000  2048.000000  \n",
       "mean      0.118602     0.237641     0.141212     0.766560  \n",
       "std       0.168041     0.160780     0.143127     0.194297  \n",
       "min       0.000000     0.000000     0.000000     0.050000  \n",
       "25%       0.016000     0.163000     0.049000     0.711000  \n",
       "50%       0.036000     0.208000     0.100000     0.827000  \n",
       "75%       0.145250     0.261000     0.187250     0.903000  \n",
       "max       0.945000     1.000000     1.000000     0.960000  "
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# the built in describe() function calculates several descriptive statististics for each column\n",
    "# in the data frame and returns them as a new dataframe\n",
    "df.describe()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "ee9e8328",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "count    2048.000000\n",
       "mean        0.237641\n",
       "std         0.160780\n",
       "min         0.000000\n",
       "25%         0.163000\n",
       "50%         0.208000\n",
       "75%         0.261000\n",
       "max         1.000000\n",
       "Name: swd_pct, dtype: float64"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# we can also call describe aon a single series:\n",
    "df.swd_pct.describe()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "4cdd0f0d",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_4218/792112253.py:8: FutureWarning: The default value of numeric_only in DataFrame.corr is deprecated. In a future version, it will default to False. Select only valid columns or specify the value of numeric_only to silence this warning.\n",
      "  data.corr()\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>total_enrollment</th>\n",
       "      <th>asian_pct</th>\n",
       "      <th>black_pct</th>\n",
       "      <th>hispanic_pct</th>\n",
       "      <th>white_pct</th>\n",
       "      <th>swd_pct</th>\n",
       "      <th>ell_pct</th>\n",
       "      <th>poverty_pct</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>total_enrollment</th>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.350881</td>\n",
       "      <td>-0.242553</td>\n",
       "      <td>-0.111551</td>\n",
       "      <td>0.179056</td>\n",
       "      <td>-0.175962</td>\n",
       "      <td>-0.018582</td>\n",
       "      <td>-0.155614</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>asian_pct</th>\n",
       "      <td>0.350881</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>-0.452366</td>\n",
       "      <td>-0.370264</td>\n",
       "      <td>0.210809</td>\n",
       "      <td>-0.210489</td>\n",
       "      <td>0.138261</td>\n",
       "      <td>-0.287675</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>black_pct</th>\n",
       "      <td>-0.242553</td>\n",
       "      <td>-0.452366</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>-0.416505</td>\n",
       "      <td>-0.450801</td>\n",
       "      <td>0.138008</td>\n",
       "      <td>-0.362794</td>\n",
       "      <td>0.299685</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>hispanic_pct</th>\n",
       "      <td>-0.111551</td>\n",
       "      <td>-0.370264</td>\n",
       "      <td>-0.416505</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>-0.396739</td>\n",
       "      <td>0.070421</td>\n",
       "      <td>0.441878</td>\n",
       "      <td>0.490632</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>white_pct</th>\n",
       "      <td>0.179056</td>\n",
       "      <td>0.210809</td>\n",
       "      <td>-0.450801</td>\n",
       "      <td>-0.396739</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>-0.083534</td>\n",
       "      <td>-0.177996</td>\n",
       "      <td>-0.795595</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>swd_pct</th>\n",
       "      <td>-0.175962</td>\n",
       "      <td>-0.210489</td>\n",
       "      <td>0.138008</td>\n",
       "      <td>0.070421</td>\n",
       "      <td>-0.083534</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.000117</td>\n",
       "      <td>0.233832</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>ell_pct</th>\n",
       "      <td>-0.018582</td>\n",
       "      <td>0.138261</td>\n",
       "      <td>-0.362794</td>\n",
       "      <td>0.441878</td>\n",
       "      <td>-0.177996</td>\n",
       "      <td>0.000117</td>\n",
       "      <td>1.000000</td>\n",
       "      <td>0.359285</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>poverty_pct</th>\n",
       "      <td>-0.155614</td>\n",
       "      <td>-0.287675</td>\n",
       "      <td>0.299685</td>\n",
       "      <td>0.490632</td>\n",
       "      <td>-0.795595</td>\n",
       "      <td>0.233832</td>\n",
       "      <td>0.359285</td>\n",
       "      <td>1.000000</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                  total_enrollment  asian_pct  black_pct  hispanic_pct  \\\n",
       "total_enrollment          1.000000   0.350881  -0.242553     -0.111551   \n",
       "asian_pct                 0.350881   1.000000  -0.452366     -0.370264   \n",
       "black_pct                -0.242553  -0.452366   1.000000     -0.416505   \n",
       "hispanic_pct             -0.111551  -0.370264  -0.416505      1.000000   \n",
       "white_pct                 0.179056   0.210809  -0.450801     -0.396739   \n",
       "swd_pct                  -0.175962  -0.210489   0.138008      0.070421   \n",
       "ell_pct                  -0.018582   0.138261  -0.362794      0.441878   \n",
       "poverty_pct              -0.155614  -0.287675   0.299685      0.490632   \n",
       "\n",
       "                  white_pct   swd_pct   ell_pct  poverty_pct  \n",
       "total_enrollment   0.179056 -0.175962 -0.018582    -0.155614  \n",
       "asian_pct          0.210809 -0.210489  0.138261    -0.287675  \n",
       "black_pct         -0.450801  0.138008 -0.362794     0.299685  \n",
       "hispanic_pct      -0.396739  0.070421  0.441878     0.490632  \n",
       "white_pct          1.000000 -0.083534 -0.177996    -0.795595  \n",
       "swd_pct           -0.083534  1.000000  0.000117     0.233832  \n",
       "ell_pct           -0.177996  0.000117  1.000000     0.359285  \n",
       "poverty_pct       -0.795595  0.233832  0.359285     1.000000  "
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# we can also call the corr() method to show correclations between columns\n",
    "# we will take out \"district\" from this data because the district number\n",
    "# is categorical -- not the measure of a value\n",
    "\n",
    "# correlations close to 1 or negative one show high correlations\n",
    "# closer to zero items are not closely correlated\n",
    "data = df.drop(columns=[\"district\"])\n",
    "data.corr()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "2b796861",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/tmp/ipykernel_4218/143913075.py:3: FutureWarning: The default value of numeric_only in DataFrame.corr is deprecated. In a future version, it will default to False. Select only valid columns or specify the value of numeric_only to silence this warning.\n",
      "  corr = data.corr()\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<style type=\"text/css\">\n",
       "#T_3ecfa_row0_col0, #T_3ecfa_row1_col1, #T_3ecfa_row2_col2, #T_3ecfa_row3_col3, #T_3ecfa_row4_col4, #T_3ecfa_row5_col5, #T_3ecfa_row6_col6, #T_3ecfa_row7_col7 {\n",
       "  background-color: #b40426;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row0_col1 {\n",
       "  background-color: #ead5c9;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row0_col2 {\n",
       "  background-color: #6788ee;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row0_col3 {\n",
       "  background-color: #81a4fb;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row0_col4 {\n",
       "  background-color: #e7d7ce;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row0_col5 {\n",
       "  background-color: #4358cb;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row0_col6 {\n",
       "  background-color: #8db0fe;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row0_col7 {\n",
       "  background-color: #b2ccfb;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row1_col0 {\n",
       "  background-color: #d7dce3;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row1_col2, #T_3ecfa_row1_col5, #T_3ecfa_row2_col0, #T_3ecfa_row2_col1, #T_3ecfa_row2_col3, #T_3ecfa_row2_col6, #T_3ecfa_row4_col2, #T_3ecfa_row4_col7, #T_3ecfa_row7_col4 {\n",
       "  background-color: #3b4cc0;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row1_col3 {\n",
       "  background-color: #445acc;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row1_col4 {\n",
       "  background-color: #ebd3c6;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row1_col6 {\n",
       "  background-color: #b6cefa;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row1_col7 {\n",
       "  background-color: #98b9ff;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row2_col4 {\n",
       "  background-color: #799cf8;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row2_col5 {\n",
       "  background-color: #9abbff;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row2_col7 {\n",
       "  background-color: #f3c8b2;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row3_col0, #T_3ecfa_row4_col5 {\n",
       "  background-color: #5a78e4;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row3_col1 {\n",
       "  background-color: #4b64d5;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row3_col2 {\n",
       "  background-color: #4257c9;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row3_col4 {\n",
       "  background-color: #82a6fb;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row3_col5 {\n",
       "  background-color: #86a9fc;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row3_col6 {\n",
       "  background-color: #f1cdba;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row3_col7 {\n",
       "  background-color: #f7a688;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row4_col0 {\n",
       "  background-color: #abc8fd;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row4_col1 {\n",
       "  background-color: #d1dae9;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row4_col3 {\n",
       "  background-color: #3e51c5;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row4_col6 {\n",
       "  background-color: #6485ec;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row5_col0 {\n",
       "  background-color: #4a63d3;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row5_col1 {\n",
       "  background-color: #6f92f3;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row5_col2, #T_3ecfa_row6_col1 {\n",
       "  background-color: #c3d5f4;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row5_col3, #T_3ecfa_row6_col4 {\n",
       "  background-color: #aec9fc;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row5_col4 {\n",
       "  background-color: #bfd3f6;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row5_col6 {\n",
       "  background-color: #93b5fe;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row5_col7 {\n",
       "  background-color: #edd1c2;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row6_col0 {\n",
       "  background-color: #7597f6;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row6_col2 {\n",
       "  background-color: #4c66d6;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row6_col3 {\n",
       "  background-color: #f2c9b4;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row6_col5 {\n",
       "  background-color: #7295f4;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row6_col7 {\n",
       "  background-color: #f6bfa6;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row7_col0 {\n",
       "  background-color: #4f69d9;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row7_col1 {\n",
       "  background-color: #5e7de7;\n",
       "  color: #f1f1f1;\n",
       "}\n",
       "#T_3ecfa_row7_col2 {\n",
       "  background-color: #e1dad6;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row7_col3 {\n",
       "  background-color: #f5c0a7;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row7_col5 {\n",
       "  background-color: #b5cdfa;\n",
       "  color: #000000;\n",
       "}\n",
       "#T_3ecfa_row7_col6 {\n",
       "  background-color: #e4d9d2;\n",
       "  color: #000000;\n",
       "}\n",
       "</style>\n",
       "<table id=\"T_3ecfa\">\n",
       "  <thead>\n",
       "    <tr>\n",
       "      <th class=\"blank level0\" >&nbsp;</th>\n",
       "      <th id=\"T_3ecfa_level0_col0\" class=\"col_heading level0 col0\" >total_enrollment</th>\n",
       "      <th id=\"T_3ecfa_level0_col1\" class=\"col_heading level0 col1\" >asian_pct</th>\n",
       "      <th id=\"T_3ecfa_level0_col2\" class=\"col_heading level0 col2\" >black_pct</th>\n",
       "      <th id=\"T_3ecfa_level0_col3\" class=\"col_heading level0 col3\" >hispanic_pct</th>\n",
       "      <th id=\"T_3ecfa_level0_col4\" class=\"col_heading level0 col4\" >white_pct</th>\n",
       "      <th id=\"T_3ecfa_level0_col5\" class=\"col_heading level0 col5\" >swd_pct</th>\n",
       "      <th id=\"T_3ecfa_level0_col6\" class=\"col_heading level0 col6\" >ell_pct</th>\n",
       "      <th id=\"T_3ecfa_level0_col7\" class=\"col_heading level0 col7\" >poverty_pct</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row0\" class=\"row_heading level0 row0\" >total_enrollment</th>\n",
       "      <td id=\"T_3ecfa_row0_col0\" class=\"data row0 col0\" >1.000000</td>\n",
       "      <td id=\"T_3ecfa_row0_col1\" class=\"data row0 col1\" >0.350881</td>\n",
       "      <td id=\"T_3ecfa_row0_col2\" class=\"data row0 col2\" >-0.242553</td>\n",
       "      <td id=\"T_3ecfa_row0_col3\" class=\"data row0 col3\" >-0.111551</td>\n",
       "      <td id=\"T_3ecfa_row0_col4\" class=\"data row0 col4\" >0.179056</td>\n",
       "      <td id=\"T_3ecfa_row0_col5\" class=\"data row0 col5\" >-0.175962</td>\n",
       "      <td id=\"T_3ecfa_row0_col6\" class=\"data row0 col6\" >-0.018582</td>\n",
       "      <td id=\"T_3ecfa_row0_col7\" class=\"data row0 col7\" >-0.155614</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row1\" class=\"row_heading level0 row1\" >asian_pct</th>\n",
       "      <td id=\"T_3ecfa_row1_col0\" class=\"data row1 col0\" >0.350881</td>\n",
       "      <td id=\"T_3ecfa_row1_col1\" class=\"data row1 col1\" >1.000000</td>\n",
       "      <td id=\"T_3ecfa_row1_col2\" class=\"data row1 col2\" >-0.452366</td>\n",
       "      <td id=\"T_3ecfa_row1_col3\" class=\"data row1 col3\" >-0.370264</td>\n",
       "      <td id=\"T_3ecfa_row1_col4\" class=\"data row1 col4\" >0.210809</td>\n",
       "      <td id=\"T_3ecfa_row1_col5\" class=\"data row1 col5\" >-0.210489</td>\n",
       "      <td id=\"T_3ecfa_row1_col6\" class=\"data row1 col6\" >0.138261</td>\n",
       "      <td id=\"T_3ecfa_row1_col7\" class=\"data row1 col7\" >-0.287675</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row2\" class=\"row_heading level0 row2\" >black_pct</th>\n",
       "      <td id=\"T_3ecfa_row2_col0\" class=\"data row2 col0\" >-0.242553</td>\n",
       "      <td id=\"T_3ecfa_row2_col1\" class=\"data row2 col1\" >-0.452366</td>\n",
       "      <td id=\"T_3ecfa_row2_col2\" class=\"data row2 col2\" >1.000000</td>\n",
       "      <td id=\"T_3ecfa_row2_col3\" class=\"data row2 col3\" >-0.416505</td>\n",
       "      <td id=\"T_3ecfa_row2_col4\" class=\"data row2 col4\" >-0.450801</td>\n",
       "      <td id=\"T_3ecfa_row2_col5\" class=\"data row2 col5\" >0.138008</td>\n",
       "      <td id=\"T_3ecfa_row2_col6\" class=\"data row2 col6\" >-0.362794</td>\n",
       "      <td id=\"T_3ecfa_row2_col7\" class=\"data row2 col7\" >0.299685</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row3\" class=\"row_heading level0 row3\" >hispanic_pct</th>\n",
       "      <td id=\"T_3ecfa_row3_col0\" class=\"data row3 col0\" >-0.111551</td>\n",
       "      <td id=\"T_3ecfa_row3_col1\" class=\"data row3 col1\" >-0.370264</td>\n",
       "      <td id=\"T_3ecfa_row3_col2\" class=\"data row3 col2\" >-0.416505</td>\n",
       "      <td id=\"T_3ecfa_row3_col3\" class=\"data row3 col3\" >1.000000</td>\n",
       "      <td id=\"T_3ecfa_row3_col4\" class=\"data row3 col4\" >-0.396739</td>\n",
       "      <td id=\"T_3ecfa_row3_col5\" class=\"data row3 col5\" >0.070421</td>\n",
       "      <td id=\"T_3ecfa_row3_col6\" class=\"data row3 col6\" >0.441878</td>\n",
       "      <td id=\"T_3ecfa_row3_col7\" class=\"data row3 col7\" >0.490632</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row4\" class=\"row_heading level0 row4\" >white_pct</th>\n",
       "      <td id=\"T_3ecfa_row4_col0\" class=\"data row4 col0\" >0.179056</td>\n",
       "      <td id=\"T_3ecfa_row4_col1\" class=\"data row4 col1\" >0.210809</td>\n",
       "      <td id=\"T_3ecfa_row4_col2\" class=\"data row4 col2\" >-0.450801</td>\n",
       "      <td id=\"T_3ecfa_row4_col3\" class=\"data row4 col3\" >-0.396739</td>\n",
       "      <td id=\"T_3ecfa_row4_col4\" class=\"data row4 col4\" >1.000000</td>\n",
       "      <td id=\"T_3ecfa_row4_col5\" class=\"data row4 col5\" >-0.083534</td>\n",
       "      <td id=\"T_3ecfa_row4_col6\" class=\"data row4 col6\" >-0.177996</td>\n",
       "      <td id=\"T_3ecfa_row4_col7\" class=\"data row4 col7\" >-0.795595</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row5\" class=\"row_heading level0 row5\" >swd_pct</th>\n",
       "      <td id=\"T_3ecfa_row5_col0\" class=\"data row5 col0\" >-0.175962</td>\n",
       "      <td id=\"T_3ecfa_row5_col1\" class=\"data row5 col1\" >-0.210489</td>\n",
       "      <td id=\"T_3ecfa_row5_col2\" class=\"data row5 col2\" >0.138008</td>\n",
       "      <td id=\"T_3ecfa_row5_col3\" class=\"data row5 col3\" >0.070421</td>\n",
       "      <td id=\"T_3ecfa_row5_col4\" class=\"data row5 col4\" >-0.083534</td>\n",
       "      <td id=\"T_3ecfa_row5_col5\" class=\"data row5 col5\" >1.000000</td>\n",
       "      <td id=\"T_3ecfa_row5_col6\" class=\"data row5 col6\" >0.000117</td>\n",
       "      <td id=\"T_3ecfa_row5_col7\" class=\"data row5 col7\" >0.233832</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row6\" class=\"row_heading level0 row6\" >ell_pct</th>\n",
       "      <td id=\"T_3ecfa_row6_col0\" class=\"data row6 col0\" >-0.018582</td>\n",
       "      <td id=\"T_3ecfa_row6_col1\" class=\"data row6 col1\" >0.138261</td>\n",
       "      <td id=\"T_3ecfa_row6_col2\" class=\"data row6 col2\" >-0.362794</td>\n",
       "      <td id=\"T_3ecfa_row6_col3\" class=\"data row6 col3\" >0.441878</td>\n",
       "      <td id=\"T_3ecfa_row6_col4\" class=\"data row6 col4\" >-0.177996</td>\n",
       "      <td id=\"T_3ecfa_row6_col5\" class=\"data row6 col5\" >0.000117</td>\n",
       "      <td id=\"T_3ecfa_row6_col6\" class=\"data row6 col6\" >1.000000</td>\n",
       "      <td id=\"T_3ecfa_row6_col7\" class=\"data row6 col7\" >0.359285</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th id=\"T_3ecfa_level0_row7\" class=\"row_heading level0 row7\" >poverty_pct</th>\n",
       "      <td id=\"T_3ecfa_row7_col0\" class=\"data row7 col0\" >-0.155614</td>\n",
       "      <td id=\"T_3ecfa_row7_col1\" class=\"data row7 col1\" >-0.287675</td>\n",
       "      <td id=\"T_3ecfa_row7_col2\" class=\"data row7 col2\" >0.299685</td>\n",
       "      <td id=\"T_3ecfa_row7_col3\" class=\"data row7 col3\" >0.490632</td>\n",
       "      <td id=\"T_3ecfa_row7_col4\" class=\"data row7 col4\" >-0.795595</td>\n",
       "      <td id=\"T_3ecfa_row7_col5\" class=\"data row7 col5\" >0.233832</td>\n",
       "      <td id=\"T_3ecfa_row7_col6\" class=\"data row7 col6\" >0.359285</td>\n",
       "      <td id=\"T_3ecfa_row7_col7\" class=\"data row7 col7\" >1.000000</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n"
      ],
      "text/plain": [
       "<pandas.io.formats.style.Styler at 0x7fb5bc75efb0>"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# last, we can use styles to make the correlation table easier to read\n",
    "# note: you need to run this cell to see the colors -- it's get saved without the styled output\n",
    "corr = data.corr()\n",
    "# a coolwarm color map will show values in a gradient where -1 is the deepest blue and 1 is deepest red\n",
    "corr.style.background_gradient(cmap='coolwarm')"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "school-data",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.6"
  },
  "vscode": {
   "interpreter": {
    "hash": "c853444e20c489e5b96d8e1a4533affead1d94f1ba40ff9ef08cffb9c8ee794e"
   }
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}