4555 lines
470 KiB
Plaintext
4555 lines
470 KiB
Plaintext
|
{
|
|||
|
"cells": [
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"1. Основные возможности работы с библиотекой pandas"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 27,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"import pandas as pd"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Загрузка и сохранение данных"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 28,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"df = pd.read_csv(\"./datasets/2022/heart_2022_no_nans.csv\")"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 58,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" <th>SleepHours-HeightInMeters</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246012</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>117.93</td>\n",
|
|||
|
" <td>33.38</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>2.12</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246013</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Excellent</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>49.90</td>\n",
|
|||
|
" <td>18.30</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>2.35</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246014</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>12.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>52.16</td>\n",
|
|||
|
" <td>19.14</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>10.35</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246015</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>77.11</td>\n",
|
|||
|
" <td>28.29</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.35</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246016</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>118.84</td>\n",
|
|||
|
" <td>36.54</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.20</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246017</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past 2 years (1 year but less than 2 ye...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>102.06</td>\n",
|
|||
|
" <td>32.28</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.22</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246018</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>24.34</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.07</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246019</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>83.91</td>\n",
|
|||
|
" <td>29.86</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.32</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246020</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Excellent</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>83.01</td>\n",
|
|||
|
" <td>28.66</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.30</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246021</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>32.55</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>3.17</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>10 rows × 41 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays \\\n",
|
|||
|
"246012 Virgin Islands Male Fair 7.0 \n",
|
|||
|
"246013 Virgin Islands Male Excellent 0.0 \n",
|
|||
|
"246014 Virgin Islands Female Good 0.0 \n",
|
|||
|
"246015 Virgin Islands Female Very good 0.0 \n",
|
|||
|
"246016 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246017 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"246018 Virgin Islands Female Fair 0.0 \n",
|
|||
|
"246019 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246020 Virgin Islands Female Excellent 2.0 \n",
|
|||
|
"246021 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"\n",
|
|||
|
" MentalHealthDays LastCheckupTime \\\n",
|
|||
|
"246012 30.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246013 7.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246014 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246015 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246016 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246017 0.0 Within past 2 years (1 year but less than 2 ye... \n",
|
|||
|
"246018 7.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246019 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246020 2.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246021 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"\n",
|
|||
|
" PhysicalActivities SleepHours RemovedTeeth HadHeartAttack ... \\\n",
|
|||
|
"246012 No 4.0 None of them Yes ... \n",
|
|||
|
"246013 No 4.0 None of them No ... \n",
|
|||
|
"246014 Yes 12.0 1 to 5 No ... \n",
|
|||
|
"246015 Yes 7.0 1 to 5 No ... \n",
|
|||
|
"246016 No 6.0 1 to 5 Yes ... \n",
|
|||
|
"246017 Yes 6.0 None of them No ... \n",
|
|||
|
"246018 Yes 7.0 None of them No ... \n",
|
|||
|
"246019 Yes 7.0 1 to 5 No ... \n",
|
|||
|
"246020 Yes 7.0 None of them No ... \n",
|
|||
|
"246021 No 5.0 None of them Yes ... \n",
|
|||
|
"\n",
|
|||
|
" WeightInKilograms BMI AlcoholDrinkers HIVTesting FluVaxLast12 \\\n",
|
|||
|
"246012 117.93 33.38 Yes Yes No \n",
|
|||
|
"246013 49.90 18.30 Yes No No \n",
|
|||
|
"246014 52.16 19.14 No No No \n",
|
|||
|
"246015 77.11 28.29 Yes Yes No \n",
|
|||
|
"246016 118.84 36.54 Yes Yes Yes \n",
|
|||
|
"246017 102.06 32.28 Yes No No \n",
|
|||
|
"246018 90.72 24.34 No No No \n",
|
|||
|
"246019 83.91 29.86 Yes Yes Yes \n",
|
|||
|
"246020 83.01 28.66 No Yes Yes \n",
|
|||
|
"246021 108.86 32.55 No Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" PneumoVaxEver TetanusLast10Tdap \\\n",
|
|||
|
"246012 No No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"246013 No No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"246014 Yes Yes, received Tdap \n",
|
|||
|
"246015 No No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"246016 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246017 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246018 No No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"246019 Yes Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246020 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246021 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"\n",
|
|||
|
" HighRiskLastYear CovidPos SleepHours-HeightInMeters \n",
|
|||
|
"246012 No Yes 2.12 \n",
|
|||
|
"246013 No No 2.35 \n",
|
|||
|
"246014 No No 10.35 \n",
|
|||
|
"246015 No No 5.35 \n",
|
|||
|
"246016 No No 4.20 \n",
|
|||
|
"246017 No No 4.22 \n",
|
|||
|
"246018 No Yes 5.07 \n",
|
|||
|
"246019 No Yes 5.32 \n",
|
|||
|
"246020 No No 5.30 \n",
|
|||
|
"246021 No Yes 3.17 \n",
|
|||
|
"\n",
|
|||
|
"[10 rows x 41 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 58,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.tail(10)"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 57,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" <th>SleepHours-HeightInMeters</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>0</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>71.67</td>\n",
|
|||
|
" <td>27.99</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>7.40</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>1</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>95.25</td>\n",
|
|||
|
" <td>30.13</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.22</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>2</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>31.66</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.15</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>3</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>31.32</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.30</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>4</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>79.38</td>\n",
|
|||
|
" <td>33.07</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>3.45</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>5</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>120.20</td>\n",
|
|||
|
" <td>34.96</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.15</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>6</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>88.00</td>\n",
|
|||
|
" <td>33.30</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>6.37</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>7</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>74.84</td>\n",
|
|||
|
" <td>24.37</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.25</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>8</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>5 or more years ago</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>78.02</td>\n",
|
|||
|
" <td>26.94</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>4.30</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>9</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>63.50</td>\n",
|
|||
|
" <td>22.60</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.32</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>10 rows × 41 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays MentalHealthDays \\\n",
|
|||
|
"0 Alabama Female Very good 4.0 0.0 \n",
|
|||
|
"1 Alabama Male Very good 0.0 0.0 \n",
|
|||
|
"2 Alabama Male Very good 0.0 0.0 \n",
|
|||
|
"3 Alabama Female Fair 5.0 0.0 \n",
|
|||
|
"4 Alabama Female Good 3.0 15.0 \n",
|
|||
|
"5 Alabama Male Good 0.0 0.0 \n",
|
|||
|
"6 Alabama Female Good 3.0 0.0 \n",
|
|||
|
"7 Alabama Male Fair 5.0 0.0 \n",
|
|||
|
"8 Alabama Male Good 2.0 0.0 \n",
|
|||
|
"9 Alabama Female Very good 0.0 0.0 \n",
|
|||
|
"\n",
|
|||
|
" LastCheckupTime PhysicalActivities \\\n",
|
|||
|
"0 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"1 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"2 Within past year (anytime less than 12 months ... No \n",
|
|||
|
"3 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"4 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"5 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"6 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"7 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"8 5 or more years ago No \n",
|
|||
|
"9 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"\n",
|
|||
|
" SleepHours RemovedTeeth HadHeartAttack ... WeightInKilograms \\\n",
|
|||
|
"0 9.0 None of them No ... 71.67 \n",
|
|||
|
"1 6.0 None of them No ... 95.25 \n",
|
|||
|
"2 8.0 6 or more, but not all No ... 108.86 \n",
|
|||
|
"3 9.0 None of them No ... 90.72 \n",
|
|||
|
"4 5.0 1 to 5 No ... 79.38 \n",
|
|||
|
"5 7.0 None of them No ... 120.20 \n",
|
|||
|
"6 8.0 6 or more, but not all No ... 88.00 \n",
|
|||
|
"7 8.0 1 to 5 Yes ... 74.84 \n",
|
|||
|
"8 6.0 None of them No ... 78.02 \n",
|
|||
|
"9 7.0 None of them No ... 63.50 \n",
|
|||
|
"\n",
|
|||
|
" BMI AlcoholDrinkers HIVTesting FluVaxLast12 PneumoVaxEver \\\n",
|
|||
|
"0 27.99 No No Yes Yes \n",
|
|||
|
"1 30.13 No No Yes Yes \n",
|
|||
|
"2 31.66 Yes No No Yes \n",
|
|||
|
"3 31.32 No No Yes Yes \n",
|
|||
|
"4 33.07 No No Yes Yes \n",
|
|||
|
"5 34.96 Yes Yes Yes No \n",
|
|||
|
"6 33.30 No No Yes Yes \n",
|
|||
|
"7 24.37 No Yes Yes Yes \n",
|
|||
|
"8 26.94 No No No No \n",
|
|||
|
"9 22.60 No No Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" TetanusLast10Tdap HighRiskLastYear \\\n",
|
|||
|
"0 Yes, received Tdap No \n",
|
|||
|
"1 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"2 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"3 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"4 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"5 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"6 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"7 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"8 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"9 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"\n",
|
|||
|
" CovidPos SleepHours-HeightInMeters \n",
|
|||
|
"0 No 7.40 \n",
|
|||
|
"1 No 4.22 \n",
|
|||
|
"2 Yes 6.15 \n",
|
|||
|
"3 Yes 7.30 \n",
|
|||
|
"4 No 3.45 \n",
|
|||
|
"5 No 5.15 \n",
|
|||
|
"6 No 6.37 \n",
|
|||
|
"7 Yes 6.25 \n",
|
|||
|
"8 Yes 4.30 \n",
|
|||
|
"9 No 5.32 \n",
|
|||
|
"\n",
|
|||
|
"[10 rows x 41 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 57,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.head(10)"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 30,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"df.to_csv(\"new.csv\", index=False)"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Получение сведений о датафрейме с данными¶"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 31,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>HeightInMeters</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>count</th>\n",
|
|||
|
" <td>246022.000000</td>\n",
|
|||
|
" <td>246022.000000</td>\n",
|
|||
|
" <td>246022.000000</td>\n",
|
|||
|
" <td>246022.000000</td>\n",
|
|||
|
" <td>246022.000000</td>\n",
|
|||
|
" <td>246022.000000</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>mean</th>\n",
|
|||
|
" <td>4.119026</td>\n",
|
|||
|
" <td>4.167140</td>\n",
|
|||
|
" <td>7.021331</td>\n",
|
|||
|
" <td>1.705150</td>\n",
|
|||
|
" <td>83.615179</td>\n",
|
|||
|
" <td>28.668136</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>std</th>\n",
|
|||
|
" <td>8.405844</td>\n",
|
|||
|
" <td>8.102687</td>\n",
|
|||
|
" <td>1.440681</td>\n",
|
|||
|
" <td>0.106654</td>\n",
|
|||
|
" <td>21.323156</td>\n",
|
|||
|
" <td>6.513973</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>min</th>\n",
|
|||
|
" <td>0.000000</td>\n",
|
|||
|
" <td>0.000000</td>\n",
|
|||
|
" <td>1.000000</td>\n",
|
|||
|
" <td>0.910000</td>\n",
|
|||
|
" <td>28.120000</td>\n",
|
|||
|
" <td>12.020000</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>25%</th>\n",
|
|||
|
" <td>0.000000</td>\n",
|
|||
|
" <td>0.000000</td>\n",
|
|||
|
" <td>6.000000</td>\n",
|
|||
|
" <td>1.630000</td>\n",
|
|||
|
" <td>68.040000</td>\n",
|
|||
|
" <td>24.270000</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>50%</th>\n",
|
|||
|
" <td>0.000000</td>\n",
|
|||
|
" <td>0.000000</td>\n",
|
|||
|
" <td>7.000000</td>\n",
|
|||
|
" <td>1.700000</td>\n",
|
|||
|
" <td>81.650000</td>\n",
|
|||
|
" <td>27.460000</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>75%</th>\n",
|
|||
|
" <td>3.000000</td>\n",
|
|||
|
" <td>4.000000</td>\n",
|
|||
|
" <td>8.000000</td>\n",
|
|||
|
" <td>1.780000</td>\n",
|
|||
|
" <td>95.250000</td>\n",
|
|||
|
" <td>31.890000</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>max</th>\n",
|
|||
|
" <td>30.000000</td>\n",
|
|||
|
" <td>30.000000</td>\n",
|
|||
|
" <td>24.000000</td>\n",
|
|||
|
" <td>2.410000</td>\n",
|
|||
|
" <td>292.570000</td>\n",
|
|||
|
" <td>97.650000</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" PhysicalHealthDays MentalHealthDays SleepHours HeightInMeters \\\n",
|
|||
|
"count 246022.000000 246022.000000 246022.000000 246022.000000 \n",
|
|||
|
"mean 4.119026 4.167140 7.021331 1.705150 \n",
|
|||
|
"std 8.405844 8.102687 1.440681 0.106654 \n",
|
|||
|
"min 0.000000 0.000000 1.000000 0.910000 \n",
|
|||
|
"25% 0.000000 0.000000 6.000000 1.630000 \n",
|
|||
|
"50% 0.000000 0.000000 7.000000 1.700000 \n",
|
|||
|
"75% 3.000000 4.000000 8.000000 1.780000 \n",
|
|||
|
"max 30.000000 30.000000 24.000000 2.410000 \n",
|
|||
|
"\n",
|
|||
|
" WeightInKilograms BMI \n",
|
|||
|
"count 246022.000000 246022.000000 \n",
|
|||
|
"mean 83.615179 28.668136 \n",
|
|||
|
"std 21.323156 6.513973 \n",
|
|||
|
"min 28.120000 12.020000 \n",
|
|||
|
"25% 68.040000 24.270000 \n",
|
|||
|
"50% 81.650000 27.460000 \n",
|
|||
|
"75% 95.250000 31.890000 \n",
|
|||
|
"max 292.570000 97.650000 "
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 31,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.describe()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 32,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
"<class 'pandas.core.frame.DataFrame'>\n",
|
|||
|
"RangeIndex: 246022 entries, 0 to 246021\n",
|
|||
|
"Data columns (total 40 columns):\n",
|
|||
|
" # Column Non-Null Count Dtype \n",
|
|||
|
"--- ------ -------------- ----- \n",
|
|||
|
" 0 State 246022 non-null object \n",
|
|||
|
" 1 Sex 246022 non-null object \n",
|
|||
|
" 2 GeneralHealth 246022 non-null object \n",
|
|||
|
" 3 PhysicalHealthDays 246022 non-null float64\n",
|
|||
|
" 4 MentalHealthDays 246022 non-null float64\n",
|
|||
|
" 5 LastCheckupTime 246022 non-null object \n",
|
|||
|
" 6 PhysicalActivities 246022 non-null object \n",
|
|||
|
" 7 SleepHours 246022 non-null float64\n",
|
|||
|
" 8 RemovedTeeth 246022 non-null object \n",
|
|||
|
" 9 HadHeartAttack 246022 non-null object \n",
|
|||
|
" 10 HadAngina 246022 non-null object \n",
|
|||
|
" 11 HadStroke 246022 non-null object \n",
|
|||
|
" 12 HadAsthma 246022 non-null object \n",
|
|||
|
" 13 HadSkinCancer 246022 non-null object \n",
|
|||
|
" 14 HadCOPD 246022 non-null object \n",
|
|||
|
" 15 HadDepressiveDisorder 246022 non-null object \n",
|
|||
|
" 16 HadKidneyDisease 246022 non-null object \n",
|
|||
|
" 17 HadArthritis 246022 non-null object \n",
|
|||
|
" 18 HadDiabetes 246022 non-null object \n",
|
|||
|
" 19 DeafOrHardOfHearing 246022 non-null object \n",
|
|||
|
" 20 BlindOrVisionDifficulty 246022 non-null object \n",
|
|||
|
" 21 DifficultyConcentrating 246022 non-null object \n",
|
|||
|
" 22 DifficultyWalking 246022 non-null object \n",
|
|||
|
" 23 DifficultyDressingBathing 246022 non-null object \n",
|
|||
|
" 24 DifficultyErrands 246022 non-null object \n",
|
|||
|
" 25 SmokerStatus 246022 non-null object \n",
|
|||
|
" 26 ECigaretteUsage 246022 non-null object \n",
|
|||
|
" 27 ChestScan 246022 non-null object \n",
|
|||
|
" 28 RaceEthnicityCategory 246022 non-null object \n",
|
|||
|
" 29 AgeCategory 246022 non-null object \n",
|
|||
|
" 30 HeightInMeters 246022 non-null float64\n",
|
|||
|
" 31 WeightInKilograms 246022 non-null float64\n",
|
|||
|
" 32 BMI 246022 non-null float64\n",
|
|||
|
" 33 AlcoholDrinkers 246022 non-null object \n",
|
|||
|
" 34 HIVTesting 246022 non-null object \n",
|
|||
|
" 35 FluVaxLast12 246022 non-null object \n",
|
|||
|
" 36 PneumoVaxEver 246022 non-null object \n",
|
|||
|
" 37 TetanusLast10Tdap 246022 non-null object \n",
|
|||
|
" 38 HighRiskLastYear 246022 non-null object \n",
|
|||
|
" 39 CovidPos 246022 non-null object \n",
|
|||
|
"dtypes: float64(6), object(34)\n",
|
|||
|
"memory usage: 75.1+ MB\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.info()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Получение сведений о колонках датафрейма¶"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 33,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"Index(['State', 'Sex', 'GeneralHealth', 'PhysicalHealthDays',\n",
|
|||
|
" 'MentalHealthDays', 'LastCheckupTime', 'PhysicalActivities',\n",
|
|||
|
" 'SleepHours', 'RemovedTeeth', 'HadHeartAttack', 'HadAngina',\n",
|
|||
|
" 'HadStroke', 'HadAsthma', 'HadSkinCancer', 'HadCOPD',\n",
|
|||
|
" 'HadDepressiveDisorder', 'HadKidneyDisease', 'HadArthritis',\n",
|
|||
|
" 'HadDiabetes', 'DeafOrHardOfHearing', 'BlindOrVisionDifficulty',\n",
|
|||
|
" 'DifficultyConcentrating', 'DifficultyWalking',\n",
|
|||
|
" 'DifficultyDressingBathing', 'DifficultyErrands', 'SmokerStatus',\n",
|
|||
|
" 'ECigaretteUsage', 'ChestScan', 'RaceEthnicityCategory', 'AgeCategory',\n",
|
|||
|
" 'HeightInMeters', 'WeightInKilograms', 'BMI', 'AlcoholDrinkers',\n",
|
|||
|
" 'HIVTesting', 'FluVaxLast12', 'PneumoVaxEver', 'TetanusLast10Tdap',\n",
|
|||
|
" 'HighRiskLastYear', 'CovidPos'],\n",
|
|||
|
" dtype='object')"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 33,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.columns"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Вывод отельных строки и столбцов из датафрейма"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 34,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>0</th>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>71.67</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>1</th>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>95.25</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>2</th>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>3</th>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>4</th>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>79.38</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246017</th>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>102.06</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246018</th>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246019</th>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>83.91</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246020</th>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>83.01</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246021</th>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>246022 rows × 3 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" Sex HadHeartAttack WeightInKilograms\n",
|
|||
|
"0 Female No 71.67\n",
|
|||
|
"1 Male No 95.25\n",
|
|||
|
"2 Male No 108.86\n",
|
|||
|
"3 Female No 90.72\n",
|
|||
|
"4 Female No 79.38\n",
|
|||
|
"... ... ... ...\n",
|
|||
|
"246017 Male No 102.06\n",
|
|||
|
"246018 Female No 90.72\n",
|
|||
|
"246019 Male No 83.91\n",
|
|||
|
"246020 Female No 83.01\n",
|
|||
|
"246021 Male Yes 108.86\n",
|
|||
|
"\n",
|
|||
|
"[246022 rows x 3 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 34,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df[[\"Sex\", \"HadHeartAttack\", \"WeightInKilograms\"]]"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 35,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>HeightInMeters</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>3</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.70</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>31.32</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>4</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.55</td>\n",
|
|||
|
" <td>79.38</td>\n",
|
|||
|
" <td>33.07</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>5</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.85</td>\n",
|
|||
|
" <td>120.20</td>\n",
|
|||
|
" <td>34.96</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>3 rows × 40 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays MentalHealthDays \\\n",
|
|||
|
"3 Alabama Female Fair 5.0 0.0 \n",
|
|||
|
"4 Alabama Female Good 3.0 15.0 \n",
|
|||
|
"5 Alabama Male Good 0.0 0.0 \n",
|
|||
|
"\n",
|
|||
|
" LastCheckupTime PhysicalActivities \\\n",
|
|||
|
"3 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"4 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"5 Within past year (anytime less than 12 months ... Yes \n",
|
|||
|
"\n",
|
|||
|
" SleepHours RemovedTeeth HadHeartAttack ... HeightInMeters \\\n",
|
|||
|
"3 9.0 None of them No ... 1.70 \n",
|
|||
|
"4 5.0 1 to 5 No ... 1.55 \n",
|
|||
|
"5 7.0 None of them No ... 1.85 \n",
|
|||
|
"\n",
|
|||
|
" WeightInKilograms BMI AlcoholDrinkers HIVTesting FluVaxLast12 \\\n",
|
|||
|
"3 90.72 31.32 No No Yes \n",
|
|||
|
"4 79.38 33.07 No No Yes \n",
|
|||
|
"5 120.20 34.96 Yes Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" PneumoVaxEver TetanusLast10Tdap \\\n",
|
|||
|
"3 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"4 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"5 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"\n",
|
|||
|
" HighRiskLastYear CovidPos \n",
|
|||
|
"3 No Yes \n",
|
|||
|
"4 No No \n",
|
|||
|
"5 No No \n",
|
|||
|
"\n",
|
|||
|
"[3 rows x 40 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 35,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.iloc[3:6]"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 36,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>HeightInMeters</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>2</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.85</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>31.66</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>5</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.85</td>\n",
|
|||
|
" <td>120.20</td>\n",
|
|||
|
" <td>34.96</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>10</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.83</td>\n",
|
|||
|
" <td>122.47</td>\n",
|
|||
|
" <td>36.62</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>11</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.52</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>46.87</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot, but not Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>12</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.88</td>\n",
|
|||
|
" <td>115.67</td>\n",
|
|||
|
" <td>32.74</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246002</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.88</td>\n",
|
|||
|
" <td>106.59</td>\n",
|
|||
|
" <td>30.17</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Tested positive using home test without a heal...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246012</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.88</td>\n",
|
|||
|
" <td>117.93</td>\n",
|
|||
|
" <td>33.38</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246016</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.80</td>\n",
|
|||
|
" <td>118.84</td>\n",
|
|||
|
" <td>36.54</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246017</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past 2 years (1 year but less than 2 ye...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.78</td>\n",
|
|||
|
" <td>102.06</td>\n",
|
|||
|
" <td>32.28</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246021</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.83</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>32.55</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>44646 rows × 40 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays \\\n",
|
|||
|
"2 Alabama Male Very good 0.0 \n",
|
|||
|
"5 Alabama Male Good 0.0 \n",
|
|||
|
"10 Alabama Male Very good 0.0 \n",
|
|||
|
"11 Alabama Female Good 3.0 \n",
|
|||
|
"12 Alabama Male Good 5.0 \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246002 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246012 Virgin Islands Male Fair 7.0 \n",
|
|||
|
"246016 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246017 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"246021 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"\n",
|
|||
|
" MentalHealthDays LastCheckupTime \\\n",
|
|||
|
"2 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"5 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"10 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"11 4.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"12 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246002 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246012 30.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246016 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246017 0.0 Within past 2 years (1 year but less than 2 ye... \n",
|
|||
|
"246021 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"\n",
|
|||
|
" PhysicalActivities SleepHours RemovedTeeth HadHeartAttack \\\n",
|
|||
|
"2 No 8.0 6 or more, but not all No \n",
|
|||
|
"5 Yes 7.0 None of them No \n",
|
|||
|
"10 Yes 8.0 1 to 5 No \n",
|
|||
|
"11 Yes 5.0 None of them No \n",
|
|||
|
"12 Yes 5.0 6 or more, but not all Yes \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246002 Yes 6.0 1 to 5 No \n",
|
|||
|
"246012 No 4.0 None of them Yes \n",
|
|||
|
"246016 No 6.0 1 to 5 Yes \n",
|
|||
|
"246017 Yes 6.0 None of them No \n",
|
|||
|
"246021 No 5.0 None of them Yes \n",
|
|||
|
"\n",
|
|||
|
" ... HeightInMeters WeightInKilograms BMI AlcoholDrinkers \\\n",
|
|||
|
"2 ... 1.85 108.86 31.66 Yes \n",
|
|||
|
"5 ... 1.85 120.20 34.96 Yes \n",
|
|||
|
"10 ... 1.83 122.47 36.62 Yes \n",
|
|||
|
"11 ... 1.52 108.86 46.87 No \n",
|
|||
|
"12 ... 1.88 115.67 32.74 No \n",
|
|||
|
"... ... ... ... ... ... \n",
|
|||
|
"246002 ... 1.88 106.59 30.17 Yes \n",
|
|||
|
"246012 ... 1.88 117.93 33.38 Yes \n",
|
|||
|
"246016 ... 1.80 118.84 36.54 Yes \n",
|
|||
|
"246017 ... 1.78 102.06 32.28 Yes \n",
|
|||
|
"246021 ... 1.83 108.86 32.55 No \n",
|
|||
|
"\n",
|
|||
|
" HIVTesting FluVaxLast12 PneumoVaxEver \\\n",
|
|||
|
"2 No No Yes \n",
|
|||
|
"5 Yes Yes No \n",
|
|||
|
"10 No Yes Yes \n",
|
|||
|
"11 No No No \n",
|
|||
|
"12 No Yes Yes \n",
|
|||
|
"... ... ... ... \n",
|
|||
|
"246002 No No No \n",
|
|||
|
"246012 Yes No No \n",
|
|||
|
"246016 Yes Yes No \n",
|
|||
|
"246017 No No No \n",
|
|||
|
"246021 Yes Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" TetanusLast10Tdap HighRiskLastYear \\\n",
|
|||
|
"2 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"5 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"10 Yes, received Tdap No \n",
|
|||
|
"11 Yes, received tetanus shot, but not Tdap No \n",
|
|||
|
"12 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246002 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246012 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"246016 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246017 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246021 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"\n",
|
|||
|
" CovidPos \n",
|
|||
|
"2 Yes \n",
|
|||
|
"5 No \n",
|
|||
|
"10 No \n",
|
|||
|
"11 Yes \n",
|
|||
|
"12 No \n",
|
|||
|
"... ... \n",
|
|||
|
"246002 Tested positive using home test without a heal... \n",
|
|||
|
"246012 Yes \n",
|
|||
|
"246016 No \n",
|
|||
|
"246017 No \n",
|
|||
|
"246021 Yes \n",
|
|||
|
"\n",
|
|||
|
"[44646 rows x 40 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 36,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df[df['WeightInKilograms'] > 100]\n"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Группировка и агрегация данных в датафрейме¶"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 37,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th></th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Alabama</th>\n",
|
|||
|
" <td>85.225899</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Alaska</th>\n",
|
|||
|
" <td>83.937201</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Arizona</th>\n",
|
|||
|
" <td>82.626862</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Arkansas</th>\n",
|
|||
|
" <td>85.361796</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>California</th>\n",
|
|||
|
" <td>81.334135</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Colorado</th>\n",
|
|||
|
" <td>80.805505</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Connecticut</th>\n",
|
|||
|
" <td>82.192881</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Delaware</th>\n",
|
|||
|
" <td>84.224436</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>District of Columbia</th>\n",
|
|||
|
" <td>78.593038</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Florida</th>\n",
|
|||
|
" <td>83.155785</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Georgia</th>\n",
|
|||
|
" <td>84.332240</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Guam</th>\n",
|
|||
|
" <td>77.294261</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Hawaii</th>\n",
|
|||
|
" <td>76.419335</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Idaho</th>\n",
|
|||
|
" <td>84.648567</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Illinois</th>\n",
|
|||
|
" <td>83.459467</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Indiana</th>\n",
|
|||
|
" <td>85.703237</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Iowa</th>\n",
|
|||
|
" <td>86.970651</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Kansas</th>\n",
|
|||
|
" <td>85.864583</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Kentucky</th>\n",
|
|||
|
" <td>86.781960</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Louisiana</th>\n",
|
|||
|
" <td>85.162787</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Maine</th>\n",
|
|||
|
" <td>82.949232</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Maryland</th>\n",
|
|||
|
" <td>83.543344</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Massachusetts</th>\n",
|
|||
|
" <td>80.591010</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Michigan</th>\n",
|
|||
|
" <td>83.629868</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Minnesota</th>\n",
|
|||
|
" <td>84.954303</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Mississippi</th>\n",
|
|||
|
" <td>88.322797</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Missouri</th>\n",
|
|||
|
" <td>85.836119</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Montana</th>\n",
|
|||
|
" <td>84.231140</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Nebraska</th>\n",
|
|||
|
" <td>85.961696</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Nevada</th>\n",
|
|||
|
" <td>82.784771</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>New Hampshire</th>\n",
|
|||
|
" <td>80.702764</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>New Jersey</th>\n",
|
|||
|
" <td>81.270844</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>New Mexico</th>\n",
|
|||
|
" <td>80.529087</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>New York</th>\n",
|
|||
|
" <td>80.960180</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>North Carolina</th>\n",
|
|||
|
" <td>83.730953</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>North Dakota</th>\n",
|
|||
|
" <td>85.924972</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Ohio</th>\n",
|
|||
|
" <td>86.938279</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Oklahoma</th>\n",
|
|||
|
" <td>85.517429</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Oregon</th>\n",
|
|||
|
" <td>83.802043</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Pennsylvania</th>\n",
|
|||
|
" <td>83.831872</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Puerto Rico</th>\n",
|
|||
|
" <td>79.152187</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Rhode Island</th>\n",
|
|||
|
" <td>80.675832</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>South Carolina</th>\n",
|
|||
|
" <td>84.046443</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>South Dakota</th>\n",
|
|||
|
" <td>86.868195</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Tennessee</th>\n",
|
|||
|
" <td>86.237325</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Texas</th>\n",
|
|||
|
" <td>84.894035</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Utah</th>\n",
|
|||
|
" <td>83.888474</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Vermont</th>\n",
|
|||
|
" <td>80.557657</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Virgin Islands</th>\n",
|
|||
|
" <td>82.131440</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Virginia</th>\n",
|
|||
|
" <td>83.822634</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Washington</th>\n",
|
|||
|
" <td>83.077369</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>West Virginia</th>\n",
|
|||
|
" <td>86.697505</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Wisconsin</th>\n",
|
|||
|
" <td>86.167571</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>Wyoming</th>\n",
|
|||
|
" <td>83.844357</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" WeightInKilograms\n",
|
|||
|
"State \n",
|
|||
|
"Alabama 85.225899\n",
|
|||
|
"Alaska 83.937201\n",
|
|||
|
"Arizona 82.626862\n",
|
|||
|
"Arkansas 85.361796\n",
|
|||
|
"California 81.334135\n",
|
|||
|
"Colorado 80.805505\n",
|
|||
|
"Connecticut 82.192881\n",
|
|||
|
"Delaware 84.224436\n",
|
|||
|
"District of Columbia 78.593038\n",
|
|||
|
"Florida 83.155785\n",
|
|||
|
"Georgia 84.332240\n",
|
|||
|
"Guam 77.294261\n",
|
|||
|
"Hawaii 76.419335\n",
|
|||
|
"Idaho 84.648567\n",
|
|||
|
"Illinois 83.459467\n",
|
|||
|
"Indiana 85.703237\n",
|
|||
|
"Iowa 86.970651\n",
|
|||
|
"Kansas 85.864583\n",
|
|||
|
"Kentucky 86.781960\n",
|
|||
|
"Louisiana 85.162787\n",
|
|||
|
"Maine 82.949232\n",
|
|||
|
"Maryland 83.543344\n",
|
|||
|
"Massachusetts 80.591010\n",
|
|||
|
"Michigan 83.629868\n",
|
|||
|
"Minnesota 84.954303\n",
|
|||
|
"Mississippi 88.322797\n",
|
|||
|
"Missouri 85.836119\n",
|
|||
|
"Montana 84.231140\n",
|
|||
|
"Nebraska 85.961696\n",
|
|||
|
"Nevada 82.784771\n",
|
|||
|
"New Hampshire 80.702764\n",
|
|||
|
"New Jersey 81.270844\n",
|
|||
|
"New Mexico 80.529087\n",
|
|||
|
"New York 80.960180\n",
|
|||
|
"North Carolina 83.730953\n",
|
|||
|
"North Dakota 85.924972\n",
|
|||
|
"Ohio 86.938279\n",
|
|||
|
"Oklahoma 85.517429\n",
|
|||
|
"Oregon 83.802043\n",
|
|||
|
"Pennsylvania 83.831872\n",
|
|||
|
"Puerto Rico 79.152187\n",
|
|||
|
"Rhode Island 80.675832\n",
|
|||
|
"South Carolina 84.046443\n",
|
|||
|
"South Dakota 86.868195\n",
|
|||
|
"Tennessee 86.237325\n",
|
|||
|
"Texas 84.894035\n",
|
|||
|
"Utah 83.888474\n",
|
|||
|
"Vermont 80.557657\n",
|
|||
|
"Virgin Islands 82.131440\n",
|
|||
|
"Virginia 83.822634\n",
|
|||
|
"Washington 83.077369\n",
|
|||
|
"West Virginia 86.697505\n",
|
|||
|
"Wisconsin 86.167571\n",
|
|||
|
"Wyoming 83.844357"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 37,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"group = df.groupby(['State'])['WeightInKilograms'].mean()\n",
|
|||
|
"group.to_frame()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Сортировка данных в датафрейме"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 38,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>HeightInMeters</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>9060</th>\n",
|
|||
|
" <td>Arizona</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.85</td>\n",
|
|||
|
" <td>292.57</td>\n",
|
|||
|
" <td>85.10</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>48969</th>\n",
|
|||
|
" <td>Hawaii</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Poor</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.93</td>\n",
|
|||
|
" <td>276.24</td>\n",
|
|||
|
" <td>74.13</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>75697</th>\n",
|
|||
|
" <td>Kentucky</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>5 or more years ago</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.91</td>\n",
|
|||
|
" <td>273.52</td>\n",
|
|||
|
" <td>75.37</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>143147</th>\n",
|
|||
|
" <td>New York</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>1.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.88</td>\n",
|
|||
|
" <td>273.06</td>\n",
|
|||
|
" <td>77.29</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>76244</th>\n",
|
|||
|
" <td>Kentucky</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.83</td>\n",
|
|||
|
" <td>272.16</td>\n",
|
|||
|
" <td>81.37</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>203695</th>\n",
|
|||
|
" <td>Vermont</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Poor</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>Within past 2 years (1 year but less than 2 ye...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>18.0</td>\n",
|
|||
|
" <td>All</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.60</td>\n",
|
|||
|
" <td>30.84</td>\n",
|
|||
|
" <td>12.05</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>242632</th>\n",
|
|||
|
" <td>Puerto Rico</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.35</td>\n",
|
|||
|
" <td>30.39</td>\n",
|
|||
|
" <td>16.77</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>11614</th>\n",
|
|||
|
" <td>Arkansas</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Poor</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>All</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.52</td>\n",
|
|||
|
" <td>29.48</td>\n",
|
|||
|
" <td>12.69</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>127404</th>\n",
|
|||
|
" <td>Nebraska</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Poor</td>\n",
|
|||
|
" <td>30.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.52</td>\n",
|
|||
|
" <td>29.48</td>\n",
|
|||
|
" <td>12.69</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>179326</th>\n",
|
|||
|
" <td>South Carolina</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>5 or more years ago</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.52</td>\n",
|
|||
|
" <td>28.12</td>\n",
|
|||
|
" <td>12.11</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>246022 rows × 40 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays \\\n",
|
|||
|
"9060 Arizona Male Fair 15.0 \n",
|
|||
|
"48969 Hawaii Male Poor 30.0 \n",
|
|||
|
"75697 Kentucky Male Very good 0.0 \n",
|
|||
|
"143147 New York Male Very good 3.0 \n",
|
|||
|
"76244 Kentucky Male Very good 0.0 \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"203695 Vermont Female Poor 30.0 \n",
|
|||
|
"242632 Puerto Rico Female Fair 30.0 \n",
|
|||
|
"11614 Arkansas Female Poor 30.0 \n",
|
|||
|
"127404 Nebraska Female Poor 30.0 \n",
|
|||
|
"179326 South Carolina Female Very good 0.0 \n",
|
|||
|
"\n",
|
|||
|
" MentalHealthDays LastCheckupTime \\\n",
|
|||
|
"9060 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"48969 30.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"75697 0.0 5 or more years ago \n",
|
|||
|
"143147 1.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"76244 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"203695 3.0 Within past 2 years (1 year but less than 2 ye... \n",
|
|||
|
"242632 7.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"11614 30.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"127404 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"179326 0.0 5 or more years ago \n",
|
|||
|
"\n",
|
|||
|
" PhysicalActivities SleepHours RemovedTeeth HadHeartAttack \\\n",
|
|||
|
"9060 No 8.0 None of them No \n",
|
|||
|
"48969 Yes 4.0 None of them No \n",
|
|||
|
"75697 No 7.0 None of them No \n",
|
|||
|
"143147 Yes 8.0 None of them No \n",
|
|||
|
"76244 Yes 7.0 None of them No \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"203695 No 18.0 All No \n",
|
|||
|
"242632 No 7.0 6 or more, but not all No \n",
|
|||
|
"11614 No 8.0 All No \n",
|
|||
|
"127404 Yes 6.0 None of them No \n",
|
|||
|
"179326 No 8.0 None of them No \n",
|
|||
|
"\n",
|
|||
|
" ... HeightInMeters WeightInKilograms BMI AlcoholDrinkers \\\n",
|
|||
|
"9060 ... 1.85 292.57 85.10 No \n",
|
|||
|
"48969 ... 1.93 276.24 74.13 No \n",
|
|||
|
"75697 ... 1.91 273.52 75.37 No \n",
|
|||
|
"143147 ... 1.88 273.06 77.29 Yes \n",
|
|||
|
"76244 ... 1.83 272.16 81.37 No \n",
|
|||
|
"... ... ... ... ... ... \n",
|
|||
|
"203695 ... 1.60 30.84 12.05 No \n",
|
|||
|
"242632 ... 1.35 30.39 16.77 No \n",
|
|||
|
"11614 ... 1.52 29.48 12.69 No \n",
|
|||
|
"127404 ... 1.52 29.48 12.69 No \n",
|
|||
|
"179326 ... 1.52 28.12 12.11 No \n",
|
|||
|
"\n",
|
|||
|
" HIVTesting FluVaxLast12 PneumoVaxEver \\\n",
|
|||
|
"9060 No No No \n",
|
|||
|
"48969 No No No \n",
|
|||
|
"75697 No No No \n",
|
|||
|
"143147 No No No \n",
|
|||
|
"76244 Yes No No \n",
|
|||
|
"... ... ... ... \n",
|
|||
|
"203695 No No No \n",
|
|||
|
"242632 No Yes Yes \n",
|
|||
|
"11614 No Yes Yes \n",
|
|||
|
"127404 No No Yes \n",
|
|||
|
"179326 No No No \n",
|
|||
|
"\n",
|
|||
|
" TetanusLast10Tdap HighRiskLastYear \\\n",
|
|||
|
"9060 Yes, received Tdap No \n",
|
|||
|
"48969 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"75697 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"143147 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"76244 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"... ... ... \n",
|
|||
|
"203695 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"242632 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"11614 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"127404 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"179326 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"\n",
|
|||
|
" CovidPos \n",
|
|||
|
"9060 No \n",
|
|||
|
"48969 Yes \n",
|
|||
|
"75697 No \n",
|
|||
|
"143147 No \n",
|
|||
|
"76244 Yes \n",
|
|||
|
"... ... \n",
|
|||
|
"203695 No \n",
|
|||
|
"242632 No \n",
|
|||
|
"11614 Yes \n",
|
|||
|
"127404 No \n",
|
|||
|
"179326 No \n",
|
|||
|
"\n",
|
|||
|
"[246022 rows x 40 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 38,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"sorted_df = df.sort_values(by='WeightInKilograms', ascending = False)\n",
|
|||
|
"sorted_df"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Удаление строк/столбцов"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 39,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"df_dropped_columns = df.drop(columns=['AlcoholDrinkers', 'BMI']) # Удаление столбцов 'AlcoholDrinkers' и 'BMI'"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 40,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>RaceEthnicityCategory</th>\n",
|
|||
|
" <th>AgeCategory</th>\n",
|
|||
|
" <th>HeightInMeters</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>0</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>White only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 65 to 69</td>\n",
|
|||
|
" <td>1.60</td>\n",
|
|||
|
" <td>71.67</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>1</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>White only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 70 to 74</td>\n",
|
|||
|
" <td>1.78</td>\n",
|
|||
|
" <td>95.25</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>2</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>White only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 75 to 79</td>\n",
|
|||
|
" <td>1.85</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>3</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>White only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 80 or older</td>\n",
|
|||
|
" <td>1.70</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>4</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>White only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 80 or older</td>\n",
|
|||
|
" <td>1.55</td>\n",
|
|||
|
" <td>79.38</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246017</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past 2 years (1 year but less than 2 ye...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>White only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 60 to 64</td>\n",
|
|||
|
" <td>1.78</td>\n",
|
|||
|
" <td>102.06</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246018</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>Black only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 25 to 29</td>\n",
|
|||
|
" <td>1.93</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246019</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>Multiracial, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 65 to 69</td>\n",
|
|||
|
" <td>1.68</td>\n",
|
|||
|
" <td>83.91</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246020</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Excellent</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>Black only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 50 to 54</td>\n",
|
|||
|
" <td>1.70</td>\n",
|
|||
|
" <td>83.01</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246021</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>Black only, Non-Hispanic</td>\n",
|
|||
|
" <td>Age 70 to 74</td>\n",
|
|||
|
" <td>1.83</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>246022 rows × 38 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays \\\n",
|
|||
|
"0 Alabama Female Very good 4.0 \n",
|
|||
|
"1 Alabama Male Very good 0.0 \n",
|
|||
|
"2 Alabama Male Very good 0.0 \n",
|
|||
|
"3 Alabama Female Fair 5.0 \n",
|
|||
|
"4 Alabama Female Good 3.0 \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"246018 Virgin Islands Female Fair 0.0 \n",
|
|||
|
"246019 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246020 Virgin Islands Female Excellent 2.0 \n",
|
|||
|
"246021 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"\n",
|
|||
|
" MentalHealthDays LastCheckupTime \\\n",
|
|||
|
"0 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"1 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"2 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"3 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"4 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 0.0 Within past 2 years (1 year but less than 2 ye... \n",
|
|||
|
"246018 7.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246019 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246020 2.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246021 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"\n",
|
|||
|
" PhysicalActivities SleepHours RemovedTeeth HadHeartAttack \\\n",
|
|||
|
"0 Yes 9.0 None of them No \n",
|
|||
|
"1 Yes 6.0 None of them No \n",
|
|||
|
"2 No 8.0 6 or more, but not all No \n",
|
|||
|
"3 Yes 9.0 None of them No \n",
|
|||
|
"4 Yes 5.0 1 to 5 No \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Yes 6.0 None of them No \n",
|
|||
|
"246018 Yes 7.0 None of them No \n",
|
|||
|
"246019 Yes 7.0 1 to 5 No \n",
|
|||
|
"246020 Yes 7.0 None of them No \n",
|
|||
|
"246021 No 5.0 None of them Yes \n",
|
|||
|
"\n",
|
|||
|
" ... RaceEthnicityCategory AgeCategory HeightInMeters \\\n",
|
|||
|
"0 ... White only, Non-Hispanic Age 65 to 69 1.60 \n",
|
|||
|
"1 ... White only, Non-Hispanic Age 70 to 74 1.78 \n",
|
|||
|
"2 ... White only, Non-Hispanic Age 75 to 79 1.85 \n",
|
|||
|
"3 ... White only, Non-Hispanic Age 80 or older 1.70 \n",
|
|||
|
"4 ... White only, Non-Hispanic Age 80 or older 1.55 \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 ... White only, Non-Hispanic Age 60 to 64 1.78 \n",
|
|||
|
"246018 ... Black only, Non-Hispanic Age 25 to 29 1.93 \n",
|
|||
|
"246019 ... Multiracial, Non-Hispanic Age 65 to 69 1.68 \n",
|
|||
|
"246020 ... Black only, Non-Hispanic Age 50 to 54 1.70 \n",
|
|||
|
"246021 ... Black only, Non-Hispanic Age 70 to 74 1.83 \n",
|
|||
|
"\n",
|
|||
|
" WeightInKilograms HIVTesting FluVaxLast12 PneumoVaxEver \\\n",
|
|||
|
"0 71.67 No Yes Yes \n",
|
|||
|
"1 95.25 No Yes Yes \n",
|
|||
|
"2 108.86 No No Yes \n",
|
|||
|
"3 90.72 No Yes Yes \n",
|
|||
|
"4 79.38 No Yes Yes \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 102.06 No No No \n",
|
|||
|
"246018 90.72 No No No \n",
|
|||
|
"246019 83.91 Yes Yes Yes \n",
|
|||
|
"246020 83.01 Yes Yes No \n",
|
|||
|
"246021 108.86 Yes Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" TetanusLast10Tdap HighRiskLastYear \\\n",
|
|||
|
"0 Yes, received Tdap No \n",
|
|||
|
"1 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"2 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"3 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"4 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246018 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"246019 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246020 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246021 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"\n",
|
|||
|
" CovidPos \n",
|
|||
|
"0 No \n",
|
|||
|
"1 No \n",
|
|||
|
"2 Yes \n",
|
|||
|
"3 Yes \n",
|
|||
|
"4 No \n",
|
|||
|
"... ... \n",
|
|||
|
"246017 No \n",
|
|||
|
"246018 Yes \n",
|
|||
|
"246019 Yes \n",
|
|||
|
"246020 No \n",
|
|||
|
"246021 Yes \n",
|
|||
|
"\n",
|
|||
|
"[246022 rows x 38 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 40,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df_dropped_columns"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 41,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>HeightInMeters</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>2</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.85</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>31.66</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>3</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.70</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>31.32</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>4</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.55</td>\n",
|
|||
|
" <td>79.38</td>\n",
|
|||
|
" <td>33.07</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>5</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.85</td>\n",
|
|||
|
" <td>120.20</td>\n",
|
|||
|
" <td>34.96</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>6</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.63</td>\n",
|
|||
|
" <td>88.00</td>\n",
|
|||
|
" <td>33.30</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246017</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past 2 years (1 year but less than 2 ye...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.78</td>\n",
|
|||
|
" <td>102.06</td>\n",
|
|||
|
" <td>32.28</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246018</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.93</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>24.34</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246019</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.68</td>\n",
|
|||
|
" <td>83.91</td>\n",
|
|||
|
" <td>29.86</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246020</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Excellent</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.70</td>\n",
|
|||
|
" <td>83.01</td>\n",
|
|||
|
" <td>28.66</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246021</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>1.83</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>32.55</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>246020 rows × 40 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays \\\n",
|
|||
|
"2 Alabama Male Very good 0.0 \n",
|
|||
|
"3 Alabama Female Fair 5.0 \n",
|
|||
|
"4 Alabama Female Good 3.0 \n",
|
|||
|
"5 Alabama Male Good 0.0 \n",
|
|||
|
"6 Alabama Female Good 3.0 \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"246018 Virgin Islands Female Fair 0.0 \n",
|
|||
|
"246019 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246020 Virgin Islands Female Excellent 2.0 \n",
|
|||
|
"246021 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"\n",
|
|||
|
" MentalHealthDays LastCheckupTime \\\n",
|
|||
|
"2 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"3 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"4 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"5 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"6 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 0.0 Within past 2 years (1 year but less than 2 ye... \n",
|
|||
|
"246018 7.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246019 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246020 2.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246021 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"\n",
|
|||
|
" PhysicalActivities SleepHours RemovedTeeth HadHeartAttack \\\n",
|
|||
|
"2 No 8.0 6 or more, but not all No \n",
|
|||
|
"3 Yes 9.0 None of them No \n",
|
|||
|
"4 Yes 5.0 1 to 5 No \n",
|
|||
|
"5 Yes 7.0 None of them No \n",
|
|||
|
"6 Yes 8.0 6 or more, but not all No \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Yes 6.0 None of them No \n",
|
|||
|
"246018 Yes 7.0 None of them No \n",
|
|||
|
"246019 Yes 7.0 1 to 5 No \n",
|
|||
|
"246020 Yes 7.0 None of them No \n",
|
|||
|
"246021 No 5.0 None of them Yes \n",
|
|||
|
"\n",
|
|||
|
" ... HeightInMeters WeightInKilograms BMI AlcoholDrinkers \\\n",
|
|||
|
"2 ... 1.85 108.86 31.66 Yes \n",
|
|||
|
"3 ... 1.70 90.72 31.32 No \n",
|
|||
|
"4 ... 1.55 79.38 33.07 No \n",
|
|||
|
"5 ... 1.85 120.20 34.96 Yes \n",
|
|||
|
"6 ... 1.63 88.00 33.30 No \n",
|
|||
|
"... ... ... ... ... ... \n",
|
|||
|
"246017 ... 1.78 102.06 32.28 Yes \n",
|
|||
|
"246018 ... 1.93 90.72 24.34 No \n",
|
|||
|
"246019 ... 1.68 83.91 29.86 Yes \n",
|
|||
|
"246020 ... 1.70 83.01 28.66 No \n",
|
|||
|
"246021 ... 1.83 108.86 32.55 No \n",
|
|||
|
"\n",
|
|||
|
" HIVTesting FluVaxLast12 PneumoVaxEver \\\n",
|
|||
|
"2 No No Yes \n",
|
|||
|
"3 No Yes Yes \n",
|
|||
|
"4 No Yes Yes \n",
|
|||
|
"5 Yes Yes No \n",
|
|||
|
"6 No Yes Yes \n",
|
|||
|
"... ... ... ... \n",
|
|||
|
"246017 No No No \n",
|
|||
|
"246018 No No No \n",
|
|||
|
"246019 Yes Yes Yes \n",
|
|||
|
"246020 Yes Yes No \n",
|
|||
|
"246021 Yes Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" TetanusLast10Tdap HighRiskLastYear \\\n",
|
|||
|
"2 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"3 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"4 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"5 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"6 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246018 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"246019 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246020 Yes, received tetanus shot but not sure what type No \n",
|
|||
|
"246021 No, did not receive any tetanus shot in the pa... No \n",
|
|||
|
"\n",
|
|||
|
" CovidPos \n",
|
|||
|
"2 Yes \n",
|
|||
|
"3 Yes \n",
|
|||
|
"4 No \n",
|
|||
|
"5 No \n",
|
|||
|
"6 No \n",
|
|||
|
"... ... \n",
|
|||
|
"246017 No \n",
|
|||
|
"246018 Yes \n",
|
|||
|
"246019 Yes \n",
|
|||
|
"246020 No \n",
|
|||
|
"246021 Yes \n",
|
|||
|
"\n",
|
|||
|
"[246020 rows x 40 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 41,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df_dropped_rows = df.drop([0, 1]) # Удаление строк с индексами 0 и 1\n",
|
|||
|
"df_dropped_rows"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Создание новых столбцов на основе данных из существующих столбцов датафрейма¶"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 42,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"df['SleepHours-HeightInMeters'] = df['SleepHours'] - df['HeightInMeters']"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 43,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" <th>SleepHours-HeightInMeters</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>0</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>71.67</td>\n",
|
|||
|
" <td>27.99</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>7.40</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>1</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>95.25</td>\n",
|
|||
|
" <td>30.13</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.22</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>2</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>31.66</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.15</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>3</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>31.32</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.30</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>4</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>79.38</td>\n",
|
|||
|
" <td>33.07</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>3.45</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246017</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past 2 years (1 year but less than 2 ye...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>102.06</td>\n",
|
|||
|
" <td>32.28</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.22</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246018</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>24.34</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.07</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246019</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>83.91</td>\n",
|
|||
|
" <td>29.86</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.32</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246020</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Excellent</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>83.01</td>\n",
|
|||
|
" <td>28.66</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.30</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246021</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>32.55</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>3.17</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>246022 rows × 41 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays \\\n",
|
|||
|
"0 Alabama Female Very good 4.0 \n",
|
|||
|
"1 Alabama Male Very good 0.0 \n",
|
|||
|
"2 Alabama Male Very good 0.0 \n",
|
|||
|
"3 Alabama Female Fair 5.0 \n",
|
|||
|
"4 Alabama Female Good 3.0 \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"246018 Virgin Islands Female Fair 0.0 \n",
|
|||
|
"246019 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246020 Virgin Islands Female Excellent 2.0 \n",
|
|||
|
"246021 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"\n",
|
|||
|
" MentalHealthDays LastCheckupTime \\\n",
|
|||
|
"0 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"1 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"2 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"3 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"4 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 0.0 Within past 2 years (1 year but less than 2 ye... \n",
|
|||
|
"246018 7.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246019 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246020 2.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246021 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"\n",
|
|||
|
" PhysicalActivities SleepHours RemovedTeeth HadHeartAttack \\\n",
|
|||
|
"0 Yes 9.0 None of them No \n",
|
|||
|
"1 Yes 6.0 None of them No \n",
|
|||
|
"2 No 8.0 6 or more, but not all No \n",
|
|||
|
"3 Yes 9.0 None of them No \n",
|
|||
|
"4 Yes 5.0 1 to 5 No \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Yes 6.0 None of them No \n",
|
|||
|
"246018 Yes 7.0 None of them No \n",
|
|||
|
"246019 Yes 7.0 1 to 5 No \n",
|
|||
|
"246020 Yes 7.0 None of them No \n",
|
|||
|
"246021 No 5.0 None of them Yes \n",
|
|||
|
"\n",
|
|||
|
" ... WeightInKilograms BMI AlcoholDrinkers HIVTesting FluVaxLast12 \\\n",
|
|||
|
"0 ... 71.67 27.99 No No Yes \n",
|
|||
|
"1 ... 95.25 30.13 No No Yes \n",
|
|||
|
"2 ... 108.86 31.66 Yes No No \n",
|
|||
|
"3 ... 90.72 31.32 No No Yes \n",
|
|||
|
"4 ... 79.38 33.07 No No Yes \n",
|
|||
|
"... ... ... ... ... ... ... \n",
|
|||
|
"246017 ... 102.06 32.28 Yes No No \n",
|
|||
|
"246018 ... 90.72 24.34 No No No \n",
|
|||
|
"246019 ... 83.91 29.86 Yes Yes Yes \n",
|
|||
|
"246020 ... 83.01 28.66 No Yes Yes \n",
|
|||
|
"246021 ... 108.86 32.55 No Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" PneumoVaxEver TetanusLast10Tdap \\\n",
|
|||
|
"0 Yes Yes, received Tdap \n",
|
|||
|
"1 Yes Yes, received tetanus shot but not sure what type \n",
|
|||
|
"2 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"3 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"4 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246018 No No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"246019 Yes Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246020 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246021 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"\n",
|
|||
|
" HighRiskLastYear CovidPos SleepHours-HeightInMeters \n",
|
|||
|
"0 No No 7.40 \n",
|
|||
|
"1 No No 4.22 \n",
|
|||
|
"2 No Yes 6.15 \n",
|
|||
|
"3 No Yes 7.30 \n",
|
|||
|
"4 No No 3.45 \n",
|
|||
|
"... ... ... ... \n",
|
|||
|
"246017 No No 4.22 \n",
|
|||
|
"246018 No Yes 5.07 \n",
|
|||
|
"246019 No Yes 5.32 \n",
|
|||
|
"246020 No No 5.30 \n",
|
|||
|
"246021 No Yes 3.17 \n",
|
|||
|
"\n",
|
|||
|
"[246022 rows x 41 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 43,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Удаление строк с пустыми значениями"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 44,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
"State 0\n",
|
|||
|
"Sex 0\n",
|
|||
|
"GeneralHealth 0\n",
|
|||
|
"PhysicalHealthDays 0\n",
|
|||
|
"MentalHealthDays 0\n",
|
|||
|
"LastCheckupTime 0\n",
|
|||
|
"PhysicalActivities 0\n",
|
|||
|
"SleepHours 0\n",
|
|||
|
"RemovedTeeth 0\n",
|
|||
|
"HadHeartAttack 0\n",
|
|||
|
"HadAngina 0\n",
|
|||
|
"HadStroke 0\n",
|
|||
|
"HadAsthma 0\n",
|
|||
|
"HadSkinCancer 0\n",
|
|||
|
"HadCOPD 0\n",
|
|||
|
"HadDepressiveDisorder 0\n",
|
|||
|
"HadKidneyDisease 0\n",
|
|||
|
"HadArthritis 0\n",
|
|||
|
"HadDiabetes 0\n",
|
|||
|
"DeafOrHardOfHearing 0\n",
|
|||
|
"BlindOrVisionDifficulty 0\n",
|
|||
|
"DifficultyConcentrating 0\n",
|
|||
|
"DifficultyWalking 0\n",
|
|||
|
"DifficultyDressingBathing 0\n",
|
|||
|
"DifficultyErrands 0\n",
|
|||
|
"SmokerStatus 0\n",
|
|||
|
"ECigaretteUsage 0\n",
|
|||
|
"ChestScan 0\n",
|
|||
|
"RaceEthnicityCategory 0\n",
|
|||
|
"AgeCategory 0\n",
|
|||
|
"HeightInMeters 0\n",
|
|||
|
"WeightInKilograms 0\n",
|
|||
|
"BMI 0\n",
|
|||
|
"AlcoholDrinkers 0\n",
|
|||
|
"HIVTesting 0\n",
|
|||
|
"FluVaxLast12 0\n",
|
|||
|
"PneumoVaxEver 0\n",
|
|||
|
"TetanusLast10Tdap 0\n",
|
|||
|
"HighRiskLastYear 0\n",
|
|||
|
"CovidPos 0\n",
|
|||
|
"SleepHours-HeightInMeters 0\n",
|
|||
|
"dtype: int64\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"print(df.isna().sum())"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 45,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/html": [
|
|||
|
"<div>\n",
|
|||
|
"<style scoped>\n",
|
|||
|
" .dataframe tbody tr th:only-of-type {\n",
|
|||
|
" vertical-align: middle;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe tbody tr th {\n",
|
|||
|
" vertical-align: top;\n",
|
|||
|
" }\n",
|
|||
|
"\n",
|
|||
|
" .dataframe thead th {\n",
|
|||
|
" text-align: right;\n",
|
|||
|
" }\n",
|
|||
|
"</style>\n",
|
|||
|
"<table border=\"1\" class=\"dataframe\">\n",
|
|||
|
" <thead>\n",
|
|||
|
" <tr style=\"text-align: right;\">\n",
|
|||
|
" <th></th>\n",
|
|||
|
" <th>State</th>\n",
|
|||
|
" <th>Sex</th>\n",
|
|||
|
" <th>GeneralHealth</th>\n",
|
|||
|
" <th>PhysicalHealthDays</th>\n",
|
|||
|
" <th>MentalHealthDays</th>\n",
|
|||
|
" <th>LastCheckupTime</th>\n",
|
|||
|
" <th>PhysicalActivities</th>\n",
|
|||
|
" <th>SleepHours</th>\n",
|
|||
|
" <th>RemovedTeeth</th>\n",
|
|||
|
" <th>HadHeartAttack</th>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <th>WeightInKilograms</th>\n",
|
|||
|
" <th>BMI</th>\n",
|
|||
|
" <th>AlcoholDrinkers</th>\n",
|
|||
|
" <th>HIVTesting</th>\n",
|
|||
|
" <th>FluVaxLast12</th>\n",
|
|||
|
" <th>PneumoVaxEver</th>\n",
|
|||
|
" <th>TetanusLast10Tdap</th>\n",
|
|||
|
" <th>HighRiskLastYear</th>\n",
|
|||
|
" <th>CovidPos</th>\n",
|
|||
|
" <th>SleepHours-HeightInMeters</th>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </thead>\n",
|
|||
|
" <tbody>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>0</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>4.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>71.67</td>\n",
|
|||
|
" <td>27.99</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received Tdap</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>7.40</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>1</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>95.25</td>\n",
|
|||
|
" <td>30.13</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.22</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>2</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>8.0</td>\n",
|
|||
|
" <td>6 or more, but not all</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>31.66</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.15</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>3</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>9.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>31.32</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.30</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>4</th>\n",
|
|||
|
" <td>Alabama</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>3.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>79.38</td>\n",
|
|||
|
" <td>33.07</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>3.45</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>...</th>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246017</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past 2 years (1 year but less than 2 ye...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>6.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>102.06</td>\n",
|
|||
|
" <td>32.28</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>4.22</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246018</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Fair</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>90.72</td>\n",
|
|||
|
" <td>24.34</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.07</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246019</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>15.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>1 to 5</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>83.91</td>\n",
|
|||
|
" <td>29.86</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>5.32</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246020</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Female</td>\n",
|
|||
|
" <td>Excellent</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>2.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>7.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>83.01</td>\n",
|
|||
|
" <td>28.66</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes, received tetanus shot but not sure what type</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.30</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" <tr>\n",
|
|||
|
" <th>246021</th>\n",
|
|||
|
" <td>Virgin Islands</td>\n",
|
|||
|
" <td>Male</td>\n",
|
|||
|
" <td>Very good</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>0.0</td>\n",
|
|||
|
" <td>Within past year (anytime less than 12 months ...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>5.0</td>\n",
|
|||
|
" <td>None of them</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>...</td>\n",
|
|||
|
" <td>108.86</td>\n",
|
|||
|
" <td>32.55</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>No, did not receive any tetanus shot in the pa...</td>\n",
|
|||
|
" <td>No</td>\n",
|
|||
|
" <td>Yes</td>\n",
|
|||
|
" <td>3.17</td>\n",
|
|||
|
" </tr>\n",
|
|||
|
" </tbody>\n",
|
|||
|
"</table>\n",
|
|||
|
"<p>246022 rows × 41 columns</p>\n",
|
|||
|
"</div>"
|
|||
|
],
|
|||
|
"text/plain": [
|
|||
|
" State Sex GeneralHealth PhysicalHealthDays \\\n",
|
|||
|
"0 Alabama Female Very good 4.0 \n",
|
|||
|
"1 Alabama Male Very good 0.0 \n",
|
|||
|
"2 Alabama Male Very good 0.0 \n",
|
|||
|
"3 Alabama Female Fair 5.0 \n",
|
|||
|
"4 Alabama Female Good 3.0 \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"246018 Virgin Islands Female Fair 0.0 \n",
|
|||
|
"246019 Virgin Islands Male Good 0.0 \n",
|
|||
|
"246020 Virgin Islands Female Excellent 2.0 \n",
|
|||
|
"246021 Virgin Islands Male Very good 0.0 \n",
|
|||
|
"\n",
|
|||
|
" MentalHealthDays LastCheckupTime \\\n",
|
|||
|
"0 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"1 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"2 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"3 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"4 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 0.0 Within past 2 years (1 year but less than 2 ye... \n",
|
|||
|
"246018 7.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246019 15.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246020 2.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"246021 0.0 Within past year (anytime less than 12 months ... \n",
|
|||
|
"\n",
|
|||
|
" PhysicalActivities SleepHours RemovedTeeth HadHeartAttack \\\n",
|
|||
|
"0 Yes 9.0 None of them No \n",
|
|||
|
"1 Yes 6.0 None of them No \n",
|
|||
|
"2 No 8.0 6 or more, but not all No \n",
|
|||
|
"3 Yes 9.0 None of them No \n",
|
|||
|
"4 Yes 5.0 1 to 5 No \n",
|
|||
|
"... ... ... ... ... \n",
|
|||
|
"246017 Yes 6.0 None of them No \n",
|
|||
|
"246018 Yes 7.0 None of them No \n",
|
|||
|
"246019 Yes 7.0 1 to 5 No \n",
|
|||
|
"246020 Yes 7.0 None of them No \n",
|
|||
|
"246021 No 5.0 None of them Yes \n",
|
|||
|
"\n",
|
|||
|
" ... WeightInKilograms BMI AlcoholDrinkers HIVTesting FluVaxLast12 \\\n",
|
|||
|
"0 ... 71.67 27.99 No No Yes \n",
|
|||
|
"1 ... 95.25 30.13 No No Yes \n",
|
|||
|
"2 ... 108.86 31.66 Yes No No \n",
|
|||
|
"3 ... 90.72 31.32 No No Yes \n",
|
|||
|
"4 ... 79.38 33.07 No No Yes \n",
|
|||
|
"... ... ... ... ... ... ... \n",
|
|||
|
"246017 ... 102.06 32.28 Yes No No \n",
|
|||
|
"246018 ... 90.72 24.34 No No No \n",
|
|||
|
"246019 ... 83.91 29.86 Yes Yes Yes \n",
|
|||
|
"246020 ... 83.01 28.66 No Yes Yes \n",
|
|||
|
"246021 ... 108.86 32.55 No Yes Yes \n",
|
|||
|
"\n",
|
|||
|
" PneumoVaxEver TetanusLast10Tdap \\\n",
|
|||
|
"0 Yes Yes, received Tdap \n",
|
|||
|
"1 Yes Yes, received tetanus shot but not sure what type \n",
|
|||
|
"2 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"3 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"4 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"... ... ... \n",
|
|||
|
"246017 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246018 No No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"246019 Yes Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246020 No Yes, received tetanus shot but not sure what type \n",
|
|||
|
"246021 Yes No, did not receive any tetanus shot in the pa... \n",
|
|||
|
"\n",
|
|||
|
" HighRiskLastYear CovidPos SleepHours-HeightInMeters \n",
|
|||
|
"0 No No 7.40 \n",
|
|||
|
"1 No No 4.22 \n",
|
|||
|
"2 No Yes 6.15 \n",
|
|||
|
"3 No Yes 7.30 \n",
|
|||
|
"4 No No 3.45 \n",
|
|||
|
"... ... ... ... \n",
|
|||
|
"246017 No No 4.22 \n",
|
|||
|
"246018 No Yes 5.07 \n",
|
|||
|
"246019 No Yes 5.32 \n",
|
|||
|
"246020 No No 5.30 \n",
|
|||
|
"246021 No Yes 3.17 \n",
|
|||
|
"\n",
|
|||
|
"[246022 rows x 41 columns]"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 45,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.dropna() #Тк.пустых строк нет, мы ничего не удалили"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 46,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"#df.fillna(df.mean(), inplace=True)\n",
|
|||
|
"#df.fillna(df.median(), inplace=True)"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Мы обрабатываем пустые значения для каждого столбца отдельно\n",
|
|||
|
"\n",
|
|||
|
"Мы можем заполнить пропуски средним или медианой, если это числовой столбец\n",
|
|||
|
"\n",
|
|||
|
"Мы заполняем средним, если в колонке нет выбросов\n",
|
|||
|
"\n",
|
|||
|
"Если столбец категориальный, то мы можем заполнить пропуски модой (самым часто встречающимся значением)\n",
|
|||
|
"\n",
|
|||
|
"Если пропусков мало, то их можно просто удалить."
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"2. Возможности визуализации"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 47,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"import matplotlib.pyplot as plt"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 48,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAA0EAAAHDCAYAAADiGhEjAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAACDAElEQVR4nO3dd3wT9f8H8Fe6KV0U6GDvvVcpILMyRRTcyPCL4AAXiooiU4a4QEXw5wBFAUUZCsho2VBWZY9CoWzaAqV7N/f7oyQkzU4uuST3ej4efUCSy90nl8vdvT/j/VEIgiCAiIiIiIhIJjykLgAREREREZEjMQgiIiIiIiJZYRBERERERESywiCIiIiIiIhkhUEQERERERHJCoMgIiIiIiKSFQZBREREREQkKwyCiIiIiIhIVhgEERERERGRrDAIIiJZu3z5MhQKBZYtWyZ1UQxatmwZFAoFLl++7JDt5eTkICwsDL/99ptDtqepZ8+e6Nmzp9XvbdGihbgFshN936ktn93dvP/++4iKipK6GETkxhgEEZHbUt1oHjlyROqi6DV9+nQoFAr1n7+/P5o1a4YpU6YgKytLlG2sWLECCxYssOg9CxcuRGBgIJ555hkAwPz586FQKHD06FGt5QRBQKVKlaBQKJCcnKz1WkFBAXx9ffHcc8/ZVH57uHnzJqZPn45jx47pvDZ69GgEBARYtd6dO3dCoVDgzz//1Hq+qKgIjzzyCDw8PPDTTz9ZtW65efPNN3H8+HH8/fffUheFiNwUgyAikrXatWsjPz8fI0aMkKwMixcvxvLly/HFF1+gSZMmmD17Nvr37w9BEGxet6VBUHFxMRYuXIgXX3wRnp6eAIBu3boBAPbu3au17OnTp5GRkQEvLy/s27dP67XDhw+jqKhI/V5zbd26FVu3brXoPZa6efMmZsyYoTcIEltxcTGeeOIJbNq0Cd9//z3+97//AQBGjBiB/Px81K5d2+5lcEUREREYMmQIPvvsM6mLQkRuikEQEcmaQqGAn5+f+oZfCk888QSef/55vPzyy1izZg2GDh2K+Ph4HDhwwOFl2bBhA27fvo2nnnpK/VyHDh3g5+enEwTt27cPlStXRp8+fXReUz22NAjy8fGBj4+PlaV3LsXFxXjqqaewYcMGfPfddxgzZoz6NU9PT/j5+UGhUEhYwjK5ublSF0Gvp556Cnv37sWlS5ekLgoRuSEGQUQka/rGBKm6RN24cQOPPfYYAgICULVqVbzzzjsoLS3Ver9SqcSCBQvQvHlz+Pn5ITw8HC+99BLu3btndZl69+4NADpdzMr79ttv0bx5c/j6+qJatWoYP348MjIy1K/37NkTGzduxJUrV9Rd7urUqWN0nevWrUOdOnVQv3599XM+Pj7o2LGjTmvPvn37EB0dja5du+p9LSQkRD1Gx9z9pG9czJUrV/Doo4+iYsWKCAsLw1tvvYUtW7ZAoVBg586dOp/hzJkz6NWrF/z9/VG9enXMnz9f/drOnTvRsWNHAMALL7yg3i/GxoTVqVMHjzzyCPbu3YtOnTrBz88P9erVwy+//GLwPSUlJXjmmWewfv16LF68GGPHjtV63dxxXmlpaRgzZgzCw8Ph5+eH1q1b4+eff9ZZ7u7duxgxYgSCgoIQEhKCUaNG4fjx4waP7YsXL2LgwIEIDAzE8OHDAQB79uzBk08+iVq1asHX1xc1a9bEW2+9hfz8fK1tqdZx9epVPPLIIwgICED16tWxaNEiAMDJkyfRu3dvVKxYEbVr18aKFSu03l9cXIwZM2agYcOG8PPzQ+XKldGtWzds27ZNa7mYmBgAwPr1643uIyIiazAIIiLSo7S0FP369UPlypXx2WefoUePHvj888/xf//3f1rLvfTSS5g0aRK6du2KhQsX4oUXXsBvv/2Gfv36obi42KptX7x4EQBQuXJlg8tMnz4d48ePR7Vq1fD5559j2LBh+O6779C3b1/1dj/88EO0adMGVapUwfLly7F8+XKTXeP279+Pdu3a6TzfrVs33LhxQ+umfd++fejSpQu6dOmi7hoHlI0V2r9/P6Kjo+HhUXaZsXY/5ebmonfv3oiNjcXrr7+ODz/8EPv378d7772nd/l79+6hf//+aN26NT7//HM0adIE7733Hv79918AQNOmTTFz5kwAwLhx49T7pXv37kb3S1JSEp544gk8/PDD+Pzzz1GpUiWMHj0ap0+f1lm2pKQEzz77LNauXYtFixbhpZdeMrpuQ/Lz89GzZ08sX74cw4cPx6efforg4GCMHj0aCxcuVC+nVCoxePBgrFy5EqNGjcLs2bNx69YtjBo1Su96S0pK0K9fP4SFheGzzz7DsGHDAACrV69GXl4eXnnlFXz99dfo168fvv76a4wcOVJnHaWlpRgwYABq1qyJ+fPno06dOpgwYQKWLVuG/v37o0OHDvjkk08QGBiIkSNHagX006dPx4wZM9CrVy988803+PDDD1GrVi38999/WtsIDg5G/fr1dQJsIiJRCEREbmrp0qUCAOHw4cMGl0lOThYACEuXLlU/N2rUKAGAMHPmTK1l27ZtK7Rv3179eM+ePQIA4bffftNabvPmzXqfL2/atGkCACExMVG4ffu2kJycLHz33XeCr6+vEB4eLuTm5mp9juTkZEEQBCEtLU3w8fER+vbtK5SWlqrX98033wgAhJ9++kn93KBBg4TatWsbLYdKcXGxoFAohLffflvntY0bNwoAhOXLlwuCIAi3bt0SAAi7du0SsrOzBU9PT2Hjxo2CIAjCqVOnBADC7NmzLd5PPXr0EHr06KF+/PnnnwsAhHXr1qmfy8/PF5o0aSIAEHbs2KH1XgDCL7/8on6usLBQiIiIEIYNG6Z+7vDhwzrfucqoUaOEihUraj1Xu3ZtAYCwe/du9XNpaWmCr6+v1r7asWOHAEC9/KJFi3TWr1L+O9X32RcsWCAAEH799Vf1c0VFRUJ0dLQQEBAgZGVlCYIgCH/99ZcAQFiwYIF6udLSUqF3794Gj+33339fp0x5eXk6z82dO1dQKBTClStXdNYxZ84c9XP37t0TKlSoICgUCmHVqlXq58+dOycAEKZNm6Z+rnXr1sKgQYMM7htNffv2FZo2bWrWskRElmBLEBGRAS+//LLW44ceekhrfMLq1asRHByMhx9+GHfu3FH/tW/fHgEBAdixY4dZ22ncuDGqVq2KunXr4qWXXkKDBg2wceNG+Pv7610+NjYWRUVFePPNN9UtLQAwduxYBAUFYePGjVZ8WiA9PV2d8a28Ll26wMPDQz3WZ9++ffD29kbHjh0REBCAVq1aqWvsVf+qxgPZsp82b96M6tWr49FHH1U/5+fnp9O9TCUgIADPP/+8+rGPjw86depk87iSZs2a4aGHHlI/rlq1Kho3bqx3vampqfDy8kLdunVt2uamTZsQERGBZ599Vv2ct7c3Xn/9deTk5GDXrl0AyvaRt7e31j7x8PDA+PHjDa77lVde0XmuQoUK6v/n5ubizp076NKlCwRB0MkMCAAvvvii+v8hISFo3LgxKlasqDWerHHjxggJCdHaTyEhITh9+jQuXLhgahegUqVKuHPnjsnliIgs5SV1AYiInJGfnx+qVq2q9VylSpW0xrBcuHABmZmZCAsL07uOtLQ0s7b1119/ISgoCN7e3qhRo4bWeBx9rly5AqDsBlOTj48P6tWrp37dWoKerHQhISFo3ry5VqDTtm1b9Y1zly5dtF5TBR+AbfvpypUrqF+/vk4CgQYNGuhdvkaNGjrLVqpUCSdOnDC4DXPUqlVL57nyx4PK/PnzsWDBAjzxxBPYunUrunbtatU2r1y5goYNG2oFukBZlz7V66p/IyMjdYJmQ/vIy8sLNWrU0Hn+6tWrmDp1Kv7++2+dz5WZman1WN/vIzg4WO/+Dw4O1lrfzJkzMWTIEDRq1AgtWrRA//79MWLECLRq1UqnTIIgOEXyCCJyPwyCiIj0MCdbnFKpNDqpaPmbREO6d++OKlWqWFQ+ewgNDYVCoTCY1KFbt25YsmQJMjIy1OOBVLp06YKffvoJxcXF2Lt3L9q3bw8/Pz8
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 1000x500 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"#Линейная диаграмма\n",
|
|||
|
"plt.figure(figsize=(10, 5))\n",
|
|||
|
"df['WeightInKilograms'].plot(title='Line Plot (WeightInKilograms)')\n",
|
|||
|
"plt.show()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 49,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 800x500 with 0 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAlIAAAGhCAYAAACqMVpZAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAABB0ElEQVR4nO3de1xVdb7/8TcXuahsEA2QEZXSVPKWmEhTnRxJVOpoUkfNipTslwdNZfLWGJo1o+Hx1nihphLnpJP6OOaUJsZgapPkBSUvKWOmYaMbnRS2UlyE9fujwzpuoYtLdAO+no/Hejzc6/vZ3/XZe7EfvF2stbabYRiGAAAAcNXcXd0AAABAfUWQAgAAsIggBQAAYBFBCgAAwCKCFAAAgEUEKQAAAIsIUgAAABYRpAAAACwiSAEAAFhEkAIAALDIpUGqoqJCL774osLDw+Xr66vbbrtNL7/8si7/1hrDMJSSkqKWLVvK19dXMTExOnr0qNM8586d04gRI2Sz2RQQEKDExERdvHjRqWb//v2699575ePjo7CwMKWmplbrZ+3aterYsaN8fHzUpUsXffjhh9fnhQMAgAbBpUHq1Vdf1bJly7R48WIdPnxYr776qlJTU/XHP/7RrElNTdVrr72mtLQ07dy5U02aNFFsbKxKSkrMmhEjRujQoUPKzMzUhg0btH37dj3zzDPmuMPhUL9+/dSmTRvl5ORo7ty5mjlzpt544w2zZseOHRo+fLgSExO1b98+DR48WIMHD9bBgwdvzJsBAADqHTdXfmnxgw8+qODgYL311lvmuvj4ePn6+uqdd96RYRgKDQ3Vb3/7Wz3//POSpKKiIgUHBys9PV3Dhg3T4cOHFRERod27d6tnz56SpIyMDA0cOFDffPONQkNDtWzZMv3ud7+T3W6Xl5eXJGnq1Klav369jhw5IkkaOnSoiouLtWHDBrOX3r17q3v37kpLS/vZ11JZWalTp07Jz89Pbm5utfYeAQCA68cwDF24cEGhoaFyd7dwfMlwod///vdGmzZtjLy8PMMwDCM3N9cICgoy3nnnHcMwDOPYsWOGJGPfvn1Oz7vvvvuM5557zjAMw3jrrbeMgIAAp/Hy8nLDw8PDWLdunWEYhvHEE08YgwYNcqrZsmWLIck4d+6cYRiGERYWZixYsMCpJiUlxejatWuNvZeUlBhFRUXm8sUXXxiSWFhYWFhYWOrhcvLkyavOMYZhGJ5yoalTp8rhcKhjx47y8PBQRUWFfv/732vEiBGSJLvdLkkKDg52el5wcLA5ZrfbFRQU5DTu6empwMBAp5rw8PBqc1SNNWvWTHa7/Se3c6XZs2frpZdeqrb+5MmTstlsv+j1AwAA13I4HAoLC5Ofn5+l57s0SK1Zs0YrV67UqlWrdMcddyg3N1cTJkxQaGioEhISXNnaz5o2bZqSk5PNx1U7wmazEaQAAKhnrJ6W49IgNWnSJE2dOlXDhg2TJHXp0kVff/21Zs+erYSEBIWEhEiSCgoK1LJlS/N5BQUF6t69uyQpJCREZ86ccZr30qVLOnfunPn8kJAQFRQUONVUPf65mqrxK3l7e8vb29vKywYAAA2ES6/a++6776qd2OXh4aHKykpJUnh4uEJCQpSVlWWOOxwO7dy5U9HR0ZKk6OhoFRYWKicnx6zZsmWLKisrFRUVZdZs375d5eXlZk1mZqY6dOigZs2amTWXb6eqpmo7AAAA1Vg6s6qWJCQkGL/61a+MDRs2GMePHzfWrVtntGjRwpg8ebJZM2fOHCMgIMD461//auzfv98YNGiQER4ebnz//fdmTf/+/Y0777zT2Llzp/H3v//daN++vTF8+HBzvLCw0AgODjaeeOIJ4+DBg8a7775rNG7c2Hj99dfNmk8//dTw9PQ0/uu//ss4fPiwMWPGDKNRo0bGgQMHftFrKSoqMiQZRUVFtfDOAACAG+Faf3+79PYHFy5c0Isvvqj33ntPZ86cUWhoqIYPH66UlBTzNgWGYWjGjBl64403VFhYqHvuuUdLly7V7bffbs5z7tw5jR07Vh988IHc3d0VHx+v1157TU2bNjVr9u/fr6SkJO3evVstWrTQuHHjNGXKFKd+1q5dq+nTp+vEiRNq3769UlNTNXDgwF/0WhwOh/z9/VVUVMQ5UgBQBxmGoUuXLqmiosLVreAG8vDwkKen54+eA3Wtv79dGqQaEoIUANRdZWVlOn36tL777jtXtwIXaNy4sVq2bGkepLnctf7+dunJ5gAAXG+VlZU6fvy4PDw8FBoaKi8vL26cfJMwDENlZWU6e/asjh8/rvbt21u76eZPIEgBABq0srIyVVZWKiwsTI0bN3Z1O7jBfH191ahRI3399dcqKyuTj49Prc7v0qv2AAC4UWr7SATqj+u57/mpAgAAsIggBQAAYBHnSAEAblptp268ods7MSeu1ud0c3PTe++9p8GDB9f63Ph5HJECAKAOO3v2rMaMGaPWrVvL29tbISEhio2N1aeffuqynk6cOCE3Nzfl5uZWG7v//vs1YcKEG96Tq3BECgCAOiw+Pl5lZWVasWKFbr31VhUUFCgrK0vffvutq1tzmbKyshrvCeUKHJECAKCOKiws1CeffKJXX31Vffr0UZs2bdSrVy9NmzZN//7v/17jc06ePKn/+I//UEBAgAIDAzVo0CCdOHHCqebNN99Up06d5OPjo44dO2rp0qXmWNXRpnfffVd33323fHx81LlzZ23bts3Sazh//ryefPJJNWvWTI0bN9aAAQN09OhRc3zmzJnq3r2703MWLlyotm3bmo+feuopDR48WL///e8VGhqqDh06SJKWLl2q9u3by8fHR8HBwXrkkUcs9XgtOCIF3AA/dh7G9ThfAkDD0bRpUzVt2lTr169X79695e3t/ZP15eXlio2NVXR0tD755BN5enrqlVdeUf/+/bV//355eXlp5cqVSklJ0eLFi3XnnXdq3759Gj16tJo0aaKEhARzrkmTJmnhwoWKiIjQ/Pnz9dBDD+n48eNq3rz5Vb2Gp556SkePHtX7778vm82mKVOmaODAgfriiy/UqFGjXzxPVlaWbDabMjMzJUl79uzRc889p//+7//W3XffrXPnzumTTz65qt5qA0EKAIA6ytPTU+np6Ro9erTS0tLUo0cP/du//ZuGDRumrl27VqtfvXq1Kisr9eabb5p3b1++fLkCAgK0detW9evXTzNmzNC8efM0ZMgQSVJ4eLi++OILvf76605BauzYsYqPj5ckLVu2TBkZGXrrrbc0efJks+buu++udo+m77//3jzCVBWgPv30U919992SpJUrVyosLEzr16/Xo48++ovfiyZNmujNN980/6S3bt06NWnSRA8++KD8/PzUpk0b3Xnnnb94vtrCn/YAAKjD4uPjderUKb3//vvq37+/tm7dqh49eig9Pb1a7eeff64vv/xSfn5+5tGswMBAlZSU6NixYyouLtaxY8eUmJhojjdt2lSvvPKKjh075jRXdHS0+W9PT0/17NlThw8fdqpZvXq1cnNznZaePXua44cPH5anp6eioqLMdc2bN1eHDh2qzfVzunTp4nRe1AMPPKA2bdro1ltv1RNPPKGVK1e65LsUOSIFAEAd5+PjowceeEAPPPCAXnzxRT399NOaMWOGnnrqKae6ixcvKjIyUitXrqw2xy233KKLFy9Kkv70pz85hRtJ8vDwuOq+wsLC1K5dO6d1vr6+VzWHu7u7DMNwWldeXl6trkmTJk6P/fz8tHfvXm3dulUfffSRUlJSNHPmTO3evVsBAQFX1cO14IgUAAD1TEREhIqLi6ut79Gjh44ePaqgoCC1a9fOafH391dwcLBCQ0P11VdfVRsPDw93muuzzz4z/33p0iXl5OSoU6dOV9Vnp06ddOnSJe3cudNc9+233yovL08RERGSfgh4drvdKUzVdFuFmnh6eiomJkapqanav3+/Tpw4oS1btlxVj9eKI1IAANRR3377rR599FGNGjVKXbt2lZ+fn/bs2aPU1FQNGjSoWv2IESM0d+5cDRo0SLNmzVKrVq309ddfa926dZo8ebJatWq
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"#Гистограмма\n",
|
|||
|
"plt.figure(figsize=(8, 5))\n",
|
|||
|
"df.plot.hist(column=[\"SleepHours\"], bins=80)\n",
|
|||
|
"plt.show()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 50,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAArUAAAIzCAYAAAAeSeGEAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAABlD0lEQVR4nO3dd3gU5cL+8XuTkAoJUpIQCL0XKUEwoHQJigJWRFRAEOGACnhQsNAtR0GFQ1MpsQCCKKAgvUqRXgQhFEFQTGhCKNKS5/eHv+zLmgQSSJg8nO/nuvZ63Xmenb13Mu/JzWRm1mWMMQIAAAAs5uV0AAAAAOBGUWoBAABgPUotAAAArEepBQAAgPUotQAAALAepRYAAADWo9QCAADAepRaAAAAWI9SCwAAAOtRagFAUvv27VW8ePGb9n7r1q2Tr6+vfv3115v2nsg6ly5dUmRkpEaPHu10FAD/H6UWQLaIjY2Vy+XyeISGhqphw4aaO3fuTcvRoEEDjwz58uXTHXfcoQkTJig5OTlL3uOtt97SzJkzM/Wa1157TW3atFGxYsXSHK9Vq5ZcLpfGjBmTBQkzZ9myZXrooYcUHh4uX19fhYaG6oEHHtA333yT6XWdO3dOAwYM0LJly7I+qINy5cqlXr166c0339T58+edjgNAlFoA2WzQoEH6/PPP9dlnn+nll1/W0aNHdd9992n27Nk3LUORIkX0+eef6/PPP9cbb7yhy5cvq2PHjnr11VezZP2ZLbVbtmzRokWL1KVLlzTH9+zZo/Xr16t48eKaNGlSlmTMqP79+6thw4bavn27nnvuOY0dO1a9e/fWmTNn9PDDD2vy5MmZWt+5c+c0cODAW67USlKHDh107NixTG8TANnDx+kAAG5t9957r2rWrOl+3rFjR4WFhWnKlCm6//77b3j9ycnJunjxovz9/dOdExISoieffNL9/LnnnlO5cuU0cuRIDR48WLly5brhHJkxceJEFS1aVHfeeWea41988YVCQ0M1bNgwPfLIIzpw4MBNOTVi+vTpGjRokB555BFNnjzZY7v07t1b8+fP16VLl7I9h1POnTunwMDADM/PmzevmjZtqtjYWD3zzDPZmAxARnCkFsBNlTdvXgUEBMjHx/Pf1EOHDlWdOnWUP39+BQQEKCoqStOnT0/1epfLpe7du2vSpEmqVKmS/Pz8NG/evExlCAwM1J133qmzZ8/q6NGj6c47e/asXnrpJUVGRsrPz0/lypXT0KFDZYzxyHP27Fl9+umn7lMc2rdvf9X3nzlzpho1aiSXy5Xm+OTJk/XII4/o/vvvV0hISLpHApctW6aaNWvK399fpUqV0kcffaQBAwakud4vvvhCUVFRCggIUL58+fT444/r0KFDHnPeeOMN5cuXTxMmTEiz6MfExLj/IXLx4kX169dPUVFRCgkJUVBQkO6++24tXbrUPf/AgQMqWLCgJGngwIHu7TNgwAD3nF27dumRRx5Rvnz55O/vr5o1a+rbb79N9d7btm1T/fr1FRAQoCJFimjIkCGaOHGiXC6XDhw44DF39OjR7n0jIiJC3bp108mTJz3mNGjQQJUrV9bGjRtVr149BQYG6tVXX1W7du1UoECBNMt706ZNVa5cOY9l99xzj1auXKkTJ06kmg/g5uJILYBsderUKR07dkzGGB05ckT//e9/debMGY8jp5I0fPhwtWjRQm3bttXFixf15Zdf6tFHH9Xs2bPVvHlzj7lLlizRtGnT1L17dxUoUOC6jmL+8ssv8vb2Vt68edMcN8aoRYsWWrp0qTp27Khq1app/vz56t27t37//Xd98MEHkqTPP/9cnTp1Uq1atdS5c2dJUqlSpdJ9399//10HDx5UjRo10hxfu3at9u7dq4kTJ8rX11cPPfSQJk2alOpUic2bN6tZs2YqVKiQBg4cqKSkJA0aNMhdIq/05ptv6o033tBjjz2mTp066ejRo/rvf/+revXqafPmzcqbN6/27NmjXbt26ZlnnlGePHmuuf0SExM1btw4tWnTRs8++6xOnz6t8ePHKyYmRuvWrVO1atVUsGBBjRkzRl27dtWDDz6ohx56SJJ0++23S5J27NihunXrqnDhwurTp4+CgoI0bdo0tWrVSl9//bUefPBB9zZr2LChXC6X+vbtq6CgII0bN05+fn6pcg0YMEADBw5UkyZN1LVrV8XFxWnMmDFav369Vq1a5VHWjx8/rnvvvVePP/64nnzySYWFhSkoKEifffaZ5s+f7/GXhPj4eC1ZskT9+/f3eL+oqCgZY7R69eos+csDgBtgACAbTJw40UhK9fDz8zOxsbGp5p87d87j+cWLF03lypVNo0aNPJZLMl5eXmbHjh0ZylG/fn1Tvnx5c/ToUXP06FGzc+dO88ILLxhJ5oEHHnDPa9eunSlWrJj7+cyZM40kM2TIEI/1PfLII8blcpm9e/e6lwUFBZl27dplKM+iRYuMJPPdd9+lOd69e3cTGRlpkpOTjTHGLFiwwEgymzdv9pj3wAMPmMDAQPP777+7l+3Zs8f4+PiYK/+n/cCBA8bb29u8+eabHq//6aefjI+Pj3v5rFmzjCTzwQcfZOhzXL582Vy4cMFj2Z9//mnCwsLMM88841529OhRI8n0798/1ToaN25sqlSpYs6fP+9elpycbOrUqWPKlCnjXvb8888bl8vlsQ2OHz9u8uXLZySZ/fv3G2OMOXLkiPH19TVNmzY1SUlJ7rkjR440ksyECRPcy+rXr28kmbFjx3pkSkpKMkWKFDGtW7f2WP7+++8bl8tlfvnlF4/lhw8fNpLMf/7zn3S2FICbhdMPAGSrUaNGaeHChVq4cKG++OILNWzYUJ06dUp1JX1AQID7v//880+dOnVKd999tzZt2pRqnfXr11fFihUznGHXrl0qWLCgChYsqAoVKui///2vmjdvrgkTJqT7mu+//17e3t564YUXPJa/9NJLMsZc9x0cjh8/Lkm67bbbUo1dvnxZU6dOVevWrd2nEDRq1EihoaEeF4wlJSVp0aJFatWqlSIiItzLS5curXvvvddjnd98842Sk5P12GOP6dixY+5HeHi4ypQp4z5dIDExUZIydJRWkry9veXr6yvp7/OaT5w4ocuXL6tmzZpp/sz+6cSJE1qyZIkee+wxnT592p3r+PHjiomJ0Z49e/T7779LkubNm6fo6GhVq1bN/fp8+fKpbdu2HutctGiRLl68qB49esjL6/9+vT377LMKDg7WnDlzPOb7+fmpQ4cOHsu8vLzUtm1bffvttzp9+rR7+aRJk1SnTh2VKFHCY37Kz/HYsWPX/MwAshenHwDIVrVq1fK4UKxNmzaqXr26unfvrvvvv99djGbPnq0hQ4Zoy5YtunDhgnt+WueH/rNYXEvx4sX1ySefyOVyyd/fX2XKlFFoaOhVX/Prr78qIiIiVcmrUKGCe/xGmCvOy02xYMECHT16VLVq1dLevXvdyxs2bKgpU6boP//5j7y8vHTkyBH99ddfKl26dKp1/HPZnj17ZIxRmTJl0syR8uf44OBgSfIoctfy6aefatiwYdq1a5fHOagZ+fns3btXxhi98cYbeuONN9Kcc+TIERUuXFi//vqroqOjU43/87Om/Ez+ed6rr6+vSpYsmepnVrhwYff+d6Wnn35a//nPfzRjxgw9/fTTiouL08aNGzV27NhUc1N+jumdHw3g5qHUAripvLy81LBhQw0fPlx79uxRpUqV9MMPP6hFixaqV6+eRo8erUKFCilXrlyaOHFimhdJXXlUNyOCgoLUpEmTrPoINyR//vyS/j4a/U8pR2Mfe+yxNF+7fPlyNWzYMFPvl5ycLJfLpblz58rb2zvVeO7cuSVJ5cuXlyT99NNPGVrvF198ofbt26tVq1bq3bu3QkND5e3trbffflv79u3LUC5J+ve//62YmJg056RV2rNSevtRxYoVFRUVpS+++EJPP/20vvjiC/n6+qb5c0n5ORYoUCBbswK4NkotgJvu8uXLkqQzZ85Ikr7++mv5+/tr/vz5Hhf/TJw40ZF8klSsWDEtWrRIp0+f9jhau2vXLvd4isw
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 800x500 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"plt.figure(figsize=(8, 5))\n",
|
|||
|
"df['AgeCategory'].value_counts().plot(kind='bar', title='Bar Plot (AgeCategory)')\n",
|
|||
|
"plt.show()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 53,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAqQAAAHDCAYAAADyXwjWAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAt9klEQVR4nO3deXhU5d3/8c8kIYsJmSxmhQB5gBYVFKsWAVGQXAYECyVqqbhAsFoBFRQoUFGxShRFBIvwyEMBFZdHBAStEUWCUcIilVbUB5GdbICQGRKzMZnfH/wYGbYQPcmdmbxf1zWXM/f5zjnf+Mf48T73OcfmdrvdAgAAAAwJMN0AAAAAmjYCKQAAAIwikAIAAMAoAikAAACMIpACAADAKAIpAAAAjCKQAgAAwCgCKQAAAIwikAIAAMAoAikAAACMIpACaPSKi4t1zz33qFWrVmrWrJlsNpvn1aZNG9PtAQB+oSDTDQDAuVRUVOjaa6/Vjh07NGzYMHXp0kWhoaGSpOnTp+vIkSOGOwQA/FIEUgCN2vLly/Xdd99p4sSJmjp1qte2N998k0AKAH6AU/YAGrUdO3ZIkq655przqrfZbBo1apTXWP/+/U87tb9kyRLZbDbl5OR4xhYuXCibzabdu3d7xmpqanTppZfKZrNp4cKFnvGhQ4eets/XXntNAQEBevrpp2vts6SkRGPGjFGbNm0UEhKili1b6s4779ShQ4fO+p3rrrtOl1122Rm3/frXv1Z6erpX3zNnzlSnTp0UGhqquLg49enTR1988YWnZsGCBbr++usVHx+vkJAQXXzxxZozZ85p+27Tpo1sNptGjx592rb09HTZbDb179/fM5aTk3Pav1tJ6tevn2w2mx5//PGz/o0AmiYCKYBGLSYmRpK8QmJDevXVV/XVV1/VWrdq1SplZmZq1KhRmjBhwjlrS0tL1aNHD7344ou64YYbNHPmTP35z3/W//3f/2n//v1n/d4dd9yh//znP9q6davX+KZNm/Tdd9/p9ttv94wNHz5co0ePVkpKip555hlNmDBBoaGhWr9+vadmzpw5at26tSZNmqTp06crJSVFI0aM0OzZs087dmhoqBYvXqzq6mrP2P79+7V69WrPEopz+fTTT/XPf/6z1joATROn7AE0agMGDNCECRP0xBNPKCEhwWsN6cnhqD5UVlbq0UcfVd++ffXBBx+ctW7z5s3KyMjQwIED9cILL9S632effVZbt27V0qVL9fvf/94z/sgjj8jtdp/1e7fccovuv/9+vfbaa16zsK+99prCw8M1aNAgSdKaNWu0cOFCPfDAA5o5c6an7uGHH/ba/9q1axUWFub5PGrUKPXp00fPP/+8Ro4c6XXsHj166Msvv9SKFSuUkZEh6fiMcpcuXZSfn1/r3zx+/Pha/z0CaLqYIQXQqCUnJ2vdunXq1KmTbr75ZqWkpCguLk5xcXFatWpVvR579uzZ+uGHH/TYY4+dtWbnzp3q16+fOnfurFdffVUBAbX/rL7zzju67LLLvMLoCTab7azfs9vtGjBggN544w1PsHS5XHrrrbc0cOBAhYeHe/Zvs9nO2PfJ+z85jDocDh06dEjXXXeddu7cKYfD4fW94OBgDRkyRAsWLPCMLVy4UMOGDav17126dKk2bdp0XksZADRNBFIAjd4ll1yiDz74QG3btlXLli310Ucf6aOPPlKXLl3q7ZgOh0NTp07VQw89pISEhDPWlJWVKT09XcXFxTp8+PA5w+TJduzYoY4dO/6svu68807t3btXubm5kqSPP/5YxcXFuuOOO7z2n5yc7FnucDaff/650tLSFB4erqioKMXFxWnSpEmSdFoglaRhw4YpOztbhYWFWrt2rQoLC3Xrrbee8xgul0uTJk3SkCFDdOmll9b1zwXQRBBIAfiEuXPnaseOHcrKylJaWprS0tJ04YUX1tvxnnnmGQUEBGjcuHFnrTl06JCqq6u1cuVKbdu2TVlZWfXWzwnp6elKSEjQa6+9Jun46frExESlpaXVaT87duxQ7969dejQIT3//PN6//339dFHH2nMmDGSjl8UdarLLrtMl112mV555RUtWLBAGRkZioyMPOdx5s+fr927d+tvf/tbnfoD0LQQSAE0eg6HQ1OmTNFVV12lIUOG1PvxCgoKNHPmTD3yyCNq3rz5WesuuOACZWdnq3///hozZoymTp2qb7/9ttb9t23b9rQLk85XYGCgbrvtNi1ZskRHjhzR8uXL9cc//lGBgYFe+y8oKNDhw4fPup+VK1eqsrJSK1as0L333qsbb7xRaWlpXqfxzyQzM1Pz5s3TkiVLaj1d/+OPP2rKlCkaMWKEWrduXbc/FECTQiAF0OhNnTpVhw4d0owZM877tPgvMWXKFCUkJOjPf/7zOevi4uLUoUMHSdITTzyhli1b6k9/+tM5L0ySpIyMDP373//WsmXLTttW23el41fbHzlyRPfee69KS0u9rq4/sX+3260pU6acdf8nAuzJx3M4HF5rRM/ktttuU35+vuLj49WzZ89z1s6cOVNlZWX661//WuvfBKBp4yp7AI3anj17NGvWLN16663q3r37eX1n7969ys7O9nw+ePCgysvLvca2bNkiSdq4caPat2+vFi1aeLatWrVKixcvVnBw8Hn3GRYWppdffllpaWmaM2eORowYcdbacePGacmSJbrllluUmZmpK664QocPH9aKFSs0d+7cs95r9ITLL79cHTt21Ntvv62LLrpIv/nNb7y29+rVS3fccYdmzZql7du3q0+fPqqpqVFubq569eqlUaNG6YYbblBwcLBuuukmT7CdN2+e4uPjVVhYeNZjR0dHq7CwUIGBgbX+z8GqVav01FNPKTY29px1AEAgBdCoTZo0SW63W88888x5f2flypVauXLlaeN9+/Y9bewvf/mL4uPjNXToUM9Y586d9cc//rHOvfbu3VvDhg3TxIkTNWDAAK+Qe7KIiAjl5ubqscce07Jly7Ro0SLFx8erd+/eatmy5Xkd684779T48eO9LmY62YIFC3TppZdq/vz5GjdunOx2u6688kp169ZN0vEb6S9ZskSPPPKIxo4dq8TERN13332Ki4tTZmbmOY8dFRV1Xj0mJSWd8Wb6AHAqm/t8zg8BgJ/q2bOnhg4d6hVIfcHMmTM1ZswY7d69W61atTLdDgD8IqwhBQAf43a7NX/+fF133XWEUQB+gVP2AJq03/72t2c9td7YlJWVacWKFVqzZo2++uorvfvuu6ZbAgBLcMoeAHzE7t27lZqaqqioKI0YMUJPPfWU6ZYAwBIEUgAAABjFGlIAAAAYRSAFAACAUT55UVNNTY0KCgrUvHnzBnlqCwAAAOrG7Xbr6NGjSk5OVkDAuedAfTKQFhQUKCUlxXQbAAAAqMW+fftqfeiHTwbS5s2bSzr+B0ZGRhruBgAAAKdyOp1KSUnx5LZz8clAeuI0fWRkJIEUAACgETuf5ZVc1AQAAACj6hxIP/30U910001KTk6WzWbT8uXLvba73W49+uijSkpKUlhYmNLS0rR9+3avmsOHD2vIkCGKjIxUVFSUhg8frtLS0l/0hwAAAMA31TmQlpWV6bLLLtPs2bPPuH3atGmaNWuW5s6dqw0bNig8PFzp6emqqKjw1AwZMkRff/21PvroI7333nv69NNPdc899/z8vwIAAAA+6xc9qclms2nZsmUaOHCgpOOzo8nJyXr44Yc1duxYSZLD4VBCQoIWLlyowYMH69tvv9XFF1+sTZs26corr5QkZWdn68Ybb9T+/fuVnJxc63GdTqfsdrscDgdrSAEAABqhuuQ1S9eQ7tq1S0VFRUpLS/OM2e12denSRXl5eZKkvLw8RUVFecKoJKWlpSkgIEAbNmw4434rKyvldDq9XgAAAPAPlgbSoqIiSVJCQoLXeEJCgmdbUVGR4uPjvbYHBQUpJibGU3OqrKws2e12z4t7kAIAAPgPn7jKfuLEiXI4HJ7Xvn37TLcEAAAAi1gaSBMTEyVJxcXFXuPFxcWebYmJiTpw4IDX9mPHjunw4cOemlOFhIR47jnKvUcBAAD8i6W
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 800x500 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"plt.figure(figsize=(8, 5))\n",
|
|||
|
"df[\"BMI\"].plot(kind = \"box\", title='Ящик с усами')\n",
|
|||
|
"plt.show()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": null,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 800x500 with 0 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAjMAAAGzCAYAAADaCpaHAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAC+CElEQVR4nO2deZwkRZn3f1nVXdX3NUf3zDAXw8g5cgw6DijgMsshKAguIIiACq4LKqKC7Csg6Iqi6+KB4AmogyiuILrKLnKpOJxyH8MMcx993911V7x/VGVmRGTkVZV1dT/f+fRUVWZkxBMRTzzxxJGZGmOMgSAIgiAIokYJVVoAgiAIgiCIYiBnhiAIgiCImoacGYIgCIIgahpyZgiCIAiCqGnImSEIgiAIoqYhZ4YgCIIgiJqGnBmCIAiCIGoacmYIgiAIgqhpyJkhCIIgCKKmIWeGIKqI4447Dscdd1zZ0vv1r3+Nrq4uTE5Oli1NYvbxjne8A1deeWWlxSBmMOTMEDXP97//fWiahjVr1lRaFFuWLVsGTdOMv/nz5+Nd73oX7r333kDin56expe+9CU8+uijnq/JZDK47rrr8MlPfhItLS3K8wsXLoSmafjTn/4UiJx+uPfee3HyySdj7ty5iEQiWLhwIc466yw8/PDDvuPas2cPvvSlL+H5558PXtAa4Y477hB0UNfDd7/73cr61cN87GMfU8b3//7f/zPCDA4OGscvvPBCiz5dddVVuOWWW9Db2xtspggiDzkzRM2zfv16LFu2DE899RQ2b95caXFsOeyww/Dzn/8cP//5z/G5z30Oe/bswRlnnIHbbrut6Linp6dx/fXX+3Jmfv/732Pjxo245JJLlOcffvhh7N27F8uWLcP69euLltErjDFcdNFFOOOMM9DX14crrrgCt912Gy699FJs2bIFxx9/PP7+97/7inPPnj24/vrrZ7Uzo3PDDTfg5z//OX72s5/hyiuvxMDAAN7znvfgD3/4gyVsQ0MD/vu//xvJZNJy7pe//CUaGho8pXnaaaehra0N3//+94uWnyCUMIKoYbZs2cIAsN/+9rds3rx57Etf+pKn61KpFEskEiWWzmTp0qXslFNOEY7t3buXNTc3s7e85S3GsWOPPZYde+yxvuMfGBhgANh1113n+Zr3ve997J3vfKft+Q9/+MPsiCOOYN/+9rdZc3Mzm5yc9C1XIXzjG99gANjll1/Ostms5fzPfvYz9uSTT/qK8+mnn2YA2O233x6QlKUhm82y6enpksR9++23MwDs6aefFo4PDw+z+vp6du655wrHAbDTTz+dhUIhdt999wnnHn/8cQaAnXnmmQwAGxgYMM5dcMEFrLm52ZL+ZZddxpYuXaqsU4IoFpqZIWqa9evXo7OzE6eccgo+8IEPKGcQtm3bBk3T8M1vfhM333wzVqxYgWg0ildffRUA8Prrr+MDH/gAurq60NDQgCOPPBL333+/EMfw8DA+97nPYdWqVWhpaUFbWxtOPvlkvPDCCwXL3tPTgwMPPBBbt251DNff34+PfvSj6O7uRkNDAw499FDceeedQv7mzZsHALj++uuNqf8vfelLtnHG43E88MADWLdunfJ8LBbDvffei3POOQdnnXUWYrEYfve73ynD3nPPPTjooIPQ0NCAQw45BPfeey8uvPBCLFu2TAiXzWZx88034+CDD0ZDQwO6u7vx8Y9/HCMjI0K6N954Iw444AB885vfhKZplvTOP/98vP3tbwfgrV4effRRvO1tbwMAXHTRRUb53HHHHUaYJ598EieddBLa29vR1NSEY489Fo8//rgl7UcffRRHHnkkGhoasGLFCvzgBz/Al770JYuc6XQaX/7ylw1dW7ZsGf793/8diURCCLds2TKceuqp+N///V8ceeSRaGxsxA9+8AMce+yxOPTQQ5Xlvf/+++PEE09UniuEjo4ONDY2oq6uznJu0aJFOOaYY3DXXXcJx9evX49Vq1bhkEMO8ZzOP//zP2P79u00O0aUBKv2EkQNsX79epxxxhmIRCL44Ac/iFtvvRVPP/200Xnx3H777YjH47jkkksQjUbR1dWFV155BUcffTQWLVqEL3zhC2hubsavf/1rnH766fjv//5vvP/97wcAbNmyBffddx/+5V/+BcuXL0dfX5/R6bz66qtYuHChb9lTqRR27tyJOXPm2IaJxWI47rjjsHnzZlx22WVYvnw57rnnHlx44YUYHR3Fpz/9acybNw+33norPvGJT+D9738/zjjjDADAW9/6Vtt4n332WSSTSRxxxBHK8/fffz8mJydxzjnnoKenB8cddxzWr1+Pc889Vwj3P//zPzj77LOxatUq3HjjjRgZGcFHP/pRLFq0yBLnxz/+cdxxxx246KKL8KlPfQpbt27F9773PTz33HN4/PHHUV9fj7/97W8YHh7G5ZdfjnA47FqGXurlwAMPxA033IBrr70Wl1xyCd71rncBAI466igAueW0k08+GatXr8Z1112HUCiE22+/Hf/0T/+Ev/71r4bj9Nxzz+Gkk07CggULcP311yOTyeCGG24wHEmej33sY7jzzjvxgQ98AJ/97Gfx5JNP4sYbb8Rrr71m2Se1ceNGfPCDH8THP/5xXHzxxdh///3R0tKCiy++GC+//LLgMDz99NN444038MUvftG1bOwYGxvD4OAgGGPo7+/Hd7/7XUxOTuJDH/qQMvy5556LT3/605icnERLSwvS6TTuueceXHHFFYjH457TXb16NQDg8ccfx+GHH16w/AShpNJTQwRRKM888wwDwB588EHGWG6Kfp999mGf/vSnhXBbt25lAFhbWxvr7+8Xzh1//PFs1apVLB6PG8ey2Sw76qij2MqVK41j8XicZTIZS7zRaJTdcMMNrrIuXbqUnXDCCWxgYIANDAywF154gZ1zzjkMAPvkJz9phJOXmW6++WYGgP3iF78wjiWTSbZ27VrW0tLCxsfHGWP+l5l+/OMfMwDspZdeUp4/9dRT2dFHH238/uEPf8jq6uos5bdq1Sq2zz77sImJCePYo48+ygCwpUuXGsf++te/MgBs/fr1wvUPPPCAcPzb3/42A8DuvfdeT/nwWi92y0zZbJatXLmSnXjiicLyx/T0NFu+fDn753/+Z+PYe9/7XtbU1MR2795tHNu0aROrq6tjvCl9/vnnGQD2sY99TEjrc5/7HAPAHn74YePY0qVLGQD2wAMPCGFHR0dZQ0MDu+qqq4Tjn/rUpwpe8tOXmeS/aDTK7rjjDkt4AOzSSy9lw8PDLBKJsJ///OeMMcb+53/+h2maxrZt28auu+46z8tMjDEWiUTYJz7xCd+yE4QbtMxE1Czr169Hd3c33v3udwPI3X1x9tln4+6770Ymk7GEP/PMM4VR9PDwMB5++GGcddZZmJiYwODgIAYHBzE0NIQTTzwRmzZtwu7duwEA0WgUoVCuuWQyGQwNDaGlpQX7778//vGPf3iS9//+7/8wb948zJs3D4ceeijuuecenH/++fj6179ue80f//hH9PT04IMf/KBxrL6+Hp/61KcwOTmJxx57zFPaMkNDQwCAzs5O5bn//d//FdI888wzoWkafv3rXxvH9uzZg5deegkf/vCHhbtXjj32WKxatUqI85577kF7ezv++Z//2SjnwcFBrF69Gi0tLXjkkUcAAOPj4wCA1tZWT/kotl6ef/55bNq0Ceeeey6GhoYMuaampnD88cfjL3/5C7LZLDKZDP785z/j9NNPF2bh9ttvP5x88slCnH/84x8BAFdccYVw/LOf/SyA3GwWz/Llyy3LRu3t7TjttNPwy1/+EowxI3+/+tWvcPrpp6O5udlL8Si55ZZb8OCDD+LBBx/EL37xC7z73e/Gxz72Mfz2t79Vhu/s7MRJJ52EX/7ylwCAu+66C0cddRSWLl3qO+3Ozk7hzieCCApaZiJqkkwmg7vvvhvvfve7hT0na9aswX/+53/ioYcewgknnCBcs3z5cuH35s2bwRjDNddcg2uuuUaZTn9/PxYtWoRsNotvf/vb+P73v4+tW7cKzpLTMhHPmjVr8JWvfAWapqG
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"plt.figure(figsize=(8, 5))\n",
|
|||
|
"df[['AgeCategory', 'BMI']].plot(kind='area', alpha=0.2, title='Area Plot (AgeCategory, BMI)')\n",
|
|||
|
"plt.show()"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": null,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"<Axes: xlabel='BMI', ylabel='WeightInKilograms'>"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 39,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAj4AAAGwCAYAAACpYG+ZAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAB9gElEQVR4nO3deXhTZfo38G+6UGihbbpRCoUWKJuAFClbESkwLAKKoK8yKIuoIwO44oLruOKCP2dElJkRURxBB1fElYFSZJEWCkoBS6GUAqW0lC60hdLlvH/UhCQ9OUvWk+T7uS6vGZKTkydN2nPnee7nvnWCIAggIiIi8gF+7h4AERERkasw8CEiIiKfwcCHiIiIfAYDHyIiIvIZDHyIiIjIZzDwISIiIp/BwIeIiIh8RoC7B6AFTU1NKCoqQrt27aDT6dw9HCIiIlJAEARcuHABcXFx8PNTNpfDwAdAUVER4uPj3T0MIiIissHJkyfRqVMnRccy8AHQrl07AM0/uNDQUDePhoiIiJSoqqpCfHy88TquBAMfwLi8FRoaysCHiIjIw6hJU2FyMxEREfkMtwY+7777Lvr372+caRk2bBi+//574/2XLl3CggULEBkZibZt22L69Ok4e/as2TkKCwsxadIkBAcHIyYmBo888ggaGhpc/VKIiIjIA7g18OnUqRNeeeUV7N27F3v27MHo0aNx44034uDBgwCABx98EN988w3Wr1+PjIwMFBUVYdq0acbHNzY2YtKkSbh8+TJ27tyJDz/8EB988AGeeeYZd70kIiIi0jCdIAiCuwdhKiIiAq+//jpuvvlmREdHY+3atbj55psBAL///jt69+6NXbt2YejQofj+++8xefJkFBUVoX379gCAlStX4rHHHkNpaSlatWol+hx1dXWoq6sz/tuQHFVZWckcHyIiIg9RVVWFsLAwVddvzeT4NDY24pNPPkFNTQ2GDRuGvXv3or6+HmPHjjUe06tXL3Tu3Bm7du0CAOzatQv9+vUzBj0AMH78eFRVVRlnjcQsXboUYWFhxv+4lZ2IiMg3uD3wOXDgANq2bYugoCDce++9+PLLL9GnTx8UFxejVatWCA8PNzu+ffv2KC4uBgAUFxebBT2G+w33WbNkyRJUVlYa/zt58qRjXxQRERFpktu3s/fs2RP79+9HZWUlPvvsM8yePRsZGRlOfc6goCAEBQU59TmIiIhIe9we+LRq1Qrdu3cHAFxzzTXIysrCP/7xD9x66624fPkyKioqzGZ9zp49i9jYWABAbGwsMjMzzc5n2PVlOIaIiIjIwO1LXZaamppQV1eHa665BoGBgdi8ebPxvtzcXBQWFmLYsGEAgGHDhuHAgQMoKSkxHrNp0yaEhoaiT58+Lh87ERERaZtbZ3yWLFmCiRMnonPnzrhw4QLWrl2LrVu34scff0RYWBjmzZuHhx56CBEREQgNDcWiRYswbNgwDB06FAAwbtw49OnTB3fccQdee+01FBcX46mnnsKCBQu4lEVEREQtuDXwKSkpwaxZs3DmzBmEhYWhf//++PHHH/GnP/0JAPDmm2/Cz88P06dPR11dHcaPH4933nnH+Hh/f39s3LgR8+fPx7BhwxASEoLZs2fj+eefd9dLIiIiAgDkl1bjxPlaJESGIDEqxN3DoT9oro6PO9hSB4CIiEhMRe1l3LduP7bllRpvG5kUjeUzkhEWHOjGkXkfj67jQ0RE5A3uW7cfO46eM7ttx9FzWLRun5tGRKYY+BARETlIfmk1tuWVotFiMaVRELAtrxTHz9W4aWRkwMCHiIjIQU6cr5W8v6CMgY+7MfAhIiJykC4RwZL3J0QyydndGPgQERE5SNfothiZFA1/nc7sdn+dDiOTorm7SwMY+BARETnQ8hnJSO0eZXZbavcoLJ+R7KYRkSm3t6wgIiLyJmHBgVgzbzCOn6tBQVkN6/hoDAMfIiIiJ0iMYsCjRVzqIiIiIp/BwIeIiIh8BgMfIiIi8hkMfIiIiMhnMPAhIiIin8HAh4iIiHwGAx8iIiLyGQx8iIiIyGcw8CEiIiKfwcCHiIiIfAYDHyIiIvIZ7NVFREQulV9ajRPna9m8k9yCgQ8REblERe1l3LduP7bllRpvG5kUjeUzkhEWHOjGkZEv4VIXERG5xH3r9mPH0XNmt+04eg6L1u1z04jIFzHwISIip8svrca2vFI0CoLZ7Y2CgG15pTh+rsZ4XHpuifHfRI7GpS4iInK6E+drJe/PKarEs18fVLwMxjwhshUDHyIicrouEcGS96/ZWYDsExVmtxmWwdbMG2y8zZl5QloNprQ6Lk/FwIeIiJyua3RbjEyKxo6j58yWu/x1OiR3DkdWQXmLx5gugxku+FJ5QqYBkhpaTbrW6rg8HXN8iIjIJZbPSEZq9yiz21K7R2Hu8ATJxxWUXcn/UZInpJZWk661Oi5PxxkfIiJyibDgQKyZNxjHz9WgoKzGuHSTX1ot+biEyObZHrk8oYKyGtVLQYZgypLYbJMraXVc3oAzPkRE5FKJUSFI6xljvHAblsH8dTqz4/x1OoxMijYeJ5cnZAiQ1FASTLmDVsflDRj4EBGR21lbBls+I9n4b6UBkhrOCKYcQavj8gZc6iIiIreztgxmafmMZCxat89sGcgyQFJDKuk6tXuU25aTtDoub6ATBIssMR9UVVWFsLAwVFZWIjQ01N3DISIiGXIBkhqVtfUtgikt7J7S6ri0xJbrNwMfMPAhIiLHBlOOpNVxaYEt128udRERkdtpoUhfYpQ2AwutjstTMfAhIiK3YZE+cjXu6iIin8ammO7liUX6+JnxbJzxISKfxJkG9/O0In38zHgHzvgQkU/yxJkGb+NpRfr4mfEODHyIyOc4q+cTqeNJRfr4mfEeDHyIyOd42kyDt3JGJWZn4WfGezDwISKf40kzDd5OSasKLeBnxnswuZmIfA7bAWiH0lYV7sbPjPfgjA8R+SRPmWnwFZYd27WInxnvwJYVYMsKIl+m9ZkG0h5+ZrSDLSuIiFRiOwBttIvwJPzMeDYGPkREPooF+cgXMceHiMhHsSAf+SIGPkREPogF+dRhfy7vwaUuIiIfpKQgH/NYuBzojTjjQ0Tkg1iQTxkuB3ofBj5ERD7Ik9pFuAuXA70TAx8iIh/FgnzS2J/LO7k18Fm6dClSUlLQrl07xMTEYOrUqcjNzTU7ZtSoUdDpdGb/3XvvvWbHFBYWYtKkSQgODkZMTAweeeQRNDQ0uPKlEBF5HEO7iPTFo7B6bgrSF4/CmnmDHZK74g3JwN60HOgN74ejuDW5OSMjAwsWLEBKSgoaGhrwxBNPYNy4cTh06BBCQq58oO6++248//zzxn8HB1/5MDY2NmLSpEmIjY3Fzp07cebMGcyaNQuBgYF4+eWXXfp6iIg8kSML8qlNBs7ILcH+UxUY2FmPa5OiHTIGwDFFGbXUn8vW1+Pu5GwtFsfUVMuK0tJSxMTEICMjAyNHjgTQPOMzYMAA/P3vfxd9zPfff4/JkyejqKgI7du3BwCsXLkSjz32GEpLS9GqVSvZ52XLCiIix5i1KtNqoLBm3mDjbSfKajB1xQ6U19Ybb9MHB2LDghGIj5SeaZHi6At9ZW09Fq3b57bAwd7Xo/T9cDRXBVy2XL81leNTWVkJAIiIiDC7/eOPP0ZUVBT69u2LJUuWoLb2yrrrrl270K9fP2PQAwDjx49HVVUVDh48KPo8dXV1qKqqMvuPiIjsoyYZ2DLoAYDy2nrcsGK7XWNw9C4sZy4HKmHP63FncraWd8NpJvBpamrCAw88gNTUVPTt29d4+5///Gf85z//QXp6OpYsWYKPPvoIt99+u/H+4uJis6AHgPHfxcXFos+1dOlShIWFGf+Lj493wisiIvItSpOBM3JLWgQ9BuW19fjZZJZADWde6N3RPd7e1+Ou5Gyt74bTTAHDBQsWICcnB9u3m0f799xzj/H/9+vXDx06dMCYMWNw7NgxdOvWzabnWrJkCR566CHjv6uqqhj8EBHZSWky8P5TFZLHZReW25Tvo7WijPbmt9j7etyVnK2198GSJgKfhQsXYuPGjdi2bRs
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.plot.scatter(x=\"BMI\", y=\"WeightInKilograms\")"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": null,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAhIAAAGrCAYAAACVEH6fAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAADi/UlEQVR4nOzdd3xTVf/A8U/SlXSX7tKWUkYpe29kC4oIyh4KiiwZIqjIDxVRwcGD4kBALTJkiwgqKnuDZbWljG6ge7d0t0nu749KILalg7bpOO/nlddD7j33nG9i23xz7hkySZIkBEEQBEEQKkCu7wAEQRAEQai9RCIhCIIgCEKFiURCEARBEIQKE4mEIAiCIAgVJhIJQRAEQRAqTCQSgiAIgiBUmEgkBEEQBEGoMJFICIIgCIJQYSKREARBEAShwkQiIdRKU6dOxcPDQy9t3759G5lMxv/+9z+9tF8WGo2G1q1bs2LFCn2HIlTQ22+/Tbdu3fQdhiCUSiQSQo2yadMmZDKZ9qFQKGjevDlz584lPj6+ytv38/Nj8uTJuLm5YWJiQoMGDRg0aBA//vgjarW6ytsvzsGDB3n//ffLdc2OHTuIjIxk7ty5xZ7/9ttvkclkevmgio+P54033qBFixaYmppiZmZGp06d+Oijj0hLSyt3fdu3b2fNmjWVHqe+LViwAH9/fw4cOKDvUAThkQz1HYAgFOeDDz6gcePG5ObmcubMGdatW8fBgwcJDAzE1NSU77//Ho1GU6lt/vDDD8yaNQtHR0deeOEFmjVrRkZGBkePHmXatGnExsbyf//3f5XaZlkcPHiQtWvXliuZWLVqFePHj8fKyqrY89u2bcPDwwNfX19CQ0Np2rRpJUX7aBcvXuTpp58mMzOTyZMn06lTJwAuXbrEJ598wqlTpzh06FC56ty+fTuBgYEsWLCgCiLWHycnJ0aMGMH//vc/nn32WX2HIwglEomEUCM99dRTdO7cGYBXXnkFW1tbPv/8c/bv38+ECRMwMjKq1PYuXLjArFmz6NGjBwcPHsTCwkJ7bsGCBVy6dInAwMBKbbM0WVlZmJmZlfu6q1ev4u/vz+rVq4s9HxERwblz5/jll1+YOXMm27ZtY9myZY8bbqnS0tJ47rnnMDAw4OrVq7Ro0ULn/IoVK/j++++rPA59qch/z7FjxzJmzBjCw8Px9PSsosgE4fGIWxtCrTBgwACg8EMQih8jodFoWLNmDa1atUKhUODo6MjMmTNJTU0ttf7ly5cjk8nYtm2bThJxX+fOnZk6dWqR49999x1NmjTBxMSELl26cPHiRZ3zAQEBTJ06FU9PTxQKBU5OTrz88sskJyfrlHv//feRyWTcuHGDiRMnYmNjQ+/evZk6dSpr164F0Lnl8yi//vorxsbGPPHEE8We37ZtGzY2NgwbNozRo0ezbdu2YsslJyfzwgsvYGlpibW1NVOmTMHf3x+ZTMamTZt0yt66dYvRo0fToEEDFAoFnTt3LtIlv2HDBqKjo/n888+LJBEAjo6OvPPOO9rn+/fvZ9iwYbi4uGBiYkKTJk348MMPdW4x9evXjz/++IM7d+5o35uHfy7y8vJYtmwZTZs2xcTEBDc3N9566y3y8vJ02s7JyWH+/PnY2dlhYWHBs88+S3R0NDKZrEhP0NWrV3nqqaewtLTE3NycgQMHcuHCBZ0y92/RnTx5kldffRUHBwdcXV05fvw4MpmMffv2FXn927dvRyaTcf78ee2xQYMGad8LQaipRI+EUCuEhYUBYGtrW2KZmTNnsmnTJl566SXmz59PREQE33zzDVevXuXs2bMl9mJkZ2dz9OhRnnjiCdzd3csc0/bt28nIyGDmzJnIZDI+++wznn/+ecLDw7VtHT58mPDwcF566SWcnJy4fv063333HdevX+fChQtFkoIxY8bQrFkzVq5ciSRJdOjQgZiYGA4fPszWrVvLFNe5c+do3bp1ia9327ZtPP/88xgbGzNhwgTWrVvHxYsX6dKli7aMRqNh+PDh+Pr6Mnv2bFq0aMH+/fuZMmVKkfquX79Or169aNiwIW+//TZmZmbs3r2bkSNHsnfvXp577jkADhw4gFKpZPTo0WV6HZs2bcLc3JyFCxdibm7OsWPHeO+997h37x6rVq0CYOnSpaSnpxMVFcUXX3wBgLm5ufY1PPvss5w5c4YZM2bg7e3NtWvX+OKLLwgODubXX3/VtjV16lR2797NCy+8QPfu3Tl58iTDhg0r9rX26dMHS0tL3nrrLYyMjNiwYQP9+vXj5MmTRcacvPrqq9jb2/Pee++RlZVFv379cHNzY9u2bdr35eH/Lk2aNKFHjx7aY1ZWVjRp0oSzZ8/y+uuvl+l9E4RqJwlCDfLjjz9KgHTkyBEpMTFRioyMlHbu3CnZ2tpKSqVSioqKkiRJkqZMmSI1atRIe93p06clQNq2bZtOfX/99Vexxx/m7+8vAdJrr71WphgjIiIkQLK1tZVSUlK0x/fv3y8B0m+//aY9lp2dXeT6HTt2SIB06tQp7bFly5ZJgDRhwoQi5efMmSOV51fV1dVVGjVqVLHnLl26JAHS4cOHJUmSJI1GI7m6uhZ57Xv37pUAac2aNdpjarVaGjBggARIP/74o/b4wIEDpTZt2ki5ubnaYxqNRurZs6fUrFkz7TEbGxupXbt2ZX4dxb13M2fOlExNTXXaGjZsmM7Pwn1bt26V5HK5dPr0aZ3j69evlwDp7NmzkiRJ0uXLlyVAWrBggU65qVOnSoC0bNky7bGRI0dKxsbGUlhYmPZYTEyMZGFhIT3xxBPaY/d/jnv37i2pVCqdepcsWSKZmJhIaWlp2mMJCQmSoaGhTlv3Pfnkk5K3t3eR44JQU4hbG0KNNGjQIOzt7XFzc2P8+PGYm5uzb98+GjZsWGz5PXv2YGVlxeDBg0lKStI+OnXqhLm5OcePHy+xrXv37gEUe0vjUcaNG4eNjY32eZ8+fQAIDw/XHlMqldp/5+bmkpSURPfu3QG4cuVKkTpnzZpVrhiKk5ycrBPXw7Zt24ajoyP9+/cHCm+XjBs3jp07d+rcMvjrr78wMjJi+vTp2mNyuZw5c+bo1JeSksKxY8cYO3YsGRkZ2vc9OTmZIUOGEBISQnR0NFD4PpfnPX74vbtfd58+fcjOzubWrVulXr9nzx68vb1p0aKFzs/E/dtk938m/vrrL6Cw9+Bh8+bN03muVqs5dOgQI0eO1Bmv4OzszMSJEzlz5oz2Z+m+6dOnY2BgoHPsxRdfJC8vj59//ll7bNeuXahUKiZPnlzkddjY2JCUlFTq6xUEfRG3NoQaae3atTRv3hxDQ0McHR3x8vJCLi857w0JCSE9PR0HB4dizyckJJR4raWlJVD4YVUe/70Ncv/D++ExGSkpKSxfvpydO3cWiSE9Pb1InY0bNy5XDCWRJKnIMbVazc6dO+nfv792rAlAt27dWL16NUePHuXJJ58E4M6dOzg7O2NqaqpTx39nd4SGhiJJEu+++y7vvvtusbEkJCTQsGFDLC0ty/UeX79+nXfeeYdjx44V+YAu7r37r5CQEG7evIm9vX2JcUHha5XL5UXe+/++1sTERLKzs/Hy8ipSl7e3NxqNhsjISFq1aqU9Xtx/zxYtWtClSxe2bdvGtGnTgMIEr3v37sXOnpEkqdRxMYKgTyKREGqkrl27amdtlIVGo8HBwaHEgYMlfZhA4QeGoaEh165dK1eM//2med/DH+Jjx47l3LlzvPnmm7Rv3x5zc3M0Gg1Dhw4tdvrqw9/CK8rW1rbYAabHjh0jNjaWnTt3snPnziLnt23bpk0kyur+a3jjjTcYMmRIsWXufzi2aNECPz8/8vPzMTY2fmS9aWlp9O3bF0tLSz744AOaNGmCQqHgypUrLF68uExTfzUaDW3atOHzzz8v9rybm1updTyukv57vvjii7z22mtERUWRl5fHhQsX+Oabb4otm5qaip2dXVWGKQiPRSQSQp3QpEkTjhw5Qq9evcr9YWxqasqAAQM4duwYkZGRlfYBk5qaytGjR1m+fDnvvfee9nhISEi56invt9EWLVro9Djct23bNhw
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 800x500 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"plt.figure(figsize=(8, 5))\n",
|
|||
|
"df['AgeCategory'].value_counts().plot(kind='pie', autopct='%1.1f%%', title='Pie Chart (AgeCategory)')\n",
|
|||
|
"plt.show()\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"metadata": {
|
|||
|
"kernelspec": {
|
|||
|
"display_name": "Python 3",
|
|||
|
"language": "python",
|
|||
|
"name": "python3"
|
|||
|
},
|
|||
|
"language_info": {
|
|||
|
"codemirror_mode": {
|
|||
|
"name": "ipython",
|
|||
|
"version": 3
|
|||
|
},
|
|||
|
"file_extension": ".py",
|
|||
|
"mimetype": "text/x-python",
|
|||
|
"name": "python",
|
|||
|
"nbconvert_exporter": "python",
|
|||
|
"pygments_lexer": "ipython3",
|
|||
|
"version": "3.12.6"
|
|||
|
}
|
|||
|
},
|
|||
|
"nbformat": 4,
|
|||
|
"nbformat_minor": 2
|
|||
|
}
|