714 lines
173 KiB
Plaintext
714 lines
173 KiB
Plaintext
|
{
|
|||
|
"cells": [
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Работа с NumPy"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 1,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
"matrix = \n",
|
|||
|
" [[4 5 0]\n",
|
|||
|
" [9 9 9]] \n",
|
|||
|
"\n",
|
|||
|
"tmatrix = \n",
|
|||
|
" [[4 9]\n",
|
|||
|
" [5 9]\n",
|
|||
|
" [0 9]] \n",
|
|||
|
"\n",
|
|||
|
"vector = \n",
|
|||
|
" [4 5 0 9 9 9] \n",
|
|||
|
"\n",
|
|||
|
"tvector = \n",
|
|||
|
" [[4]\n",
|
|||
|
" [5]\n",
|
|||
|
" [0]\n",
|
|||
|
" [9]\n",
|
|||
|
" [9]\n",
|
|||
|
" [9]] \n",
|
|||
|
"\n",
|
|||
|
"list_matrix = \n",
|
|||
|
" [array([4, 5, 0]), array([9, 9, 9])] \n",
|
|||
|
"\n",
|
|||
|
"matrix as str = \n",
|
|||
|
" [[4 5 0]\n",
|
|||
|
" [9 9 9]] \n",
|
|||
|
"\n",
|
|||
|
"matrix type is <class 'numpy.ndarray'> \n",
|
|||
|
"\n",
|
|||
|
"vector type is <class 'numpy.ndarray'> \n",
|
|||
|
"\n",
|
|||
|
"list_matrix type is <class 'list'> \n",
|
|||
|
"\n",
|
|||
|
"str_matrix type is <class 'str'> \n",
|
|||
|
"\n",
|
|||
|
"formatted_vector = \n",
|
|||
|
" 4; 5; 0; 9; 9; 9 \n",
|
|||
|
"\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"import numpy as np\n",
|
|||
|
"\n",
|
|||
|
"matrix = np.array([[4, 5, 0], [9, 9, 9]])\n",
|
|||
|
"print(\"matrix = \\n\", matrix, \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"tmatrix = matrix.T\n",
|
|||
|
"print(\"tmatrix = \\n\", tmatrix, \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"vector = np.ravel(matrix)\n",
|
|||
|
"print(\"vector = \\n\", vector, \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"tvector = np.reshape(vector, (6, 1))\n",
|
|||
|
"print(\"tvector = \\n\", tvector, \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"list_matrix = list(matrix)\n",
|
|||
|
"print(\"list_matrix = \\n\", list_matrix, \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"str_matrix = str(matrix)\n",
|
|||
|
"print(\"matrix as str = \\n\", str_matrix, \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"print(\"matrix type is\", type(matrix), \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"print(\"vector type is\", type(vector), \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"print(\"list_matrix type is\", type(list_matrix), \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"print(\"str_matrix type is\", type(str_matrix), \"\\n\")\n",
|
|||
|
"\n",
|
|||
|
"formatted_vector = \"; \".join(map(str, vector))\n",
|
|||
|
"print(\"formatted_vector = \\n\", formatted_vector, \"\\n\")"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Работа с Pandas DataFrame\n",
|
|||
|
"\n",
|
|||
|
"https://pandas.pydata.org/docs/user_guide/10min.html"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Работа с данными - чтение и запись CSV"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 2,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [],
|
|||
|
"source": [
|
|||
|
"import pandas as pd\n",
|
|||
|
"\n",
|
|||
|
"df = pd.read_csv(\"data/titanic.csv\", index_col=\"PassengerId\")\n",
|
|||
|
"\n",
|
|||
|
"df.to_csv(\"test.csv\")"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Работа с данными - основные команды"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 3,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
"<class 'pandas.core.frame.DataFrame'>\n",
|
|||
|
"Index: 891 entries, 1 to 891\n",
|
|||
|
"Data columns (total 11 columns):\n",
|
|||
|
" # Column Non-Null Count Dtype \n",
|
|||
|
"--- ------ -------------- ----- \n",
|
|||
|
" 0 Survived 891 non-null int64 \n",
|
|||
|
" 1 Pclass 891 non-null int64 \n",
|
|||
|
" 2 Name 891 non-null object \n",
|
|||
|
" 3 Sex 891 non-null object \n",
|
|||
|
" 4 Age 714 non-null float64\n",
|
|||
|
" 5 SibSp 891 non-null int64 \n",
|
|||
|
" 6 Parch 891 non-null int64 \n",
|
|||
|
" 7 Ticket 891 non-null object \n",
|
|||
|
" 8 Fare 891 non-null float64\n",
|
|||
|
" 9 Cabin 204 non-null object \n",
|
|||
|
" 10 Embarked 889 non-null object \n",
|
|||
|
"dtypes: float64(2), int64(4), object(5)\n",
|
|||
|
"memory usage: 83.5+ KB\n",
|
|||
|
" count mean std min 25% 50% 75% max\n",
|
|||
|
"Survived 891.0 0.383838 0.486592 0.00 0.0000 0.0000 1.0 1.0000\n",
|
|||
|
"Pclass 891.0 2.308642 0.836071 1.00 2.0000 3.0000 3.0 3.0000\n",
|
|||
|
"Age 714.0 29.699118 14.526497 0.42 20.1250 28.0000 38.0 80.0000\n",
|
|||
|
"SibSp 891.0 0.523008 1.102743 0.00 0.0000 0.0000 1.0 8.0000\n",
|
|||
|
"Parch 891.0 0.381594 0.806057 0.00 0.0000 0.0000 0.0 6.0000\n",
|
|||
|
"Fare 891.0 32.204208 49.693429 0.00 7.9104 14.4542 31.0 512.3292\n",
|
|||
|
" Survived Pclass Sex Age SibSp Parch Fare Cabin\n",
|
|||
|
"PassengerId \n",
|
|||
|
"1 0 3 male 22.0 1 0 7.2500 NaN\n",
|
|||
|
"2 1 1 female 38.0 1 0 71.2833 C85\n",
|
|||
|
"3 1 3 female 26.0 0 0 7.9250 NaN\n",
|
|||
|
"4 1 1 female 35.0 1 0 53.1000 C123\n",
|
|||
|
"5 0 3 male 35.0 0 0 8.0500 NaN\n",
|
|||
|
" Survived Pclass Sex Age SibSp Parch Fare Cabin\n",
|
|||
|
"PassengerId \n",
|
|||
|
"887 0 2 male 27.0 0 0 13.00 NaN\n",
|
|||
|
"888 1 1 female 19.0 0 0 30.00 B42\n",
|
|||
|
"889 0 3 female NaN 1 2 23.45 NaN\n",
|
|||
|
"890 1 1 male 26.0 0 0 30.00 C148\n",
|
|||
|
"891 0 3 male 32.0 0 0 7.75 NaN\n",
|
|||
|
" Survived Pclass Sex Age SibSp Parch Fare Cabin\n",
|
|||
|
"PassengerId \n",
|
|||
|
"804 1 3 male 0.42 0 1 8.5167 NaN\n",
|
|||
|
"756 1 2 male 0.67 1 1 14.5000 NaN\n",
|
|||
|
"470 1 3 female 0.75 2 1 19.2583 NaN\n",
|
|||
|
"645 1 3 female 0.75 2 1 19.2583 NaN\n",
|
|||
|
"79 1 2 male 0.83 0 2 29.0000 NaN\n",
|
|||
|
" Survived Pclass Sex Age SibSp Parch Fare Cabin\n",
|
|||
|
"PassengerId \n",
|
|||
|
"860 0 3 male NaN 0 0 7.2292 NaN\n",
|
|||
|
"864 0 3 female NaN 8 2 69.5500 NaN\n",
|
|||
|
"869 0 3 male NaN 0 0 9.5000 NaN\n",
|
|||
|
"879 0 3 male NaN 0 0 7.8958 NaN\n",
|
|||
|
"889 0 3 female NaN 1 2 23.4500 NaN\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.info()\n",
|
|||
|
"\n",
|
|||
|
"print(df.describe().transpose())\n",
|
|||
|
"\n",
|
|||
|
"cleared_df = df.drop([\"Name\", \"Ticket\", \"Embarked\"], axis=1)\n",
|
|||
|
"print(cleared_df.head())\n",
|
|||
|
"print(cleared_df.tail())\n",
|
|||
|
"\n",
|
|||
|
"sorted_df = cleared_df.sort_values(by=\"Age\")\n",
|
|||
|
"print(sorted_df.head())\n",
|
|||
|
"print(sorted_df.tail())"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Работа с данными - работа с элементами"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 4,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
"PassengerId\n",
|
|||
|
"1 22.0\n",
|
|||
|
"2 38.0\n",
|
|||
|
"3 26.0\n",
|
|||
|
"4 35.0\n",
|
|||
|
"5 35.0\n",
|
|||
|
" ... \n",
|
|||
|
"887 27.0\n",
|
|||
|
"888 19.0\n",
|
|||
|
"889 NaN\n",
|
|||
|
"890 26.0\n",
|
|||
|
"891 32.0\n",
|
|||
|
"Name: Age, Length: 891, dtype: float64\n",
|
|||
|
"Survived 0\n",
|
|||
|
"Pclass 2\n",
|
|||
|
"Name Kantor, Mr. Sinai\n",
|
|||
|
"Sex male\n",
|
|||
|
"Age 34.0\n",
|
|||
|
"SibSp 1\n",
|
|||
|
"Parch 0\n",
|
|||
|
"Ticket 244367\n",
|
|||
|
"Fare 26.0\n",
|
|||
|
"Cabin NaN\n",
|
|||
|
"Embarked S\n",
|
|||
|
"Name: 100, dtype: object\n",
|
|||
|
"Kantor, Mr. Sinai\n",
|
|||
|
" Age Name\n",
|
|||
|
"PassengerId \n",
|
|||
|
"100 34.0 Kantor, Mr. Sinai\n",
|
|||
|
"101 28.0 Petranec, Miss. Matilda\n",
|
|||
|
"102 NaN Petroff, Mr. Pastcho (\"Pentcho\")\n",
|
|||
|
"103 21.0 White, Mr. Richard Frasar\n",
|
|||
|
"104 33.0 Johansson, Mr. Gustaf Joel\n",
|
|||
|
"... ... ...\n",
|
|||
|
"196 58.0 Lurette, Miss. Elise\n",
|
|||
|
"197 NaN Mernagh, Mr. Robert\n",
|
|||
|
"198 42.0 Olsen, Mr. Karl Siegwart Andreas\n",
|
|||
|
"199 NaN Madigan, Miss. Margaret \"Maggie\"\n",
|
|||
|
"200 24.0 Yrois, Miss. Henriette (\"Mrs Harbeck\")\n",
|
|||
|
"\n",
|
|||
|
"[101 rows x 2 columns]\n",
|
|||
|
" Survived Pclass \\\n",
|
|||
|
"PassengerId \n",
|
|||
|
"1 0 3 \n",
|
|||
|
"2 1 1 \n",
|
|||
|
"3 1 3 \n",
|
|||
|
"\n",
|
|||
|
" Name Sex Age \\\n",
|
|||
|
"PassengerId \n",
|
|||
|
"1 Braund, Mr. Owen Harris male 22.0 \n",
|
|||
|
"2 Cumings, Mrs. John Bradley (Florence Briggs Th... female 38.0 \n",
|
|||
|
"3 Heikkinen, Miss. Laina female 26.0 \n",
|
|||
|
"\n",
|
|||
|
" SibSp Parch Ticket Fare Cabin Embarked \n",
|
|||
|
"PassengerId \n",
|
|||
|
"1 1 0 A/5 21171 7.2500 NaN S \n",
|
|||
|
"2 1 0 PC 17599 71.2833 C85 C \n",
|
|||
|
"3 0 0 STON/O2. 3101282 7.9250 NaN S \n",
|
|||
|
"Survived 0\n",
|
|||
|
"Pclass 3\n",
|
|||
|
"Name Braund, Mr. Owen Harris\n",
|
|||
|
"Sex male\n",
|
|||
|
"Age 22.0\n",
|
|||
|
"SibSp 1\n",
|
|||
|
"Parch 0\n",
|
|||
|
"Ticket A/5 21171\n",
|
|||
|
"Fare 7.25\n",
|
|||
|
"Cabin NaN\n",
|
|||
|
"Embarked S\n",
|
|||
|
"Name: 1, dtype: object\n",
|
|||
|
" Survived Pclass\n",
|
|||
|
"PassengerId \n",
|
|||
|
"4 1 1\n",
|
|||
|
"5 0 3\n",
|
|||
|
" Survived Pclass\n",
|
|||
|
"PassengerId \n",
|
|||
|
"4 1 1\n",
|
|||
|
"5 0 3\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"print(df[\"Age\"])\n",
|
|||
|
"\n",
|
|||
|
"print(df.loc[100])\n",
|
|||
|
"\n",
|
|||
|
"print(df.loc[100, \"Name\"])\n",
|
|||
|
"\n",
|
|||
|
"print(df.loc[100:200, [\"Age\", \"Name\"]])\n",
|
|||
|
"\n",
|
|||
|
"print(df[0:3])\n",
|
|||
|
"\n",
|
|||
|
"print(df.iloc[0])\n",
|
|||
|
"\n",
|
|||
|
"print(df.iloc[3:5, 0:2])\n",
|
|||
|
"\n",
|
|||
|
"print(df.iloc[[3, 4], [0, 1]])"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Работа с данными - отбор и группировка"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 12,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
"['male' 'female']\n",
|
|||
|
"male count = 577\n",
|
|||
|
"female count = 314\n",
|
|||
|
"Total count = 891\n",
|
|||
|
" Pclass Survived Count\n",
|
|||
|
"0 1 0 80\n",
|
|||
|
"1 1 1 136\n",
|
|||
|
"2 2 0 97\n",
|
|||
|
"3 2 1 87\n",
|
|||
|
"4 3 0 372\n",
|
|||
|
"5 3 1 119\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"s_values = df[\"Sex\"].unique()\n",
|
|||
|
"print(s_values)\n",
|
|||
|
"\n",
|
|||
|
"s_total = 0\n",
|
|||
|
"for s_value in s_values:\n",
|
|||
|
" count = df[df[\"Sex\"] == s_value].shape[0]\n",
|
|||
|
" s_total += count\n",
|
|||
|
" print(s_value, \"count =\", count)\n",
|
|||
|
"print(\"Total count = \", s_total)\n",
|
|||
|
"\n",
|
|||
|
"print(df.groupby([\"Pclass\", \"Survived\"]).size().reset_index(name=\"Count\")) # type: ignore"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Визуализация - Исходные данные"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 6,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
" Pclass Survived Age\n",
|
|||
|
"PassengerId \n",
|
|||
|
"1 3 0 22.0\n",
|
|||
|
"2 1 1 38.0\n",
|
|||
|
"3 3 1 26.0\n",
|
|||
|
"4 1 1 35.0\n",
|
|||
|
"5 3 0 35.0\n",
|
|||
|
"... ... ... ...\n",
|
|||
|
"886 3 0 39.0\n",
|
|||
|
"887 2 0 27.0\n",
|
|||
|
"888 1 1 19.0\n",
|
|||
|
"890 1 1 26.0\n",
|
|||
|
"891 3 0 32.0\n",
|
|||
|
"\n",
|
|||
|
"[714 rows x 3 columns]\n"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"data = df[[\"Pclass\", \"Survived\", \"Age\"]].copy()\n",
|
|||
|
"data.dropna(subset=[\"Age\"], inplace=True)\n",
|
|||
|
"print(data)"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Визуализация - Сводка пяти чисел\n",
|
|||
|
"\n",
|
|||
|
"<img src=\"assets/quantile.png\" width=\"400\" style=\"background-color: white\">"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 7,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
" Age \n",
|
|||
|
" min q1 q2 median q3 max\n",
|
|||
|
"Pclass \n",
|
|||
|
"1 0.92 27.0 37.0 37.0 49.0 80.0\n",
|
|||
|
"2 0.67 23.0 29.0 29.0 36.0 70.0\n",
|
|||
|
"3 0.42 18.0 24.0 24.0 32.0 74.0\n",
|
|||
|
" Age \n",
|
|||
|
" low_iqr iqr high_iqr\n",
|
|||
|
"Pclass \n",
|
|||
|
"1 0.0 22.0 82.0\n",
|
|||
|
"2 3.5 13.0 55.5\n",
|
|||
|
"3 0.0 14.0 53.0\n"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"<Axes: title={'center': 'Age'}, xlabel='Pclass'>"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 7,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAi8AAAHNCAYAAADWsJtQAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAABQtklEQVR4nO3deVxU5f4H8M8Aw7AOiLJeQUkUVDDLErguuLCEShBQWfcWprdbiSvYgr9ya8Hcl1BbDCs1u3IVlVxAU9R0vEoXL5YaGC6JIG6ggOMwnN8fXs5tAo1BhpkDn/fr5QvnnOec8z3DgfnwnOecIxMEQQARERGRRJgZuwAiIiIifTC8EBERkaQwvBAREZGkMLwQERGRpDC8EBERkaQwvBAREZGkMLwQERGRpDC8EBERkaQwvBAREZGkMLwQmQiZTIZZs2YZu4w2b9++fZDJZNi3b999282aNQsymQxXrlxpncJaQH3NRG0dwwu1eWvWrIFMJtP55+LigqFDh2LHjh3GLu+B/fTTT5g1axbOnj1r7FKoGYYMGaJzbDo5OeHxxx/H559/jrq6OmOXR2SSLIxdAFFrmTNnDry9vSEIAsrKyrBmzRqMGDEC27Ztw6hRo4xdXrP99NNPmD17NoYMGYKuXbsauxxqhs6dOyM1NRUAUF5eji+//BLjxo3Dzz//jLlz5xq5OiLTw/BC7UZkZCQee+wx8fW4cePg6uqKr7/+WtLhpTXV1tairq4OlpaWxi6lTXFwcMBf//pX8fUrr7wCX19ffPTRR3j33Xchl8uNWB2R6eFpI2q3HB0dYW1tDQsL3QxfVVWF5ORkeHp6QqFQwNfXFwsWLED9A9hramrg5+cHPz8/1NTUiMtdu3YN7u7u+POf/wytVgsAGDNmDOzs7PDLL78gIiICtra28PDwwJw5c9CUB7r/+9//RmRkJJRKJezs7DB8+HCoVCpx/po1a/D0008DAIYOHSqeevij8RwbN25Er169YGVlBX9/f2zevBljxozR6bk5e/YsZDIZFixYgCVLlqBbt25QKBT46aefAADfffcdBg0aBFtbWzg6OiI6OhonT57U2c7v11mvsbEZMpkMEyZMwLp16+Dr6wsrKyv069cP+/fvb7D8xYsXMXbsWLi6ukKhUKB37974/PPPG7T79ddfERMTA1tbW7i4uGDq1KlQq9X3fW9+78qVK3jmmWegVCrRsWNHTJ48Gbdv3xbnh4SE4OGHH250WV9fX0REROi1PQCwsbFBUFAQqqqqUF5eLk4/cuQIRowYgQ4dOsDW1hZ9+vTB0qVL77uu9PR0DBs2DC4uLlAoFOjVqxdWrlzZoN2xY8cQERGBTp06wdraGt7e3hg7dqxOmw0bNqBfv36wt7eHUqlEQEDAH26fyBDY80LtRkVFBa5cuQJBEHD58mUsX74ct27d0vmLVxAEPPnkk9i7dy/GjRuHvn37YteuXXj99ddx8eJFLF68GNbW1vjiiy8wYMAA/N///R8WLVoEAEhMTERFRQXWrFkDc3NzcZ1arRZPPPEEgoKCMG/ePOzcuRMzZ85EbW0t5syZc896f/zxRwwaNAhKpRJvvPEG5HI5Pv74YwwZMgS5ubkIDAzE4MGDMWnSJCxbtgzTp09Hz549AUD82phvv/0Wzz77LAICApCamorr169j3Lhx+NOf/tRo+/T0dNy+fRt///vfoVAo4OTkhN27dyMyMhIPPfQQZs2ahZqaGixfvhwDBgzADz/80OzTV7m5ufjmm28wadIkKBQKrFixAk888QT+9a9/wd/fHwBQVlaGoKAgMew4Oztjx44dGDduHCorKzFlyhQAd0Pm8OHDcf78eUyaNAkeHh746quv8N133+lV0zPPPIOuXbsiNTUVKpUKy5Ytw/Xr1/Hll18CAF544QW8/PLLOHHihFgjABw9ehQ///wz3n777Wa9F7/88gvMzc3h6OgIAMjJycGoUaPg7u6OyZMnw83NDSdPnkRWVhYmT558z/WsXLkSvXv3xpNPPgkLCwts27YN48ePR11dHRITEwEAly9fRnh4OJydnfHWW2/B0dERZ8+exaZNm8T15OTk4LnnnsPw4cPx4YcfAgBOnjyJ77///r7bJzIIgaiNS09PFwA0+KdQKIQ1a9botM3MzBQACO+9957O9Pj4eEEmkwlFRUXitJSUFMHMzEzYv3+/sHHjRgGAsGTJEp3lEhISBADCxIkTxWl1dXXCyJEjBUtLS6G8vFycDkCYOXOm+DomJkawtLQUzpw5I04rKSkR7O3thcGDB4vT6re9d+/eJr0fAQEBQufOnYWbN2+K0/bt2ycAELp06SJOKy4uFgAISqVSuHz5ss46+vbtK7i4uAhXr14Vpx0/flwwMzMTXnzxRZ39/+06682cOVP4/a+f+u/LsWPHxGnnzp0TrKyshKeeekqcNm7cOMHd3V24cuWKzvKjR48WHBwchOrqakEQBGHJkiUCAOEf//iH2Kaqqkrw8fFp0vtVX+OTTz6pM338+PECAOH48eOCIAjCjRs3BCsrK+HNN9/UaTdp0iTB1tZWuHXr1n23ExISIvj5+Qnl5eVCeXm5cPLkSWHSpEkCACEqKkoQBEGora0VvL29hS5dugjXr1/XWb6urq5Bzb9V/378VkREhPDQQw+Jrzdv3iwAEI4ePXrPOidPniwolUqhtrb2vvtD1Bp42ojajbS0NOTk5CAnJwdr167F0KFD8be//U3nr8vt27fD3NwckyZN0lk2OTkZgiDoXJ00a9Ys9O7dGwkJCRg/fjxCQkIaLFdvwoQJ4v/rewzu3LmD3bt3N9peq9UiOzsbMTExeOihh8Tp7u7ueP7553Hw4EFUVlbq/R6UlJSgoKAAL774Iuzs7MTpISEhCAgIaHSZuLg4ODs7i68vXbqE/Px8jBkzBk5OTuL0Pn36ICwsDNu3b9e7rnrBwcHo16+f+NrLywvR0dHYtWsXtFotBEHAP//5T0RFRUEQBFy5ckX8FxERgYqKCvzwww8A7n4v3d3dER8fL67PxsYGf//73/Wqqb53ot7EiRPF9QN3x6tER0fj66+/Fk8FarVafPPNN+Ipqz9y6tQpODs7w9nZGT179sTy5csxcuRI8VTYv//9bxQXF2PKlCliT0y9P7o02traWvx/fe9jSEgIfvnlF1RUVACAuM6srCxoNJpG1+Po6Iiqqirk5OT84f4QGRrDC7Ub/fv3R2hoKEJDQ/GXv/wF3377LXr16iUGCQA4d+4cPDw8YG9vr7Ns/WmYc+fOidMsLS3x+eefo7i4GDdv3kR6enqjHyRmZmY6AQQAevToAQD3vLy5vLwc1dXV8PX1bTCvZ8+eqKurw4ULF5q+8/9VX7+Pj0+DeY1NAwBvb+9G13Gv2q5cuYKqqiq9awOA7t27N5jWo0cPVFdXo7y8HOXl5bhx4wY++eQT8cO+/t9LL70E4O4pkPo6fXx8GnxPGqtbn5q6desGMzMzne/diy++iPPnz+PAgQMAgN27d6OsrAwvvPBCk7bRtWtX5OTkYPfu3Th48CBKS0uRlZWFTp06AQDOnDkDADqnpZrq+++/R2hoqDg2ydnZGdOnTwcAMbyEhIQgLi4Os2fPRqdOnRAdHY309HSd8UHjx49Hjx49EBkZic6dO2Ps2LHYuXOn3vUQtQSOeaF2y8zMDEOHDsXSpUtRWFiI3r17672OXbt2AQBu376NwsLCBh/0bcFv/3LX1716BeoHNOur/r4nf/3rX5GQkNBomz59+jRr3U3V2D5FRETA1dUVa9euxeDBg7F27Vq4ubkhNDS0Seu0tbVtclt9nDlzBsOHD4efnx8WLVoET09PWFpaYvv27Vi8eLH4fspkMmRkZEClUmHbtm3YtWsXxo4di4ULF0KlUsHOzg4uLi7Iz8/Hrl27sGPHDuzYsQPp6el48cUX8cUXX7R47UT3w54Xatdqa2sBALdu3QIAdOnSBSUlJbh586ZOu1OnTonz6/3nP//BnDlz8NJLL+GRRx7B3/72N/Ev2d+qq6vDL7/8ojPt559/BoB7Dmx1dnaGjY0NTp8+3WDeqVOnYGZmBk9PTwB
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"def q1(x):\n",
|
|||
|
" return x.quantile(0.25)\n",
|
|||
|
"\n",
|
|||
|
"\n",
|
|||
|
"# median = quantile(0.5)\n",
|
|||
|
"def q2(x):\n",
|
|||
|
" return x.quantile(0.5)\n",
|
|||
|
"\n",
|
|||
|
"\n",
|
|||
|
"def q3(x):\n",
|
|||
|
" return x.quantile(0.75)\n",
|
|||
|
"\n",
|
|||
|
"\n",
|
|||
|
"def iqr(x):\n",
|
|||
|
" return q3(x) - q1(x)\n",
|
|||
|
"\n",
|
|||
|
"\n",
|
|||
|
"def low_iqr(x):\n",
|
|||
|
" return max(0, q1(x) - 1.5 * iqr(x))\n",
|
|||
|
"\n",
|
|||
|
"\n",
|
|||
|
"def high_iqr(x):\n",
|
|||
|
" return q3(x) + 1.5 * iqr(x)\n",
|
|||
|
"\n",
|
|||
|
"\n",
|
|||
|
"quantiles = data[[\"Pclass\", \"Age\"]].groupby([\"Pclass\"]).aggregate([\"min\", q1, q2, \"median\", q3, \"max\"])\n",
|
|||
|
"print(quantiles)\n",
|
|||
|
"\n",
|
|||
|
"iqrs = data[[\"Pclass\", \"Age\"]].groupby([\"Pclass\"]).aggregate([low_iqr, iqr, high_iqr])\n",
|
|||
|
"print(iqrs)\n",
|
|||
|
"\n",
|
|||
|
"data.boxplot(column=\"Age\", by=\"Pclass\")"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Визуализация - Гистограмма"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 8,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"<Axes: ylabel='Frequency'>"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 8,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAjIAAAGdCAYAAAAIbpn/AAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAqDklEQVR4nO3de3RU5b3/8c+QG0FyETC3kkDkKkIoImDKpShUbktF8CxUOAalWm1QIFoBrSC1NFQWVDwi9JwDiR5FhC7wWkGIEEqLKGhA9Ge4GAFLuFQlIaEkkHl+f7CY5ZgLyTDJnmd4v9aatdjP3rPzfWabyce9n70flzHGCAAAwELNnC4AAADAVwQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1Qp0uoLG53W4dOXJEUVFRcrlcTpcDAADqwRijU6dOKSkpSc2a1X7eJeiDzJEjR5ScnOx0GQAAwAeHDx9W27Zta10f9EEmKipK0vkPIjo62uFqAABAfZSWlio5Odnzd7w2QR9kLlxOio6OJsgAAGCZiw0LYbAvAACwFkEGAABYiyADAACsFfRjZAAAaErGGJ07d05VVVVOlxLQQkJCFBoaesmPRiHIAADgJ5WVlSouLtbp06edLsUKLVq0UGJiosLDw33eB0EGAAA/cLvdKioqUkhIiJKSkhQeHs6DWGthjFFlZaVOnDihoqIiderUqc6H3tWFIAMAgB9UVlbK7XYrOTlZLVq0cLqcgBcZGamwsDAdPHhQlZWVat68uU/7YbAvAAB+5OuZhcuRPz4rPm0AAGAtggwAALAWY2QAAGhk7We822Q/6+t5o3x+77Zt2zRgwAANHz5c777bdDVfCs7IAAAASdKyZcv08MMPa8uWLTpy5IjT5dQLQQYAAKisrEyvv/66HnroIY0aNUq5uble69966y116tRJzZs314033qiXXnpJLpdLJ0+e9GyzdetWDRw4UJGRkUpOTtYjjzyi8vLyRq2bIAMAALRq1Sp17dpVXbp00YQJE7R8+XIZYyRJRUVFuuOOOzR69Gjt2rVLv/rVr/Tkk096vf/AgQMaPny4xo4dq927d+v111/X1q1bNXny5EatmzEywCWq7dr3pVynBoCmtmzZMk2YMEGSNHz4cJWUlCg/P1+DBw/Wn//8Z3Xp0kXz58+XJHXp0kV79uzR3LlzPe/Pzs7W+PHjNXXqVElSp06d9Pzzz+vnP/+5lixZ4vNzYi6GMzIAAFzmCgsL9dFHH+muu+6SJIWGhmrcuHFatmyZZ32fPn283tO3b1+v5V27dik3N1ctW7b0vIYNG+Z54nFj4YwMAACXuWXLluncuXNKSkrytBljFBERoRdeeKFe+ygrK9OvfvUrPfLII9XWpaSk+K3WHyPIAABwGTt37pxefvllLViwQDfffLPXutGjR+u1115Tly5d9Ne//tVr3ccff+y1fN111+mLL75Qx44dG73mHyLIAABwGXvnnXf0/fffa9KkSYqJifFaN3bsWC1btkyrVq3SwoULNX36dE2aNEkFBQWeu5ouTIw5ffp03XDDDZo8ebJ++ctf6oorrtAXX3yhDRs21Pusji8YIwMAwGVs2bJlGjp0aLUQI50PMjt27NCpU6f0l7/8RWvWrFFaWpqWLFniuWspIiJCkpSWlqb8/Hzt3btXAwcOVK9evTRr1iyvy1WNgTMyAAA0skC+i/Htt9+udV3fvn09t2CnpaXp1ltv9aybO3eu2rZt63U3Up8+ffT+++83XrE1cPSMzJIlS5SWlqbo6GhFR0crPT1d7733nmf9mTNnlJmZqdatW6tly5YaO3asjh075mDFAABcnl588UV9/PHH+uqrr/R///d/mj9/vjIyMpwuy9kg07ZtW82bN087d+7Ujh07dNNNN+m2227T559/LkmaNm2a3n77ba1evVr5+fk6cuSIxowZ42TJAABclvbt26fbbrtN3bp10zPPPKNHH31UTz/9tNNlyWUunDMKEK1atdL8+fN1xx136KqrrtKKFSt0xx13SJK+/PJLXXPNNdq2bZtuuOGGeu2vtLRUMTExKikpUXR0dGOWjssUD8QDIJ2/ilBUVKTU1NRGe/hbsKnrM6vv3++AGexbVVWllStXqry8XOnp6dq5c6fOnj2roUOHerbp2rWrUlJStG3bNgcrBQAAgcLxwb6fffaZ0tPTdebMGbVs2VJr165Vt27dVFBQoPDwcMXGxnptHx8fr6NHj9a6v4qKClVUVHiWS0tLG6t0AADgMMfPyHTp0kUFBQXavn27HnroIWVkZOiLL77weX/Z2dmKiYnxvJKTk/1YLQAAdQuwERsBzR+fleNBJjw8XB07dlTv3r2VnZ2tnj17atGiRUpISFBlZaXX9OCSdOzYMSUkJNS6v5kzZ6qkpMTzOnz4cCP3AAAAKSwsTJJ0+vRphyuxx4XP6sJn5wvHLy39mNvtVkVFhXr37q2wsDDl5eVp7Nixks5PWnXo0CGlp6fX+v6IiAjPw3kAAGgqISEhio2N1fHjxyVJLVq08Dz1Ft6MMTp9+rSOHz+u2NhYhYSE+LwvR4PMzJkzNWLECKWkpOjUqVNasWKFNm/erPXr1ysmJkaTJk1SVlaWWrVqpejoaD388MNKT0+v9x1LAAA0pQtXDC6EGdQtNja2zqss9eFokDl+/LjuueceFRcXKyYmRmlpaVq/fr1+8YtfSJL+9Kc/qVmzZho7dqwqKio0bNgwvfjii06WDABArVwulxITExUXF6ezZ886XU5ACwsLu6QzMRcE3HNk/I3nyKCx8RwZAPA/654jAwAA0FAEGQAAYC2CDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALAWQQYAAFiLIAMAAKxFkAEAANYiyAAAAGsRZAAAgLUIMgAAwFoEGQAAYC2CDAAAsBZBBgAAWCvU6QKAQNR+xrvV2r6eN8qBSgAAdeGMDAAAsBZBBgAAWIsgAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiykKYK2aphGQmEoAAC4nnJEBAADWIsgAAABrEWQAAIC1CDIAAMBaBBkAAGAtggwAALCWo0EmOztbffr0UVRUlOLi4jR69GgVFhZ6bTN48GC5XC6v14MPPuhQxQAAIJA4GmTy8/OVmZmpDz/8UBs2bNDZs2d18803q7y83Gu7+++/X8XFxZ7Xs88+61DFAAAgkDj6QLx169Z5Lefm5iouLk47d+7UoEGDPO0tWrRQQkJCU5cHAAACXECNkSkpKZEktWrVyqv91VdfVZs2bdS9e3fNnDlTp0+frnUfFRUVKi0t9XoBAIDgFDBTFLjdbk2dOlX9+/dX9+7dPe1333232rVrp6SkJO3evVvTp09XYWGh1qxZU+N+srOzNWfOnKYqGwGoIVMX1LZtoKipvtqmYGDKBgCXo4AJMpmZmdqzZ4+2bt3q1f7AAw94/t2jRw8lJiZqyJAhOnDggDp06FBtPzNnzlRWVpZnubS0VMnJyY1XOAAAcExABJnJkyfrnXfe0ZYtW9S2bds6t+3Xr58kaf/+/TUGmYiICEVERDRKnQAAILA4GmSMMXr44Ye1du1abd68WampqRd9T0FBgSQpMTGxkasDAACBztEgk5mZqRUrVujNN99UVFSUjh49KkmKiYlRZGSkDhw4oBUrVmjkyJFq3bq1du/erWnTpmnQoEFKS0tzsnQAABAAHA0yS5YskXT+oXc/lJOTo4kTJyo8PFwbN27Uc889p/LyciUnJ2vs2LH67W9/60C1AAAg0Dh+aakuycnJys/Pb6JqAACAbQLqOTIAAAANQZABAADWIsgAAABrEWQAAIC1CDIAAMBaAfFkXyAYNWSeJACAbzgjAwAArEWQAQAA1iLIAAAAaxFkAACAtQgyAADAWgQZAABgLYIMAACwFkEGAABYiyADAACsRZABAADWIsg
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"data.plot.hist(column=[\"Age\"], bins=80)"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Визуализация - Точечная диаграмма"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 9,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"<Axes: xlabel='Pclass', ylabel='Age'>"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 9,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAlEAAAGwCAYAAACJjDBkAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAw8UlEQVR4nO3deXRUVb728acyQghJIGEmgUAYRAwEAxIG0QZRRL04cmlEaBVbhRbQRkARnBB9udxmUnEAAbVlukLT0toiQhSkhQgBgRYCBIIyQwZIEITs9w+bMkVVhdQmsZL4/ayVtahdu3b9dp1zdj1UTp04jDFGAAAA8EmAvwsAAACoiAhRAAAAFghRAAAAFghRAAAAFghRAAAAFghRAAAAFghRAAAAFoL8XUBlVVhYqAMHDqh69epyOBz+LgcAAJSAMUYnT55U/fr1FRBQ/GdNhKgycuDAAcXGxvq7DAAAYGH//v1q2LBhsX0IUWWkevXqkn7eCBEREX6uBgAAlEReXp5iY2Od7+PFIUSVkQu/wouIiCBEAQBQwZTkVBxOLAcAALBAiAIAALBAiAIAALBAiAIAALBAiAIAALBAiAIAALBAiAIAALBAiAIAALBAiAIAALDg1xBljNFDDz2kmjVryuFwKD093S917N2716/PDwAAKh6//tmXTz75RHPmzNHq1avVpEkTxcTE+LOcCid1xxEtTf9BDkm3t2uors1qOe97YkG6vt57XClNYjTp7jbO/unf56hdXA2Xvs8v26av9hxTl4RaGntLK2f7jJUZWrv7mLo2q6VHr08odow9R09p34kCNY6upviYai41Xtzf07jFjeGt3dtr4qm+os95U+u62neiQF/uPKp/H8xzq8PTa+etveOEFTp88qzqRYTqq6d6OPs+NHeDvtmfrfaNamrmgORi6/PWt+vLK/VD7o+Kjaqq1FG/K3Z7JY7/RHlnzisyNFCbn7up2L7e2r3N21t9ntq7T1qlfdkFio+upjfuS3Zut4nLt3scY8H6LK3LPK7OTWN0daMa2neiQB98vU/bD+a51eFtv+n/5jptOZCrtg2j9O6DHYut2du+5Mvr4a3dU31F53d38i9/kNzbfuqpv7fn88aXY86XNcGXY9xbf2+vhy/Hvre+3sb2xJc1xVt/b/PGb4vDGGP89eQzZszQpEmTtG/fPn+VIOnnT6Li4+O1adMmtW3btlTGzMvLU2RkpHJzc0v9b+ftO56vW6evUd6P51zaI6oE6k/XJ2jCxzvcHhMW5FDBuV82dY2wYP35huZ6+m/b3PqO7NFMkz7LcGsPDw3UqTPnXcZ474EOeuWTnfoi46iz/dpmtfTkTc01YNZ6ZRf85GyvFhKg/LOFbuO+fV+y5q3b5zbGi31aa+zSrW7t0/slKTIs2O016fPqWpfnqxEWrHG3XKERC7e4PacnQ69tohlf7HFrv7d9Q7234fsSjdGuQXVt/OGkW/ufezbXrDWZLvWFBUoF5926KjkuQmlZeW7t1ybU1Be7TpSojsT64dpy4JRb+5Bu8Xo1NbNEY9yVVF+LNx1wa+/Tpq6Wbj5UojG8GXp9vGam7tW5wksvP0Oui9erq91r7t+hod5fX7LtMq53S63eedxtX7o9qV6J94/+1zTU+1+7P9/Qbk00I9V9vwl0SOeLTC8owKGZ/dtp5P9tcdtPJ92ZqIff3+jyejgkeXp1pvVtq9uSGri1ezoGLj5mL5h6Txs9+9F2tzpG3tBcT3lYE66sH6FtB37ZJ69tVktP3thcA2avdxvD05rQLjZSW37I1bkih39QgEPvPdBBr63eU6Jjv1PTaBkjrdtz3KXvI92aaMDs9S6vXVCAQ8uGdFarBpEu88gpOKvHPkgv0ZrirX+HxjW04/BJ5Z7+Zf2tERasZUO6KDY6zG0MVDy+vH/7LUQNGjRIc+fOdd5u1KiR9uzZo1deeUVvvvmmDh06pObNm+uZZ57RXXfdJUlavXq1rr/+en3yyScaPXq0vvvuO6WkpGj+/Pn65ptv9Pjjj+uHH37QLbfcorffflthYT/v0J988olefPFFbd26VYGBgUpJSdHUqVPVtGlTSZ5D1NatWzVy5Eh9+eWXqlatmnr27Km//OUvJf60rCxDVNLzn7osXP4UFOCQMdL5IrtRoMMhh0MleoMs+piLx4ioGqS80+fc2jsnxGjeAx1cHl+eXhOUT572sfP++z/kZdn7cm+3tl/zGCjuGPe0JlxqrJIc+yV57MV17HrpZpe2+2at19pdx0q0pnjr702NsGBtGtfzkv1Q/vny/u23c6KmTp2q559/Xg0bNtTBgwe1YcMGTZw4UfPmzdPMmTO1bds2jRgxQvfee69SU1NdHvvss89qxowZ+uqrr7R//37dc889mjJliv76179q+fLl+vTTTzV9+nRn//z8fD3++ONKS0vTypUrFRAQoNtvv12Fhe6fikhSTk6Ofve73ykpKUlpaWn65JNPdPjwYd1zzz1e53PmzBnl5eW5/JSF1B1HylVYOFdo3BaY88b4FKAuPObi29kFP3ls/yLjqDKP5TvbyttrgvLJ075UUY1ctNnl9q99DBR3jHtaEy411sW3PR37JXnsxXUsStvvvL3n6Cl9kXG0RGtKcf29yS74SV8W+cQKvw1+OycqMjJS1atXV2BgoOrWraszZ87opZde0meffaaUlBRJUpMmTbRmzRq98cYb6tatm/OxL774ojp37ixJeuCBBzRmzBjt3r1bTZo0kSTdddddWrVqlUaNGiVJuvPOO12ee/bs2apVq5a2b9+u1q1bu9U2Y8YMJSUl6aWXXnJ5TGxsrHbu3KnmzZu7PWbixIl67rnnLvNVubT073PK/Dkqgr3H853nJvCa4Ldm3Z5jLrc5Bjxbu/uY8/yofScKiu1bdE0pSX9PNmZlc37Ub0y5ucTBrl27VFBQoBtuuEHh4eHOn3nz5mn37t0ufRMTE53/rlOnjsLCwpwB6kLbkSNHnLczMjLUr18/NWnSRBEREWrcuLEkKSsry2Mtmzdv1qpVq1zqaNmypSS51XLBmDFjlJub6/zZv3+/x36Xq23DqDIZt6JpHP3LYsdrgt+alCaupxVwDHjWuekvr1OjmsWfr1R0TSlJf0/axdXw+TGo2Pz67byiTp36+STY5cuXq0ED15MmQ0NDXW4HB/9yAqDD4XC5faGt6K/qbr31VjVq1EhvvfWW6tevr8LCQrVu3Vpnz571Wsutt96qV155xe2+evXqeXxMaGioW51loVuL2qoRFlxufn3lr3Oiiv6Psby9JiifKtM5URd/S+/XPgYqyjlRRb+l16RWuK5tVsvrOVEXf0vPW39vaoQF8ynUb1C5+SSqVatWCg0NVVZWlhISElx+YmOL/7pqcY4fP64dO3Zo7Nix6t69u6644gplZ2cX+5h27dpp27Ztaty4sVst1apd+uuwZW3ZkC6KqOKefyOqBGpc7ys8PiYsyOFyu0ZYsF6+3f1XmZI0sqf7ryuln7/pc/EYy4Z0VucE1/8Vd06I0bIhnVXjom+7hId43t1m3ZfsZYwuHtun90tyG2PZkC5uz1cjLFjT+rb1+Jye/On6ph7b7+tY8v0vOdbzSYgjezZ3qy8s0GNXdWwc6bH9+ubRJa6jbYPqHtu9zdGTvsnu3wCTpNvbev6PhC/+dH1TBQU4Lt1RpbNdxvW+wuO+5Mv+4e35vNUXeNH0ggIcmnVfssf9dNZ9yW6vh7dXx1vNno6Bi4/ZomN4qsPbmnBlfdf92tsx7m1NaBcbpaCLDv+gAIcWDO5Y4mO/U9NopTSJduu7YHBHt9fuwrfzLja9X1KJ1xRv/Ts0rqnIqq7r74Vv5+G3x6+XOJgyZYqmTJmivXv3SpLGjh2rmTNnavLkyerSpYtyc3O1du1aRUREaODAgc5v52VnZysqKkqSNGfOHA0fPlw5OTnOcZ999lktXbpU6enpKiwsVO3atdWrVy+NHz9eWVlZGj16tDZs2KAlS5aoT58+bt/OO3DggNq2batu3brpySefVM2aNbVr1y7Nnz9fb7/9tgIDvbz7FVGW38674MuMo1qy8QdJxu0
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAjIAAAGwCAYAAACzXI8XAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAABLqUlEQVR4nO3dfVwVdfo//tfhHgQO9yDJrRLeJN5DqGkmRa5r+cvM/LRlZdtWaKt2s9Jv07XaoFtL09zM1G68yW01u9FuSDEV71BKswgEBUNuJOBwk4Aw3z+Ik0cOcxg4Z2aO83o+HuexMdecwzU7DueamWveb50gCAKIiIiI7JCD0gkQERERdRcLGSIiIrJbLGSIiIjIbrGQISIiIrvFQoaIiIjsFgsZIiIislssZIiIiMhuOSmdgK21traipKQEXl5e0Ol0SqdDREREXSAIAmpraxEaGgoHh86vu1zxhUxJSQnCwsKUToOIiIi6obi4GH369Ok0fsUXMl5eXgDa/o/w9vZWOBsiIiLqCoPBgLCwMOP3eGeu+EKm/XaSt7c3CxkiIiI7Y6kthM2+REREZLdYyBAREZHdYiFDREREdouFDBEREdktFjJERERkt1jIEBERkd1iIUNERER2i4UMERER2S0WMkRERGS3WMgQERGR3VK0kGlpacHTTz+NqKgouLu7o2/fvnj22WchCIJxHUEQsGjRIvTu3Rvu7u5ISkpCXl6eglm3Kaiow67cchSer1c6FSIiIs1SdK6lF154AW+++SbWr1+PQYMG4ciRI7jvvvug1+vx6KOPAgBefPFFLFu2DOvXr0dUVBSefvppJCcn4+TJk3Bzc5M95+qGJjy6MQd78iqMy8bFBGL5zGHQezjLng8REZGW6YRLL3/I7M9//jOCg4OxZs0a47Jp06bB3d0d77//PgRBQGhoKB577DE8/vjjAICamhoEBwdj3bp1uPPOOy3+DoPBAL1ej5qaGqtMGnnPmkPYl38eLZf83+ao02FMvwC8Ozu+x59PREREXf/+VvTW0ujRo5GRkYGff/4ZAPDdd99h7969mDRpEgCgsLAQpaWlSEpKMr5Hr9cjISEBWVlZZj+zsbERBoPB5GUtBRV12JNXYVLEAECLIGBPXgVvMxEREclM0VtLCxcuhMFgQP/+/eHo6IiWlhb8+9//xl133QUAKC0tBQAEBwebvC84ONgYu1xaWhqWLFlik3zP/NogGj9dWY+ogF42+d1ERETUkaJXZD788EN88MEH2LBhA44ePYr169fj5Zdfxvr167v9mampqaipqTG+iouLrZZvhJ+HaDzSn0UMERGRnBS9IvPEE09g4cKFxl6XwYMH48yZM0hLS8OsWbMQEhICACgrK0Pv3r2N7ysrK8PQoUPNfqarqytcXV1tkm90oCfGxQR22iPDqzFERETyUvSKTENDAxwcTFNwdHREa2srACAqKgohISHIyMgwxg0GAw4ePIjExERZc223fOYwjOkXYLJsTL8ALJ85TJF8iIiItEzRKzJTpkzBv//9b4SHh2PQoEE4duwYXn31Vdx///0AAJ1Oh3nz5uG5555DTEyM8fHr0NBQTJ06VZGc9R7OeHd2PArP1+N0ZT0i/XvxSgwREZFCFC1kli9fjqeffhqPPPIIysvLERoair/97W9YtGiRcZ0nn3wS9fX1ePDBB1FdXY2xY8di586diowhc6moABYwRERESlN0HBk5WHscGSIiIrI9uxhHhoiIiKgnWMgQERGR3WIhQ0RERHaLhQwRERHZLRYyREREZLdYyBAREZHdYiFDREREdouFDBEREdktFjJERERkt1jIEBERkd1iIUNERER2i4UMERER2S0WMkRERGS3WMgQERGR3XJSOgEiIiKyTwUVdTjzawMi/XshKqCXIjmwkCEiIiJJqhua8OjGHOzJqzAuGxcTiOUzh0Hv4SxrLry1RERERJI8ujEH+/LPmyzbl38eczcekz0XFjJERETUZQUVddiTV4EWQTBZ3iII2JNXgcLz9bLmw0KGiIiIuuzMrw2i8dOVLGSIiIhIpSL8PETjkf7yNv2ykCEiIqIuiw70xLiYQDjqdCbLHXU6jIsJlP3pJRYyREREJMnymcMwpl+AybIx/QKwfOYw2XPh49dEREQkid7DGe/Ojkfh+XqcrqznODJERERkf6IClCtg2vHWEhEREdktFjJERERkt1jIEBERkd1ij0w3ZeaWI+dsNYaH++K6mECl0yEiItIkFjISnamsx9QV+1DV0Gxc5uvhjO0pYxHmLz5IEBEREVkXby1JdHkRAwBVDc24ZcVehTIiIiJSRkFFHXbllss+v9KleEVGgszc8g5FTLuqhmZ8m1fB20xERHTFq25owqMbc7Anr8K4bFxMIJbPHAa9h7OsufCKjAQ5Z6tF40eLquRJhIgAqONskEiLHt2Yg335502W7cs/j7kbj8mei6KFTGRkJHQ6XYdXSkoKAODChQtISUmBv78/PD09MW3aNJSVlSmW79A+PqLx4eG+8iRCpHHVDU24Z80h3PBKJu5bexgTXt6Ne9YcQk0nV0yJyHoKKuqwJ68CLYJgsrxFELAnr0L2EwtFC5nDhw/j3LlzxtdXX30FAJg+fToAYP78+fjkk0+wZcsWZGZmoqSkBLfddpti+Y6PDYKTg85szMlBx9tKRDJR09kgkdac+bVBNH66Ut5CRtEemcBA0y/+9PR09O3bF+PHj0dNTQ3WrFmDDRs24IYbbgAArF27FgMGDMCBAwdw7bXXmv3MxsZGNDY2Gn82GAxWy7egog4XWwWzsYutAgrP1ys+VDPRla79bPByl54N8jgksp0IP/EndCP9NTr7dVNTE95//33cf//90Ol0yM7ORnNzM5KSkozr9O/fH+Hh4cjKyur0c9LS0qDX642vsLAwq+WotiqUSIt4HBIpKzrQE+NiAuGoM71D4ajTYVxMoOwnEqopZLZt24bq6mrce++9AIDS0lK4uLjAx8fHZL3g4GCUlpZ2+jmpqamoqakxvoqLi62Wo9qqUCIt4nFIpLzlM4dhTL8Ak2Vj+gVg+cxhsueimsev16xZg0mTJiE0NLRHn+Pq6gpXV1crZWWqvQrdl3/epMnJUafDmH4BvJxNJAMeh0TK03s4493Z8Sg8X4/TlfWI9FduFmxVXJE5c+YMvv76azzwwAPGZSEhIWhqakJ1dbXJumVlZQgJCZE5wz+oqQol0ioeh0TqEBXQCxNigxQ9gVDFFZm1a9ciKCgIkydPNi4bMWIEnJ2dkZGRgWnTpgEAcnNzUVRUhMTERKVSVVUVSqRVPA6JqJ3ihUxrayvWrl2LWbNmwcnpj3T0ej1mz56NBQsWwM/PD97e3pg7dy4SExM7fWJJTlEB/MNJpDQeh0SkeCHz9ddfo6ioCPfff3+H2NKlS+Hg4IBp06ahsbERycnJWLlypQJZEhERkRrpBEEwPzDKFcJgMECv16Ompgbe3t5Kp0NERERd0NXvb1U0+xIRERF1BwsZIiIislssZIiIiMhusZAhIiIiu8VChoiIiOyW4o9fExF1V0FFHc782sAB8Yg0jIUMEdmd6oYmPLoxB3vyKozLxsUEYvnMYdB7OCuYGRHJjbeWiMjuPLoxB/vyz5ss25d/HnM3HlMoIyJSCgsZIrIrBRV12JNXYTLzNQC0CAL25FWg8Hy9QpkRkRJYyHRTZm45Xs/4Gd9ecmmbiGzvzK8NovHTlSxkiORSUFGHXbnlip5AsEdGojOV9Zi6Yh+qGpqNy3w9nLE9ZSzC/D0UzIxIGyL8xI+zSH82/RLZmpr61HhFRqLLixgAqGpoxi0r9iqUEZG2RAd6YlxMIBx1OpPljjodxsUE8uklIhmoqU+NhYwEmbnlHYqYdlUNzbzNRCST5TOHYUy/AJNlY/oFYPnMYQplRKQdautT460lCXLOVovGjxZV4bqYQHmSIdIwvYcz3p0dj8Lz9ThdWc9xZIhk1JU+NTmPRxYyEgzt4yMaHx7uK08iRAQAiApgAUMkN7X1qfHWkgTjY4NE47waQ0REVzq19amxkJEgM7dcNM4eGSIi0gI19anx1pI
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"df.plot.scatter(x=\"Age\", y=\"Sex\")\n",
|
|||
|
"\n",
|
|||
|
"df.plot.scatter(x=\"Pclass\", y=\"Age\")"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Визуализация - Столбчатая диаграмма"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 10,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"text/plain": [
|
|||
|
"<matplotlib.legend.Legend at 0x1ac1cd1c6e0>"
|
|||
|
]
|
|||
|
},
|
|||
|
"execution_count": 10,
|
|||
|
"metadata": {},
|
|||
|
"output_type": "execute_result"
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAigAAAGrCAYAAADqwWxuAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAAqnElEQVR4nO3deXhU5aHH8d8kIRtkJg2QTPKQsIrsaxAjiAgpIVhkVZZUiXLhyqKFWGlzryyCvUGuCkW223uvBIUIUgsCAkJZwhZQ0oKK7AWDDyThgsmwJYRk7h88TDslLIGEeRO+n+c5z+PMec+Zd2Da+XLOmRmL0+l0CgAAwCBenp4AAADAPyNQAACAcQgUAABgHAIFAAAYh0ABAADGIVAAAIBxCBQAAGAcH09P4F6UlJTo9OnTCgoKksVi8fR0AADAXXA6nbpw4YIiIiLk5XX7YySVMlBOnz6tyMhIT08DAADcg1OnTqlOnTq3HVMpAyUoKEjS9SdotVo9PBsAAHA3HA6HIiMjXe/jt1MpA+XGaR2r1UqgAABQydzN5RlcJAsAAIxDoAAAAOMQKAAAwDiV8hqUu1VcXKyioiJPTwOGqVatmry9vT09DQDAbVTJQHE6ncrOzlZeXp6npwJDBQcHy2638z06AGCoKhkoN+IkNDRUgYGBvAnBxel06vLly8rNzZUkhYeHe3hGAIDSVLlAKS4udsVJzZo1PT0dGCggIECSlJubq9DQUE73AICBqtxFsjeuOQkMDPTwTGCyG68PrlECADNVuUC5gdM6uB1eHwBgtiobKAAAoPIiUAAAgHGq3EWyt5W+98E91lPRD+6xKpGTJ0+qfv36+utf/6o2bdpU2ONMmTJFK1eu1L59+yrsMQAAFYcjKIZITEyUxWLR9OnT3e5fuXJlma+XqFevnmbNmlWOsys/kZGROnPmjFq0aOHpqQAADEagGMTf31/vvPOOfvrpJ09P5Z7czSdivL29Zbfb5ePzcB28AwCUDYFikNjYWNntdqWkpNx23GeffabmzZvLz89P9erV03vvveda17VrV/3www8aP368LBbLLY++OJ1OTZkyRVFRUfLz81NERIRee+0113qLxaKVK1e6bRMcHKzU1FRJ10/VWCwWLVu2TE899ZT8/f01f/58BQQEaN26dW7brVixQkFBQbp8+bJru3379qmkpER16tTR/Pnz3cb/9a9/lZeXl3744QdJUl5env7lX/5FtWvXltVqVbdu3bR//363baZPn66wsDAFBQVp+PDhKigouO2fIQDAbPwz1iDe3t76j//4Dw0dOlSvvfaa6tSpc9OYzMxMPf/885oyZYoGDRqkXbt2afTo0apZs6YSExP1pz/9Sa1bt9bIkSM1YsSIWz7WZ599ppkzZ2rp0qVq3ry5srOzb3rTvxu//e1v9d5776lt27by9/fX9u3blZaWpvj4eNeYJUuWqG/fvjd9N42Xl5eGDBmitLQ0jRo1ym18p06dVLduXUnSc8895wofm82m//qv/1L37t115MgRhYSE6NNPP9WUKVM0d+5cde7cWR9//LFmz56tBg0alPn5APCAB3l94L3iusIHjiMohunXr5/atGmjyZMnl7r+/fffV/fu3TVx4kQ1btxYiYmJGjt2rP7zP/9TkhQSEiJvb28FBQXJbrfLbreXup+srCzZ7XbFxsYqKipKjz322G2D5lbGjRun/v37q379+goPD1dCQoJWrlypy5cvS5IcDoe++OILJSQklLp9QkKCdu7cqaysLElSSUmJli5d6hq/Y8cOffXVV1q+fLmio6P1yCOP6N1331VwcLD++Mc/SpJmzZql4cOHa/jw4Xr00Uf19ttvq1mzZmV+LgAAcxAoBnrnnXe0aNEiHTx48KZ1Bw8eVKdOndzu69Spk44ePari4uK7foznnntOV65cUYMGDTRixAitWLFC165dK/Nco6Pd/1XRq1cvVatWTatWrZJ0/UiN1WpVbGxsqdu3adNGTZs2VVpamiQpPT1dubm5eu655yRJ+/fv18WLF1WzZk3VqFHDtZw4cULHjx+XdP3PpGPHjm77jYmJKfNzAQCYg0AxUJcuXRQXF6fk5OQKe4zIyEgdPnxY8+bNU0BAgEaPHq0uXbq4LnS1WCxyOp1u25R2EWz16tXdbvv6+mrgwIGu4EhLS9OgQYNue1FsQkKC2/iePXu6fkfp4sWLCg8P1759+9yWw4cP64033rj3PwAAgNEIFENNnz5dq1evVkZGhtv9TZs21c6dO93u27lzpxo3buz60TtfX9+7OpoSEBCg3r17a/bs2dq6dasyMjL07bffSpJq166tM2fOuMYePXrUddrmThISErR+/XodOHBAmzdvvuXpnRuGDh2q7777TpmZmfrjH//oNr5du3bKzs6Wj4+PGjVq5LbUqlXL9WeyZ88et33u3r37ruYKADATF8kaqmXLlkpISNDs2bPd7n/99dfVoUMHTZs2TYMGDVJGRobmzJmjefPmucbUq1dP27Zt0+DBg+Xn5+d6I/9HqampKi4uVseOHRUYGKjFixcrICDAdWFqt27dNGfOHMXExKi4uFi/+c1vVK1atbuae5cuXWS325WQkKD69evfdPrln9WrV09PPPGEhg8fruLiYj377LOudbGxsYqJiVHfvn01Y8YMNW7cWKdPn9YXX3yhfv36KTo6Wr/61a+UmJio6OhoderUSUuWLNGBAwe4SBYAKrGHK1Aq2VXYU6dO1bJly9zua9eunT799FNNmjRJ06ZNU3h4uKZOnarExES37f71X/9VDRs2VGFh4U2naqTrHxmePn26kpKSVFxcrJYtW2r16tWuUyvvvfeeXnrpJT355JOKiIjQ73//e2VmZt7VvC0Wi4YMGaIZM2Zo0qRJd7VNQkKCRo8erRdffFEBAQFu+1q7dq3+/d//XS+99JLOnj0ru92uLl26KCwsTJI0aNAgHT9+XBMmTFBBQYEGDBigUaNG6csvv7yrxwYAmMfiLO3dy3AOh0M2m035+fmyWq1u6woKCnTixAnVr19f/v7+HpohTMfrBDAIHzN+aNzu/fufcQ0KAAAwDoECAACMQ6AAAADjECgAAMA4BAoAADAOgQIAAIxDoAAAAOMQKAAAwDgECrR161ZZLBbl5eVV6OMkJiaqb9++FfoYAICq4aH6qnvLW5YH9ljOyWX/gt6zZ89q0qRJ+uKLL5STk6Of/exnat26tSZNmqROnTpVwCyve+KJJ3TmzBnZbLYKewwAAMrioQoU0w0YMEBXr17VokWL1KBBA+Xk5GjTpk06d+7cPe3P6XSquLhYPj63/2v29fWV3W6/p8cAAKAicIrHEHl5edq+fbveeecdPf3006pbt64ee+wxJScn69lnn9XJkydlsVi0b98+t20sFou2bt0q6e+natatW6f27dvLz89PH374oSwWiw4dOuT2eDNnzlTDhg3dtsvLy5PD4VBAQIDWrVvnNn7FihUKCgrS5cuXJUmnTp3S888/r+DgYIWEhKhPnz46efKka3xxcbGSkpIUHBysmjVrasKECaX+aCEAAKUhUAxRo0YN1ahRQytXrlRhYeF97eu3v/2tpk+froMHD2rgwIGKjo7WkiVL3MYsWbJEQ4cOvWlbq9WqX/ziF0pLS7tpfN++fRUYGKiioiLFxcUpKChI27dv186dO1WjRg317NlTV69elXT915BTU1P14YcfaseOHTp//rxWrFhxX88LAPDwIFAM4ePjo9TUVC1atEjBwcHq1KmT/u3f/k3ffPNNmfc1depU/fznP1fDhg0VEhKihIQEffLJJ671R44cUWZmphISEkrdPiEhQStXrnQdLXE4HPriiy9c45ctW6aSkhL9z//8j1q2bKmmTZtq4cKFysrKch3NmTVrlpKTk9W/f381bdpUCxYs4BoXAMBdK1OgpKSkqEOHDgoKClJoaKj69u2rw4cPu43p2rWrLBaL2/LKK6+4jcnKytIzzzyjwMBAhYaG6o033tC1a9fu/9lUcgMGDNDp06e1atUq9ezZU1u3blW7du2Umppapv1ER7v/LPjgwYN18uRJ7d69W9L
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"plot = data.groupby([\"Pclass\", \"Survived\"]).size().unstack().plot.bar(color=[\"pink\", \"green\"])\n",
|
|||
|
"plot.legend([\"Not survived\", \"Survived\"])"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "markdown",
|
|||
|
"metadata": {},
|
|||
|
"source": [
|
|||
|
"Визуализация - Временные ряды"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"cell_type": "code",
|
|||
|
"execution_count": 11,
|
|||
|
"metadata": {},
|
|||
|
"outputs": [
|
|||
|
{
|
|||
|
"name": "stdout",
|
|||
|
"output_type": "stream",
|
|||
|
"text": [
|
|||
|
"<class 'pandas.core.frame.DataFrame'>\n",
|
|||
|
"RangeIndex: 243 entries, 0 to 242\n",
|
|||
|
"Data columns (total 6 columns):\n",
|
|||
|
" # Column Non-Null Count Dtype \n",
|
|||
|
"--- ------ -------------- ----- \n",
|
|||
|
" 0 my_date 243 non-null object \n",
|
|||
|
" 1 my_value 243 non-null float64 \n",
|
|||
|
" 2 bullet 2 non-null object \n",
|
|||
|
" 3 bulletClass 2 non-null object \n",
|
|||
|
" 4 label 2 non-null object \n",
|
|||
|
" 5 date 243 non-null datetime64[ns]\n",
|
|||
|
"dtypes: datetime64[ns](1), float64(1), object(4)\n",
|
|||
|
"memory usage: 11.5+ KB\n",
|
|||
|
" my_date my_value bullet bulletClass label date\n",
|
|||
|
"0 28.03.2023 76.5662 NaN NaN NaN 2023-03-28\n",
|
|||
|
"1 31.03.2023 77.0863 NaN NaN NaN 2023-03-31\n",
|
|||
|
"2 01.04.2023 77.3233 NaN NaN NaN 2023-04-01\n",
|
|||
|
"3 04.04.2023 77.9510 NaN NaN NaN 2023-04-04\n",
|
|||
|
"4 05.04.2023 79.3563 NaN NaN NaN 2023-04-05\n",
|
|||
|
".. ... ... ... ... ... ...\n",
|
|||
|
"238 20.03.2024 92.2243 NaN NaN NaN 2024-03-20\n",
|
|||
|
"239 21.03.2024 92.6861 NaN NaN NaN 2024-03-21\n",
|
|||
|
"240 22.03.2024 91.9499 NaN NaN NaN 2024-03-22\n",
|
|||
|
"241 23.03.2024 92.6118 NaN NaN NaN 2024-03-23\n",
|
|||
|
"242 26.03.2024 92.7761 NaN NaN NaN 2024-03-26\n",
|
|||
|
"\n",
|
|||
|
"[243 rows x 6 columns]\n"
|
|||
|
]
|
|||
|
},
|
|||
|
{
|
|||
|
"data": {
|
|||
|
"image/png": "iVBORw0KGgoAAAANSUhEUgAAAigAAAHGCAYAAABeq3DqAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMiwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy8hTgPZAAAACXBIWXMAAA9hAAAPYQGoP6dpAAChdUlEQVR4nOzdd3xT9foH8M/JaNK994aWvRHKEhCZooBywYEyHCBe9aL3yhWvoIheRP2J4zq5iqgo6FVBVEAEWbIrlA2lLbRQ2tKZDrqS5/dHmkPTpOOkSXvSPu/Xqy9Ncs75PpyTnDz5ToGICIwxxhhjMqJo7QAYY4wxxuriBIUxxhhjssMJCmOMMcZkhxMUxhhjjMkOJyiMMcYYkx1OUBhjjDEmO5ygMMYYY0x2VK0dgC0MBgMyMzPh6ekJQRBaOxzGGGOMNQERobi4GGFhYVAoGq4jccoEJTMzE5GRka0dBmOMMcZskJGRgYiIiAa3ccoExdPTE4DxH+jl5dXK0TDGGGOsKXQ6HSIjI8Xv8YY4ZYJiatbx8vLiBIUxxhhzMk3pnsGdZBljjDEmO5ygMMYYY0x2OEFhjDHGmOw4ZR8UxhhjbY9er0dVVVVrh8GaQa1WQ6lU2uVYnKAwxhhrVUSErKwsFBYWtnYozA58fHwQEhLS7HnKOEFhjDHWqkzJSVBQENzc3HgCTidFRCgrK0NOTg4AIDQ0tFnH4wSFMcZYq9Hr9WJy4u/v39rhsGZydXUFAOTk5CAoKKhZzT3cSZYxxlirMfU5cXNza+VImL2YrmVz+xNxgsIYY6zVcbNO22Gva8kJCmOMMcZkhxMUxlibVF6lb+0QGGPNwAkKY6zNWbPvIros3oKd53JaOxTGZOPixYsQBAHHjh1r7VCahBMUxlibYjAQPtyVAgA4kJrfytEwxmzFCQpjrE05kJqHq0XlAIDCsspWjoYxZitOUBhzcuezi5F4qaC1w5CN7/68Iv5/AScoTomIUFZZ3Sp/RNTkOEeOHIknnngCCxYsgK+vL4KDg7Fq1SqUlpZizpw58PT0RFxcHDZv3gwiQlxcHN544w2zYxw7dgyCIODChQsNlnXffffh7rvvNnuuqqoKAQEB+PzzzwEAW7ZswbBhw+Dj4wN/f3/cfvvtSElJqfeYn332GXx8fMye27Bhg8UonI0bN6Jfv37QarXo0KEDli5diurq6sZOT7PxRG2MOTEiwn2rDqDoehUSF4+Bl1bd2iG1qrLKamw+eVV8XFDG67o4o+tVenRbsrVVyj790ji4uTT9q3HNmjVYuHAhDh06hPXr12P+/Pn44YcfcOedd+K5557DypUr8cADDyA9PR0PPvggVq9ejX/84x/i/qtXr8bw4cMRFxfXYDkzZszAtGnTUFJSAg8PDwDA1q1bUVZWhjvvvBMAUFpaiqeffhq9evVCSUkJlixZgjvvvBPHjh2DQmFbfcSePXswc+ZMvPPOO7j55puRkpKCuXPnAgBeeOEFm47ZVFyDwpgTKyirQm5JJar0hMJS/jLeeioLZZV6mH4AchMPc7TevXvj+eefR3x8PBYtWgStVouAgAA88sgjiI+Px5IlS5CXl4fjx49j9uzZOHfuHA4dOgTAWAPy1Vdf4cEHH2y0nHHjxsHd3R0//PCD+NxXX32FSZMmwdPTEwAwdepU3HXXXYiLi0OfPn3w6aef4sSJEzh9+rTN/76lS5fi2WefxaxZs9ChQweMGTMGy5Ytw0cffWTzMZuKa1AYc2KZhdfF/6+o5mG139c074zpGoxfT2dzDYqTclUrcfqlca1WthS9evUS/1+pVMLf3x89e/YUnwsODgZgnPp90KBBmDhxIj799FMMHDgQmzZtQkVFBaZNm9ZoOSqVCtOnT8fatWvxwAMPoLS0FBs3bsS6devEbZKTk7FkyRIcPHgQubm5MBgMAID09HT06NFD0r/LJCkpCX/88QdeeeUV8Tm9Xo/y8nKUlZU5dAZgTlAYc2KmzqAAUFFtaMVIWl9WUTn2XsgFADw4LBa/ns5GYVkliIhnKXUygiBIamZpTWq1ebOqIAhmz5nee6Zk4eGHH8YDDzyAlStXYvXq1bj77rub/CU/Y8YMjBgxAjk5Odi2bRtcXV0xfvx48fU77rgD0dHRWLVqFcLCwmAwGNCjRw9UVlqvSVQoFBZ9bupOT19SUoKlS5firrvusthfq9U2KW5bOcc7gDFm1dWi2jUo7TtB2XDsCoiAgTF+6BXhDQCo0hNKK/Xw0PCtjsnDbbfdBnd3d3zwwQfYsmULdu/e3eR9hwwZgsjISKxfvx6bN2/GtGnTxGQoLy8P586dw6pVq3DzzTcDAPbu3dvg8QIDA1FcXIzS0lK4u7sDgMUcKf369cO5c+ca7SPjCPypZcyJZRbWrkFpv008RITvEi8DAO7sFw5XtRIuKgUqqw0oKK3kBIXJhlKpxOzZs7Fo0SLEx8dj8ODBkva/77778OGHH+L8+fP4/fffxed9fX3h7++Pjz/+GKGhoUhPT8ezzz7b4LESEhLg5uaG5557Dk8++SQOHjyIzz77zGybJUuW4Pbbb0dUVBT+8pe/QKFQICkpCSdPnsTLL78sKXapuJMsY06sdg1KZTuuQTl9VYfknBK4qBS4rWcoBEGAr5vxlyUPNWZy89BDD6GyshJz5syRvO+MGTNw+vRphIeHY+jQoeLzCoUC69atQ2JiInr06IGnnnoKr7/+eoPH8vPzw5dffolffvkFPXv2xNdff40XX3zRbJtx48bhp59+wq+//ooBAwZg0KBBWLlyJaKjoyXHLhX/rGDMiV0t5D4oAHDichEAICHWD96uxsTE180F2boK7ijLHGbnzp0Wz128eNHiubr9PK5cuQK1Wo2ZM2dKLrNr1671ztUyevRoixE7tbeNiYmx2HfKlCmYMmWK2XOPPPKI2eNx48Zh3LiW77TMCQpjTiyTa1AAAOn5ZQCAGH938TlfNxcAPNSYyUdFRQWuXbuGF198EdOmTRNH+DDrJDfx7N69G3fccQfCwsIgCAI2bNhg9joRYcmSJQgNDYWrqytGjx6N5ORks23y8/MxY8YMeHl5wcfHBw899BBKSkqa9Q9hrL0xGAjZOq5BAYCMAmOiFunnKj7n617TxFPKCQqTh6+//hrR0dEoLCzEa6+9Zvba2rVr4eHhYfWve/furRRx65Jcg1JaWorevXvjwQcftDrs6LXXXsM777yDNWvWIDY2FosXL8a4ceNw+vRpcUjSjBkzcPXqVWzbtg1VVVWYM2cO5s6di6+++qr5/yLG2onckgpU6W9U17bnGpSMmhqUKL8bwzV9ampQuImHycXs2bMxe/Zsq69NmjQJCQkJVl+rO5S5vZCcoEyYMAETJkyw+hoR4a233sLzzz+PyZMnAwA+//xzBAcHY8OGDbjnnntw5swZbNmyBYcPH8ZNN90EAHj33Xdx22234Y033kBYWFgz/jmMtR+ZteZAAdr3KB5TghLheyNBqd1J1mAgKBQ8F4qcSVkDpy3y9PQUZ4R1dva6lnYdxZOWloasrCyMHj1afM7b2xsJCQnYv38/AGD//v3w8fERkxPA2LFHoVDg4MGDVo9bUVEBnU5n9sdYe3e11iyyQPutQSmtqEZeTTNOlH/tBMVYg/L5/ku4/xPr9xbW+ky1A2VlZa0cCbMX07Vsbs2PXTvJZmVlAYBFx5/g4GDxtaysLAQFBZkHoVLBz89P3Kau5cuXY+nSpfYMlTGnZ1mD0j4TlIwC483Q21VttlhisNeNWS73peS1eFysaZRKJXx8fJCTkwMAcHNz45l/nRQRoaysDDk5OfDx8YFSKW3ZgLqcYhTPokWL8PTTT4uPdTodIiMjWzEixlof16AYZeRbdpAFgDHdgvHXWzrivd+Ny83rDQQlN/PIUkhICACISQpzbj4+PuI1bQ67JiimgLKzsxEaGio+n52djT59+ojb1H0TVldXIz8/v95/kEajgUajsWeojDk90zo8GpUCFdWGdtsHJd1KB1kA0KqVePyWeDFBKa/Sw51nlJUlQRAQGhqKoKAgi7VgmHNRq9XNrjkxseunNTY2FiE
|
|||
|
"text/plain": [
|
|||
|
"<Figure size 640x480 with 1 Axes>"
|
|||
|
]
|
|||
|
},
|
|||
|
"metadata": {},
|
|||
|
"output_type": "display_data"
|
|||
|
}
|
|||
|
],
|
|||
|
"source": [
|
|||
|
"from datetime import datetime\n",
|
|||
|
"import matplotlib.dates as md\n",
|
|||
|
"\n",
|
|||
|
"ts = pd.read_csv(\"data/dollar.csv\")\n",
|
|||
|
"ts[\"date\"] = ts.apply(lambda row: datetime.strptime(row[\"my_date\"], \"%d.%m.%Y\"), axis=1)\n",
|
|||
|
"ts.info()\n",
|
|||
|
"\n",
|
|||
|
"print(ts)\n",
|
|||
|
"\n",
|
|||
|
"plot = ts.plot.line(x=\"date\", y=\"my_value\")\n",
|
|||
|
"plot.xaxis.set_major_locator(md.DayLocator(interval=10))\n",
|
|||
|
"plot.xaxis.set_major_formatter(md.DateFormatter(\"%d.%m.%Y\"))\n",
|
|||
|
"plot.tick_params(axis=\"x\", labelrotation=90)"
|
|||
|
]
|
|||
|
}
|
|||
|
],
|
|||
|
"metadata": {
|
|||
|
"kernelspec": {
|
|||
|
"display_name": ".venv",
|
|||
|
"language": "python",
|
|||
|
"name": "python3"
|
|||
|
},
|
|||
|
"language_info": {
|
|||
|
"codemirror_mode": {
|
|||
|
"name": "ipython",
|
|||
|
"version": 3
|
|||
|
},
|
|||
|
"file_extension": ".py",
|
|||
|
"mimetype": "text/x-python",
|
|||
|
"name": "python",
|
|||
|
"nbconvert_exporter": "python",
|
|||
|
"pygments_lexer": "ipython3",
|
|||
|
"version": "3.12.5"
|
|||
|
}
|
|||
|
},
|
|||
|
"nbformat": 4,
|
|||
|
"nbformat_minor": 2
|
|||
|
}
|