{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "#### Загрузка набора данных" ] }, { "cell_type": "code", "execution_count": 69, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Price | \n", "Levy | \n", "Manufacturer | \n", "Model | \n", "Prod. year | \n", "Category | \n", "Leather interior | \n", "Fuel type | \n", "Engine volume | \n", "Mileage | \n", "Cylinders | \n", "Gear box type | \n", "Drive wheels | \n", "Doors | \n", "Wheel | \n", "Color | \n", "Airbags | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "13328 | \n", "1399 | \n", "LEXUS | \n", "RX 450 | \n", "2010 | \n", "Jeep | \n", "Yes | \n", "Hybrid | \n", "3.5 | \n", "186005 | \n", "6 | \n", "Automatic | \n", "4x4 | \n", "Четырехдверный | \n", "Left wheel | \n", "Silver | \n", "12 | \n", "
1 | \n", "16621 | \n", "1018 | \n", "CHEVROLET | \n", "Equinox | \n", "2011 | \n", "Jeep | \n", "No | \n", "Petrol | \n", "3.0 | \n", "192000 | \n", "6 | \n", "Tiptronic | \n", "4x4 | \n", "Четырехдверный | \n", "Left wheel | \n", "Black | \n", "8 | \n", "
2 | \n", "8467 | \n", "0 | \n", "HONDA | \n", "FIT | \n", "2006 | \n", "Hatchback | \n", "No | \n", "Petrol | \n", "1.3 | \n", "200000 | \n", "4 | \n", "Variator | \n", "Front | \n", "Четырехдверный | \n", "Right-hand drive | \n", "Black | \n", "2 | \n", "
3 | \n", "3607 | \n", "862 | \n", "FORD | \n", "Escape | \n", "2011 | \n", "Jeep | \n", "Yes | \n", "Hybrid | \n", "2.5 | \n", "168966 | \n", "4 | \n", "Automatic | \n", "4x4 | \n", "Четырехдверный | \n", "Left wheel | \n", "White | \n", "0 | \n", "
4 | \n", "11726 | \n", "446 | \n", "HONDA | \n", "FIT | \n", "2014 | \n", "Hatchback | \n", "Yes | \n", "Petrol | \n", "1.3 | \n", "91901 | \n", "4 | \n", "Automatic | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Silver | \n", "4 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
12592 | \n", "8781 | \n", "1107 | \n", "OPEL | \n", "Combo | \n", "2007 | \n", "Goods wagon | \n", "No | \n", "Diesel | \n", "1.7 | \n", "236000 | \n", "4 | \n", "Manual | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Beige | \n", "4 | \n", "
12593 | \n", "7840 | \n", "0 | \n", "NISSAN | \n", "Skyline | \n", "2003 | \n", "Sedan | \n", "Yes | \n", "Petrol | \n", "3.0 | \n", "220000 | \n", "6 | \n", "Tiptronic | \n", "Rear | \n", "Четырехдверный | \n", "Right-hand drive | \n", "White | \n", "0 | \n", "
12594 | \n", "8467 | \n", "0 | \n", "MERCEDES-BENZ | \n", "CLK 200 | \n", "1999 | \n", "Coupe | \n", "Yes | \n", "CNG | \n", "2.0 | \n", "300000 | \n", "4 | \n", "Manual | \n", "Rear | \n", "Двухдверный | \n", "Left wheel | \n", "Silver | \n", "5 | \n", "
12595 | \n", "15681 | \n", "831 | \n", "HYUNDAI | \n", "Sonata | \n", "2011 | \n", "Sedan | \n", "Yes | \n", "Petrol | \n", "2.4 | \n", "161600 | \n", "4 | \n", "Tiptronic | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Red | \n", "8 | \n", "
12596 | \n", "26108 | \n", "836 | \n", "HYUNDAI | \n", "Tucson | \n", "2010 | \n", "Jeep | \n", "Yes | \n", "Diesel | \n", "2.0 | \n", "116365 | \n", "4 | \n", "Automatic | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Grey | \n", "4 | \n", "
12597 rows × 17 columns
\n", "\n", " | Levy | \n", "Prod. year | \n", "Engine volume | \n", "Mileage | \n", "Cylinders | \n", "Airbags | \n", "Category_Coupe | \n", "Category_Goods wagon | \n", "Category_Hatchback | \n", "Category_Jeep | \n", "... | \n", "Fuel type_Petrol | \n", "Fuel type_Plug-in Hybrid | \n", "Gear box type_Manual | \n", "Gear box type_Tiptronic | \n", "Gear box type_Variator | \n", "Drive wheels_Front | \n", "Drive wheels_Rear | \n", "Doors_Многодверный | \n", "Doors_Четырехдверный | \n", "Wheel_Right-hand drive | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
10083 | \n", "-1.192982 | \n", "1.946936 | \n", "-0.479341 | \n", "-1.531744 | \n", "-0.403213 | \n", "-0.683755 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
9482 | \n", "-1.192982 | \n", "-0.879266 | \n", "-0.887855 | \n", "-0.130245 | \n", "-0.403213 | \n", "-1.190217 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "1.0 | \n", "
6177 | \n", "0.081576 | \n", "0.642535 | \n", "-0.479341 | \n", "-0.651122 | \n", "-0.403213 | \n", "0.835631 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
11756 | \n", "-1.192982 | \n", "-1.531466 | \n", "0.473858 | \n", "1.263152 | \n", "-0.403213 | \n", "-0.430524 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
6557 | \n", "1.703146 | \n", "1.512135 | \n", "0.473858 | \n", "-0.739330 | \n", "-0.403213 | \n", "-0.683755 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
11964 | \n", "-1.192982 | \n", "-0.879266 | \n", "0.337687 | \n", "0.318018 | \n", "1.538421 | \n", "-0.683755 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
5191 | \n", "0.476602 | \n", "0.859935 | \n", "-0.206998 | \n", "-0.011145 | \n", "-0.403213 | \n", "1.342092 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
5390 | \n", "0.646834 | \n", "-0.661866 | \n", "-0.887855 | \n", "1.155137 | \n", "-0.403213 | \n", "0.329169 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
860 | \n", "-1.192982 | \n", "1.077335 | \n", "-0.751684 | \n", "-0.697325 | \n", "-0.403213 | \n", "0.329169 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
7270 | \n", "0.446048 | \n", "0.425135 | \n", "0.337687 | \n", "-0.465093 | \n", "7.363324 | \n", "0.329169 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "
8817 rows × 31 columns
\n", "\n", " | RMSE_train | \n", "RMSE_test | \n", "RMAE_test | \n", "R2_test | \n", "
---|---|---|---|---|
knn | \n", "5777.663053 | \n", "6607.095563 | \n", "67.047388 | \n", "0.632511 | \n", "
random_forest | \n", "6567.406346 | \n", "6852.474190 | \n", "70.119860 | \n", "0.604708 | \n", "
decision_tree | \n", "7022.066577 | \n", "7393.444466 | \n", "72.910390 | \n", "0.539832 | \n", "
linear | \n", "8399.752941 | \n", "8498.166215 | \n", "80.676781 | \n", "0.392042 | \n", "
ridge | \n", "8400.004465 | \n", "8498.452033 | \n", "80.683952 | \n", "0.392001 | \n", "
linear_poly | \n", "6880.451269 | \n", "3235067552304.437988 | \n", "267308.588962 | \n", "-88102783177967152.000000 | \n", "
linear_interact | \n", "7037.525048 | \n", "113842510019087.921875 | \n", "1576050.007127 | \n", "-109101782409976135680.000000 | \n", "