{ "cells": [ { "cell_type": "markdown", "metadata": { "vscode": { "languageId": "plaintext" } }, "source": [ "#### Загрузка набора данных" ] }, { "cell_type": "code", "execution_count": 732, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | Price | \n", "Levy | \n", "Manufacturer | \n", "Model | \n", "Prod. year | \n", "Category | \n", "Leather interior | \n", "Fuel type | \n", "Engine volume | \n", "Mileage | \n", "Cylinders | \n", "Gear box type | \n", "Drive wheels | \n", "Doors | \n", "Wheel | \n", "Color | \n", "Airbags | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "13328 | \n", "1399 | \n", "LEXUS | \n", "RX 450 | \n", "2010 | \n", "Jeep | \n", "Yes | \n", "Hybrid | \n", "3.5 | \n", "186005 km | \n", "6.0 | \n", "Automatic | \n", "4x4 | \n", "04-May | \n", "Left wheel | \n", "Silver | \n", "12 | \n", "
1 | \n", "16621 | \n", "1018 | \n", "CHEVROLET | \n", "Equinox | \n", "2011 | \n", "Jeep | \n", "No | \n", "Petrol | \n", "3 | \n", "192000 km | \n", "6.0 | \n", "Tiptronic | \n", "4x4 | \n", "04-May | \n", "Left wheel | \n", "Black | \n", "8 | \n", "
2 | \n", "8467 | \n", "- | \n", "HONDA | \n", "FIT | \n", "2006 | \n", "Hatchback | \n", "No | \n", "Petrol | \n", "1.3 | \n", "200000 km | \n", "4.0 | \n", "Variator | \n", "Front | \n", "04-May | \n", "Right-hand drive | \n", "Black | \n", "2 | \n", "
3 | \n", "3607 | \n", "862 | \n", "FORD | \n", "Escape | \n", "2011 | \n", "Jeep | \n", "Yes | \n", "Hybrid | \n", "2.5 | \n", "168966 km | \n", "4.0 | \n", "Automatic | \n", "4x4 | \n", "04-May | \n", "Left wheel | \n", "White | \n", "0 | \n", "
4 | \n", "11726 | \n", "446 | \n", "HONDA | \n", "FIT | \n", "2014 | \n", "Hatchback | \n", "Yes | \n", "Petrol | \n", "1.3 | \n", "91901 km | \n", "4.0 | \n", "Automatic | \n", "Front | \n", "04-May | \n", "Left wheel | \n", "Silver | \n", "4 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
19232 | \n", "8467 | \n", "- | \n", "MERCEDES-BENZ | \n", "CLK 200 | \n", "1999 | \n", "Coupe | \n", "Yes | \n", "CNG | \n", "2.0 Turbo | \n", "300000 km | \n", "4.0 | \n", "Manual | \n", "Rear | \n", "02-Mar | \n", "Left wheel | \n", "Silver | \n", "5 | \n", "
19233 | \n", "15681 | \n", "831 | \n", "HYUNDAI | \n", "Sonata | \n", "2011 | \n", "Sedan | \n", "Yes | \n", "Petrol | \n", "2.4 | \n", "161600 km | \n", "4.0 | \n", "Tiptronic | \n", "Front | \n", "04-May | \n", "Left wheel | \n", "Red | \n", "8 | \n", "
19234 | \n", "26108 | \n", "836 | \n", "HYUNDAI | \n", "Tucson | \n", "2010 | \n", "Jeep | \n", "Yes | \n", "Diesel | \n", "2 | \n", "116365 km | \n", "4.0 | \n", "Automatic | \n", "Front | \n", "04-May | \n", "Left wheel | \n", "Grey | \n", "4 | \n", "
19235 | \n", "5331 | \n", "1288 | \n", "CHEVROLET | \n", "Captiva | \n", "2007 | \n", "Jeep | \n", "Yes | \n", "Diesel | \n", "2 | \n", "51258 km | \n", "4.0 | \n", "Automatic | \n", "Front | \n", "04-May | \n", "Left wheel | \n", "Black | \n", "4 | \n", "
19236 | \n", "470 | \n", "753 | \n", "HYUNDAI | \n", "Sonata | \n", "2012 | \n", "Sedan | \n", "Yes | \n", "Hybrid | \n", "2.4 | \n", "186923 km | \n", "4.0 | \n", "Automatic | \n", "Front | \n", "04-May | \n", "Left wheel | \n", "White | \n", "12 | \n", "
19237 rows × 17 columns
\n", "\n", " | Price | \n", "Levy | \n", "Manufacturer | \n", "Model | \n", "Prod. year | \n", "Category | \n", "Leather interior | \n", "Fuel type | \n", "Engine volume | \n", "Mileage | \n", "Cylinders | \n", "Gear box type | \n", "Drive wheels | \n", "Doors | \n", "Wheel | \n", "Color | \n", "Airbags | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "13328 | \n", "1399 | \n", "LEXUS | \n", "RX 450 | \n", "2010 | \n", "Jeep | \n", "Yes | \n", "Hybrid | \n", "3.5 | \n", "186005 | \n", "6 | \n", "Automatic | \n", "4x4 | \n", "Четырехдверный | \n", "Left wheel | \n", "Silver | \n", "12 | \n", "
1 | \n", "16621 | \n", "1018 | \n", "CHEVROLET | \n", "Equinox | \n", "2011 | \n", "Jeep | \n", "No | \n", "Petrol | \n", "3.0 | \n", "192000 | \n", "6 | \n", "Tiptronic | \n", "4x4 | \n", "Четырехдверный | \n", "Left wheel | \n", "Black | \n", "8 | \n", "
2 | \n", "8467 | \n", "0 | \n", "HONDA | \n", "FIT | \n", "2006 | \n", "Hatchback | \n", "No | \n", "Petrol | \n", "1.3 | \n", "200000 | \n", "4 | \n", "Variator | \n", "Front | \n", "Четырехдверный | \n", "Right-hand drive | \n", "Black | \n", "2 | \n", "
3 | \n", "3607 | \n", "862 | \n", "FORD | \n", "Escape | \n", "2011 | \n", "Jeep | \n", "Yes | \n", "Hybrid | \n", "2.5 | \n", "168966 | \n", "4 | \n", "Automatic | \n", "4x4 | \n", "Четырехдверный | \n", "Left wheel | \n", "White | \n", "0 | \n", "
4 | \n", "11726 | \n", "446 | \n", "HONDA | \n", "FIT | \n", "2014 | \n", "Hatchback | \n", "Yes | \n", "Petrol | \n", "1.3 | \n", "91901 | \n", "4 | \n", "Automatic | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Silver | \n", "4 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
19231 | \n", "5802 | \n", "1055 | \n", "MERCEDES-BENZ | \n", "E 350 | \n", "2013 | \n", "Sedan | \n", "Yes | \n", "Diesel | \n", "3.5 | \n", "107800 | \n", "6 | \n", "Automatic | \n", "Rear | \n", "Четырехдверный | \n", "Left wheel | \n", "Grey | \n", "12 | \n", "
19232 | \n", "8467 | \n", "0 | \n", "MERCEDES-BENZ | \n", "CLK 200 | \n", "1999 | \n", "Coupe | \n", "Yes | \n", "CNG | \n", "2.0 | \n", "300000 | \n", "4 | \n", "Manual | \n", "Rear | \n", "Двухдверный | \n", "Left wheel | \n", "Silver | \n", "5 | \n", "
19233 | \n", "15681 | \n", "831 | \n", "HYUNDAI | \n", "Sonata | \n", "2011 | \n", "Sedan | \n", "Yes | \n", "Petrol | \n", "2.4 | \n", "161600 | \n", "4 | \n", "Tiptronic | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Red | \n", "8 | \n", "
19234 | \n", "26108 | \n", "836 | \n", "HYUNDAI | \n", "Tucson | \n", "2010 | \n", "Jeep | \n", "Yes | \n", "Diesel | \n", "2.0 | \n", "116365 | \n", "4 | \n", "Automatic | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Grey | \n", "4 | \n", "
19235 | \n", "5331 | \n", "1288 | \n", "CHEVROLET | \n", "Captiva | \n", "2007 | \n", "Jeep | \n", "Yes | \n", "Diesel | \n", "2.0 | \n", "51258 | \n", "4 | \n", "Automatic | \n", "Front | \n", "Четырехдверный | \n", "Left wheel | \n", "Black | \n", "4 | \n", "
17574 rows × 17 columns
\n", "\n", " | Leather interior_Yes | \n", "Category_Coupe | \n", "Category_Goods wagon | \n", "Category_Hatchback | \n", "Category_Jeep | \n", "Category_Limousine | \n", "Category_Microbus | \n", "Category_Minivan | \n", "Category_Pickup | \n", "Category_Sedan | \n", "... | \n", "Gear box type_Tiptronic | \n", "Gear box type_Variator | \n", "Drive wheels_Front | \n", "Drive wheels_Rear | \n", "Wheel_Right-hand drive | \n", "Price | \n", "Levy | \n", "Prod. year | \n", "Engine volume | \n", "Airbags | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "-0.332733 | \n", "1.851925 | \n", "-0.224219 | \n", "1.849443 | \n", "1.353782 | \n", "
1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "-0.029023 | \n", "1.024150 | \n", "-0.007434 | \n", "1.162057 | \n", "0.340316 | \n", "
2 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "1.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "-0.781060 | \n", "-1.187596 | \n", "-1.091356 | \n", "-1.175055 | \n", "-1.179883 | \n", "
3 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "-1.229294 | \n", "0.685218 | \n", "-0.007434 | \n", "0.474671 | \n", "-1.686616 | \n", "
4 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "-0.480485 | \n", "-0.218599 | \n", "0.642919 | \n", "-1.175055 | \n", "-0.673150 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
19225 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "-0.752100 | \n", "1.217515 | \n", "-0.874572 | \n", "-0.625146 | \n", "-0.673150 | \n", "
19226 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "1.0 | \n", "-0.838888 | \n", "-1.187596 | \n", "-1.741709 | \n", "1.162057 | \n", "-1.686616 | \n", "
19232 | \n", "1.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "-0.781060 | \n", "-1.187596 | \n", "-2.608847 | \n", "-0.212715 | \n", "-0.419784 | \n", "
19233 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "-0.115718 | \n", "0.617867 | \n", "-0.007434 | \n", "0.337194 | \n", "0.340316 | \n", "
19234 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.845956 | \n", "0.628730 | \n", "-0.224219 | \n", "-0.212715 | \n", "-0.673150 | \n", "
12597 rows × 28 columns
\n", "\n", " | Leather interior_Yes | \n", "Category_Coupe | \n", "Category_Goods wagon | \n", "Category_Hatchback | \n", "Category_Jeep | \n", "Category_Limousine | \n", "Category_Microbus | \n", "Category_Minivan | \n", "Category_Pickup | \n", "Category_Sedan | \n", "... | \n", "Gear box type_Manual | \n", "Gear box type_Tiptronic | \n", "Gear box type_Variator | \n", "Drive wheels_Front | \n", "Drive wheels_Rear | \n", "Wheel_Right-hand drive | \n", "Levy | \n", "Prod. year | \n", "Engine volume | \n", "Airbags | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
15146 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "-1.187596 | \n", "1.943625 | \n", "-0.487669 | \n", "-0.673150 | \n", "
14145 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "-1.187596 | \n", "-0.874572 | \n", "-0.900100 | \n", "-1.179883 | \n", "
8943 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.081225 | \n", "0.642919 | \n", "-0.487669 | \n", "0.847049 | \n", "
17889 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "-1.187596 | \n", "-1.524925 | \n", "0.474671 | \n", "-0.419784 | \n", "
9515 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "1.695495 | \n", "1.510056 | \n", "0.474671 | \n", "-0.673150 | \n", "
... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "... | \n", "
18201 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "-1.187596 | \n", "-0.874572 | \n", "0.337194 | \n", "-0.673150 | \n", "
7436 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.474472 | \n", "0.859703 | \n", "-0.212715 | \n", "1.353782 | \n", "
7728 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.643938 | \n", "-0.657787 | \n", "-0.900100 | \n", "0.340316 | \n", "
1136 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "-1.187596 | \n", "1.076487 | \n", "-0.762623 | \n", "0.340316 | \n", "
10640 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "1.0 | \n", "... | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "1.0 | \n", "0.0 | \n", "0.0 | \n", "0.444055 | \n", "0.426134 | \n", "0.337194 | \n", "0.340316 | \n", "
8817 rows × 27 columns
\n", "\n", " | RMSE_train | \n", "RMSE_test | \n", "RMAE_test | \n", "R2_test | \n", "
---|---|---|---|---|
knn | \n", "0.536712 | \n", "0.602377 | \n", "0.643601 | \n", "0.640894 | \n", "
random_forest | \n", "0.610511 | \n", "0.634321 | \n", "0.675524 | \n", "0.601798 | \n", "
decision_tree | \n", "0.650704 | \n", "0.683437 | \n", "0.701393 | \n", "0.537743 | \n", "
ridge | \n", "0.779199 | \n", "0.788052 | \n", "0.776391 | \n", "0.385397 | \n", "
linear | \n", "0.779198 | \n", "0.788056 | \n", "0.776379 | \n", "0.385390 | \n", "