{ "cells": [ { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "!pip install ЧегоНеХватает" ] }, { "cell_type": "code", "execution_count": 1, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/usr/local/lib/python3.7/site-packages/lightgbm/__init__.py:46: UserWarning: Starting from version 2.2.1, the library file in distribution wheels for macOS is built by the Apple Clang (Xcode_8.3.1) compiler.\n", "This means that in case of installing LightGBM from PyPI via the ``pip install lightgbm`` command, you don't need to install the gcc compiler anymore.\n", "Instead of that, you need to install the OpenMP library, which is required for running LightGBM on the system with the Apple Clang compiler.\n", "You can install the OpenMP library by the following command: ``brew install libomp``.\n", " \"You can install the OpenMP library by the following command: ``brew install libomp``.\", UserWarning)\n" ] } ], "source": [ "import pandas as pd\n", "import numpy as np\n", "import lightgbm # сожрет все сырым и построит регрессионную модель, которая покажет важные фичи\n", " # чтобы дальше делать лабу только на них\n", " # если не можешь установить, то важные фичи в ячейке [8]\n", "from sklearn.model_selection import train_test_split, GridSearchCV\n", "from sklearn.neighbors import KNeighborsRegressor" ] }, { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | bulk_id | \n", "spalen | \n", "date1 | \n", "start_square | \n", "value | \n", "price | \n", "mean_sq | \n", "mean_fl | \n", "plan_s | \n", "plan_m | \n", "... | \n", "До промки(км) | \n", "До парка(км) | \n", "До парка пешком(км) | \n", "Станций метро от кольца | \n", "Площадь двора | \n", "Курс | \n", "Cтавка по ипотеке | \n", "Вклады до 1 года | \n", "Вклады от 1 года до 3 лет | \n", "Вклады свыше 3 лет | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
id | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
0 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "1 | \n", "2017-10-01 | \n", "13109.9 | \n", "1124.5 | \n", "135633.913043 | \n", "38.00 | \n", "8 | \n", "147 | \n", "198 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
1 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "2 | \n", "2017-10-01 | \n", "19898.4 | \n", "1412.3 | \n", "128492.419825 | \n", "58.01 | \n", "9 | \n", "139 | \n", "120 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
2 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "0 | \n", "2017-10-01 | \n", "2100.0 | \n", "345.0 | \n", "158237.634409 | \n", "22.58 | \n", "10 | \n", "78 | \n", "15 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
3 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "3 | \n", "2017-10-01 | \n", "9614.9 | \n", "769.4 | \n", "123250.000000 | \n", "78.81 | \n", "8 | \n", "50 | \n", "0 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
4 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "1 | \n", "2017-11-01 | \n", "11947.2 | \n", "526.7 | \n", "139420.634921 | \n", "37.93 | \n", "9 | \n", "140 | \n", "175 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "58.926552 | \n", "9.87 | \n", "5.17 | \n", "7.07 | \n", "6.20 | \n", "
5 rows × 55 columns
\n", "\n", " | bulk_id | \n", "spalen | \n", "date1 | \n", "start_square | \n", "value | \n", "price | \n", "mean_sq | \n", "mean_fl | \n", "plan_s | \n", "plan_m | \n", "... | \n", "До промки(км) | \n", "До парка(км) | \n", "До парка пешком(км) | \n", "Станций метро от кольца | \n", "Площадь двора | \n", "Курс | \n", "Cтавка по ипотеке | \n", "Вклады до 1 года | \n", "Вклады от 1 года до 3 лет | \n", "Вклады свыше 3 лет | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
id | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
0 | \n", "NaN | \n", "1 | \n", "2017-10-01 | \n", "13109.9 | \n", "1124.5 | \n", "135633.913043 | \n", "NaN | \n", "8 | \n", "147 | \n", "198 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
1 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "2 | \n", "2017-10-01 | \n", "19898.4 | \n", "1412.3 | \n", "128492.419825 | \n", "58.01 | \n", "9 | \n", "139 | \n", "120 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
2 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "0 | \n", "2017-10-01 | \n", "2100.0 | \n", "345.0 | \n", "158237.634409 | \n", "22.58 | \n", "10 | \n", "78 | \n", "15 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
3 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "3 | \n", "2017-10-01 | \n", "9614.9 | \n", "769.4 | \n", "123250.000000 | \n", "78.81 | \n", "8 | \n", "50 | \n", "0 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "57.698052 | \n", "10.04 | \n", "5.74 | \n", "5.94 | \n", "6.03 | \n", "
4 | \n", "FF3814A9-9F7D-E711-8530-00505688958B | \n", "1 | \n", "2017-11-01 | \n", "11947.2 | \n", "526.7 | \n", "139420.634921 | \n", "37.93 | \n", "9 | \n", "140 | \n", "175 | \n", "... | \n", "0.28 | \n", "0.58 | \n", "0.93 | \n", "8 | \n", "7640 | \n", "58.926552 | \n", "9.87 | \n", "5.17 | \n", "7.07 | \n", "6.20 | \n", "
5 rows × 55 columns
\n", "