{ "cells": [ { "cell_type": "code", "execution_count": 2, "id": "e312113e", "metadata": {}, "outputs": [], "source": [ "\n", "import pandas as pd\n", "import matplotlib as plt\n", "import seaborn as sns\n", "import numpy as np" ] }, { "cell_type": "markdown", "id": "de2c028d", "metadata": {}, "source": [ "# Загрузка и знакомство с данными" ] }, { "cell_type": "code", "execution_count": 3, "id": "5cd00195", "metadata": {}, "outputs": [], "source": [ "# dataset https://www.kaggle.com/datasets/mrdaniilak/russia-real-estate-20182021/data \n", "\n", "df = pd.read_csv('data/all_v2.csv')\n" ] }, { "cell_type": "code", "execution_count": 5, "id": "05b57100", "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | price | \n", "date | \n", "time | \n", "geo_lat | \n", "geo_lon | \n", "region | \n", "building_type | \n", "level | \n", "levels | \n", "rooms | \n", "area | \n", "kitchen_area | \n", "object_type | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "6050000 | \n", "2018-02-19 | \n", "20:00:21 | \n", "59.805808 | \n", "30.376141 | \n", "2661 | \n", "1 | \n", "8 | \n", "10 | \n", "3 | \n", "82.6 | \n", "10.8 | \n", "1 | \n", "
1 | \n", "8650000 | \n", "2018-02-27 | \n", "12:04:54 | \n", "55.683807 | \n", "37.297405 | \n", "81 | \n", "3 | \n", "5 | \n", "24 | \n", "2 | \n", "69.1 | \n", "12.0 | \n", "1 | \n", "
2 | \n", "4000000 | \n", "2018-02-28 | \n", "15:44:00 | \n", "56.295250 | \n", "44.061637 | \n", "2871 | \n", "1 | \n", "5 | \n", "9 | \n", "3 | \n", "66.0 | \n", "10.0 | \n", "1 | \n", "
3 | \n", "1850000 | \n", "2018-03-01 | \n", "11:24:52 | \n", "44.996132 | \n", "39.074783 | \n", "2843 | \n", "4 | \n", "12 | \n", "16 | \n", "2 | \n", "38.0 | \n", "5.0 | \n", "11 | \n", "
4 | \n", "5450000 | \n", "2018-03-01 | \n", "17:42:43 | \n", "55.918767 | \n", "37.984642 | \n", "81 | \n", "3 | \n", "13 | \n", "14 | \n", "2 | \n", "60.0 | \n", "10.0 | \n", "1 | \n", "
5 | \n", "3300000 | \n", "2018-03-02 | \n", "21:18:42 | \n", "55.908253 | \n", "37.726448 | \n", "81 | \n", "1 | \n", "4 | \n", "5 | \n", "1 | \n", "32.0 | \n", "6.0 | \n", "1 | \n", "
6 | \n", "4704280 | \n", "2018-03-04 | \n", "12:35:25 | \n", "55.621097 | \n", "37.431002 | \n", "3 | \n", "2 | \n", "1 | \n", "25 | \n", "1 | \n", "31.7 | \n", "6.0 | \n", "11 | \n", "
7 | \n", "3600000 | \n", "2018-03-04 | \n", "20:52:38 | \n", "59.875526 | \n", "30.395457 | \n", "2661 | \n", "1 | \n", "2 | \n", "5 | \n", "1 | \n", "31.1 | \n", "6.0 | \n", "1 | \n", "
8 | \n", "3390000 | \n", "2018-03-05 | \n", "07:07:05 | \n", "53.195031 | \n", "50.106952 | \n", "3106 | \n", "2 | \n", "4 | \n", "24 | \n", "2 | \n", "64.0 | \n", "13.0 | \n", "11 | \n", "
9 | \n", "2800000 | \n", "2018-03-06 | \n", "09:57:10 | \n", "55.736972 | \n", "38.846457 | \n", "81 | \n", "1 | \n", "9 | \n", "10 | \n", "2 | \n", "55.0 | \n", "8.0 | \n", "1 | \n", "