wrongmove/crawler/exploration.ipynb

2005 lines
77 KiB
Text
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"id": "f20bddee-1e7c-4c46-a17a-c7bb6c13f30c",
"metadata": {},
"outputs": [
{
"name": "stderr",
"output_type": "stream",
"text": [
"/Users/kadir/code/realestate/crawler/venv/lib/python3.12/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
" from .autonotebook import tqdm as notebook_tqdm\n"
]
}
],
"source": [
"from data_access import Listing\n",
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "b1101088-9613-465f-81fd-79801e0202b8",
"metadata": {},
"outputs": [],
"source": [
"ls = Listing.get_all_listings()"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "63e61601-7e3f-4d58-89f6-1794e4868cc3",
"metadata": {},
"outputs": [],
"source": [
"ds = [l.dict_nicely() for l in ls]"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "1c222721-f426-42c0-9ac5-badc1f7a2034",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>sqm_ocr</th>\n",
" <th>price</th>\n",
" <th>price_per_sqm</th>\n",
" <th>url</th>\n",
" <th>bedrooms</th>\n",
" <th>travel_time_fastest</th>\n",
" <th>travel_time_second</th>\n",
" <th>lease_left</th>\n",
" <th>development</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>7.81</td>\n",
" <td>350000.0</td>\n",
" <td>44814.340589</td>\n",
" <td>https://www.rightmove.co.uk/properties/102360773</td>\n",
" <td>1</td>\n",
" <td>{'duration': 2695, 'distance': 6467, 'duration...</td>\n",
" <td>{'duration': 1682, 'distance': 6810, 'duration...</td>\n",
" <td>119.0</td>\n",
" <td>False</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>NaN</td>\n",
" <td>400000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/105836849</td>\n",
" <td>3</td>\n",
" <td>{'duration': 2565, 'distance': 14070, 'duratio...</td>\n",
" <td>{'duration': 2565, 'distance': 14070, 'duratio...</td>\n",
" <td>NaN</td>\n",
" <td>False</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>76.91</td>\n",
" <td>400000.0</td>\n",
" <td>5200.884150</td>\n",
" <td>https://www.rightmove.co.uk/properties/107233214</td>\n",
" <td>3</td>\n",
" <td>{'duration': 1714, 'distance': 9570, 'duration...</td>\n",
" <td>{'duration': 1774, 'distance': 9570, 'duration...</td>\n",
" <td>91.0</td>\n",
" <td>False</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>112.40</td>\n",
" <td>800000.0</td>\n",
" <td>7117.437722</td>\n",
" <td>https://www.rightmove.co.uk/properties/107976896</td>\n",
" <td>3</td>\n",
" <td>{'duration': 1862, 'distance': 8278, 'duration...</td>\n",
" <td>{'duration': 1862, 'distance': 8278, 'duration...</td>\n",
" <td>NaN</td>\n",
" <td>False</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>115.60</td>\n",
" <td>775000.0</td>\n",
" <td>6704.152249</td>\n",
" <td>https://www.rightmove.co.uk/properties/115499441</td>\n",
" <td>3</td>\n",
" <td>{'duration': 2943, 'distance': 7437, 'duration...</td>\n",
" <td>{'duration': 2167, 'distance': 9920, 'duration...</td>\n",
" <td>NaN</td>\n",
" <td>False</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2129</th>\n",
" <td>NaN</td>\n",
" <td>750000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/86813508</td>\n",
" <td>3</td>\n",
" <td>{'duration': 2400, 'distance': 13983, 'duratio...</td>\n",
" <td>{'duration': 2605, 'distance': 14702, 'duratio...</td>\n",
" <td>NaN</td>\n",
" <td>True</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2130</th>\n",
" <td>NaN</td>\n",
" <td>655000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/86813523</td>\n",
" <td>3</td>\n",
" <td>{'duration': 2400, 'distance': 13983, 'duratio...</td>\n",
" <td>{'duration': 2605, 'distance': 14702, 'duratio...</td>\n",
" <td>NaN</td>\n",
" <td>True</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2131</th>\n",
" <td>82.80</td>\n",
" <td>550000.0</td>\n",
" <td>6642.512077</td>\n",
" <td>https://www.rightmove.co.uk/properties/86814669</td>\n",
" <td>3</td>\n",
" <td>{'duration': 2310, 'distance': 12972, 'duratio...</td>\n",
" <td>{'duration': 2322, 'distance': 12104, 'duratio...</td>\n",
" <td>0.0</td>\n",
" <td>False</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2132</th>\n",
" <td>5.52</td>\n",
" <td>300000.0</td>\n",
" <td>54347.826087</td>\n",
" <td>https://www.rightmove.co.uk/properties/86955958</td>\n",
" <td>3</td>\n",
" <td>{'duration': 2332, 'distance': 6898, 'duration...</td>\n",
" <td>{'duration': 2248, 'distance': 6893, 'duration...</td>\n",
" <td>105.0</td>\n",
" <td>False</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2133</th>\n",
" <td>81.60</td>\n",
" <td>790000.0</td>\n",
" <td>9681.372549</td>\n",
" <td>https://www.rightmove.co.uk/properties/86972726</td>\n",
" <td>2</td>\n",
" <td>{'duration': 1393, 'distance': 6390, 'duration...</td>\n",
" <td>{'duration': 2733, 'distance': 6490, 'duration...</td>\n",
" <td>993.0</td>\n",
" <td>False</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>2134 rows × 9 columns</p>\n",
"</div>"
],
"text/plain": [
" sqm_ocr price price_per_sqm \\\n",
"0 7.81 350000.0 44814.340589 \n",
"1 NaN 400000.0 NaN \n",
"2 76.91 400000.0 5200.884150 \n",
"3 112.40 800000.0 7117.437722 \n",
"4 115.60 775000.0 6704.152249 \n",
"... ... ... ... \n",
"2129 NaN 750000.0 NaN \n",
"2130 NaN 655000.0 NaN \n",
"2131 82.80 550000.0 6642.512077 \n",
"2132 5.52 300000.0 54347.826087 \n",
"2133 81.60 790000.0 9681.372549 \n",
"\n",
" url bedrooms \\\n",
"0 https://www.rightmove.co.uk/properties/102360773 1 \n",
"1 https://www.rightmove.co.uk/properties/105836849 3 \n",
"2 https://www.rightmove.co.uk/properties/107233214 3 \n",
"3 https://www.rightmove.co.uk/properties/107976896 3 \n",
"4 https://www.rightmove.co.uk/properties/115499441 3 \n",
"... ... ... \n",
"2129 https://www.rightmove.co.uk/properties/86813508 3 \n",
"2130 https://www.rightmove.co.uk/properties/86813523 3 \n",
"2131 https://www.rightmove.co.uk/properties/86814669 3 \n",
"2132 https://www.rightmove.co.uk/properties/86955958 3 \n",
"2133 https://www.rightmove.co.uk/properties/86972726 2 \n",
"\n",
" travel_time_fastest \\\n",
"0 {'duration': 2695, 'distance': 6467, 'duration... \n",
"1 {'duration': 2565, 'distance': 14070, 'duratio... \n",
"2 {'duration': 1714, 'distance': 9570, 'duration... \n",
"3 {'duration': 1862, 'distance': 8278, 'duration... \n",
"4 {'duration': 2943, 'distance': 7437, 'duration... \n",
"... ... \n",
"2129 {'duration': 2400, 'distance': 13983, 'duratio... \n",
"2130 {'duration': 2400, 'distance': 13983, 'duratio... \n",
"2131 {'duration': 2310, 'distance': 12972, 'duratio... \n",
"2132 {'duration': 2332, 'distance': 6898, 'duration... \n",
"2133 {'duration': 1393, 'distance': 6390, 'duration... \n",
"\n",
" travel_time_second lease_left \\\n",
"0 {'duration': 1682, 'distance': 6810, 'duration... 119.0 \n",
"1 {'duration': 2565, 'distance': 14070, 'duratio... NaN \n",
"2 {'duration': 1774, 'distance': 9570, 'duration... 91.0 \n",
"3 {'duration': 1862, 'distance': 8278, 'duration... NaN \n",
"4 {'duration': 2167, 'distance': 9920, 'duration... NaN \n",
"... ... ... \n",
"2129 {'duration': 2605, 'distance': 14702, 'duratio... NaN \n",
"2130 {'duration': 2605, 'distance': 14702, 'duratio... NaN \n",
"2131 {'duration': 2322, 'distance': 12104, 'duratio... 0.0 \n",
"2132 {'duration': 2248, 'distance': 6893, 'duration... 105.0 \n",
"2133 {'duration': 2733, 'distance': 6490, 'duration... 993.0 \n",
"\n",
" development \n",
"0 False \n",
"1 False \n",
"2 False \n",
"3 False \n",
"4 False \n",
"... ... \n",
"2129 True \n",
"2130 True \n",
"2131 False \n",
"2132 False \n",
"2133 False \n",
"\n",
"[2134 rows x 9 columns]"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df = pd.DataFrame(ds)\n",
"df"
]
},
{
"cell_type": "code",
"execution_count": 14,
"id": "387c48d9-26c6-4bed-8201-352735c06acb",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"0 1682.0\n",
"1 2565.0\n",
"2 1714.0\n",
"3 1862.0\n",
"4 2167.0\n",
" ... \n",
"2129 2400.0\n",
"2130 2400.0\n",
"2131 2310.0\n",
"2132 2248.0\n",
"2133 1393.0\n",
"Length: 2134, dtype: float64"
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": []
},
{
"cell_type": "code",
"execution_count": 19,
"id": "7b37ad6b-9b0a-444e-b8c3-6fe4e43e42cb",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>sqm_ocr</th>\n",
" <th>price</th>\n",
" <th>price_per_sqm</th>\n",
" <th>url</th>\n",
" <th>bedrooms</th>\n",
" <th>lease_left</th>\n",
" <th>development</th>\n",
" <th>a_duration</th>\n",
" <th>a_duration_per_transit</th>\n",
" <th>a_number_of_transit_stops</th>\n",
" <th>b_duration</th>\n",
" <th>b_duration_per_transit</th>\n",
" <th>b_number_of_transit_stops</th>\n",
" <th>min_duration</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>7.81</td>\n",
" <td>350000.0</td>\n",
" <td>44814.340589</td>\n",
" <td>https://www.rightmove.co.uk/properties/102360773</td>\n",
" <td>1</td>\n",
" <td>119.0</td>\n",
" <td>False</td>\n",
" <td>2695</td>\n",
" <td>{'WALK': 414, 'TRANSIT': 2280}</td>\n",
" <td>1</td>\n",
" <td>1682.0</td>\n",
" <td>{'WALK': 608, 'TRANSIT': 804}</td>\n",
" <td>2.0</td>\n",
" <td>28.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>NaN</td>\n",
" <td>400000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/105836849</td>\n",
" <td>3</td>\n",
" <td>NaN</td>\n",
" <td>False</td>\n",
" <td>2565</td>\n",
" <td>{'WALK': 750, 'TRANSIT': 1800}</td>\n",
" <td>1</td>\n",
" <td>2565.0</td>\n",
" <td>{'WALK': 750, 'TRANSIT': 1800}</td>\n",
" <td>1.0</td>\n",
" <td>43.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>76.91</td>\n",
" <td>400000.0</td>\n",
" <td>5200.884150</td>\n",
" <td>https://www.rightmove.co.uk/properties/107233214</td>\n",
" <td>3</td>\n",
" <td>91.0</td>\n",
" <td>False</td>\n",
" <td>1714</td>\n",
" <td>{'WALK': 903, 'TRANSIT': 780}</td>\n",
" <td>1</td>\n",
" <td>1774.0</td>\n",
" <td>{'WALK': 903, 'TRANSIT': 840}</td>\n",
" <td>1.0</td>\n",
" <td>29.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>112.40</td>\n",
" <td>800000.0</td>\n",
" <td>7117.437722</td>\n",
" <td>https://www.rightmove.co.uk/properties/107976896</td>\n",
" <td>3</td>\n",
" <td>NaN</td>\n",
" <td>False</td>\n",
" <td>1862</td>\n",
" <td>{'WALK': 635, 'TRANSIT': 900}</td>\n",
" <td>2</td>\n",
" <td>1862.0</td>\n",
" <td>{'WALK': 635, 'TRANSIT': 960}</td>\n",
" <td>2.0</td>\n",
" <td>31.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>115.60</td>\n",
" <td>775000.0</td>\n",
" <td>6704.152249</td>\n",
" <td>https://www.rightmove.co.uk/properties/115499441</td>\n",
" <td>3</td>\n",
" <td>NaN</td>\n",
" <td>False</td>\n",
" <td>2943</td>\n",
" <td>{'WALK': 242, 'TRANSIT': 2700}</td>\n",
" <td>1</td>\n",
" <td>2167.0</td>\n",
" <td>{'WALK': 658, 'TRANSIT': 1200}</td>\n",
" <td>2.0</td>\n",
" <td>36.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2129</th>\n",
" <td>NaN</td>\n",
" <td>750000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/86813508</td>\n",
" <td>3</td>\n",
" <td>NaN</td>\n",
" <td>True</td>\n",
" <td>2400</td>\n",
" <td>{'WALK': 603, 'TRANSIT': 1524}</td>\n",
" <td>2</td>\n",
" <td>2605.0</td>\n",
" <td>{'WALK': 1467, 'TRANSIT': 1132}</td>\n",
" <td>1.0</td>\n",
" <td>40.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2130</th>\n",
" <td>NaN</td>\n",
" <td>655000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/86813523</td>\n",
" <td>3</td>\n",
" <td>NaN</td>\n",
" <td>True</td>\n",
" <td>2400</td>\n",
" <td>{'WALK': 603, 'TRANSIT': 1524}</td>\n",
" <td>2</td>\n",
" <td>2605.0</td>\n",
" <td>{'WALK': 1467, 'TRANSIT': 1132}</td>\n",
" <td>1.0</td>\n",
" <td>40.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2131</th>\n",
" <td>82.80</td>\n",
" <td>550000.0</td>\n",
" <td>6642.512077</td>\n",
" <td>https://www.rightmove.co.uk/properties/86814669</td>\n",
" <td>3</td>\n",
" <td>0.0</td>\n",
" <td>False</td>\n",
" <td>2310</td>\n",
" <td>{'WALK': 786, 'TRANSIT': 1277}</td>\n",
" <td>2</td>\n",
" <td>2322.0</td>\n",
" <td>{'WALK': 991, 'TRANSIT': 1080}</td>\n",
" <td>2.0</td>\n",
" <td>38.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2132</th>\n",
" <td>5.52</td>\n",
" <td>300000.0</td>\n",
" <td>54347.826087</td>\n",
" <td>https://www.rightmove.co.uk/properties/86955958</td>\n",
" <td>3</td>\n",
" <td>105.0</td>\n",
" <td>False</td>\n",
" <td>2332</td>\n",
" <td>{'WALK': 1671, 'TRANSIT': 660}</td>\n",
" <td>1</td>\n",
" <td>2248.0</td>\n",
" <td>{'WALK': 1671, 'TRANSIT': 576}</td>\n",
" <td>1.0</td>\n",
" <td>37.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2133</th>\n",
" <td>81.60</td>\n",
" <td>790000.0</td>\n",
" <td>9681.372549</td>\n",
" <td>https://www.rightmove.co.uk/properties/86972726</td>\n",
" <td>2</td>\n",
" <td>993.0</td>\n",
" <td>False</td>\n",
" <td>1393</td>\n",
" <td>{'WALK': 518, 'TRANSIT': 564}</td>\n",
" <td>2</td>\n",
" <td>2733.0</td>\n",
" <td>{'WALK': 451, 'TRANSIT': 2280}</td>\n",
" <td>1.0</td>\n",
" <td>23.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>2134 rows × 14 columns</p>\n",
"</div>"
],
"text/plain": [
" sqm_ocr price price_per_sqm \\\n",
"0 7.81 350000.0 44814.340589 \n",
"1 NaN 400000.0 NaN \n",
"2 76.91 400000.0 5200.884150 \n",
"3 112.40 800000.0 7117.437722 \n",
"4 115.60 775000.0 6704.152249 \n",
"... ... ... ... \n",
"2129 NaN 750000.0 NaN \n",
"2130 NaN 655000.0 NaN \n",
"2131 82.80 550000.0 6642.512077 \n",
"2132 5.52 300000.0 54347.826087 \n",
"2133 81.60 790000.0 9681.372549 \n",
"\n",
" url bedrooms lease_left \\\n",
"0 https://www.rightmove.co.uk/properties/102360773 1 119.0 \n",
"1 https://www.rightmove.co.uk/properties/105836849 3 NaN \n",
"2 https://www.rightmove.co.uk/properties/107233214 3 91.0 \n",
"3 https://www.rightmove.co.uk/properties/107976896 3 NaN \n",
"4 https://www.rightmove.co.uk/properties/115499441 3 NaN \n",
"... ... ... ... \n",
"2129 https://www.rightmove.co.uk/properties/86813508 3 NaN \n",
"2130 https://www.rightmove.co.uk/properties/86813523 3 NaN \n",
"2131 https://www.rightmove.co.uk/properties/86814669 3 0.0 \n",
"2132 https://www.rightmove.co.uk/properties/86955958 3 105.0 \n",
"2133 https://www.rightmove.co.uk/properties/86972726 2 993.0 \n",
"\n",
" development a_duration a_duration_per_transit \\\n",
"0 False 2695 {'WALK': 414, 'TRANSIT': 2280} \n",
"1 False 2565 {'WALK': 750, 'TRANSIT': 1800} \n",
"2 False 1714 {'WALK': 903, 'TRANSIT': 780} \n",
"3 False 1862 {'WALK': 635, 'TRANSIT': 900} \n",
"4 False 2943 {'WALK': 242, 'TRANSIT': 2700} \n",
"... ... ... ... \n",
"2129 True 2400 {'WALK': 603, 'TRANSIT': 1524} \n",
"2130 True 2400 {'WALK': 603, 'TRANSIT': 1524} \n",
"2131 False 2310 {'WALK': 786, 'TRANSIT': 1277} \n",
"2132 False 2332 {'WALK': 1671, 'TRANSIT': 660} \n",
"2133 False 1393 {'WALK': 518, 'TRANSIT': 564} \n",
"\n",
" a_number_of_transit_stops b_duration b_duration_per_transit \\\n",
"0 1 1682.0 {'WALK': 608, 'TRANSIT': 804} \n",
"1 1 2565.0 {'WALK': 750, 'TRANSIT': 1800} \n",
"2 1 1774.0 {'WALK': 903, 'TRANSIT': 840} \n",
"3 2 1862.0 {'WALK': 635, 'TRANSIT': 960} \n",
"4 1 2167.0 {'WALK': 658, 'TRANSIT': 1200} \n",
"... ... ... ... \n",
"2129 2 2605.0 {'WALK': 1467, 'TRANSIT': 1132} \n",
"2130 2 2605.0 {'WALK': 1467, 'TRANSIT': 1132} \n",
"2131 2 2322.0 {'WALK': 991, 'TRANSIT': 1080} \n",
"2132 1 2248.0 {'WALK': 1671, 'TRANSIT': 576} \n",
"2133 2 2733.0 {'WALK': 451, 'TRANSIT': 2280} \n",
"\n",
" b_number_of_transit_stops min_duration \n",
"0 2.0 28.0 \n",
"1 1.0 43.0 \n",
"2 1.0 29.0 \n",
"3 2.0 31.0 \n",
"4 2.0 36.0 \n",
"... ... ... \n",
"2129 1.0 40.0 \n",
"2130 1.0 40.0 \n",
"2131 2.0 38.0 \n",
"2132 1.0 37.0 \n",
"2133 1.0 23.0 \n",
"\n",
"[2134 rows x 14 columns]"
]
},
"execution_count": 19,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"dropcolumns = ['distance_per_transit', 'duration_static', 'distance']\n",
"s1 = df['travel_time_fastest'].apply(pd.Series).drop(dropcolumns, axis=1)\n",
"s1.columns = ['a_' + c for c in s1.columns]\n",
"\n",
"s2 = df['travel_time_second'].apply(pd.Series).drop(dropcolumns, axis=1)\n",
"s2.columns = ['b_' + c for c in s2.columns]\n",
"\n",
"df2 = pd.concat([df.drop(['travel_time_fastest', 'travel_time_second'], axis=1), s1, s2], axis=1)\n",
"df2.loc[:, 'min_duration'] = (df2.loc[:, ['a_duration', 'b_duration']].min(axis=1) / 60).round()\n",
"df2"
]
},
{
"cell_type": "code",
"execution_count": 21,
"id": "8c75aaa6-6113-482f-809b-11e405510184",
"metadata": {},
"outputs": [],
"source": [
"df2.to_clipboard()"
]
},
{
"cell_type": "code",
"execution_count": 12,
"id": "79f99692-91e8-4915-9b57-7b3a1efd7d3a",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>sqm_ocr</th>\n",
" <th>price</th>\n",
" <th>price_per_sqm</th>\n",
" <th>url</th>\n",
" <th>bedrooms</th>\n",
" <th>duration</th>\n",
" <th>distance</th>\n",
" <th>duration_static</th>\n",
" <th>duration_per_transit</th>\n",
" <th>distance_per_transit</th>\n",
" <th>number_of_transit_stops</th>\n",
" <th>duration</th>\n",
" <th>distance</th>\n",
" <th>duration_static</th>\n",
" <th>duration_per_transit</th>\n",
" <th>distance_per_transit</th>\n",
" <th>number_of_transit_stops</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>7.81</td>\n",
" <td>350000.0</td>\n",
" <td>44814.340589</td>\n",
" <td>https://www.rightmove.co.uk/properties/102360773</td>\n",
" <td>1</td>\n",
" <td>2695</td>\n",
" <td>6467</td>\n",
" <td>2695</td>\n",
" <td>{'WALK': 414, 'TRANSIT': 2280}</td>\n",
" <td>{'WALK': 465, 'TRANSIT': 6002}</td>\n",
" <td>1</td>\n",
" <td>1682.0</td>\n",
" <td>6810.0</td>\n",
" <td>1682.0</td>\n",
" <td>{'WALK': 608, 'TRANSIT': 804}</td>\n",
" <td>{'WALK': 582, 'TRANSIT': 6228}</td>\n",
" <td>2.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>NaN</td>\n",
" <td>400000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/105836849</td>\n",
" <td>3</td>\n",
" <td>2565</td>\n",
" <td>14070</td>\n",
" <td>2565</td>\n",
" <td>{'WALK': 750, 'TRANSIT': 1800}</td>\n",
" <td>{'WALK': 856, 'TRANSIT': 13214}</td>\n",
" <td>1</td>\n",
" <td>2565.0</td>\n",
" <td>14070.0</td>\n",
" <td>2565.0</td>\n",
" <td>{'WALK': 750, 'TRANSIT': 1800}</td>\n",
" <td>{'WALK': 856, 'TRANSIT': 13214}</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>76.91</td>\n",
" <td>400000.0</td>\n",
" <td>5200.884150</td>\n",
" <td>https://www.rightmove.co.uk/properties/107233214</td>\n",
" <td>3</td>\n",
" <td>1714</td>\n",
" <td>9570</td>\n",
" <td>1714</td>\n",
" <td>{'WALK': 903, 'TRANSIT': 780}</td>\n",
" <td>{'WALK': 1035, 'TRANSIT': 8535}</td>\n",
" <td>1</td>\n",
" <td>1774.0</td>\n",
" <td>9570.0</td>\n",
" <td>1774.0</td>\n",
" <td>{'WALK': 903, 'TRANSIT': 840}</td>\n",
" <td>{'WALK': 1035, 'TRANSIT': 8535}</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>112.40</td>\n",
" <td>800000.0</td>\n",
" <td>7117.437722</td>\n",
" <td>https://www.rightmove.co.uk/properties/107976896</td>\n",
" <td>3</td>\n",
" <td>1862</td>\n",
" <td>8278</td>\n",
" <td>1862</td>\n",
" <td>{'WALK': 635, 'TRANSIT': 900}</td>\n",
" <td>{'WALK': 710, 'TRANSIT': 7568}</td>\n",
" <td>2</td>\n",
" <td>1862.0</td>\n",
" <td>8278.0</td>\n",
" <td>1862.0</td>\n",
" <td>{'WALK': 635, 'TRANSIT': 960}</td>\n",
" <td>{'WALK': 710, 'TRANSIT': 7568}</td>\n",
" <td>2.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>115.60</td>\n",
" <td>775000.0</td>\n",
" <td>6704.152249</td>\n",
" <td>https://www.rightmove.co.uk/properties/115499441</td>\n",
" <td>3</td>\n",
" <td>2943</td>\n",
" <td>7437</td>\n",
" <td>2943</td>\n",
" <td>{'WALK': 242, 'TRANSIT': 2700}</td>\n",
" <td>{'WALK': 276, 'TRANSIT': 7161}</td>\n",
" <td>1</td>\n",
" <td>2167.0</td>\n",
" <td>9920.0</td>\n",
" <td>2167.0</td>\n",
" <td>{'WALK': 658, 'TRANSIT': 1200}</td>\n",
" <td>{'WALK': 720, 'TRANSIT': 9200}</td>\n",
" <td>2.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2046</th>\n",
" <td>NaN</td>\n",
" <td>750000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/86813508</td>\n",
" <td>3</td>\n",
" <td>2400</td>\n",
" <td>13983</td>\n",
" <td>2400</td>\n",
" <td>{'WALK': 603, 'TRANSIT': 1524}</td>\n",
" <td>{'WALK': 671, 'TRANSIT': 13312}</td>\n",
" <td>2</td>\n",
" <td>2605.0</td>\n",
" <td>14702.0</td>\n",
" <td>2605.0</td>\n",
" <td>{'WALK': 1467, 'TRANSIT': 1132}</td>\n",
" <td>{'WALK': 1698, 'TRANSIT': 13004}</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2047</th>\n",
" <td>NaN</td>\n",
" <td>655000.0</td>\n",
" <td>NaN</td>\n",
" <td>https://www.rightmove.co.uk/properties/86813523</td>\n",
" <td>3</td>\n",
" <td>2400</td>\n",
" <td>13983</td>\n",
" <td>2400</td>\n",
" <td>{'WALK': 603, 'TRANSIT': 1524}</td>\n",
" <td>{'WALK': 671, 'TRANSIT': 13312}</td>\n",
" <td>2</td>\n",
" <td>2605.0</td>\n",
" <td>14702.0</td>\n",
" <td>2605.0</td>\n",
" <td>{'WALK': 1467, 'TRANSIT': 1132}</td>\n",
" <td>{'WALK': 1698, 'TRANSIT': 13004}</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2048</th>\n",
" <td>82.80</td>\n",
" <td>550000.0</td>\n",
" <td>6642.512077</td>\n",
" <td>https://www.rightmove.co.uk/properties/86814669</td>\n",
" <td>3</td>\n",
" <td>2310</td>\n",
" <td>12972</td>\n",
" <td>2310</td>\n",
" <td>{'WALK': 786, 'TRANSIT': 1277}</td>\n",
" <td>{'WALK': 885, 'TRANSIT': 12087}</td>\n",
" <td>2</td>\n",
" <td>2322.0</td>\n",
" <td>12104.0</td>\n",
" <td>2322.0</td>\n",
" <td>{'WALK': 991, 'TRANSIT': 1080}</td>\n",
" <td>{'WALK': 1089, 'TRANSIT': 11015}</td>\n",
" <td>2.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2049</th>\n",
" <td>5.52</td>\n",
" <td>300000.0</td>\n",
" <td>54347.826087</td>\n",
" <td>https://www.rightmove.co.uk/properties/86955958</td>\n",
" <td>3</td>\n",
" <td>2332</td>\n",
" <td>6898</td>\n",
" <td>2332</td>\n",
" <td>{'WALK': 1671, 'TRANSIT': 660}</td>\n",
" <td>{'WALK': 1945, 'TRANSIT': 4953}</td>\n",
" <td>1</td>\n",
" <td>2248.0</td>\n",
" <td>6893.0</td>\n",
" <td>2248.0</td>\n",
" <td>{'WALK': 1671, 'TRANSIT': 576}</td>\n",
" <td>{'WALK': 1945, 'TRANSIT': 4948}</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2050</th>\n",
" <td>81.60</td>\n",
" <td>790000.0</td>\n",
" <td>9681.372549</td>\n",
" <td>https://www.rightmove.co.uk/properties/86972726</td>\n",
" <td>2</td>\n",
" <td>1393</td>\n",
" <td>6390</td>\n",
" <td>1393</td>\n",
" <td>{'WALK': 518, 'TRANSIT': 564}</td>\n",
" <td>{'WALK': 441, 'TRANSIT': 5949}</td>\n",
" <td>2</td>\n",
" <td>2733.0</td>\n",
" <td>6490.0</td>\n",
" <td>2733.0</td>\n",
" <td>{'WALK': 451, 'TRANSIT': 2280}</td>\n",
" <td>{'WALK': 488, 'TRANSIT': 6002}</td>\n",
" <td>1.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>2051 rows × 17 columns</p>\n",
"</div>"
],
"text/plain": [
" sqm_ocr price price_per_sqm \\\n",
"0 7.81 350000.0 44814.340589 \n",
"1 NaN 400000.0 NaN \n",
"2 76.91 400000.0 5200.884150 \n",
"3 112.40 800000.0 7117.437722 \n",
"4 115.60 775000.0 6704.152249 \n",
"... ... ... ... \n",
"2046 NaN 750000.0 NaN \n",
"2047 NaN 655000.0 NaN \n",
"2048 82.80 550000.0 6642.512077 \n",
"2049 5.52 300000.0 54347.826087 \n",
"2050 81.60 790000.0 9681.372549 \n",
"\n",
" url bedrooms duration \\\n",
"0 https://www.rightmove.co.uk/properties/102360773 1 2695 \n",
"1 https://www.rightmove.co.uk/properties/105836849 3 2565 \n",
"2 https://www.rightmove.co.uk/properties/107233214 3 1714 \n",
"3 https://www.rightmove.co.uk/properties/107976896 3 1862 \n",
"4 https://www.rightmove.co.uk/properties/115499441 3 2943 \n",
"... ... ... ... \n",
"2046 https://www.rightmove.co.uk/properties/86813508 3 2400 \n",
"2047 https://www.rightmove.co.uk/properties/86813523 3 2400 \n",
"2048 https://www.rightmove.co.uk/properties/86814669 3 2310 \n",
"2049 https://www.rightmove.co.uk/properties/86955958 3 2332 \n",
"2050 https://www.rightmove.co.uk/properties/86972726 2 1393 \n",
"\n",
" distance duration_static duration_per_transit \\\n",
"0 6467 2695 {'WALK': 414, 'TRANSIT': 2280} \n",
"1 14070 2565 {'WALK': 750, 'TRANSIT': 1800} \n",
"2 9570 1714 {'WALK': 903, 'TRANSIT': 780} \n",
"3 8278 1862 {'WALK': 635, 'TRANSIT': 900} \n",
"4 7437 2943 {'WALK': 242, 'TRANSIT': 2700} \n",
"... ... ... ... \n",
"2046 13983 2400 {'WALK': 603, 'TRANSIT': 1524} \n",
"2047 13983 2400 {'WALK': 603, 'TRANSIT': 1524} \n",
"2048 12972 2310 {'WALK': 786, 'TRANSIT': 1277} \n",
"2049 6898 2332 {'WALK': 1671, 'TRANSIT': 660} \n",
"2050 6390 1393 {'WALK': 518, 'TRANSIT': 564} \n",
"\n",
" distance_per_transit number_of_transit_stops duration \\\n",
"0 {'WALK': 465, 'TRANSIT': 6002} 1 1682.0 \n",
"1 {'WALK': 856, 'TRANSIT': 13214} 1 2565.0 \n",
"2 {'WALK': 1035, 'TRANSIT': 8535} 1 1774.0 \n",
"3 {'WALK': 710, 'TRANSIT': 7568} 2 1862.0 \n",
"4 {'WALK': 276, 'TRANSIT': 7161} 1 2167.0 \n",
"... ... ... ... \n",
"2046 {'WALK': 671, 'TRANSIT': 13312} 2 2605.0 \n",
"2047 {'WALK': 671, 'TRANSIT': 13312} 2 2605.0 \n",
"2048 {'WALK': 885, 'TRANSIT': 12087} 2 2322.0 \n",
"2049 {'WALK': 1945, 'TRANSIT': 4953} 1 2248.0 \n",
"2050 {'WALK': 441, 'TRANSIT': 5949} 2 2733.0 \n",
"\n",
" distance duration_static duration_per_transit \\\n",
"0 6810.0 1682.0 {'WALK': 608, 'TRANSIT': 804} \n",
"1 14070.0 2565.0 {'WALK': 750, 'TRANSIT': 1800} \n",
"2 9570.0 1774.0 {'WALK': 903, 'TRANSIT': 840} \n",
"3 8278.0 1862.0 {'WALK': 635, 'TRANSIT': 960} \n",
"4 9920.0 2167.0 {'WALK': 658, 'TRANSIT': 1200} \n",
"... ... ... ... \n",
"2046 14702.0 2605.0 {'WALK': 1467, 'TRANSIT': 1132} \n",
"2047 14702.0 2605.0 {'WALK': 1467, 'TRANSIT': 1132} \n",
"2048 12104.0 2322.0 {'WALK': 991, 'TRANSIT': 1080} \n",
"2049 6893.0 2248.0 {'WALK': 1671, 'TRANSIT': 576} \n",
"2050 6490.0 2733.0 {'WALK': 451, 'TRANSIT': 2280} \n",
"\n",
" distance_per_transit number_of_transit_stops \n",
"0 {'WALK': 582, 'TRANSIT': 6228} 2.0 \n",
"1 {'WALK': 856, 'TRANSIT': 13214} 1.0 \n",
"2 {'WALK': 1035, 'TRANSIT': 8535} 1.0 \n",
"3 {'WALK': 710, 'TRANSIT': 7568} 2.0 \n",
"4 {'WALK': 720, 'TRANSIT': 9200} 2.0 \n",
"... ... ... \n",
"2046 {'WALK': 1698, 'TRANSIT': 13004} 1.0 \n",
"2047 {'WALK': 1698, 'TRANSIT': 13004} 1.0 \n",
"2048 {'WALK': 1089, 'TRANSIT': 11015} 2.0 \n",
"2049 {'WALK': 1945, 'TRANSIT': 4948} 1.0 \n",
"2050 {'WALK': 488, 'TRANSIT': 6002} 1.0 \n",
"\n",
"[2051 rows x 17 columns]"
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df = pd.concat([df.drop(['travel_time_fastest'], axis=1), df['travel_time_fastest'].apply(pd.Series)], axis=1)\n",
"df = pd.concat([df.drop(['travel_time_second'], axis=1), df['travel_time_second'].apply(pd.Series)], axis=1)\n",
"df"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "abcbde40-7432-4449-957a-79ce2ca126eb",
"metadata": {},
"outputs": [],
"source": [
"\n"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "99c5b304-3d13-466b-a9f5-83a5db6311b5",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>sqm_ocr</th>\n",
" <th>price</th>\n",
" <th>price_per_sqm</th>\n",
" <th>url</th>\n",
" <th>bedrooms</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>953</th>\n",
" <td>74142.40</td>\n",
" <td>550000.0</td>\n",
" <td>7.418157</td>\n",
" <td>https://www.rightmove.co.uk/properties/145546538</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>249</th>\n",
" <td>21850.10</td>\n",
" <td>725000.0</td>\n",
" <td>33.180626</td>\n",
" <td>https://www.rightmove.co.uk/properties/140821736</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>177</th>\n",
" <td>137.50</td>\n",
" <td>695000.0</td>\n",
" <td>5054.545455</td>\n",
" <td>https://www.rightmove.co.uk/properties/139354259</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>352</th>\n",
" <td>85.50</td>\n",
" <td>475000.0</td>\n",
" <td>5555.555556</td>\n",
" <td>https://www.rightmove.co.uk/properties/142142348</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>36</th>\n",
" <td>82.90</td>\n",
" <td>475000.0</td>\n",
" <td>5729.794934</td>\n",
" <td>https://www.rightmove.co.uk/properties/128925950</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>700</th>\n",
" <td>101.00</td>\n",
" <td>650000.0</td>\n",
" <td>6435.643564</td>\n",
" <td>https://www.rightmove.co.uk/properties/144591572</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>823</th>\n",
" <td>80.40</td>\n",
" <td>525000.0</td>\n",
" <td>6529.850746</td>\n",
" <td>https://www.rightmove.co.uk/properties/145051769</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>214</th>\n",
" <td>91.51</td>\n",
" <td>650000.0</td>\n",
" <td>7103.048847</td>\n",
" <td>https://www.rightmove.co.uk/properties/140326307</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>171</th>\n",
" <td>91.10</td>\n",
" <td>650000.0</td>\n",
" <td>7135.016465</td>\n",
" <td>https://www.rightmove.co.uk/properties/139245428</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>598</th>\n",
" <td>109.40</td>\n",
" <td>795000.0</td>\n",
" <td>7266.910420</td>\n",
" <td>https://www.rightmove.co.uk/properties/144034655</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>146</th>\n",
" <td>93.78</td>\n",
" <td>700000.0</td>\n",
" <td>7464.278098</td>\n",
" <td>https://www.rightmove.co.uk/properties/138510395</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>711</th>\n",
" <td>100.31</td>\n",
" <td>750000.0</td>\n",
" <td>7476.821852</td>\n",
" <td>https://www.rightmove.co.uk/properties/144620303</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>592</th>\n",
" <td>86.49</td>\n",
" <td>650000.0</td>\n",
" <td>7515.319690</td>\n",
" <td>https://www.rightmove.co.uk/properties/143987669</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>624</th>\n",
" <td>101.35</td>\n",
" <td>775000.0</td>\n",
" <td>7646.768624</td>\n",
" <td>https://www.rightmove.co.uk/properties/144217922</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>55</th>\n",
" <td>97.60</td>\n",
" <td>750000.0</td>\n",
" <td>7684.426230</td>\n",
" <td>https://www.rightmove.co.uk/properties/132564737</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>851</th>\n",
" <td>81.01</td>\n",
" <td>625000.0</td>\n",
" <td>7715.096902</td>\n",
" <td>https://www.rightmove.co.uk/properties/145172504</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>356</th>\n",
" <td>89.00</td>\n",
" <td>695000.0</td>\n",
" <td>7808.988764</td>\n",
" <td>https://www.rightmove.co.uk/properties/142185623</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>748</th>\n",
" <td>85.90</td>\n",
" <td>675000.0</td>\n",
" <td>7857.974389</td>\n",
" <td>https://www.rightmove.co.uk/properties/144771281</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>204</th>\n",
" <td>82.40</td>\n",
" <td>650000.0</td>\n",
" <td>7888.349515</td>\n",
" <td>https://www.rightmove.co.uk/properties/140173319</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>654</th>\n",
" <td>83.33</td>\n",
" <td>665000.0</td>\n",
" <td>7980.319213</td>\n",
" <td>https://www.rightmove.co.uk/properties/144361100</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>514</th>\n",
" <td>87.50</td>\n",
" <td>700000.0</td>\n",
" <td>8000.000000</td>\n",
" <td>https://www.rightmove.co.uk/properties/143460365</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>762</th>\n",
" <td>92.90</td>\n",
" <td>750000.0</td>\n",
" <td>8073.196986</td>\n",
" <td>https://www.rightmove.co.uk/properties/144846725</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>963</th>\n",
" <td>92.90</td>\n",
" <td>750000.0</td>\n",
" <td>8073.196986</td>\n",
" <td>https://www.rightmove.co.uk/properties/145565252</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>938</th>\n",
" <td>86.10</td>\n",
" <td>699000.0</td>\n",
" <td>8118.466899</td>\n",
" <td>https://www.rightmove.co.uk/properties/145491137</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>403</th>\n",
" <td>90.60</td>\n",
" <td>750000.0</td>\n",
" <td>8278.145695</td>\n",
" <td>https://www.rightmove.co.uk/properties/142704416</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>302</th>\n",
" <td>93.30</td>\n",
" <td>795000.0</td>\n",
" <td>8520.900322</td>\n",
" <td>https://www.rightmove.co.uk/properties/141595433</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>671</th>\n",
" <td>93.27</td>\n",
" <td>800000.0</td>\n",
" <td>8577.248847</td>\n",
" <td>https://www.rightmove.co.uk/properties/144429140</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>349</th>\n",
" <td>80.57</td>\n",
" <td>695000.0</td>\n",
" <td>8626.039469</td>\n",
" <td>https://www.rightmove.co.uk/properties/142115918</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>224</th>\n",
" <td>90.10</td>\n",
" <td>800000.0</td>\n",
" <td>8879.023307</td>\n",
" <td>https://www.rightmove.co.uk/properties/140464481</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>740</th>\n",
" <td>81.70</td>\n",
" <td>735000.0</td>\n",
" <td>8996.328029</td>\n",
" <td>https://www.rightmove.co.uk/properties/144722414</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>326</th>\n",
" <td>87.30</td>\n",
" <td>800000.0</td>\n",
" <td>9163.802978</td>\n",
" <td>https://www.rightmove.co.uk/properties/141846023</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>319</th>\n",
" <td>81.57</td>\n",
" <td>750000.0</td>\n",
" <td>9194.556822</td>\n",
" <td>https://www.rightmove.co.uk/properties/141797357</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>558</th>\n",
" <td>86.77</td>\n",
" <td>800000.0</td>\n",
" <td>9219.776420</td>\n",
" <td>https://www.rightmove.co.uk/properties/143758763</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>712</th>\n",
" <td>86.30</td>\n",
" <td>800000.0</td>\n",
" <td>9269.988413</td>\n",
" <td>https://www.rightmove.co.uk/properties/144622157</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>473</th>\n",
" <td>86.00</td>\n",
" <td>800000.0</td>\n",
" <td>9302.325581</td>\n",
" <td>https://www.rightmove.co.uk/properties/143210102</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>105</th>\n",
" <td>80.40</td>\n",
" <td>750000.0</td>\n",
" <td>9328.358209</td>\n",
" <td>https://www.rightmove.co.uk/properties/136988726</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1003</th>\n",
" <td>80.27</td>\n",
" <td>750000.0</td>\n",
" <td>9343.465803</td>\n",
" <td>https://www.rightmove.co.uk/properties/86775291</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>235</th>\n",
" <td>82.80</td>\n",
" <td>775000.0</td>\n",
" <td>9359.903382</td>\n",
" <td>https://www.rightmove.co.uk/properties/140611055</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>65</th>\n",
" <td>85.10</td>\n",
" <td>800000.0</td>\n",
" <td>9400.705053</td>\n",
" <td>https://www.rightmove.co.uk/properties/134116232</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>30</th>\n",
" <td>83.70</td>\n",
" <td>795000.0</td>\n",
" <td>9498.207885</td>\n",
" <td>https://www.rightmove.co.uk/properties/127787960</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1025</th>\n",
" <td>81.60</td>\n",
" <td>790000.0</td>\n",
" <td>9681.372549</td>\n",
" <td>https://www.rightmove.co.uk/properties/86972726</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>88</th>\n",
" <td>81.75</td>\n",
" <td>800000.0</td>\n",
" <td>9785.932722</td>\n",
" <td>https://www.rightmove.co.uk/properties/136012193</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>454</th>\n",
" <td>80.80</td>\n",
" <td>800000.0</td>\n",
" <td>9900.990099</td>\n",
" <td>https://www.rightmove.co.uk/properties/143138867</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>343</th>\n",
" <td>80.64</td>\n",
" <td>800000.0</td>\n",
" <td>9920.634921</td>\n",
" <td>https://www.rightmove.co.uk/properties/142032935</td>\n",
" <td>2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" sqm_ocr price price_per_sqm \\\n",
"953 74142.40 550000.0 7.418157 \n",
"249 21850.10 725000.0 33.180626 \n",
"177 137.50 695000.0 5054.545455 \n",
"352 85.50 475000.0 5555.555556 \n",
"36 82.90 475000.0 5729.794934 \n",
"700 101.00 650000.0 6435.643564 \n",
"823 80.40 525000.0 6529.850746 \n",
"214 91.51 650000.0 7103.048847 \n",
"171 91.10 650000.0 7135.016465 \n",
"598 109.40 795000.0 7266.910420 \n",
"146 93.78 700000.0 7464.278098 \n",
"711 100.31 750000.0 7476.821852 \n",
"592 86.49 650000.0 7515.319690 \n",
"624 101.35 775000.0 7646.768624 \n",
"55 97.60 750000.0 7684.426230 \n",
"851 81.01 625000.0 7715.096902 \n",
"356 89.00 695000.0 7808.988764 \n",
"748 85.90 675000.0 7857.974389 \n",
"204 82.40 650000.0 7888.349515 \n",
"654 83.33 665000.0 7980.319213 \n",
"514 87.50 700000.0 8000.000000 \n",
"762 92.90 750000.0 8073.196986 \n",
"963 92.90 750000.0 8073.196986 \n",
"938 86.10 699000.0 8118.466899 \n",
"403 90.60 750000.0 8278.145695 \n",
"302 93.30 795000.0 8520.900322 \n",
"671 93.27 800000.0 8577.248847 \n",
"349 80.57 695000.0 8626.039469 \n",
"224 90.10 800000.0 8879.023307 \n",
"740 81.70 735000.0 8996.328029 \n",
"326 87.30 800000.0 9163.802978 \n",
"319 81.57 750000.0 9194.556822 \n",
"558 86.77 800000.0 9219.776420 \n",
"712 86.30 800000.0 9269.988413 \n",
"473 86.00 800000.0 9302.325581 \n",
"105 80.40 750000.0 9328.358209 \n",
"1003 80.27 750000.0 9343.465803 \n",
"235 82.80 775000.0 9359.903382 \n",
"65 85.10 800000.0 9400.705053 \n",
"30 83.70 795000.0 9498.207885 \n",
"1025 81.60 790000.0 9681.372549 \n",
"88 81.75 800000.0 9785.932722 \n",
"454 80.80 800000.0 9900.990099 \n",
"343 80.64 800000.0 9920.634921 \n",
"\n",
" url bedrooms \n",
"953 https://www.rightmove.co.uk/properties/145546538 2 \n",
"249 https://www.rightmove.co.uk/properties/140821736 2 \n",
"177 https://www.rightmove.co.uk/properties/139354259 2 \n",
"352 https://www.rightmove.co.uk/properties/142142348 2 \n",
"36 https://www.rightmove.co.uk/properties/128925950 2 \n",
"700 https://www.rightmove.co.uk/properties/144591572 1 \n",
"823 https://www.rightmove.co.uk/properties/145051769 2 \n",
"214 https://www.rightmove.co.uk/properties/140326307 2 \n",
"171 https://www.rightmove.co.uk/properties/139245428 2 \n",
"598 https://www.rightmove.co.uk/properties/144034655 2 \n",
"146 https://www.rightmove.co.uk/properties/138510395 2 \n",
"711 https://www.rightmove.co.uk/properties/144620303 2 \n",
"592 https://www.rightmove.co.uk/properties/143987669 2 \n",
"624 https://www.rightmove.co.uk/properties/144217922 1 \n",
"55 https://www.rightmove.co.uk/properties/132564737 2 \n",
"851 https://www.rightmove.co.uk/properties/145172504 2 \n",
"356 https://www.rightmove.co.uk/properties/142185623 2 \n",
"748 https://www.rightmove.co.uk/properties/144771281 2 \n",
"204 https://www.rightmove.co.uk/properties/140173319 2 \n",
"654 https://www.rightmove.co.uk/properties/144361100 2 \n",
"514 https://www.rightmove.co.uk/properties/143460365 1 \n",
"762 https://www.rightmove.co.uk/properties/144846725 1 \n",
"963 https://www.rightmove.co.uk/properties/145565252 2 \n",
"938 https://www.rightmove.co.uk/properties/145491137 2 \n",
"403 https://www.rightmove.co.uk/properties/142704416 2 \n",
"302 https://www.rightmove.co.uk/properties/141595433 2 \n",
"671 https://www.rightmove.co.uk/properties/144429140 2 \n",
"349 https://www.rightmove.co.uk/properties/142115918 2 \n",
"224 https://www.rightmove.co.uk/properties/140464481 2 \n",
"740 https://www.rightmove.co.uk/properties/144722414 2 \n",
"326 https://www.rightmove.co.uk/properties/141846023 2 \n",
"319 https://www.rightmove.co.uk/properties/141797357 2 \n",
"558 https://www.rightmove.co.uk/properties/143758763 2 \n",
"712 https://www.rightmove.co.uk/properties/144622157 2 \n",
"473 https://www.rightmove.co.uk/properties/143210102 2 \n",
"105 https://www.rightmove.co.uk/properties/136988726 2 \n",
"1003 https://www.rightmove.co.uk/properties/86775291 2 \n",
"235 https://www.rightmove.co.uk/properties/140611055 2 \n",
"65 https://www.rightmove.co.uk/properties/134116232 2 \n",
"30 https://www.rightmove.co.uk/properties/127787960 1 \n",
"1025 https://www.rightmove.co.uk/properties/86972726 2 \n",
"88 https://www.rightmove.co.uk/properties/136012193 1 \n",
"454 https://www.rightmove.co.uk/properties/143138867 2 \n",
"343 https://www.rightmove.co.uk/properties/142032935 2 "
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df2 = df[df.sqm_ocr > 80]\n",
"df2.sort_values('price_per_sqm')"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "52545cfa-0932-46fe-ba7e-961fd43f2786",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>sqm_ocr</th>\n",
" <th>price</th>\n",
" <th>price_per_sqm</th>\n",
" <th>url</th>\n",
" <th>bedrooms</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>359</th>\n",
" <td>73.40</td>\n",
" <td>400000.0</td>\n",
" <td>5449.591281</td>\n",
" <td>https://www.rightmove.co.uk/properties/142186991</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>293</th>\n",
" <td>77.00</td>\n",
" <td>425000.0</td>\n",
" <td>5519.480519</td>\n",
" <td>https://www.rightmove.co.uk/properties/141437783</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>352</th>\n",
" <td>85.50</td>\n",
" <td>475000.0</td>\n",
" <td>5555.555556</td>\n",
" <td>https://www.rightmove.co.uk/properties/142142348</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>685</th>\n",
" <td>76.03</td>\n",
" <td>425000.0</td>\n",
" <td>5589.898724</td>\n",
" <td>https://www.rightmove.co.uk/properties/144494012</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>36</th>\n",
" <td>82.90</td>\n",
" <td>475000.0</td>\n",
" <td>5729.794934</td>\n",
" <td>https://www.rightmove.co.uk/properties/128925950</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>491</th>\n",
" <td>71.68</td>\n",
" <td>450000.0</td>\n",
" <td>6277.901786</td>\n",
" <td>https://www.rightmove.co.uk/properties/143315840</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1020</th>\n",
" <td>73.67</td>\n",
" <td>495000.0</td>\n",
" <td>6719.152980</td>\n",
" <td>https://www.rightmove.co.uk/properties/86807916</td>\n",
" <td>2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" sqm_ocr price price_per_sqm \\\n",
"359 73.40 400000.0 5449.591281 \n",
"293 77.00 425000.0 5519.480519 \n",
"352 85.50 475000.0 5555.555556 \n",
"685 76.03 425000.0 5589.898724 \n",
"36 82.90 475000.0 5729.794934 \n",
"491 71.68 450000.0 6277.901786 \n",
"1020 73.67 495000.0 6719.152980 \n",
"\n",
" url bedrooms \n",
"359 https://www.rightmove.co.uk/properties/142186991 2 \n",
"293 https://www.rightmove.co.uk/properties/141437783 2 \n",
"352 https://www.rightmove.co.uk/properties/142142348 2 \n",
"685 https://www.rightmove.co.uk/properties/144494012 2 \n",
"36 https://www.rightmove.co.uk/properties/128925950 2 \n",
"491 https://www.rightmove.co.uk/properties/143315840 2 \n",
"1020 https://www.rightmove.co.uk/properties/86807916 2 "
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df2 = df[(df.sqm_ocr > 70) & (df.price <500000)]\n",
"df2.sort_values('price_per_sqm')"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "d0246926-13ef-4110-8e3a-fb676a55c2a6",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>sqm_ocr</th>\n",
" <th>price</th>\n",
" <th>price_per_sqm</th>\n",
" <th>url</th>\n",
" <th>bedrooms</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>953</th>\n",
" <td>74142.40</td>\n",
" <td>550000.0</td>\n",
" <td>7.418157</td>\n",
" <td>https://www.rightmove.co.uk/properties/145546538</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>823</th>\n",
" <td>80.40</td>\n",
" <td>525000.0</td>\n",
" <td>6529.850746</td>\n",
" <td>https://www.rightmove.co.uk/properties/145051769</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>492</th>\n",
" <td>73.90</td>\n",
" <td>525000.0</td>\n",
" <td>7104.194858</td>\n",
" <td>https://www.rightmove.co.uk/properties/143317361</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>561</th>\n",
" <td>76.70</td>\n",
" <td>550000.0</td>\n",
" <td>7170.795306</td>\n",
" <td>https://www.rightmove.co.uk/properties/143780789</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>69</th>\n",
" <td>73.10</td>\n",
" <td>525000.0</td>\n",
" <td>7181.942544</td>\n",
" <td>https://www.rightmove.co.uk/properties/134574563</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>988</th>\n",
" <td>72.40</td>\n",
" <td>525000.0</td>\n",
" <td>7251.381215</td>\n",
" <td>https://www.rightmove.co.uk/properties/86648925</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>272</th>\n",
" <td>77.89</td>\n",
" <td>575000.0</td>\n",
" <td>7382.205675</td>\n",
" <td>https://www.rightmove.co.uk/properties/141131297</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>521</th>\n",
" <td>70.88</td>\n",
" <td>525000.0</td>\n",
" <td>7406.884876</td>\n",
" <td>https://www.rightmove.co.uk/properties/143514149</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>324</th>\n",
" <td>76.10</td>\n",
" <td>575000.0</td>\n",
" <td>7555.847569</td>\n",
" <td>https://www.rightmove.co.uk/properties/141831353</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1018</th>\n",
" <td>71.80</td>\n",
" <td>550000.0</td>\n",
" <td>7660.167131</td>\n",
" <td>https://www.rightmove.co.uk/properties/86804832</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>526</th>\n",
" <td>78.00</td>\n",
" <td>600000.0</td>\n",
" <td>7692.307692</td>\n",
" <td>https://www.rightmove.co.uk/properties/143552156</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>817</th>\n",
" <td>71.17</td>\n",
" <td>550000.0</td>\n",
" <td>7727.975270</td>\n",
" <td>https://www.rightmove.co.uk/properties/145035929</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>843</th>\n",
" <td>77.50</td>\n",
" <td>600000.0</td>\n",
" <td>7741.935484</td>\n",
" <td>https://www.rightmove.co.uk/properties/145144988</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>337</th>\n",
" <td>70.60</td>\n",
" <td>550000.0</td>\n",
" <td>7790.368272</td>\n",
" <td>https://www.rightmove.co.uk/properties/141904286</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>233</th>\n",
" <td>75.70</td>\n",
" <td>600000.0</td>\n",
" <td>7926.023778</td>\n",
" <td>https://www.rightmove.co.uk/properties/140582213</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>763</th>\n",
" <td>75.00</td>\n",
" <td>600000.0</td>\n",
" <td>8000.000000</td>\n",
" <td>https://www.rightmove.co.uk/properties/144862070</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>315</th>\n",
" <td>71.30</td>\n",
" <td>590000.0</td>\n",
" <td>8274.894811</td>\n",
" <td>https://www.rightmove.co.uk/properties/141669686</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>899</th>\n",
" <td>71.47</td>\n",
" <td>595000.0</td>\n",
" <td>8325.171401</td>\n",
" <td>https://www.rightmove.co.uk/properties/145362911</td>\n",
" <td>2</td>\n",
" </tr>\n",
" <tr>\n",
" <th>147</th>\n",
" <td>71.50</td>\n",
" <td>600000.0</td>\n",
" <td>8391.608392</td>\n",
" <td>https://www.rightmove.co.uk/properties/138537527</td>\n",
" <td>1</td>\n",
" </tr>\n",
" <tr>\n",
" <th>973</th>\n",
" <td>70.89</td>\n",
" <td>595000.0</td>\n",
" <td>8393.285372</td>\n",
" <td>https://www.rightmove.co.uk/properties/86296491</td>\n",
" <td>2</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" sqm_ocr price price_per_sqm \\\n",
"953 74142.40 550000.0 7.418157 \n",
"823 80.40 525000.0 6529.850746 \n",
"492 73.90 525000.0 7104.194858 \n",
"561 76.70 550000.0 7170.795306 \n",
"69 73.10 525000.0 7181.942544 \n",
"988 72.40 525000.0 7251.381215 \n",
"272 77.89 575000.0 7382.205675 \n",
"521 70.88 525000.0 7406.884876 \n",
"324 76.10 575000.0 7555.847569 \n",
"1018 71.80 550000.0 7660.167131 \n",
"526 78.00 600000.0 7692.307692 \n",
"817 71.17 550000.0 7727.975270 \n",
"843 77.50 600000.0 7741.935484 \n",
"337 70.60 550000.0 7790.368272 \n",
"233 75.70 600000.0 7926.023778 \n",
"763 75.00 600000.0 8000.000000 \n",
"315 71.30 590000.0 8274.894811 \n",
"899 71.47 595000.0 8325.171401 \n",
"147 71.50 600000.0 8391.608392 \n",
"973 70.89 595000.0 8393.285372 \n",
"\n",
" url bedrooms \n",
"953 https://www.rightmove.co.uk/properties/145546538 2 \n",
"823 https://www.rightmove.co.uk/properties/145051769 2 \n",
"492 https://www.rightmove.co.uk/properties/143317361 2 \n",
"561 https://www.rightmove.co.uk/properties/143780789 2 \n",
"69 https://www.rightmove.co.uk/properties/134574563 2 \n",
"988 https://www.rightmove.co.uk/properties/86648925 2 \n",
"272 https://www.rightmove.co.uk/properties/141131297 2 \n",
"521 https://www.rightmove.co.uk/properties/143514149 2 \n",
"324 https://www.rightmove.co.uk/properties/141831353 2 \n",
"1018 https://www.rightmove.co.uk/properties/86804832 2 \n",
"526 https://www.rightmove.co.uk/properties/143552156 1 \n",
"817 https://www.rightmove.co.uk/properties/145035929 2 \n",
"843 https://www.rightmove.co.uk/properties/145144988 2 \n",
"337 https://www.rightmove.co.uk/properties/141904286 2 \n",
"233 https://www.rightmove.co.uk/properties/140582213 2 \n",
"763 https://www.rightmove.co.uk/properties/144862070 2 \n",
"315 https://www.rightmove.co.uk/properties/141669686 2 \n",
"899 https://www.rightmove.co.uk/properties/145362911 2 \n",
"147 https://www.rightmove.co.uk/properties/138537527 1 \n",
"973 https://www.rightmove.co.uk/properties/86296491 2 "
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df2 = df[(df.sqm_ocr > 70) & (df.price <=600000)& (df.price >500000)]\n",
"df2.sort_values('price_per_sqm')"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "b9f2ca7b-8476-47f1-a34f-7acdfbe84bd1",
"metadata": {},
"outputs": [],
"source": []
},
{
"cell_type": "code",
"execution_count": 10,
"id": "edd9fa24-cad2-4448-9b17-c6d514564f41",
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>sqm_ocr</th>\n",
" <th>price</th>\n",
" <th>price_per_sqm</th>\n",
" <th>url</th>\n",
" <th>bedrooms</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
"Empty DataFrame\n",
"Columns: [sqm_ocr, price, price_per_sqm, url, bedrooms]\n",
"Index: []"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[df.bedrooms > 2]"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "002b2a3a-3ecc-45c1-8c2f-c143380ee0d5",
"metadata": {},
"outputs": [],
"source": [
"\n"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.12.0"
}
},
"nbformat": 4,
"nbformat_minor": 5
}