diff --git a/crawler/.ipynb_checkpoints/exploration-checkpoint.ipynb b/crawler/.ipynb_checkpoints/exploration-checkpoint.ipynb index 363fcab..480a582 100644 --- a/crawler/.ipynb_checkpoints/exploration-checkpoint.ipynb +++ b/crawler/.ipynb_checkpoints/exploration-checkpoint.ipynb @@ -1,6 +1,1714 @@ { - "cells": [], - "metadata": {}, + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "id": "f20bddee-1e7c-4c46-a17a-c7bb6c13f30c", + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "/Users/kadir/code/realestate/crawler/venv/lib/python3.12/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n", + " from .autonotebook import tqdm as notebook_tqdm\n" + ] + } + ], + "source": [ + "from data_access import Listing\n", + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "id": "b1101088-9613-465f-81fd-79801e0202b8", + "metadata": {}, + "outputs": [], + "source": [ + "ls = Listing.get_all_listings()" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "id": "63e61601-7e3f-4d58-89f6-1794e4868cc3", + "metadata": {}, + "outputs": [], + "source": [ + "ds = [l.dict_nicely() for l in ls]" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "1c222721-f426-42c0-9ac5-badc1f7a2034", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "travel_time_fastest | \n", + "travel_time_second | \n", + "lease_left | \n", + "development | \n", + "
|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "7.81 | \n", + "350000.0 | \n", + "44814.340589 | \n", + "https://www.rightmove.co.uk/properties/102360773 | \n", + "1 | \n", + "{'duration': 2695, 'distance': 6467, 'duration... | \n", + "{'duration': 1682, 'distance': 6810, 'duration... | \n", + "119.0 | \n", + "False | \n", + "
| 1 | \n", + "NaN | \n", + "400000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/105836849 | \n", + "3 | \n", + "{'duration': 2565, 'distance': 14070, 'duratio... | \n", + "{'duration': 2565, 'distance': 14070, 'duratio... | \n", + "NaN | \n", + "False | \n", + "
| 2 | \n", + "76.91 | \n", + "400000.0 | \n", + "5200.884150 | \n", + "https://www.rightmove.co.uk/properties/107233214 | \n", + "3 | \n", + "{'duration': 1714, 'distance': 9570, 'duration... | \n", + "{'duration': 1774, 'distance': 9570, 'duration... | \n", + "91.0 | \n", + "False | \n", + "
| 3 | \n", + "112.40 | \n", + "800000.0 | \n", + "7117.437722 | \n", + "https://www.rightmove.co.uk/properties/107976896 | \n", + "3 | \n", + "{'duration': 1862, 'distance': 8278, 'duration... | \n", + "{'duration': 1862, 'distance': 8278, 'duration... | \n", + "NaN | \n", + "False | \n", + "
| 4 | \n", + "115.60 | \n", + "775000.0 | \n", + "6704.152249 | \n", + "https://www.rightmove.co.uk/properties/115499441 | \n", + "3 | \n", + "{'duration': 2943, 'distance': 7437, 'duration... | \n", + "{'duration': 2167, 'distance': 9920, 'duration... | \n", + "NaN | \n", + "False | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
| 2129 | \n", + "NaN | \n", + "750000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813508 | \n", + "3 | \n", + "{'duration': 2400, 'distance': 13983, 'duratio... | \n", + "{'duration': 2605, 'distance': 14702, 'duratio... | \n", + "NaN | \n", + "True | \n", + "
| 2130 | \n", + "NaN | \n", + "655000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813523 | \n", + "3 | \n", + "{'duration': 2400, 'distance': 13983, 'duratio... | \n", + "{'duration': 2605, 'distance': 14702, 'duratio... | \n", + "NaN | \n", + "True | \n", + "
| 2131 | \n", + "82.80 | \n", + "550000.0 | \n", + "6642.512077 | \n", + "https://www.rightmove.co.uk/properties/86814669 | \n", + "3 | \n", + "{'duration': 2310, 'distance': 12972, 'duratio... | \n", + "{'duration': 2322, 'distance': 12104, 'duratio... | \n", + "0.0 | \n", + "False | \n", + "
| 2132 | \n", + "5.52 | \n", + "300000.0 | \n", + "54347.826087 | \n", + "https://www.rightmove.co.uk/properties/86955958 | \n", + "3 | \n", + "{'duration': 2332, 'distance': 6898, 'duration... | \n", + "{'duration': 2248, 'distance': 6893, 'duration... | \n", + "105.0 | \n", + "False | \n", + "
| 2133 | \n", + "81.60 | \n", + "790000.0 | \n", + "9681.372549 | \n", + "https://www.rightmove.co.uk/properties/86972726 | \n", + "2 | \n", + "{'duration': 1393, 'distance': 6390, 'duration... | \n", + "{'duration': 2733, 'distance': 6490, 'duration... | \n", + "993.0 | \n", + "False | \n", + "
2134 rows × 9 columns
\n", + "| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "duration | \n", + "distance | \n", + "duration_static | \n", + "duration_per_transit | \n", + "distance_per_transit | \n", + "number_of_transit_stops | \n", + "duration | \n", + "distance | \n", + "duration_static | \n", + "duration_per_transit | \n", + "distance_per_transit | \n", + "number_of_transit_stops | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "7.81 | \n", + "350000.0 | \n", + "44814.340589 | \n", + "https://www.rightmove.co.uk/properties/102360773 | \n", + "1 | \n", + "2695 | \n", + "6467 | \n", + "2695 | \n", + "{'WALK': 414, 'TRANSIT': 2280} | \n", + "{'WALK': 465, 'TRANSIT': 6002} | \n", + "1 | \n", + "1682.0 | \n", + "6810.0 | \n", + "1682.0 | \n", + "{'WALK': 608, 'TRANSIT': 804} | \n", + "{'WALK': 582, 'TRANSIT': 6228} | \n", + "2.0 | \n", + "
| 1 | \n", + "NaN | \n", + "400000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/105836849 | \n", + "3 | \n", + "2565 | \n", + "14070 | \n", + "2565 | \n", + "{'WALK': 750, 'TRANSIT': 1800} | \n", + "{'WALK': 856, 'TRANSIT': 13214} | \n", + "1 | \n", + "2565.0 | \n", + "14070.0 | \n", + "2565.0 | \n", + "{'WALK': 750, 'TRANSIT': 1800} | \n", + "{'WALK': 856, 'TRANSIT': 13214} | \n", + "1.0 | \n", + "
| 2 | \n", + "76.91 | \n", + "400000.0 | \n", + "5200.884150 | \n", + "https://www.rightmove.co.uk/properties/107233214 | \n", + "3 | \n", + "1714 | \n", + "9570 | \n", + "1714 | \n", + "{'WALK': 903, 'TRANSIT': 780} | \n", + "{'WALK': 1035, 'TRANSIT': 8535} | \n", + "1 | \n", + "1774.0 | \n", + "9570.0 | \n", + "1774.0 | \n", + "{'WALK': 903, 'TRANSIT': 840} | \n", + "{'WALK': 1035, 'TRANSIT': 8535} | \n", + "1.0 | \n", + "
| 3 | \n", + "112.40 | \n", + "800000.0 | \n", + "7117.437722 | \n", + "https://www.rightmove.co.uk/properties/107976896 | \n", + "3 | \n", + "1862 | \n", + "8278 | \n", + "1862 | \n", + "{'WALK': 635, 'TRANSIT': 900} | \n", + "{'WALK': 710, 'TRANSIT': 7568} | \n", + "2 | \n", + "1862.0 | \n", + "8278.0 | \n", + "1862.0 | \n", + "{'WALK': 635, 'TRANSIT': 960} | \n", + "{'WALK': 710, 'TRANSIT': 7568} | \n", + "2.0 | \n", + "
| 4 | \n", + "115.60 | \n", + "775000.0 | \n", + "6704.152249 | \n", + "https://www.rightmove.co.uk/properties/115499441 | \n", + "3 | \n", + "2943 | \n", + "7437 | \n", + "2943 | \n", + "{'WALK': 242, 'TRANSIT': 2700} | \n", + "{'WALK': 276, 'TRANSIT': 7161} | \n", + "1 | \n", + "2167.0 | \n", + "9920.0 | \n", + "2167.0 | \n", + "{'WALK': 658, 'TRANSIT': 1200} | \n", + "{'WALK': 720, 'TRANSIT': 9200} | \n", + "2.0 | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
| 2046 | \n", + "NaN | \n", + "750000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813508 | \n", + "3 | \n", + "2400 | \n", + "13983 | \n", + "2400 | \n", + "{'WALK': 603, 'TRANSIT': 1524} | \n", + "{'WALK': 671, 'TRANSIT': 13312} | \n", + "2 | \n", + "2605.0 | \n", + "14702.0 | \n", + "2605.0 | \n", + "{'WALK': 1467, 'TRANSIT': 1132} | \n", + "{'WALK': 1698, 'TRANSIT': 13004} | \n", + "1.0 | \n", + "
| 2047 | \n", + "NaN | \n", + "655000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813523 | \n", + "3 | \n", + "2400 | \n", + "13983 | \n", + "2400 | \n", + "{'WALK': 603, 'TRANSIT': 1524} | \n", + "{'WALK': 671, 'TRANSIT': 13312} | \n", + "2 | \n", + "2605.0 | \n", + "14702.0 | \n", + "2605.0 | \n", + "{'WALK': 1467, 'TRANSIT': 1132} | \n", + "{'WALK': 1698, 'TRANSIT': 13004} | \n", + "1.0 | \n", + "
| 2048 | \n", + "82.80 | \n", + "550000.0 | \n", + "6642.512077 | \n", + "https://www.rightmove.co.uk/properties/86814669 | \n", + "3 | \n", + "2310 | \n", + "12972 | \n", + "2310 | \n", + "{'WALK': 786, 'TRANSIT': 1277} | \n", + "{'WALK': 885, 'TRANSIT': 12087} | \n", + "2 | \n", + "2322.0 | \n", + "12104.0 | \n", + "2322.0 | \n", + "{'WALK': 991, 'TRANSIT': 1080} | \n", + "{'WALK': 1089, 'TRANSIT': 11015} | \n", + "2.0 | \n", + "
| 2049 | \n", + "5.52 | \n", + "300000.0 | \n", + "54347.826087 | \n", + "https://www.rightmove.co.uk/properties/86955958 | \n", + "3 | \n", + "2332 | \n", + "6898 | \n", + "2332 | \n", + "{'WALK': 1671, 'TRANSIT': 660} | \n", + "{'WALK': 1945, 'TRANSIT': 4953} | \n", + "1 | \n", + "2248.0 | \n", + "6893.0 | \n", + "2248.0 | \n", + "{'WALK': 1671, 'TRANSIT': 576} | \n", + "{'WALK': 1945, 'TRANSIT': 4948} | \n", + "1.0 | \n", + "
| 2050 | \n", + "81.60 | \n", + "790000.0 | \n", + "9681.372549 | \n", + "https://www.rightmove.co.uk/properties/86972726 | \n", + "2 | \n", + "1393 | \n", + "6390 | \n", + "1393 | \n", + "{'WALK': 518, 'TRANSIT': 564} | \n", + "{'WALK': 441, 'TRANSIT': 5949} | \n", + "2 | \n", + "2733.0 | \n", + "6490.0 | \n", + "2733.0 | \n", + "{'WALK': 451, 'TRANSIT': 2280} | \n", + "{'WALK': 488, 'TRANSIT': 6002} | \n", + "1.0 | \n", + "
2051 rows × 17 columns
\n", + "| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "
|---|---|---|---|---|---|
| 953 | \n", + "74142.40 | \n", + "550000.0 | \n", + "7.418157 | \n", + "https://www.rightmove.co.uk/properties/145546538 | \n", + "2 | \n", + "
| 249 | \n", + "21850.10 | \n", + "725000.0 | \n", + "33.180626 | \n", + "https://www.rightmove.co.uk/properties/140821736 | \n", + "2 | \n", + "
| 177 | \n", + "137.50 | \n", + "695000.0 | \n", + "5054.545455 | \n", + "https://www.rightmove.co.uk/properties/139354259 | \n", + "2 | \n", + "
| 352 | \n", + "85.50 | \n", + "475000.0 | \n", + "5555.555556 | \n", + "https://www.rightmove.co.uk/properties/142142348 | \n", + "2 | \n", + "
| 36 | \n", + "82.90 | \n", + "475000.0 | \n", + "5729.794934 | \n", + "https://www.rightmove.co.uk/properties/128925950 | \n", + "2 | \n", + "
| 700 | \n", + "101.00 | \n", + "650000.0 | \n", + "6435.643564 | \n", + "https://www.rightmove.co.uk/properties/144591572 | \n", + "1 | \n", + "
| 823 | \n", + "80.40 | \n", + "525000.0 | \n", + "6529.850746 | \n", + "https://www.rightmove.co.uk/properties/145051769 | \n", + "2 | \n", + "
| 214 | \n", + "91.51 | \n", + "650000.0 | \n", + "7103.048847 | \n", + "https://www.rightmove.co.uk/properties/140326307 | \n", + "2 | \n", + "
| 171 | \n", + "91.10 | \n", + "650000.0 | \n", + "7135.016465 | \n", + "https://www.rightmove.co.uk/properties/139245428 | \n", + "2 | \n", + "
| 598 | \n", + "109.40 | \n", + "795000.0 | \n", + "7266.910420 | \n", + "https://www.rightmove.co.uk/properties/144034655 | \n", + "2 | \n", + "
| 146 | \n", + "93.78 | \n", + "700000.0 | \n", + "7464.278098 | \n", + "https://www.rightmove.co.uk/properties/138510395 | \n", + "2 | \n", + "
| 711 | \n", + "100.31 | \n", + "750000.0 | \n", + "7476.821852 | \n", + "https://www.rightmove.co.uk/properties/144620303 | \n", + "2 | \n", + "
| 592 | \n", + "86.49 | \n", + "650000.0 | \n", + "7515.319690 | \n", + "https://www.rightmove.co.uk/properties/143987669 | \n", + "2 | \n", + "
| 624 | \n", + "101.35 | \n", + "775000.0 | \n", + "7646.768624 | \n", + "https://www.rightmove.co.uk/properties/144217922 | \n", + "1 | \n", + "
| 55 | \n", + "97.60 | \n", + "750000.0 | \n", + "7684.426230 | \n", + "https://www.rightmove.co.uk/properties/132564737 | \n", + "2 | \n", + "
| 851 | \n", + "81.01 | \n", + "625000.0 | \n", + "7715.096902 | \n", + "https://www.rightmove.co.uk/properties/145172504 | \n", + "2 | \n", + "
| 356 | \n", + "89.00 | \n", + "695000.0 | \n", + "7808.988764 | \n", + "https://www.rightmove.co.uk/properties/142185623 | \n", + "2 | \n", + "
| 748 | \n", + "85.90 | \n", + "675000.0 | \n", + "7857.974389 | \n", + "https://www.rightmove.co.uk/properties/144771281 | \n", + "2 | \n", + "
| 204 | \n", + "82.40 | \n", + "650000.0 | \n", + "7888.349515 | \n", + "https://www.rightmove.co.uk/properties/140173319 | \n", + "2 | \n", + "
| 654 | \n", + "83.33 | \n", + "665000.0 | \n", + "7980.319213 | \n", + "https://www.rightmove.co.uk/properties/144361100 | \n", + "2 | \n", + "
| 514 | \n", + "87.50 | \n", + "700000.0 | \n", + "8000.000000 | \n", + "https://www.rightmove.co.uk/properties/143460365 | \n", + "1 | \n", + "
| 762 | \n", + "92.90 | \n", + "750000.0 | \n", + "8073.196986 | \n", + "https://www.rightmove.co.uk/properties/144846725 | \n", + "1 | \n", + "
| 963 | \n", + "92.90 | \n", + "750000.0 | \n", + "8073.196986 | \n", + "https://www.rightmove.co.uk/properties/145565252 | \n", + "2 | \n", + "
| 938 | \n", + "86.10 | \n", + "699000.0 | \n", + "8118.466899 | \n", + "https://www.rightmove.co.uk/properties/145491137 | \n", + "2 | \n", + "
| 403 | \n", + "90.60 | \n", + "750000.0 | \n", + "8278.145695 | \n", + "https://www.rightmove.co.uk/properties/142704416 | \n", + "2 | \n", + "
| 302 | \n", + "93.30 | \n", + "795000.0 | \n", + "8520.900322 | \n", + "https://www.rightmove.co.uk/properties/141595433 | \n", + "2 | \n", + "
| 671 | \n", + "93.27 | \n", + "800000.0 | \n", + "8577.248847 | \n", + "https://www.rightmove.co.uk/properties/144429140 | \n", + "2 | \n", + "
| 349 | \n", + "80.57 | \n", + "695000.0 | \n", + "8626.039469 | \n", + "https://www.rightmove.co.uk/properties/142115918 | \n", + "2 | \n", + "
| 224 | \n", + "90.10 | \n", + "800000.0 | \n", + "8879.023307 | \n", + "https://www.rightmove.co.uk/properties/140464481 | \n", + "2 | \n", + "
| 740 | \n", + "81.70 | \n", + "735000.0 | \n", + "8996.328029 | \n", + "https://www.rightmove.co.uk/properties/144722414 | \n", + "2 | \n", + "
| 326 | \n", + "87.30 | \n", + "800000.0 | \n", + "9163.802978 | \n", + "https://www.rightmove.co.uk/properties/141846023 | \n", + "2 | \n", + "
| 319 | \n", + "81.57 | \n", + "750000.0 | \n", + "9194.556822 | \n", + "https://www.rightmove.co.uk/properties/141797357 | \n", + "2 | \n", + "
| 558 | \n", + "86.77 | \n", + "800000.0 | \n", + "9219.776420 | \n", + "https://www.rightmove.co.uk/properties/143758763 | \n", + "2 | \n", + "
| 712 | \n", + "86.30 | \n", + "800000.0 | \n", + "9269.988413 | \n", + "https://www.rightmove.co.uk/properties/144622157 | \n", + "2 | \n", + "
| 473 | \n", + "86.00 | \n", + "800000.0 | \n", + "9302.325581 | \n", + "https://www.rightmove.co.uk/properties/143210102 | \n", + "2 | \n", + "
| 105 | \n", + "80.40 | \n", + "750000.0 | \n", + "9328.358209 | \n", + "https://www.rightmove.co.uk/properties/136988726 | \n", + "2 | \n", + "
| 1003 | \n", + "80.27 | \n", + "750000.0 | \n", + "9343.465803 | \n", + "https://www.rightmove.co.uk/properties/86775291 | \n", + "2 | \n", + "
| 235 | \n", + "82.80 | \n", + "775000.0 | \n", + "9359.903382 | \n", + "https://www.rightmove.co.uk/properties/140611055 | \n", + "2 | \n", + "
| 65 | \n", + "85.10 | \n", + "800000.0 | \n", + "9400.705053 | \n", + "https://www.rightmove.co.uk/properties/134116232 | \n", + "2 | \n", + "
| 30 | \n", + "83.70 | \n", + "795000.0 | \n", + "9498.207885 | \n", + "https://www.rightmove.co.uk/properties/127787960 | \n", + "1 | \n", + "
| 1025 | \n", + "81.60 | \n", + "790000.0 | \n", + "9681.372549 | \n", + "https://www.rightmove.co.uk/properties/86972726 | \n", + "2 | \n", + "
| 88 | \n", + "81.75 | \n", + "800000.0 | \n", + "9785.932722 | \n", + "https://www.rightmove.co.uk/properties/136012193 | \n", + "1 | \n", + "
| 454 | \n", + "80.80 | \n", + "800000.0 | \n", + "9900.990099 | \n", + "https://www.rightmove.co.uk/properties/143138867 | \n", + "2 | \n", + "
| 343 | \n", + "80.64 | \n", + "800000.0 | \n", + "9920.634921 | \n", + "https://www.rightmove.co.uk/properties/142032935 | \n", + "2 | \n", + "
| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "
|---|---|---|---|---|---|
| 359 | \n", + "73.40 | \n", + "400000.0 | \n", + "5449.591281 | \n", + "https://www.rightmove.co.uk/properties/142186991 | \n", + "2 | \n", + "
| 293 | \n", + "77.00 | \n", + "425000.0 | \n", + "5519.480519 | \n", + "https://www.rightmove.co.uk/properties/141437783 | \n", + "2 | \n", + "
| 352 | \n", + "85.50 | \n", + "475000.0 | \n", + "5555.555556 | \n", + "https://www.rightmove.co.uk/properties/142142348 | \n", + "2 | \n", + "
| 685 | \n", + "76.03 | \n", + "425000.0 | \n", + "5589.898724 | \n", + "https://www.rightmove.co.uk/properties/144494012 | \n", + "2 | \n", + "
| 36 | \n", + "82.90 | \n", + "475000.0 | \n", + "5729.794934 | \n", + "https://www.rightmove.co.uk/properties/128925950 | \n", + "2 | \n", + "
| 491 | \n", + "71.68 | \n", + "450000.0 | \n", + "6277.901786 | \n", + "https://www.rightmove.co.uk/properties/143315840 | \n", + "2 | \n", + "
| 1020 | \n", + "73.67 | \n", + "495000.0 | \n", + "6719.152980 | \n", + "https://www.rightmove.co.uk/properties/86807916 | \n", + "2 | \n", + "
| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "
|---|---|---|---|---|---|
| 953 | \n", + "74142.40 | \n", + "550000.0 | \n", + "7.418157 | \n", + "https://www.rightmove.co.uk/properties/145546538 | \n", + "2 | \n", + "
| 823 | \n", + "80.40 | \n", + "525000.0 | \n", + "6529.850746 | \n", + "https://www.rightmove.co.uk/properties/145051769 | \n", + "2 | \n", + "
| 492 | \n", + "73.90 | \n", + "525000.0 | \n", + "7104.194858 | \n", + "https://www.rightmove.co.uk/properties/143317361 | \n", + "2 | \n", + "
| 561 | \n", + "76.70 | \n", + "550000.0 | \n", + "7170.795306 | \n", + "https://www.rightmove.co.uk/properties/143780789 | \n", + "2 | \n", + "
| 69 | \n", + "73.10 | \n", + "525000.0 | \n", + "7181.942544 | \n", + "https://www.rightmove.co.uk/properties/134574563 | \n", + "2 | \n", + "
| 988 | \n", + "72.40 | \n", + "525000.0 | \n", + "7251.381215 | \n", + "https://www.rightmove.co.uk/properties/86648925 | \n", + "2 | \n", + "
| 272 | \n", + "77.89 | \n", + "575000.0 | \n", + "7382.205675 | \n", + "https://www.rightmove.co.uk/properties/141131297 | \n", + "2 | \n", + "
| 521 | \n", + "70.88 | \n", + "525000.0 | \n", + "7406.884876 | \n", + "https://www.rightmove.co.uk/properties/143514149 | \n", + "2 | \n", + "
| 324 | \n", + "76.10 | \n", + "575000.0 | \n", + "7555.847569 | \n", + "https://www.rightmove.co.uk/properties/141831353 | \n", + "2 | \n", + "
| 1018 | \n", + "71.80 | \n", + "550000.0 | \n", + "7660.167131 | \n", + "https://www.rightmove.co.uk/properties/86804832 | \n", + "2 | \n", + "
| 526 | \n", + "78.00 | \n", + "600000.0 | \n", + "7692.307692 | \n", + "https://www.rightmove.co.uk/properties/143552156 | \n", + "1 | \n", + "
| 817 | \n", + "71.17 | \n", + "550000.0 | \n", + "7727.975270 | \n", + "https://www.rightmove.co.uk/properties/145035929 | \n", + "2 | \n", + "
| 843 | \n", + "77.50 | \n", + "600000.0 | \n", + "7741.935484 | \n", + "https://www.rightmove.co.uk/properties/145144988 | \n", + "2 | \n", + "
| 337 | \n", + "70.60 | \n", + "550000.0 | \n", + "7790.368272 | \n", + "https://www.rightmove.co.uk/properties/141904286 | \n", + "2 | \n", + "
| 233 | \n", + "75.70 | \n", + "600000.0 | \n", + "7926.023778 | \n", + "https://www.rightmove.co.uk/properties/140582213 | \n", + "2 | \n", + "
| 763 | \n", + "75.00 | \n", + "600000.0 | \n", + "8000.000000 | \n", + "https://www.rightmove.co.uk/properties/144862070 | \n", + "2 | \n", + "
| 315 | \n", + "71.30 | \n", + "590000.0 | \n", + "8274.894811 | \n", + "https://www.rightmove.co.uk/properties/141669686 | \n", + "2 | \n", + "
| 899 | \n", + "71.47 | \n", + "595000.0 | \n", + "8325.171401 | \n", + "https://www.rightmove.co.uk/properties/145362911 | \n", + "2 | \n", + "
| 147 | \n", + "71.50 | \n", + "600000.0 | \n", + "8391.608392 | \n", + "https://www.rightmove.co.uk/properties/138537527 | \n", + "1 | \n", + "
| 973 | \n", + "70.89 | \n", + "595000.0 | \n", + "8393.285372 | \n", + "https://www.rightmove.co.uk/properties/86296491 | \n", + "2 | \n", + "
| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "
|---|
1026 rows × 5 columns
\n", + "2134 rows × 9 columns
\n", "" ], "text/plain": [ " sqm_ocr price price_per_sqm \\\n", "0 7.81 350000.0 44814.340589 \n", - "1 5.88 695000.0 118197.278912 \n", - "2 64.74 575000.0 8881.680568 \n", - "3 52.80 790000.0 14962.121212 \n", - "4 4.56 425000.0 93201.754386 \n", + "1 NaN 400000.0 NaN \n", + "2 76.91 400000.0 5200.884150 \n", + "3 112.40 800000.0 7117.437722 \n", + "4 115.60 775000.0 6704.152249 \n", "... ... ... ... \n", - "1021 NaN 220000.0 NaN \n", - "1022 49.00 450000.0 9183.673469 \n", - "1023 58.20 550000.0 9450.171821 \n", - "1024 3.00 475000.0 158333.333333 \n", - "1025 81.60 790000.0 9681.372549 \n", + "2129 NaN 750000.0 NaN \n", + "2130 NaN 655000.0 NaN \n", + "2131 82.80 550000.0 6642.512077 \n", + "2132 5.52 300000.0 54347.826087 \n", + "2133 81.60 790000.0 9681.372549 \n", "\n", - " url bedrooms \n", - "0 https://www.rightmove.co.uk/properties/102360773 1 \n", - "1 https://www.rightmove.co.uk/properties/115530848 1 \n", - "2 https://www.rightmove.co.uk/properties/117095606 2 \n", - "3 https://www.rightmove.co.uk/properties/118752221 1 \n", - "4 https://www.rightmove.co.uk/properties/119578451 2 \n", - "... ... ... \n", - "1021 https://www.rightmove.co.uk/properties/86809926 1 \n", - "1022 https://www.rightmove.co.uk/properties/86811141 1 \n", - "1023 https://www.rightmove.co.uk/properties/86811177 2 \n", - "1024 https://www.rightmove.co.uk/properties/86812494 1 \n", - "1025 https://www.rightmove.co.uk/properties/86972726 2 \n", + " url bedrooms \\\n", + "0 https://www.rightmove.co.uk/properties/102360773 1 \n", + "1 https://www.rightmove.co.uk/properties/105836849 3 \n", + "2 https://www.rightmove.co.uk/properties/107233214 3 \n", + "3 https://www.rightmove.co.uk/properties/107976896 3 \n", + "4 https://www.rightmove.co.uk/properties/115499441 3 \n", + "... ... ... \n", + "2129 https://www.rightmove.co.uk/properties/86813508 3 \n", + "2130 https://www.rightmove.co.uk/properties/86813523 3 \n", + "2131 https://www.rightmove.co.uk/properties/86814669 3 \n", + "2132 https://www.rightmove.co.uk/properties/86955958 3 \n", + "2133 https://www.rightmove.co.uk/properties/86972726 2 \n", "\n", - "[1026 rows x 5 columns]" + " travel_time_fastest \\\n", + "0 {'duration': 2695, 'distance': 6467, 'duration... \n", + "1 {'duration': 2565, 'distance': 14070, 'duratio... \n", + "2 {'duration': 1714, 'distance': 9570, 'duration... \n", + "3 {'duration': 1862, 'distance': 8278, 'duration... \n", + "4 {'duration': 2943, 'distance': 7437, 'duration... \n", + "... ... \n", + "2129 {'duration': 2400, 'distance': 13983, 'duratio... \n", + "2130 {'duration': 2400, 'distance': 13983, 'duratio... \n", + "2131 {'duration': 2310, 'distance': 12972, 'duratio... \n", + "2132 {'duration': 2332, 'distance': 6898, 'duration... \n", + "2133 {'duration': 1393, 'distance': 6390, 'duration... \n", + "\n", + " travel_time_second lease_left \\\n", + "0 {'duration': 1682, 'distance': 6810, 'duration... 119.0 \n", + "1 {'duration': 2565, 'distance': 14070, 'duratio... NaN \n", + "2 {'duration': 1774, 'distance': 9570, 'duration... 91.0 \n", + "3 {'duration': 1862, 'distance': 8278, 'duration... NaN \n", + "4 {'duration': 2167, 'distance': 9920, 'duration... NaN \n", + "... ... ... \n", + "2129 {'duration': 2605, 'distance': 14702, 'duratio... NaN \n", + "2130 {'duration': 2605, 'distance': 14702, 'duratio... NaN \n", + "2131 {'duration': 2322, 'distance': 12104, 'duratio... 0.0 \n", + "2132 {'duration': 2248, 'distance': 6893, 'duration... 105.0 \n", + "2133 {'duration': 2733, 'distance': 6490, 'duration... 993.0 \n", + "\n", + " development \n", + "0 False \n", + "1 False \n", + "2 False \n", + "3 False \n", + "4 False \n", + "... ... \n", + "2129 True \n", + "2130 True \n", + "2131 False \n", + "2132 False \n", + "2133 False \n", + "\n", + "[2134 rows x 9 columns]" ] }, "execution_count": 4, @@ -208,6 +295,744 @@ "df" ] }, + { + "cell_type": "code", + "execution_count": 14, + "id": "387c48d9-26c6-4bed-8201-352735c06acb", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "0 1682.0\n", + "1 2565.0\n", + "2 1714.0\n", + "3 1862.0\n", + "4 2167.0\n", + " ... \n", + "2129 2400.0\n", + "2130 2400.0\n", + "2131 2310.0\n", + "2132 2248.0\n", + "2133 1393.0\n", + "Length: 2134, dtype: float64" + ] + }, + "execution_count": 14, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "7b37ad6b-9b0a-444e-b8c3-6fe4e43e42cb", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "lease_left | \n", + "development | \n", + "a_duration | \n", + "a_duration_per_transit | \n", + "a_number_of_transit_stops | \n", + "b_duration | \n", + "b_duration_per_transit | \n", + "b_number_of_transit_stops | \n", + "min_duration | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "7.81 | \n", + "350000.0 | \n", + "44814.340589 | \n", + "https://www.rightmove.co.uk/properties/102360773 | \n", + "1 | \n", + "119.0 | \n", + "False | \n", + "2695 | \n", + "{'WALK': 414, 'TRANSIT': 2280} | \n", + "1 | \n", + "1682.0 | \n", + "{'WALK': 608, 'TRANSIT': 804} | \n", + "2.0 | \n", + "28.0 | \n", + "
| 1 | \n", + "NaN | \n", + "400000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/105836849 | \n", + "3 | \n", + "NaN | \n", + "False | \n", + "2565 | \n", + "{'WALK': 750, 'TRANSIT': 1800} | \n", + "1 | \n", + "2565.0 | \n", + "{'WALK': 750, 'TRANSIT': 1800} | \n", + "1.0 | \n", + "43.0 | \n", + "
| 2 | \n", + "76.91 | \n", + "400000.0 | \n", + "5200.884150 | \n", + "https://www.rightmove.co.uk/properties/107233214 | \n", + "3 | \n", + "91.0 | \n", + "False | \n", + "1714 | \n", + "{'WALK': 903, 'TRANSIT': 780} | \n", + "1 | \n", + "1774.0 | \n", + "{'WALK': 903, 'TRANSIT': 840} | \n", + "1.0 | \n", + "29.0 | \n", + "
| 3 | \n", + "112.40 | \n", + "800000.0 | \n", + "7117.437722 | \n", + "https://www.rightmove.co.uk/properties/107976896 | \n", + "3 | \n", + "NaN | \n", + "False | \n", + "1862 | \n", + "{'WALK': 635, 'TRANSIT': 900} | \n", + "2 | \n", + "1862.0 | \n", + "{'WALK': 635, 'TRANSIT': 960} | \n", + "2.0 | \n", + "31.0 | \n", + "
| 4 | \n", + "115.60 | \n", + "775000.0 | \n", + "6704.152249 | \n", + "https://www.rightmove.co.uk/properties/115499441 | \n", + "3 | \n", + "NaN | \n", + "False | \n", + "2943 | \n", + "{'WALK': 242, 'TRANSIT': 2700} | \n", + "1 | \n", + "2167.0 | \n", + "{'WALK': 658, 'TRANSIT': 1200} | \n", + "2.0 | \n", + "36.0 | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
| 2129 | \n", + "NaN | \n", + "750000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813508 | \n", + "3 | \n", + "NaN | \n", + "True | \n", + "2400 | \n", + "{'WALK': 603, 'TRANSIT': 1524} | \n", + "2 | \n", + "2605.0 | \n", + "{'WALK': 1467, 'TRANSIT': 1132} | \n", + "1.0 | \n", + "40.0 | \n", + "
| 2130 | \n", + "NaN | \n", + "655000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813523 | \n", + "3 | \n", + "NaN | \n", + "True | \n", + "2400 | \n", + "{'WALK': 603, 'TRANSIT': 1524} | \n", + "2 | \n", + "2605.0 | \n", + "{'WALK': 1467, 'TRANSIT': 1132} | \n", + "1.0 | \n", + "40.0 | \n", + "
| 2131 | \n", + "82.80 | \n", + "550000.0 | \n", + "6642.512077 | \n", + "https://www.rightmove.co.uk/properties/86814669 | \n", + "3 | \n", + "0.0 | \n", + "False | \n", + "2310 | \n", + "{'WALK': 786, 'TRANSIT': 1277} | \n", + "2 | \n", + "2322.0 | \n", + "{'WALK': 991, 'TRANSIT': 1080} | \n", + "2.0 | \n", + "38.0 | \n", + "
| 2132 | \n", + "5.52 | \n", + "300000.0 | \n", + "54347.826087 | \n", + "https://www.rightmove.co.uk/properties/86955958 | \n", + "3 | \n", + "105.0 | \n", + "False | \n", + "2332 | \n", + "{'WALK': 1671, 'TRANSIT': 660} | \n", + "1 | \n", + "2248.0 | \n", + "{'WALK': 1671, 'TRANSIT': 576} | \n", + "1.0 | \n", + "37.0 | \n", + "
| 2133 | \n", + "81.60 | \n", + "790000.0 | \n", + "9681.372549 | \n", + "https://www.rightmove.co.uk/properties/86972726 | \n", + "2 | \n", + "993.0 | \n", + "False | \n", + "1393 | \n", + "{'WALK': 518, 'TRANSIT': 564} | \n", + "2 | \n", + "2733.0 | \n", + "{'WALK': 451, 'TRANSIT': 2280} | \n", + "1.0 | \n", + "23.0 | \n", + "
2134 rows × 14 columns
\n", + "| \n", + " | sqm_ocr | \n", + "price | \n", + "price_per_sqm | \n", + "url | \n", + "bedrooms | \n", + "duration | \n", + "distance | \n", + "duration_static | \n", + "duration_per_transit | \n", + "distance_per_transit | \n", + "number_of_transit_stops | \n", + "duration | \n", + "distance | \n", + "duration_static | \n", + "duration_per_transit | \n", + "distance_per_transit | \n", + "number_of_transit_stops | \n", + "
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 0 | \n", + "7.81 | \n", + "350000.0 | \n", + "44814.340589 | \n", + "https://www.rightmove.co.uk/properties/102360773 | \n", + "1 | \n", + "2695 | \n", + "6467 | \n", + "2695 | \n", + "{'WALK': 414, 'TRANSIT': 2280} | \n", + "{'WALK': 465, 'TRANSIT': 6002} | \n", + "1 | \n", + "1682.0 | \n", + "6810.0 | \n", + "1682.0 | \n", + "{'WALK': 608, 'TRANSIT': 804} | \n", + "{'WALK': 582, 'TRANSIT': 6228} | \n", + "2.0 | \n", + "
| 1 | \n", + "NaN | \n", + "400000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/105836849 | \n", + "3 | \n", + "2565 | \n", + "14070 | \n", + "2565 | \n", + "{'WALK': 750, 'TRANSIT': 1800} | \n", + "{'WALK': 856, 'TRANSIT': 13214} | \n", + "1 | \n", + "2565.0 | \n", + "14070.0 | \n", + "2565.0 | \n", + "{'WALK': 750, 'TRANSIT': 1800} | \n", + "{'WALK': 856, 'TRANSIT': 13214} | \n", + "1.0 | \n", + "
| 2 | \n", + "76.91 | \n", + "400000.0 | \n", + "5200.884150 | \n", + "https://www.rightmove.co.uk/properties/107233214 | \n", + "3 | \n", + "1714 | \n", + "9570 | \n", + "1714 | \n", + "{'WALK': 903, 'TRANSIT': 780} | \n", + "{'WALK': 1035, 'TRANSIT': 8535} | \n", + "1 | \n", + "1774.0 | \n", + "9570.0 | \n", + "1774.0 | \n", + "{'WALK': 903, 'TRANSIT': 840} | \n", + "{'WALK': 1035, 'TRANSIT': 8535} | \n", + "1.0 | \n", + "
| 3 | \n", + "112.40 | \n", + "800000.0 | \n", + "7117.437722 | \n", + "https://www.rightmove.co.uk/properties/107976896 | \n", + "3 | \n", + "1862 | \n", + "8278 | \n", + "1862 | \n", + "{'WALK': 635, 'TRANSIT': 900} | \n", + "{'WALK': 710, 'TRANSIT': 7568} | \n", + "2 | \n", + "1862.0 | \n", + "8278.0 | \n", + "1862.0 | \n", + "{'WALK': 635, 'TRANSIT': 960} | \n", + "{'WALK': 710, 'TRANSIT': 7568} | \n", + "2.0 | \n", + "
| 4 | \n", + "115.60 | \n", + "775000.0 | \n", + "6704.152249 | \n", + "https://www.rightmove.co.uk/properties/115499441 | \n", + "3 | \n", + "2943 | \n", + "7437 | \n", + "2943 | \n", + "{'WALK': 242, 'TRANSIT': 2700} | \n", + "{'WALK': 276, 'TRANSIT': 7161} | \n", + "1 | \n", + "2167.0 | \n", + "9920.0 | \n", + "2167.0 | \n", + "{'WALK': 658, 'TRANSIT': 1200} | \n", + "{'WALK': 720, 'TRANSIT': 9200} | \n", + "2.0 | \n", + "
| ... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
| 2046 | \n", + "NaN | \n", + "750000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813508 | \n", + "3 | \n", + "2400 | \n", + "13983 | \n", + "2400 | \n", + "{'WALK': 603, 'TRANSIT': 1524} | \n", + "{'WALK': 671, 'TRANSIT': 13312} | \n", + "2 | \n", + "2605.0 | \n", + "14702.0 | \n", + "2605.0 | \n", + "{'WALK': 1467, 'TRANSIT': 1132} | \n", + "{'WALK': 1698, 'TRANSIT': 13004} | \n", + "1.0 | \n", + "
| 2047 | \n", + "NaN | \n", + "655000.0 | \n", + "NaN | \n", + "https://www.rightmove.co.uk/properties/86813523 | \n", + "3 | \n", + "2400 | \n", + "13983 | \n", + "2400 | \n", + "{'WALK': 603, 'TRANSIT': 1524} | \n", + "{'WALK': 671, 'TRANSIT': 13312} | \n", + "2 | \n", + "2605.0 | \n", + "14702.0 | \n", + "2605.0 | \n", + "{'WALK': 1467, 'TRANSIT': 1132} | \n", + "{'WALK': 1698, 'TRANSIT': 13004} | \n", + "1.0 | \n", + "
| 2048 | \n", + "82.80 | \n", + "550000.0 | \n", + "6642.512077 | \n", + "https://www.rightmove.co.uk/properties/86814669 | \n", + "3 | \n", + "2310 | \n", + "12972 | \n", + "2310 | \n", + "{'WALK': 786, 'TRANSIT': 1277} | \n", + "{'WALK': 885, 'TRANSIT': 12087} | \n", + "2 | \n", + "2322.0 | \n", + "12104.0 | \n", + "2322.0 | \n", + "{'WALK': 991, 'TRANSIT': 1080} | \n", + "{'WALK': 1089, 'TRANSIT': 11015} | \n", + "2.0 | \n", + "
| 2049 | \n", + "5.52 | \n", + "300000.0 | \n", + "54347.826087 | \n", + "https://www.rightmove.co.uk/properties/86955958 | \n", + "3 | \n", + "2332 | \n", + "6898 | \n", + "2332 | \n", + "{'WALK': 1671, 'TRANSIT': 660} | \n", + "{'WALK': 1945, 'TRANSIT': 4953} | \n", + "1 | \n", + "2248.0 | \n", + "6893.0 | \n", + "2248.0 | \n", + "{'WALK': 1671, 'TRANSIT': 576} | \n", + "{'WALK': 1945, 'TRANSIT': 4948} | \n", + "1.0 | \n", + "
| 2050 | \n", + "81.60 | \n", + "790000.0 | \n", + "9681.372549 | \n", + "https://www.rightmove.co.uk/properties/86972726 | \n", + "2 | \n", + "1393 | \n", + "6390 | \n", + "1393 | \n", + "{'WALK': 518, 'TRANSIT': 564} | \n", + "{'WALK': 441, 'TRANSIT': 5949} | \n", + "2 | \n", + "2733.0 | \n", + "6490.0 | \n", + "2733.0 | \n", + "{'WALK': 451, 'TRANSIT': 2280} | \n", + "{'WALK': 488, 'TRANSIT': 6002} | \n", + "1.0 | \n", + "
2051 rows × 17 columns
\n", + "