|
43 | 43 | "outputs": [],
|
44 | 44 | "source": [
|
45 | 45 | "def read_detector_POI_join_file(detector_POI_join_shp):\n",
|
46 |
| - " detector_POI_join = gpd.read_file(\"../20211028_SCOOT_Data/SCOOT_data_points-shp/Spatial Join/\" + detector_POI_join_shp + \".shp\")\n", |
| 46 | + " detector_POI_join = gpd.read_file(\"../data/independent_variables/POI/\" + detector_POI_join_shp + \".shp\")\n", |
47 | 47 | " \n",
|
48 | 48 | " return detector_POI_join"
|
49 | 49 | ]
|
|
136 | 136 | "## 2. Implement"
|
137 | 137 | ]
|
138 | 138 | },
|
| 139 | + { |
| 140 | + "cell_type": "markdown", |
| 141 | + "metadata": {}, |
| 142 | + "source": [ |
| 143 | + "### Unzip the file" |
| 144 | + ] |
| 145 | + }, |
| 146 | + { |
| 147 | + "cell_type": "code", |
| 148 | + "execution_count": 2, |
| 149 | + "metadata": {}, |
| 150 | + "outputs": [], |
| 151 | + "source": [ |
| 152 | + "import zipfile\n", |
| 153 | + "import os" |
| 154 | + ] |
| 155 | + }, |
| 156 | + { |
| 157 | + "cell_type": "code", |
| 158 | + "execution_count": 3, |
| 159 | + "metadata": {}, |
| 160 | + "outputs": [], |
| 161 | + "source": [ |
| 162 | + "zip_file_path = '../data/independent_variables/POI.zip'\n", |
| 163 | + "extract_dir = '../data/independent_variables/'\n", |
| 164 | + "\n", |
| 165 | + "os.makedirs(extract_dir, exist_ok=True)\n", |
| 166 | + "\n", |
| 167 | + "# Unzip the file\n", |
| 168 | + "with zipfile.ZipFile(zip_file_path, 'r') as zip_ref:\n", |
| 169 | + " zip_ref.extractall(extract_dir)" |
| 170 | + ] |
| 171 | + }, |
139 | 172 | {
|
140 | 173 | "cell_type": "markdown",
|
141 | 174 | "metadata": {},
|
|
165 | 198 | "all_POI.insert(loc=0, column='siteId', value=site_list)\n",
|
166 | 199 | "all_POI\n",
|
167 | 200 | "\n",
|
168 |
| - "#all_POI.to_csv('all_buffer_POI_percent.csv', index = False)" |
| 201 | + "all_POI.to_csv('../data/independent_variables/POI/all_buffer_POI_percent.csv', index = False)" |
169 | 202 | ]
|
170 | 203 | },
|
171 | 204 | {
|
|
215 | 248 | "outputs": [],
|
216 | 249 | "source": [
|
217 | 250 | "def read_landcover_intersect_file(buffer_landcover_intersect_csv):\n",
|
218 |
| - " landcover_intersect = gpd.read_file(\"../20211028_SCOOT_Data/SCOOT_data_points-shp/Spatial Join/\" + buffer_landcover_intersect_csv + \".csv\")\n", |
| 251 | + " landcover_intersect = gpd.read_file(\"../data/independent_variables/landcover/\" + buffer_landcover_intersect_csv + \".csv\")\n", |
219 | 252 | " \n",
|
220 | 253 | " return landcover_intersect"
|
221 | 254 | ]
|
|
272 | 305 | "source": [
|
273 | 306 | "def merge_landcover_class(df_landcover_percent):\n",
|
274 | 307 | "\n",
|
275 |
| - " Landcover_osgb = gpd.read_file(\"Land_cover_shp/land_cover_osgb36.shp\")\n", |
| 308 | + " Landcover_osgb = gpd.read_file(\"../data/independent_variables/landcover/land_cover_osgb36.shp\")\n", |
276 | 309 | " landcover_class = sorted(list(set(Landcover_osgb.class_2018)))\n",
|
277 | 310 | "\n",
|
278 | 311 | " urban_residential_area = [landcover_class[2],landcover_class[3], landcover_class[4], landcover_class[5], landcover_class[6], landcover_class[12]]\n",
|
|
349 | 382 | " return landcover_sta"
|
350 | 383 | ]
|
351 | 384 | },
|
| 385 | + { |
| 386 | + "cell_type": "markdown", |
| 387 | + "metadata": {}, |
| 388 | + "source": [ |
| 389 | + "### Unzip the file" |
| 390 | + ] |
| 391 | + }, |
| 392 | + { |
| 393 | + "cell_type": "code", |
| 394 | + "execution_count": 4, |
| 395 | + "metadata": {}, |
| 396 | + "outputs": [], |
| 397 | + "source": [ |
| 398 | + "zip_file_path = '../data/independent_variables/landcover.zip'\n", |
| 399 | + "extract_dir = '../data/independent_variables/'\n", |
| 400 | + "\n", |
| 401 | + "os.makedirs(extract_dir, exist_ok=True)\n", |
| 402 | + "\n", |
| 403 | + "# Unzip the file\n", |
| 404 | + "with zipfile.ZipFile(zip_file_path, 'r') as zip_ref:\n", |
| 405 | + " zip_ref.extractall(extract_dir)" |
| 406 | + ] |
| 407 | + }, |
352 | 408 | {
|
353 | 409 | "cell_type": "markdown",
|
354 | 410 | "metadata": {},
|
|
386 | 442 | "all_landcover.insert(loc=0, column='siteId', value=site_list)\n",
|
387 | 443 | "all_landcover\n",
|
388 | 444 | "\n",
|
389 |
| - "#all_landcover.to_csv('all_buffer_landcover_percent_new.csv', index = False)" |
| 445 | + "all_landcover.to_csv('../data/independent_variables/landcover/all_buffer_landcover_percent_new.csv', index = False)" |
390 | 446 | ]
|
391 | 447 | },
|
392 | 448 | {
|
|
437 | 493 | "outputs": [],
|
438 | 494 | "source": [
|
439 | 495 | "def read_road_intersect_file(buffer_road_intersect_csv):\n",
|
440 |
| - " road_link_intersect = gpd.read_file(\"../20211028_SCOOT_Data/SCOOT_data_points-shp/Spatial Join/\" + buffer_road_intersect_csv + \".csv\")\n", |
| 496 | + " road_link_intersect = gpd.read_file(\"../data/independent_variables/road_link/\" + buffer_road_intersect_csv + \".csv\")\n", |
441 | 497 | " return road_link_intersect"
|
442 | 498 | ]
|
443 | 499 | },
|
|
506 | 562 | " return road_sta"
|
507 | 563 | ]
|
508 | 564 | },
|
| 565 | + { |
| 566 | + "cell_type": "markdown", |
| 567 | + "metadata": {}, |
| 568 | + "source": [ |
| 569 | + "### Unzip the file" |
| 570 | + ] |
| 571 | + }, |
| 572 | + { |
| 573 | + "cell_type": "code", |
| 574 | + "execution_count": 5, |
| 575 | + "metadata": {}, |
| 576 | + "outputs": [], |
| 577 | + "source": [ |
| 578 | + "zip_file_path = '../data/independent_variables/road_link.zip'\n", |
| 579 | + "extract_dir = '../data/independent_variables/'\n", |
| 580 | + "\n", |
| 581 | + "os.makedirs(extract_dir, exist_ok=True)\n", |
| 582 | + "\n", |
| 583 | + "# Unzip the file\n", |
| 584 | + "with zipfile.ZipFile(zip_file_path, 'r') as zip_ref:\n", |
| 585 | + " zip_ref.extractall(extract_dir)" |
| 586 | + ] |
| 587 | + }, |
509 | 588 | {
|
510 | 589 | "cell_type": "markdown",
|
511 | 590 | "metadata": {},
|
|
541 | 620 | "all_road.insert(loc=0, column='siteId', value=site_list)\n",
|
542 | 621 | "all_road\n",
|
543 | 622 | "\n",
|
544 |
| - "#all_road.to_csv('all_buffer_road_percent.csv', index = False)" |
| 623 | + "all_road.to_csv('../data/independent_variables/road_link/all_buffer_road_percent.csv', index = False)" |
545 | 624 | ]
|
546 | 625 | },
|
547 | 626 | {
|
|
670 | 749 | "outputs": [],
|
671 | 750 | "source": [
|
672 | 751 | "def read_OA_intersect_file(buffer_OA_intersect_csv):\n",
|
673 |
| - " OA_link_intersect = gpd.read_file(\"../20211028_SCOOT_Data/SCOOT_data_points-shp/Spatial Join/\" + buffer_OA_intersect_csv + \".csv\")\n", |
| 752 | + " OA_link_intersect = gpd.read_file(\"../data/independent_variables/census/\" + buffer_OA_intersect_csv + \".csv\")\n", |
674 | 753 | " return OA_link_intersect"
|
675 | 754 | ]
|
676 | 755 | },
|
|
742 | 821 | " return census_sta"
|
743 | 822 | ]
|
744 | 823 | },
|
| 824 | + { |
| 825 | + "cell_type": "markdown", |
| 826 | + "metadata": {}, |
| 827 | + "source": [ |
| 828 | + "### Unzip the file" |
| 829 | + ] |
| 830 | + }, |
| 831 | + { |
| 832 | + "cell_type": "code", |
| 833 | + "execution_count": 6, |
| 834 | + "metadata": {}, |
| 835 | + "outputs": [], |
| 836 | + "source": [ |
| 837 | + "zip_file_path = '../data/independent_variables/census.zip'\n", |
| 838 | + "extract_dir = '../data/independent_variables/'\n", |
| 839 | + "\n", |
| 840 | + "os.makedirs(extract_dir, exist_ok=True)\n", |
| 841 | + "\n", |
| 842 | + "# Unzip the file\n", |
| 843 | + "with zipfile.ZipFile(zip_file_path, 'r') as zip_ref:\n", |
| 844 | + " zip_ref.extractall(extract_dir)" |
| 845 | + ] |
| 846 | + }, |
745 | 847 | {
|
746 | 848 | "cell_type": "markdown",
|
747 | 849 | "metadata": {},
|
|
765 | 867 | "doc_list = ['100', '200', '300', '400']\n",
|
766 | 868 | "df_list = []\n",
|
767 | 869 | "\n",
|
768 |
| - "all_census_csv = reconstruct_census_csv('census2011_csv/useful_data/')\n", |
| 870 | + "all_census_csv = reconstruct_census_csv('../data/independent_variables/census/useful_data/')\n", |
769 | 871 | "useful_census_csv_area = get_useful_census(all_census_csv)\n",
|
770 | 872 | "\n",
|
771 | 873 | "for doc in doc_list:\n",
|
|
781 | 883 | "all_census.insert(loc=0, column='siteId', value=site_list)\n",
|
782 | 884 | "all_census\n",
|
783 | 885 | "\n",
|
784 |
| - "#all_census.to_csv('all_buffer_census_percent.csv', index = False)" |
| 886 | + "all_census.to_csv('../data/independent_variables/census/all_buffer_census_percent.csv', index = False)" |
785 | 887 | ]
|
786 | 888 | },
|
787 | 889 | {
|
|
812 | 914 | ],
|
813 | 915 | "metadata": {
|
814 | 916 | "kernelspec": {
|
815 |
| - "display_name": "Python 3", |
| 917 | + "display_name": "Python 3 (ipykernel)", |
816 | 918 | "language": "python",
|
817 | 919 | "name": "python3"
|
818 | 920 | },
|
|
826 | 928 | "name": "python",
|
827 | 929 | "nbconvert_exporter": "python",
|
828 | 930 | "pygments_lexer": "ipython3",
|
829 |
| - "version": "3.7.0" |
| 931 | + "version": "3.11.5" |
830 | 932 | }
|
831 | 933 | },
|
832 | 934 | "nbformat": 4,
|
|
0 commit comments