|
44 | 44 | }, |
45 | 45 | { |
46 | 46 | "cell_type": "code", |
47 | | - "execution_count": 5, |
| 47 | + "execution_count": null, |
48 | 48 | "id": "cell-3", |
49 | 49 | "metadata": { |
50 | 50 | "id": "cell-3" |
|
81 | 81 | }, |
82 | 82 | { |
83 | 83 | "cell_type": "code", |
84 | | - "execution_count": 6, |
| 84 | + "execution_count": null, |
85 | 85 | "id": "cell-5", |
86 | 86 | "metadata": { |
87 | 87 | "colab": { |
|
155 | 155 | }, |
156 | 156 | { |
157 | 157 | "cell_type": "code", |
158 | | - "execution_count": 7, |
| 158 | + "execution_count": null, |
159 | 159 | "id": "cell-8", |
160 | 160 | "metadata": { |
161 | 161 | "colab": { |
|
334 | 334 | }, |
335 | 335 | { |
336 | 336 | "cell_type": "code", |
337 | | - "execution_count": 8, |
| 337 | + "execution_count": null, |
338 | 338 | "id": "3981b6fb", |
339 | 339 | "metadata": { |
340 | 340 | "id": "3981b6fb" |
|
347 | 347 | }, |
348 | 348 | { |
349 | 349 | "cell_type": "code", |
350 | | - "execution_count": 9, |
| 350 | + "execution_count": null, |
351 | 351 | "id": "c9fczvktoyq", |
352 | 352 | "metadata": { |
353 | 353 | "colab": { |
|
394 | 394 | }, |
395 | 395 | { |
396 | 396 | "cell_type": "code", |
397 | | - "execution_count": 10, |
| 397 | + "execution_count": null, |
398 | 398 | "id": "o8froym44w", |
399 | 399 | "metadata": { |
400 | 400 | "colab": { |
|
450 | 450 | }, |
451 | 451 | { |
452 | 452 | "cell_type": "code", |
453 | | - "execution_count": 12, |
| 453 | + "execution_count": null, |
454 | 454 | "id": "cell-12", |
455 | 455 | "metadata": { |
456 | 456 | "colab": { |
|
670 | 670 | }, |
671 | 671 | { |
672 | 672 | "cell_type": "code", |
673 | | - "execution_count": 13, |
| 673 | + "execution_count": null, |
674 | 674 | "id": "14e27496", |
675 | 675 | "metadata": { |
676 | 676 | "colab": { |
|
881 | 881 | }, |
882 | 882 | { |
883 | 883 | "cell_type": "code", |
884 | | - "execution_count": 14, |
| 884 | + "execution_count": null, |
885 | 885 | "id": "78efc197", |
886 | 886 | "metadata": { |
887 | 887 | "colab": { |
|
915 | 915 | "source": [ |
916 | 916 | "## Duplicate Flood Event Detection\n", |
917 | 917 | "\n", |
918 | | - "One of the problems with the dataset is the presence of many duplicate records for the same flood event. While Google did perform some spatio-temporal aggregation, the dataset still has overlapping records from the same flood event that have different geographic extent (captured from different articles) and/or slightly varying dates. Our goal is to count the total unique flood events aggregated for each grid. Such duplicates would show up as spatially intersecting polygons with `start_date` values within a few days of each other. We use a vectorized `STRtree` bulk query to find all such candidate pairs efficiently." |
| 918 | + "One of the problems with aggregating this dataset over a grid is the presense of overlapping polygons for the same flood event. While Google did perform some spatio-temporal aggregation, the dataset still has overlapping records from the same flood event that have different geographic extent and slightly varying dates (an article may talk about flooding in the city while another will talk about the same flood in a neighborhood). Our goal is to count the total unique flood events aggregated for each grid and we want to only count unique flood events. We apply a pre-processing step to find all pairs of spatially intersecting polygons with `start_date` values within a few days of each other and assign the the same `flood_event` id." |
919 | 919 | ] |
920 | 920 | }, |
921 | 921 | { |
|
980 | 980 | "outputId": "af1ac87d-96ca-4c43-9287-bab18c0be48c" |
981 | 981 | }, |
982 | 982 | "id": "6cjv4TsaBl_K", |
983 | | - "execution_count": 24, |
| 983 | + "execution_count": null, |
984 | 984 | "outputs": [ |
985 | 985 | { |
986 | 986 | "output_type": "stream", |
|
1187 | 1187 | }, |
1188 | 1188 | { |
1189 | 1189 | "cell_type": "code", |
1190 | | - "execution_count": 25, |
| 1190 | + "execution_count": null, |
1191 | 1191 | "id": "mqi2zhq5h4", |
1192 | 1192 | "metadata": { |
1193 | 1193 | "colab": { |
|
1227 | 1227 | }, |
1228 | 1228 | { |
1229 | 1229 | "cell_type": "code", |
1230 | | - "execution_count": 31, |
| 1230 | + "execution_count": null, |
1231 | 1231 | "id": "d89e6286", |
1232 | 1232 | "metadata": { |
1233 | 1233 | "colab": { |
|
1486 | 1486 | }, |
1487 | 1487 | { |
1488 | 1488 | "cell_type": "code", |
1489 | | - "execution_count": 32, |
| 1489 | + "execution_count": null, |
1490 | 1490 | "id": "76c29140", |
1491 | 1491 | "metadata": { |
1492 | 1492 | "id": "76c29140" |
|
1508 | 1508 | }, |
1509 | 1509 | { |
1510 | 1510 | "cell_type": "code", |
1511 | | - "execution_count": 33, |
| 1511 | + "execution_count": null, |
1512 | 1512 | "id": "86dbb465", |
1513 | 1513 | "metadata": { |
1514 | 1514 | "id": "86dbb465" |
|
1531 | 1531 | }, |
1532 | 1532 | { |
1533 | 1533 | "cell_type": "code", |
1534 | | - "execution_count": 34, |
| 1534 | + "execution_count": null, |
1535 | 1535 | "id": "2f8f25dc", |
1536 | 1536 | "metadata": { |
1537 | 1537 | "colab": { |
|
1709 | 1709 | }, |
1710 | 1710 | { |
1711 | 1711 | "cell_type": "code", |
1712 | | - "execution_count": 41, |
| 1712 | + "execution_count": null, |
1713 | 1713 | "id": "9fcba691", |
1714 | 1714 | "metadata": { |
1715 | 1715 | "colab": { |
|
1782 | 1782 | }, |
1783 | 1783 | { |
1784 | 1784 | "cell_type": "code", |
1785 | | - "execution_count": 37, |
| 1785 | + "execution_count": null, |
1786 | 1786 | "id": "2f53ca54", |
1787 | 1787 | "metadata": { |
1788 | 1788 | "id": "2f53ca54" |
|
0 commit comments