# Import modules, define directories

from pyhere import here
import pandas as pd
import geopandas as gpd
import folium
import matplotlib
import numpy as np
import rasterio
from rasterio.plot import show
import fiona
from rasterstats import zonal_stats
from matplotlib import pyplot as plt



# You can define your own shortcuts for file paths:
path = {
    "dscr": here("data", "scratch"),
    "drpub": here("data", "raw", "public"),
    "drpriv": here("data", "raw", "private"),
    "ddpub": here("data", "derived", "public"),
    "ddpriv": here("data", "derived", "private"),
    "rfig": here("results", "figures"),
    "roth": here("results", "other"),
    "rtab": here("results", "tables"),
    "dmet": here("data", "metadata")
}

blockgroups = gpd.read_file(here(path["drpub"], "blockgroups.shp"))

blockgroups = gpd.GeoDataFrame(blockgroups)

blockgroups.head()

blockgroup_demographic_data = pd.read_csv(here(path["drpub"],'blockgroup_demographic_data.csv'), dtype=str,encoding='latin-1')


blockgroup_demographic_data.head()

actual_flood_10 = rasterio.open(here(path["drpub"],'actual_flood_10.tif'))

ax = show((actual_flood_10, 1))

bg_merged = blockgroups.merge(blockgroup_demographic_data, on = "GEOID", how = "left")

bgData = gpd.GeoDataFrame(bg_merged)

bgData.rename(
  columns={
    'B03002_001': 'Total',
    'B03002_003' : 'White',
    'B03002_004' : 'Black',
    'B03002_006' : 'Asian',
    'B03002_012' : 'Latinx',
  },
  inplace=True
)

bgData  = bgData.drop(columns=['STATEFP', 'COUNTYFP', 'TRACTCE', 'BLKGRPCE', 'AFFGEOID','LSAD', 'ALAND', 'AWATER', 'GEONAME','B03002_002','B03002_005','B03002_007', 'B03002_008','B03002_009', 'B03002_010', 'B03002_011','B03002_013','B03002_014', 'B03002_015', 'B03002_016', 'B03002_017', 'B03002_018','B03002_019', 'B03002_020', 'B03002_021'])

# bgData = bgData.astype(
#      {'GEOID': 'int','Total': 'float', 'White': 'float', 'Black': 'float', 'Asian': 'float','Latinx': 'float'}).dtypes

bgData[['Total', 'White', 'Black', 'Asian','Latinx']] = bgData[['Total', 'White', 'Black', 'Asian','Latinx']].apply(pd.to_numeric)
print(bgData.dtypes)
#bgData.columns
#bgData.plot()
#print(bgData)

GEOID         object
geometry    geometry
Total          int64
White          int64
Black          int64
Asian          int64
Latinx         int64
dtype: object

## Calculate percentages of each majority group


bgData["pctAsian"] = bgData.Asian / bgData.Total * 100
bgData["pctBlack"] = bgData.Black / bgData.Total * 100
bgData["pctLatinx"] = bgData.Latinx / bgData.Total * 100
bgData["pctWhite"] = bgData.White / bgData.Total * 100

bgData.plot(column='pctLatinx', legend=True)

<Axes: >

## Create majority group field

def assign_major_group(row):
    if row['pctAsian'] >= 60:
        return 'Asian'
    elif row['pctBlack'] >= 60:
        return 'Black'
    elif row['pctLatinx'] >= 60:
        return 'Latinx'
    elif row['pctWhite'] >= 60:
        return 'White'
    else:
        return 'Mixed'

bgData['majorGrp'] = bgData.apply(assign_major_group, axis=1)

bgData.head(10)

## Group by majority groups and dissolve geometry
bgData['blockGroups'] = 1
#bgData['majorGrp2'] = bgData.majorGrp
group_sums = bgData.groupby('majorGrp')[['blockGroups', 'Total', 'White', 'Black', 'Asian', 'Latinx']].sum().reset_index()

# Step 2: Merge the sum information with the original GeoDataFrame
bgDataWithSums = pd.merge(bgData, group_sums, on='majorGrp', how = 'inner')

# Step 3: Dissolve based on 'majorGrp' and calculate the sum
dissolved = bgDataWithSums.dissolve('majorGrp', aggfunc='sum')

# Step 4: Create a new GeoDataFrame with the dissolved result
major_grps = gpd.GeoDataFrame(dissolved)

major_grps = major_grps.drop(columns=['blockGroups_y','Total_y','White_y','Black_y','Asian_y','Latinx_y'])

major_grps.rename(
  columns={
    'blockGroups_x': 'blockGrps',
    'Total_x' : 'Total',
    'White_x' : 'White',
    'Black_x' : 'Black',
    'Asian_x' : 'Asian',
    'Latinx_x' : 'Latinx'
  },
  inplace=True
)

major_grps.head()

#bgData.plot(column='majorGrp', legend=True)

/Users/colmanbashore/anaconda3/envs/flooding/lib/python3.9/site-packages/geopandas/geodataframe.py:1676: FutureWarning: The default value of numeric_only in DataFrameGroupBy.sum is deprecated. In a future version, numeric_only will default to False. Either specify numeric_only or select only columns which should be valid for the function.
  aggregated_data = data.groupby(**groupby_kwargs).agg(aggfunc)

# Zonal Statistics

# Filter out invalid geometries
major_grps = major_grps[major_grps.geometry.is_valid]

major_grps.to_file(here(path["ddpub"],'major_grps.shp'), driver='ESRI Shapefile')


# Specify the path to the raster file
raster_file = here(path["drpub"],'actual_flood_10.tif')

# Read raster data using rasterio
with rasterio.open(raster_file) as src:
    # Get raster values as a NumPy array
    raster_data = src.read(1)


with fiona.open(here(path["ddpub"],'major_grps.shp')) as src:
    zs = zonal_stats(src, raster_file, stats="count", all_touched=True)

    
print(zs)

flood_pixels = [value for dictionary in zs for value in dictionary.values()]

bgMajorFld = gpd.read_file(here(path["ddpub"],'major_grps.shp'))

bgMajorFld['fl_count'] = flood_pixels

# Display the GeoDataFrame with the new "flood" column
print(bgMajorFld['fl_count'])

/Users/colmanbashore/anaconda3/envs/flooding/lib/python3.9/site-packages/rasterstats/main.py:151: ShapelyDeprecationWarning: The 'type' attribute is deprecated, and will be removed in the future. You can use the 'geom_type' attribute instead.
  if 'Point' in geom.type:

[{'count': 2165}, {'count': 645888}, {'count': 3181885}, {'count': 11415356}, {'count': 4784908}]
0        2165
1      645888
2     3181885
3    11415356
4     4784908
Name: fl_count, dtype: int64

# Field Calculator Flooded Area
bgMajorFld['flArea'] = bgMajorFld.fl_count * 10 * 10
bgMajorFld['totArea'] = (bgMajorFld.geometry.area).round(2)
bgMajorFld['pctFlood'] = (bgMajorFld.flArea / bgMajorFld.totArea * 100).round(2)

bgMajorFld.head()

columns_to_export = ['majorGrp', 'blockGrps','flArea', 'totArea', 'pctFlood']

bgMajorFld[columns_to_export].to_csv(here(path["rtab"],'MajGrpFld.csv'), index=False)

bgMajorFld.to_csv(here(path["ddpub"],'bgMajorFld.csv'), index=False)

# Final Table
Final_Table = pd.read_csv(here(path["rtab"],'MajGrpFld.csv'), dtype=str,encoding='latin-1')
Final_Table.head()

# Final Map
Final_Map = bgMajorFld.plot(column = 'pctFlood', legend = True, cmap = 'Blues', scheme = 'FisherJenks')
print("Percent Flooded by Block Groups")

plt.savefig(here(path["rfig"],'bgMajorFld.png'))

Percent Flooded by Block Groups

/Users/colmanbashore/anaconda3/envs/flooding/lib/python3.9/site-packages/mapclassify/classifiers.py:1860: UserWarning: Numba not installed. Using slow pure python version.
  warnings.warn(

# Map of Majority Groups
bgMajorFld.plot(column='majorGrp', legend = True)
plt.savefig(here(path["rfig"],'majorGrps.png'))

# Map of Flooding Extent

with rasterio.open(here(path["drpub"],'actual_flood_10.tif')) as src:
    # Read the raster data
    raster_data = src.read(1)

    # Plot the raster image
    plt.imshow(raster_data, cmap='Blues')
    #plt.colorbar(label='Pixel Values')
    plt.title('Flooding Extent')

    # Save the plot as a PNG file
    plt.savefig(here(path["rfig"],'actualFlood.png'))

    # Show the plot (optional)
    plt.show()

	STATEFP	COUNTYFP	TRACTCE	BLKGRPCE	AFFGEOID	GEOID	LSAD	ALAND	AWATER	GEONAME	geometry
0	48	201	311000	1	1500000US482013110001	482013110001	BG	616969.0	47009.0	Block Group 1, Census Tract 3110, Harris Count...	POLYGON ((958404.137 4217699.295, 958413.144 4...
1	48	201	311000	4	1500000US482013110004	482013110004	BG	408595.0	25333.0	Block Group 4, Census Tract 3110, Harris Count...	POLYGON ((957048.814 4217692.784, 957496.427 4...
2	48	201	311100	1	1500000US482013111001	482013111001	BG	1018525.0	213804.0	Block Group 1, Census Tract 3111, Harris Count...	POLYGON ((958975.179 4217311.881, 958892.738 4...
3	48	201	311100	3	1500000US482013111003	482013111003	BG	484061.0	36045.0	Block Group 3, Census Tract 3111, Harris Count...	POLYGON ((958773.280 4216120.376, 959779.865 4...
4	48	201	311100	4	1500000US482013111004	482013111004	BG	547376.0	0.0	Block Group 4, Census Tract 3111, Harris Count...	POLYGON ((958756.220 4216618.402, 959659.603 4...

Label	Alias	Definition	Type	Accuracy	Domain	Missing Data Value(s)	Missing Data Frequency
GEOID	GEOID	Unique identifier for each block group	Integer	N/A	482011000001 to 482019801001	N/A	None
BO3002_001	Total Population	Number of people in the block group	Integer	See ACS	9-21758	N/A	None
BO3002_003	White Population	Number of people in the White racial/ethnic group in the block group	Integer	See ACS	0-9199	N/A	None
BO3002_004	Black Population	Number of people in the Black racial/ethnic group in the block group	Integer	See ACS	0-5258	N/A	None
BO3002_006	Asian Population	Number of people in the Asian racial/ethnic group in the block group	Integer	See ACS	0-3418	N/A	None
BO3002_012	Latinx Population	Number of people in the Latinx racial/ethnic group in the block group	Integer	See ACS	0-11408	N/A	None

	GEOID	B03002_001	B03002_002	B03002_003	B03002_004	B03002_006	...	B03002_012	B03002_013	B03002_014	B03002_015	B03002_018	B03002_019	B03002_020	B03002_021
0	482013110001	583	0	0	0	0	...	583	573	0	0	10	0	0	0
1	482013110004	1869	22	22	0	0	...	1847	1818	0	0	29	0	0	0
2	482013111001	1046	11	11	0	0	...	1035	895	4	0	136	0	0	0
3	482013111003	1639	112	112	0	0	...	1527	1192	0	0	315	20	0	20
4	482013111004	1759	48	0	16	32	...	1711	1476	11	7	173	44	44	0

	GEOID	geometry	Total	White	Black	Asian	Latinx	pctAsian	pctBlack	pctLatinx	pctWhite	majorGrp
0	482013110001	POLYGON ((958404.137 4217699.295, 958413.144 4...	583	0	0	0	583	0.000000	0.000000	100.000000	0.000000	Latinx
1	482013110004	POLYGON ((957048.814 4217692.784, 957496.427 4...	1869	22	0	0	1847	0.000000	0.000000	98.822900	1.177100	Latinx
2	482013111001	POLYGON ((958975.179 4217311.881, 958892.738 4...	1046	11	0	0	1035	0.000000	0.000000	98.948375	1.051625	Latinx
3	482013111003	POLYGON ((958773.280 4216120.376, 959779.865 4...	1639	112	0	0	1527	0.000000	0.000000	93.166565	6.833435	Latinx
4	482013111004	POLYGON ((958756.220 4216618.402, 959659.603 4...	1759	0	16	32	1711	1.819215	0.909608	97.271177	0.000000	Latinx
5	482013131001	POLYGON ((948490.088 4214006.390, 948838.150 4...	2744	1567	347	434	375	15.816327	12.645773	13.666181	57.106414	Mixed
6	482013111002	POLYGON ((958538.363 4215935.056, 958611.621 4...	1092	7	0	0	1085	0.000000	0.000000	99.358974	0.641026	Latinx
7	482013131002	POLYGON ((947852.561 4213019.383, 947966.900 4...	652	304	85	119	88	18.251534	13.036810	13.496933	46.625767	Mixed
8	482015431001	POLYGON ((896848.263 4250165.408, 897077.183 4...	3498	1442	322	19	1490	0.543168	9.205260	42.595769	41.223556	Mixed
9	482015502001	POLYGON ((943861.867 4241534.858, 944139.303 4...	2256	143	1368	0	745	0.000000	60.638298	33.023050	6.338652	Black

	geometry	Total	White	Black	Asian	Latinx	pctAsian	pctBlack	pctLatinx	pctWhite	blockGrps
majorGrp
Asian	MULTIPOLYGON (((926751.990 4209490.058, 926783...	3814	557	157	2431	637	192.226138	16.971301	47.205665	41.411103	3
Black	MULTIPOLYGON (((949698.842 4206031.461, 949639...	264578	10961	199801	3261	47251	180.146080	13451.646456	3023.093058	650.237696	175
Latinx	MULTIPOLYGON (((965411.937 4198913.656, 965055...	1219893	112180	109390	27012	962544	1195.685395	4933.749778	51520.813364	6210.126096	643
Mixed	MULTIPOLYGON (((970393.326 4194192.233, 969688...	2213832	661709	497957	224801	777050	8318.759023	19525.925998	30700.430404	25805.788462	864
White	MULTIPOLYGON (((978544.008 4193972.941, 978565...	823402	601169	30980	49604	123053	2669.432784	1483.902465	6311.791195	34404.114891	459

Reproduction of Hurricane Harvey Flooding GEOG120 Lab Problem¶

Authors¶

Abstract¶

Study metadata¶

Original study spatio-temporal metadata¶

Study design¶

Materials and procedure¶

Computational environment¶

Data and variables¶

blockgroups.shp¶

Import blockgroups.shp¶

blockgroup_demographic_data.csv¶

actual_flood_10.tif¶

Bias and threats to validity¶

Data transformations¶

Goal 1: Load census data into block groups¶

Goal 2: Create regions by majority groups¶

Analysis¶

Goal 3: Find flooded area in each group and calculate pct¶

Results¶

Percent Flooded by Block Groups¶

Majority Groups in Harris County, Texas¶

Flooding extent from Hurricane Harvey in Harris County, Texas¶

Discussion¶

Integrity Statement¶

Acknowledgements¶

References¶

	majorGrp	blockGrps	flArea	totArea	pctFlood
0	Asian	3	216500	952855.79	22.72
1	Black	175	64588800	206749828.71	31.24
2	Latinx	643	318188500	789346589.94	40.31
3	Mixed	864	1141535600	2477275416.41	46.08
4	White	459	478490800	1114263551.36	42.94