# report python version and install required packages
# switch if statement from True to False once packages have been installed
if False:
    !python -V
    !pip install -r ../environment/requirements.txt


# Import modules, define directories
from pyhere import here
import pandas as pd
import geopandas as gpd
import folium as fm
from branca.colormap import LinearColormap
import matplotlib.pyplot as plt
from matplotlib.patches import Patch

# You can define your own shortcuts for file paths:
path = {
    "dscr": here("data", "scratch"),
    "drpub": here("data", "raw", "public"),
    "drpriv": here("data", "raw", "private"),
    "ddpub": here("data", "derived", "public"),
    "ddpriv": here("data", "derived", "private"),
    "rfig": here("results", "figures"),
    "roth": here("results", "other"),
    "rtab": here("results", "tables"),
    "dmet": here("data", "metadata")
}


#load in tracts 2010
tracts2010 = gpd.read_file( here(path["drpub"], "tracts2010.shp") )
tracts2010 = gpd.GeoDataFrame(tracts2010)

# Create folium map
mtracts = fm.Map([41.88155337370558, -87.63007007169067], zoom_start=10, tiles = "CartoDB Positron")

# Define a style dictionary to adjust line properties (e.g., line weight)
style_function = lambda x: {'color': 'blue', 'weight': 1, 'lineweight': '.40', 'fillColor': 'blue', 'fillOpacity': '.40'}

# Add the GeoJson layer to the map
fm.GeoJson(tracts2010, style_function=style_function).add_to(mtracts)

mtracts
#print(tracts2010)


# Load in blocks 2010
blocks2010 = gpd.read_file( here(path["drpub"], "blocks2010.shp") )
blocks2010 = gpd.GeoDataFrame(blocks2010)


# Load in parks
parks = gpd.read_file( here(path["drpub"], "parks.shp") )
parks = gpd.GeoDataFrame(parks)

# Define a style dictionary to adjust symbology
style_function = lambda x: {'color': 'green', 'weight': 1, 'fillColor': 'green', 'fillOpacity': '100'}

fm.GeoJson(parks, style_function=style_function).add_to(mtracts)

# Display map
mtracts


# Load in forest
forest = gpd.read_file( here(path["drpub"], "forest.shp") )
forest = gpd.GeoDataFrame(forest)

# Define a style dictionary to adjust line properties 
style_function = lambda x: {'color': 'darkgreen', 'weight': 1, 'fillColor': 'darkgreen', 'fillOpacity': '100'}

fm.GeoJson(forest, style_function=style_function).add_to(mtracts)

# Display map
mtracts


# Join parks and forest
greenspace = gpd.overlay(parks, forest, how='union')


# Calculate Majority Group in tracts
threshold = 60.0
for index, row in tracts2010.iterrows():
    # Check the condition for each row using 'index' to access specific values
    if row['pctWhite'] >= threshold:  # Check if 'pctWhite' is greater than or equal to 60.0
        tracts2010.loc[index, 'majorGroup'] = 'White'  # Assign 'White' to 'majorGroup'
    elif row['pctBlack'] >= threshold:  
        tracts2010.loc[index, 'majorGroup'] = 'Black'
    elif row['pctAsian'] >= threshold:  
        tracts2010.loc[index, 'majorGroup'] = 'Asian'
    elif row['pctLatinx'] >= threshold:  
        tracts2010.loc[index, 'majorGroup'] = 'Latinx'
    else: 
        tracts2010.loc[index, 'majorGroup'] = 'Mixed'


# Buffer by 0.25 miles converted to meters (1 mile ≈ 1609.34 meters)
bufferdist= 0.25 #in miles

greenspacebuffer = greenspace.buffer(bufferdist * 1609.34)

# Convert from multiple polygons into a single multi-part polygon
greenspacebuffer_single = greenspacebuffer.unary_union

# Turn buffered green space into geodataframe
bufferedgreen = gpd.GeoDataFrame(geometry=[greenspacebuffer_single], crs=blocks2010.crs)

# Create folium map
m = fm.Map([41.88155337370558, -87.63007007169067], zoom_start=10, tiles = "CartoDB Positron")

# Define a style dictionary to adjust symbology
style_function = lambda x: {'color': '#bbde93', 'weight': 1, 'fillColor': '#bbde93', 'fillOpacity': '100'}

# Add the GeoJson layer to the map
fm.GeoJson(greenspacebuffer, style_function=style_function).add_to(m)

m


#create centroids
centroids = blocks2010.geometry.centroid  

#turn into geodataframe
blockscentroids = gpd.GeoDataFrame(geometry=centroids, crs=blocks2010.crs)

# Select centroids that intersect with buffered greenspaces
greenaccessblocks = gpd.sjoin(blockscentroids, bufferedgreen, how="inner", predicate="intersects")

# Merge the original block data with the selected blocks based on centroid intersections
greenaccessblocks = greenaccessblocks.merge(blocks2010, left_index=True, right_index=True)


#Group by Tract id 
greenaccessPop = greenaccessblocks.groupby('TRACTCE10')['D001'].sum().reset_index()

# join by tractce10 and add totalpopaccess 
greenaccesstracts = tracts2010.merge(greenaccessPop[['TRACTCE10', 'D001']], on='TRACTCE10', how='left')

# create a Geodataframe with the greenaccesstracts
greenaccesstracts = gpd.GeoDataFrame(greenaccesstracts)
#print(greenaccesstracts)


#group by majority group
groupedgreenaccess = greenaccesstracts.dissolve(by='majorGroup', aggfunc={
         "majorGroup": "count","PopTotal":'sum',"D001":'sum'})
groupedgreenaccess = groupedgreenaccess.rename(columns={'majorGroup': 'Tracts'})


#calculate area for each majority group
groupedgreenaccess['area_sqm'] = groupedgreenaccess.geometry.area

#clip grouped green access and green space 
majorGrnSpace = groupedgreenaccess.clip(greenspace) 

# Calculate green space area
majorGrnSpace['areaGrn_sqm'] = majorGrnSpace.geometry.area

# Calculate 'pctAccess' as a percentage of access per population
majorGrnSpace['pctAccess'] = (majorGrnSpace['D001'] / majorGrnSpace['PopTotal']) * 100

# Calculate 'GreenAreaPop' as the ratio of green area to population
majorGrnSpace['GreenAreaPop'] = majorGrnSpace['areaGrn_sqm'] / majorGrnSpace['PopTotal']

majorGrnSpace


# Rename index column 
table1 = majorGrnSpace.rename_axis('Majority Group')

#Clean up names and round 
table1['Population'] = table1['PopTotal'].round(0).astype(int) 
table1['Population with Access'] = table1['D001'].round(0).astype(int) 
table1['Area (sqm)'] = table1['area_sqm'].round(0).astype(int) 
table1['Green Space Area (sqm)'] = table1['areaGrn_sqm'].round(0).astype(int)
table1['Percent Population with Access'] = table1['pctAccess'].round(1)
table1['Green Space Per Person (sqm)'] = table1['GreenAreaPop'].round(1)
table1 = table1.drop(columns = ["geometry", "PopTotal", "D001", "area_sqm", "areaGrn_sqm", "pctAccess", "GreenAreaPop"])
 
table1.to_csv( here(path["rtab"],"table1.csv") )# Save image

table1


# load and compare original results 
original_results = gpd.read_file( here(path["ddpub"], "original_results.csv") ) 
original_results = pd.DataFrame(original_results)

#Drop geometry column
original_results = original_results.drop(columns = ['geometry'])

original_results


# create a Geodataframe with the greenaccesstracts
greenaccesstracts = gpd.GeoDataFrame(tracts2010)


# Create folium map
mrace = fm.Map([41.88155337370558, -87.63007007169067], zoom_start=10, tiles = "CartoDB Positron")

def style_function(feature):
    major_group = feature['properties']['majorGroup']
    if major_group == 'Asian':
        color = '#bf8282FF'
    elif major_group == 'Black':
        color = '#bbafd0FF'
    elif major_group == 'Latinx':
        color = '#e4b586FF'
    elif major_group == 'Mixed':
        color = '#feffa6FF'
    elif major_group == 'White':
        color = '#4468a8FF'
    else:
        color = '#ffff00'  # Default color if 'majorGroup' doesn't match any condition

    return {
        'fillColor': color,
        'color': 'grey',
        'weight': 0.3,
        'dashArray': '5, 5',
        'fillOpacity': '100'
    }
green_style = lambda x: {'color': '#bbde93', 'weight': 1, 'fillColor': '#bbde93', 'fillOpacity': '100'}

# Add the GeoJson layer to the map
fm.GeoJson(greenaccesstracts, style_function=style_function).add_to(mrace)
fm.GeoJson(greenspace, style_function=green_style).add_to(mrace)

mrace


# dissolve the tracts geometry by racial majority group
greenaccesstracts = greenaccesstracts.dissolve(by= 'majorGroup')
greenaccesstracts['majorityGroup'] = greenaccesstracts.index

# Set up the base plot
fig, ax = plt.subplots(figsize=(10, 10))

# Define a function to assign colors based on 'majorGroup' column
def assign_color(feature):
    major_group = feature['majorityGroup']
    if major_group == 'Asian':
        return '#bf8282FF'
    elif major_group == 'Black':
        return '#bbafd0FF'
    elif major_group == 'Latinx':
        return '#e4b586FF'
    elif major_group == 'Mixed':
        return '#feffa6FF'
    elif major_group == 'White':
        return '#4468a8FF'
    else:
        return '#ffff00'

# Plot greenaccesstracts with different colors based on 'majorGroup' column
greenaccesstracts.plot(ax=ax, color=greenaccesstracts.apply(assign_color, axis=1), edgecolor='grey', linewidth=0.3)

# Plot greenspace 
greenspace.plot(ax=ax, color='#bbde93', edgecolor='grey', linewidth=0.05, alpha=1)

# Customize legend based on the colors for each majority group
plt.title('Racial Dimensions of Green Space in 2010 Chicago')
legend_patches = [
    Patch(facecolor='#bf8282FF', label='Asian'),
    Patch(facecolor='#bbafd0FF', label='Black'),
    Patch(facecolor='#e4b586FF', label='Latinx'),
    Patch(facecolor='#feffa6FF', label='Mixed'),
    Patch(facecolor='#4468a8FF', label='White'),
    Patch(facecolor='#bbde93', label='Greenspace')
]

# Add legend with the created patches
plt.legend(handles=legend_patches)

plt.savefig(here(path["rfig"], 'fig1.png')) # Save image

# Show the plot
plt.show()

Label	Alias	Definition	Type
fid	:--:	object id	int
STATEFP10	:--:	state id	int
COUNTYFP10	:--:	county id	int
TRACTCE10	:--:	tract id	int
GEOID10	:--:	geography id	int
NAME10	:--:	?	int
NAMELSAD10	:--:	census tract name	string
GISJOIN	:--:	uniquely identifies tracts for purpose of joining to geographic data	string
PopTotal	:--:	total population	int
Latinx	:--:	total Hispanic or Latino/Latina population	int
NotLatinx	:--:	total non-Hispanic White population	int
White	:--:	total non-Hispanic White population	int
Black	:--:	total non-Hispanic Black or African American population	int
Asian	:--:	total non-Hispanic Asian population	int
TwoOrMore	:--:	?	int
MedHouseVa	:--:	median house value for owner-occupied houses	int
MedGrossRe	:--:	median gross monthly rent (including utilities)	int
pctWhite	:--:	percent white population	double
pctBlack	:--:	percent black population	double
pctLatinx	:--:	percent latinx population	double
pctAsian	:--:	percent asian population	double

Label	Alias	Definition	Type	Accuracy	Domain	Missing Data Value(s)	Missing Data Frequency
GEO.id	...	Id	string	...	...	...	...
GEO.id2	...	Id2	string	...	...	...	...
GEO.display-label	...	Geography	geometry	...	...	...	...
D001	...	Total Population	int	...	...	...	...
D002	...	Hispanic or Latino	int	...	...	...	...
D003	...	Not Hispanic or Latino	int	...	...	...	...
D004	...	Not Hispanic or Latino: - Population of one race	int	...	...	...	...
D005	...	Not Hispanic or Latino: - White alone	int	...	...	...	...
D006	...	Not Hispanic or Latino: - Black or African American alone	int	...	...	...	...
D007	...	Not Hispanic or Latino: - American Indian and Alaska Native alone	int	...	...	...	...
D008	...	Not Hispanic or Latino: - Asian alone	int	...	...	...	...
D009	...	Not Hispanic or Latino: - Native Hawaiian and Other Pacific Islander alone	int	...	...	...	...
D010	...	Not Hispanic or Latino: - Some Other Race alone	int	...	...	...	...

	geometry	Tracts	PopTotal	D001	area_sqm	areaGrn_sqm	pctAccess	GreenAreaPop
majorGroup
Black	MULTIPOLYGON (((355481.444 561993.089, 355458....	269	755569.0	483672.0	1.964818e+08	1.349878e+07	64.014273	17.865712
Latinx	MULTIPOLYGON (((357408.653 576717.364, 357418....	146	579637.0	334119.0	9.621542e+07	2.667939e+06	57.642801	4.602775
Mixed	MULTIPOLYGON (((352328.568 566122.129, 352338....	178	669499.0	512778.0	1.453426e+08	8.965317e+06	76.591302	13.391083
White	MULTIPOLYGON (((347461.379 568394.469, 347367....	190	660728.0	487125.0	1.186064e+08	1.151111e+07	73.725497	17.421861
Asian	MULTIPOLYGON (((358470.236 575562.435, 358470....	4	13875.0	11248.0	1.983068e+06	2.768250e+04	81.066667	1.995135

	Tracts	Population	Population with Access	Area (sqm)	Green Space Area (sqm)	Percent Population with Access	Green Space Per Person (sqm)
Majority Group
Black	269	755569	483672	196481794	13498778	64.0	17.9
Latinx	146	579637	334119	96215420	2667939	57.6	4.6
Mixed	178	669499	512778	145342623	8965317	76.6	13.4
White	190	660728	487125	118606374	11511111	73.7	17.4
Asian	4	13875	11248	1983068	27683	81.1	2.0

	Majority Group	Tracts	Population	Population with Access	Area (sqm)	Green Space Area (sqm)	Percent Population with Access	Green Space Per Person (sqm)
0	Black	269	755,569	482,153	196,481,794	13,498,778	63.8	17.9
1	Latinx	146	579,637	332,655	96,215,420	2,667,939	57.4	4.6
2	Mixed	178	669,499	510,794	145,342,623	8,965,317	76.3	13.4
3	White	190	660,728	485,254	118,606,374	11,511,111	73.4	17.4
4	Asian	4	13,875	10,876	1,983,068	27,683	78.4	2.0

Jupyter Notebook¶

Reproduction of Urban Environmental Justice of Green Space Access in Chicago¶

Authors¶

Abstract¶

Study metadata¶

Original study spatio-temporal metadata¶

Study design¶

Materials and procedure¶

Computational environment¶

Data and variables¶

Tracts2010¶

Blocks2010¶

Parks¶

Forest¶

Bias and threats to validity¶

Data transformations¶

Analysis¶

Buffer green space¶

Calculate blocks with accessibility¶

Join to Tracts2010 by tract id¶

Final calculations by majority group¶

Results¶

Visualize racial majority group and greenspace map¶

Discussion¶

Integrity Statement¶

Acknowledgements¶

References¶