Social Vulnerability Milan - Calculate Vulnerability

Social Vulnerability Milan - Calculate Vulnerability#

Environment#

R Libraries#

The relvant R libraries are imported in to the kernal:

# Load R libraries
if(!require("pacman"))
    install.packages("pacman")

p_load("sf", "tidyverse")

print("Loaded Packages:")
p_loaded()

Loading required package: pacman

[1] "Loaded Packages:"

'lubridate'
'forcats'
'stringr'
'dplyr'
'purrr'
'readr'
'tidyr'
'tibble'
'ggplot2'
'tidyverse'
'sf'
'pacman'

Output directory#

# create the output directory if it does not exist
output_dir <- file.path("../..","3_outputs","Italy","Milan","2021")
if(!dir.exists(output_dir)){
    dir.create(output_dir, recursive = TRUE)
    print(paste0(output_dir, " created"))
}

Set the GUID#

GUID <- "SEZ2011"

Load Data#

Import the data#

# Load census data
census_indicator_data <- read.csv("../../2_pipeline/Italy/Milan/1a_CensusData/2021/censusDataZ.csv")
colnames(census_indicator_data)[colnames(census_indicator_data) == "GUID"] = "SA_GUID__1"
head(census_indicator_data)

# Load Coperncius data: tree cover density (TCD) and imperviousness density (IMP)
tcd_indicator_data <- st_read("../../2_pipeline/Italy/Milan/1b_Copernicus/2021/census_areas_TCD.geojson")
imd_indicator_data <- st_read("../../2_pipeline/Italy/Milan/1b_Copernicus/2021/census_areas_IMD.geojson")

# Get the geospatial data from the TCS data (the IMD data also has same spatial data)
oa <- subset(tcd_indicator_data, select = c(GUID, 'geometry'))

# Load vulnerability mapping information from the config file
## This mapping information is used to help guide the amalgamation of the data.
## Weighting can be changed in this file, depending on the scenario.
## Scenario 1 (best case scenario): Weighting values 1 or -1:
##  where 1 means no change
##  or -1 means all the indicator values are multiplied by -1, resulting in an inverse indicator.
## Scenario 2: Weighting values 0.5 or -0.5:
##  For domains with just a single indicators or where there is a lack of information related to missing indicators. 
##  For these domains the weights are halved using a weight of 0.5, or -0.5 for an inverse indicator.
##  Therefore the influence of these indicators are reduced in half.
## Other scenarios are supported by using other decimal numbers if decided for a particular dataset.
indicator_mapping <- read.csv("config/vulnerabilityIndicatorMappings.csv", header=TRUE, sep=",", stringsAsFactors = FALSE, fileEncoding="UTF-8-BOM")

# Print up to 100 rows of vulnerabiltiy mapping config file
head(indicator_mapping,100)

A data.frame: 6 × 11
	SEZ2011	early_childhood_boy	early_childhood_girl	age_middle_to_oldest_old_male	age_middle_to_oldest_old_female	dependants	unemployment	no_higher_education	foreign_nationals	primary_school_age	one_person_households
	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>
1	1.5146e+11	-1.230411	-1.064144	2.1196292	-1.3062152	-0.7801407	-0.5060886	-0.6075338	0.284861877	-1.458348	0.9333249
2	1.5146e+11	-1.230411	-1.064144	0.2302043	-0.3189938	0.1197864	1.3419462	0.8849880	0.768744204	-1.458348	-0.7026211
3	1.5146e+11	-1.230411	-1.064144	3.8043177	-1.3062152	-2.2200240	-0.2425543	-1.6458099	-1.081394102	-1.458348	3.2236494
4	1.5146e+11	-1.230411	-1.064144	2.6982091	-1.3062152	-0.5183437	-1.2391934	-1.6458099	-0.004949997	1.865648	0.2789465
5	1.5146e+11	-1.230411	-1.064144	19.6216703	-1.3062152	-2.2200240	-2.2981224	-1.6458099	-1.081394102	-1.458348	3.2236494
6	1.5146e+11	-1.230411	-1.064144	-1.0625601	-1.3062152	-2.2200240	-2.2981224	-1.6458099	2.865567617	-1.458348	0.9333249

Reading layer `census_areas_TCD' from data source 
  `/Cities/2_pipeline/Italy/Milan/1b_Copernicus/2021/census_areas_TCD.geojson' 
  using driver `GeoJSON'
Simple feature collection with 6079 features and 15 fields
Geometry type: POLYGON
Dimension:     XY
Bounding box:  xmin: 1503202 ymin: 5025952 xmax: 1521750 ymax: 5042528
Projected CRS: Monte Mario / Italy zone 1
Reading layer `census_areas_IMD' from data source 
  `/Cities/2_pipeline/Italy/Milan/1b_Copernicus/2021/census_areas_IMD.geojson' 
  using driver `GeoJSON'
Simple feature collection with 6079 features and 15 fields
Geometry type: POLYGON
Dimension:     XY
Bounding box:  xmin: 1503202 ymin: 5025952 xmax: 1521750 ymax: 5042528
Projected CRS: Monte Mario / Italy zone 1

A data.frame: 12 × 9
	domain	indicator	sensitivity	prepare	respond	recover	adaptive_capacity	enhanced_exposure	weight
	<chr>	<chr>	<int>	<int>	<int>	<int>	<int>	<int>	<dbl>
1	age	early_childhood_boy	1	0	0	0	0	0	1.0
2	age	early_childhood_girl	1	0	0	0	0	0	1.0
3	age	age_middle_to_oldest_old_male	1	0	0	0	0	0	1.0
4	age	age_middle_to_oldest_old_female	1	0	0	0	0	0	1.0
5	income	dependants	0	1	1	1	1	0	1.0
6	income	unemployment	0	1	1	1	1	0	1.0
7	info_access_use	no_higher_education	0	1	1	1	1	0	0.5
8	local_knowledge	foreign_nationals	0	1	1	0	1	0	0.5
9	social_network	primary_school_age	0	0	1	1	1	0	-1.0
10	social_network	one_person_households	0	0	1	1	1	0	1.0
11	physical_environment	impervious	0	0	0	0	0	1	1.0
12	physical_environment	tree_cover_density	0	0	0	0	0	1	1.0

Prepare Data#

Combine data into a single indicator dataset#

# combine census data with copernicus TCD and IMD data (without geospatial data to advoid duplication)
indicator_data <- merge(tcd_indicator_data, st_drop_geometry(census_indicator_data), by.x = GUID, by.y = GUID, all.x = TRUE)
indicator_data <- merge(imd_indicator_data, st_drop_geometry(indicator_data), by=GUID)

# drop the geometry
indicator_data <- st_drop_geometry(indicator_data)

# change the small area id column data type (GUID) to character string
indicator_data[GUID] <- lapply(indicator_data[GUID], as.character)

# trim the columns
indicator_data <- subset(indicator_data, select=c(names(census_indicator_data), 'tree_cover_density', 'impervious'))

# Set missing data fields to zero (0)
# Note: In Italian census the NA or empty data fields are areas with no population (e.g. parks, schools, etc.)
indicator_data[is.na(indicator_data)] <- 0

# Print the first part of the indicators, which are now collated into one table
head(indicator_data)

A data.frame: 6 × 13
	SEZ2011	early_childhood_boy	early_childhood_girl	age_middle_to_oldest_old_male	age_middle_to_oldest_old_female	dependants	unemployment	no_higher_education	foreign_nationals	primary_school_age	one_person_households	tree_cover_density	impervious
	<chr>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>
1	151460000001	-1.230411	-1.064144	2.1196292	-1.3062152	-0.7801407	-0.5060886	-0.6075338	0.284861877	-1.458348	0.9333249	0.6144226	1.409195
2	151460000002	-1.230411	-1.064144	0.2302043	-0.3189938	0.1197864	1.3419462	0.8849880	0.768744204	-1.458348	-0.7026211	0.6144226	1.469237
3	151460000003	-1.230411	-1.064144	3.8043177	-1.3062152	-2.2200240	-0.2425543	-1.6458099	-1.081394102	-1.458348	3.2236494	0.6144226	1.057469
4	151460000004	-1.230411	-1.064144	2.6982091	-1.3062152	-0.5183437	-1.2391934	-1.6458099	-0.004949997	1.865648	0.2789465	0.6144226	1.226182
5	151460000005	-1.230411	-1.064144	19.6216703	-1.3062152	-2.2200240	-2.2981224	-1.6458099	-1.081394102	-1.458348	3.2236494	0.6144226	1.319901
6	151460000006	0.000000	0.000000	0.0000000	0.0000000	0.0000000	0.0000000	0.0000000	0.000000000	0.000000	0.0000000	0.6144226	1.484096

Weight the indicator datas#

# Get the indicator weighting, previously loaded from the config file
indicator_weighting <- indicator_mapping %>% select('indicator', 'weight')
indicator_weighting <- indicator_weighting %>% spread(key = 'indicator', value = 'weight')

# Get the column names and weights
names <- names(indicator_weighting)
weights <- indicator_weighting[, names]

# Copy and rename the dataset
indicator_data_weighted <- indicator_data
head(indicator_data_weighted) 

# Multiply the indicators by the config file weighting
indicator_data_weighted[, names] <- sweep(indicator_data_weighted[, names], 2, unlist(weights[, names]), "*")
head(indicator_data_weighted)

A data.frame: 6 × 13
	SEZ2011	early_childhood_boy	early_childhood_girl	age_middle_to_oldest_old_male	age_middle_to_oldest_old_female	dependants	unemployment	no_higher_education	foreign_nationals	primary_school_age	one_person_households	tree_cover_density	impervious
	<chr>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>
1	151460000001	-1.230411	-1.064144	2.1196292	-1.3062152	-0.7801407	-0.5060886	-0.6075338	0.284861877	-1.458348	0.9333249	0.6144226	1.409195
2	151460000002	-1.230411	-1.064144	0.2302043	-0.3189938	0.1197864	1.3419462	0.8849880	0.768744204	-1.458348	-0.7026211	0.6144226	1.469237
3	151460000003	-1.230411	-1.064144	3.8043177	-1.3062152	-2.2200240	-0.2425543	-1.6458099	-1.081394102	-1.458348	3.2236494	0.6144226	1.057469
4	151460000004	-1.230411	-1.064144	2.6982091	-1.3062152	-0.5183437	-1.2391934	-1.6458099	-0.004949997	1.865648	0.2789465	0.6144226	1.226182
5	151460000005	-1.230411	-1.064144	19.6216703	-1.3062152	-2.2200240	-2.2981224	-1.6458099	-1.081394102	-1.458348	3.2236494	0.6144226	1.319901
6	151460000006	0.000000	0.000000	0.0000000	0.0000000	0.0000000	0.0000000	0.0000000	0.000000000	0.000000	0.0000000	0.6144226	1.484096

A data.frame: 6 × 13
	SEZ2011	early_childhood_boy	early_childhood_girl	age_middle_to_oldest_old_male	age_middle_to_oldest_old_female	dependants	unemployment	no_higher_education	foreign_nationals	primary_school_age	one_person_households	tree_cover_density	impervious
	<chr>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>
1	151460000001	-1.230411	-1.064144	2.1196292	-1.3062152	-0.7801407	-0.5060886	-0.3037669	0.142430939	1.458348	0.9333249	0.6144226	1.409195
2	151460000002	-1.230411	-1.064144	0.2302043	-0.3189938	0.1197864	1.3419462	0.4424940	0.384372102	1.458348	-0.7026211	0.6144226	1.469237
3	151460000003	-1.230411	-1.064144	3.8043177	-1.3062152	-2.2200240	-0.2425543	-0.8229049	-0.540697051	1.458348	3.2236494	0.6144226	1.057469
4	151460000004	-1.230411	-1.064144	2.6982091	-1.3062152	-0.5183437	-1.2391934	-0.8229049	-0.002474999	-1.865648	0.2789465	0.6144226	1.226182
5	151460000005	-1.230411	-1.064144	19.6216703	-1.3062152	-2.2200240	-2.2981224	-0.8229049	-0.540697051	1.458348	3.2236494	0.6144226	1.319901
6	151460000006	0.000000	0.000000	0.0000000	0.0000000	0.0000000	0.0000000	0.0000000	0.000000000	0.000000	0.0000000	0.6144226	1.484096

# Histogram visualisation of weighted indicators
indicator_columns <- colnames(indicator_data_weighted)[-1]
for( current_indicator_column in indicator_columns ) {
    indicator_filtered <- indicator_data_weighted[,current_indicator_column] 
    indicator_filtered[indicator_filtered == "NaN"] <- 0

    title <- paste("'", current_indicator_column, "' domain histogram", sep = "")
    x_label <- paste("'", current_indicator_column, "' z-score", sep = "")
    y_label <- paste("Count", sep = "")
    hist(indicator_filtered, breaks="FD", col="grey", labels = FALSE, main=title, xlab=x_label, ylab=y_label)
    box("figure", lwd = 4)
}

../../_images/40c6121ca79e1dc59977e40a7b44e8c7d5147dae78bc7070f47f978e1c64769c.png

../../_images/bcc8d2d1f7b31a506a37220180c22c624dba0aaa16c492a60361d41d7eed02a3.png

../../_images/93cc0c7c264523d7300ff6b4fa0629dfd11defb3ef226d1cbe378647d1ccba9f.png

../../_images/8548e6d43be69fbaceafe01521a8921fd6a65afa9859828bb1105fe415cbe9a6.png

../../_images/9f9acb8546a6728e406f4e77383177d5b48934ec1c2799f5012a39c59cc952a2.png

../../_images/7e6808255edfea73bf057b079461479b83c15d4ea133dd652c30aa5d56778477.png

../../_images/e3ff1fe4a6fec20803d784caeec75a77073d57a63df264f576288fe1e41b4251.png

../../_images/5b26306db690487c828f9df7f3684889fb6126fa7d21858f590d2c144650e75d.png

../../_images/1d9278dd4e11fe705059292720ee280da36ea7ce6c560c59ab28d1c3436693d0.png

../../_images/ad511a76fd79070c4700d2ac7b2cc8f638cd7b517703167a0e39f750961ceaad.png

../../_images/c17fbbd9cbd3e65181f99c5e2f9fbe0c9f2382cbf64fb470f00297dcaf436f81.png

../../_images/49aa3b063e98f21cf8d5ee1ef19b10582dbe6a6a7121589e908d2897f47d7ca6.png

Process social vulnerability scores#

Calculate domain scores#

# Get the domains and their associated indicator ID
domain_indicators <- indicator_mapping %>% select('domain', 'indicator')

# Get a vector/array of the unique domain names
unique_domains <- unique(domain_indicators$domain)

# Initialise the domain score dataset with the GUID
domain_scores <- indicator_data_weighted %>% select(all_of(GUID))

# Loop through each domain
for (current_domain in unique_domains) {
    # Identify which indicators are used within this domain (current_domain)
    current_domain_info <- domain_indicators %>% filter(domain == current_domain)

    # Count the number of indicators in this domain
    domain_indicator_count <- length(current_domain_info$indicator)

    # Get a vector/array of the indicators used by this domain, and add the GUID column name
    current_domain_indicators <- current_domain_info$indicator
    current_domain_indicators <- (c(GUID, current_domain_indicators))

    # filter the dataset to only use the indicators in the domain
    current_domain_data <- indicator_data_weighted[current_domain_indicators]

    # Calculate the internal weight distribution for the indicators within this domain,
    # using an equal weight distribution across this domain
    internal_domain_weight <- 1.0 / domain_indicator_count

    # Internally weight the data for this domain
    current_domain_data_weighted <- current_domain_data %>% mutate_if(is.numeric, function(x) {x*internal_domain_weight})

    # Sum each data row to get the total score for the domain
    current_domain_data_weighted[, current_domain] <- rowSums(current_domain_data_weighted[2:(domain_indicator_count+1)], na.rm = TRUE)

    # Add the current domain score to the overall results
    domain_indicator_score <- current_domain_data_weighted %>% select(all_of(GUID), all_of(current_domain))
    domain_scores <- merge(domain_scores, domain_indicator_score, by=GUID)
}

# Print the first part of the domain z-scores, which are now collated into one table
head(domain_scores)

A data.frame: 6 × 7
	SEZ2011	age	income	info_access_use	local_knowledge	social_network	physical_environment
	<chr>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>
1	151460000001	-0.37028523	-0.6431147	-0.3037669	0.142430939	1.1958366	1.0118090
2	151460000002	-0.59583610	0.7308663	0.4424940	0.384372102	0.3778636	1.0418299
3	151460000003	0.05088688	-1.2312892	-0.8229049	-0.540697051	2.3409988	0.8359458
4	151460000004	-0.22564026	-0.8787686	-0.8229049	-0.002474999	-0.7933508	0.9203024
5	151460000005	4.00522505	-2.2590732	-0.8229049	-0.540697051	2.3409988	0.9671620
6	151460000006	0.00000000	0.0000000	0.0000000	0.000000000	0.0000000	1.0492594

# Histogram visualisation of domain z-scores
for( current_domain in unique_domains ) {
    domain_scores_filtered <- domain_scores[,current_domain] 
    domain_scores_filtered[domain_scores_filtered == "NaN"] <- 0

    title <- paste("'", current_domain, "' domain histogram", sep = "")
    x_label <- paste("'", current_domain, "' z-score", sep = "")
    y_label <- paste("Count", sep = "")
    hist(domain_scores_filtered, breaks="FD", col="grey", labels=FALSE, main=title, xlab=x_label, ylab=y_label)
    box("figure", lwd = 4)
}

../../_images/ffc7d40d34ec1077ab2264bf4ba12ad31e5c41a820358b8f5f661375ae56c688.png

../../_images/063cafb70431d53c29c23fa131b96579f7bb7b7d99b678761ed02d68eacb83b6.png

../../_images/ef535c74dc7f11519a2c468540f8e711e31d306ec1817ca6d1c73987478f80fb.png

../../_images/80f0e62e3caf4ed6113ace797922aeb66486d74d01440d6f0be15197abc95431.png

../../_images/1bc9f1c86b82434f6d3f4268e233d09da45f64c3b58d3f728e216286ce3a558a.png

../../_images/f503cce2ad25fc324fddf8ef3e821e7293cb6586c7502af8d4f7f806cc0eac51.png

Calculate dimension scores#

Need to collate the domains into the dimensions

# Create a vector/array of the dimension names
dimensions <- c('sensitivity', 'prepare', 'respond', 'recover', 'adaptive_capacity', 'enhanced_exposure')

# Get the dimension and their associated indicator ID
dimension_indicators <- indicator_mapping %>% select(c('domain', all_of(dimensions)))
head(dimension_indicators)

# Initialise the dimensions score dataset with the GUID
dimension_scores <- indicator_data_weighted %>% select(all_of(GUID))

# loop through each of the dimensions and:
for (current_dimension in dimensions){
    # Identify which indicators are used within this dimension (current_dimension)
    # Then select the indicators marked with value 1, which means that the indicator is part of the dimension
    current_dimension_info <- dimension_indicators %>% select(c('domain', all_of(current_dimension)))
    current_dimension_info <- current_dimension_info %>% filter(dimension_indicators[, current_dimension] == 1)

    # Get a array/vector of the unique domains in this dimension
    current_dimension_domains <- unique(current_dimension_info$domain)

    # Count the number of domains in this dimension
    dimension_domain_count <- length(current_dimension_domains)

    # Filter the domain scores dataset to only use the domains in the dimension, and add the GUID column name
    current_dimension_data <- domain_scores %>% select(c(all_of(GUID), all_of(current_dimension_domains)))  

    # Sum each data row to get the total score for the dimension
    current_dimension_data[, current_dimension] <- rowSums(current_dimension_data[2:(dimension_domain_count+1)], na.rm = TRUE)

    # Add the current dimension score to the overall results
    dimension_indicator_score <- current_dimension_data %>% select(all_of(GUID), all_of(current_dimension))
    dimension_scores <- merge(dimension_scores, dimension_indicator_score, by=GUID)  
}

# generate z-scores with the scale function in order to standardise the dimension data
dimension_scores <- dimension_scores %>% mutate_if(is.numeric, scale)

# Print the first part of the dimension scores, which are now collated into one table
head(dimension_scores)

A data.frame: 6 × 7
	domain	sensitivity	prepare	respond	recover	adaptive_capacity	enhanced_exposure
	<chr>	<int>	<int>	<int>	<int>	<int>	<int>
1	age	1	0	0	0	0	0
2	age	1	0	0	0	0	0
3	age	1	0	0	0	0	0
4	age	1	0	0	0	0	0
5	income	0	1	1	1	1	0
6	income	0	1	1	1	1	0

A data.frame: 6 × 7
	SEZ2011	sensitivity	prepare	respond	recover	adaptive_capacity	enhanced_exposure
	<chr>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>
1	151460000001	-0.7647853635	-0.696485479	0.320951976	0.271253971	0.320951976	1.0934219
2	151460000002	-1.2304165745	1.355476641	1.575888423	1.676990485	1.575888423	1.1258642
3	151460000003	0.1046897905	-2.251790899	-0.203447695	0.312110916	-0.203447695	0.9033735
4	151460000004	-0.4661777348	-1.478027752	-2.026764566	-2.690739562	-2.026764566	0.9945343
5	151460000005	8.2680954025	-3.144598085	-1.038699169	-0.797332495	-1.038699169	1.0451736
6	151460000006	-0.0003619911	0.002318221	0.002883523	0.002519028	0.002883523	1.1338930

# Histogram visualisation of dimension z-scores
for( current_dimension in dimensions ){
    dimension_scores_filtered <- dimension_scores[,current_dimension] 
    dimension_scores_filtered[dimension_scores_filtered == "NaN"] <- 0
   
    title <- paste("'", current_dimension, "' dimension histogram", sep = "")
    x_label <- paste("'", current_dimension, "' z-score", sep = "")
    y_label <- paste("Count", sep = "")
    hist(dimension_scores_filtered, breaks="FD", col="grey", labels=FALSE, main=title, xlab=x_label, ylab=y_label)
    box("figure", lwd = 4)
}

../../_images/2efbe5c48c4dfa2afa8538b552234cc0352cf07b729b754d428898e7c76fce4c.png

../../_images/376a70d084f5846391486bdc6d4e397353b388b44b2df6bad5560ffa0312d994.png

../../_images/0e4e20ec6acd04cbdc0667919b3945123fa410747692f7b24d4867c9897f4d0d.png

../../_images/775f6d7c00a2ae25f952d86b6c3831d861fec032981b8893824b91385604587a.png

../../_images/aa0979cba35e60c2660d68f940adc01730e0d71df87c364c8350e110c960761d.png

../../_images/a730fe8ffbb76eb6a1f91d70c9fe388a306a37886983ea96097f86ea38dea591.png

Calculate vulnerability score#

# Initialise the vulnerability score dataset with the GUID
vulnerability_scores <- domain_scores %>% select(all_of(GUID))

#sum the domains to create a total overall score of vulnerability
vulnerability_scores$social_vulnerability <- rowSums(domain_scores[2:(ncol(domain_scores))], na.rm = TRUE)

# generate z-scores with the scale function in order to standardise the vulnerability data
vulnerability_scores <- vulnerability_scores %>% mutate_if(is.numeric, scale)

# Print the first part of the vulnerability scores, which are now collated into one table
head(vulnerability_scores)

A data.frame: 6 × 2
	SEZ2011	social_vulnerability
	<chr>	<dbl[,1]>
1	151460000001	0.6558794
2	151460000002	1.5094801
3	151460000003	0.4027326
4	151460000004	-1.1389091
5	151460000005	2.3380431
6	151460000006	0.6662274

# Histogram visualisation of Vulnerability z-scores
title <- paste("'Vulnerability' histogram", sep = "")
x_label <- paste("'Vulnerability' z-score", sep = "")
y_label <- paste("Count", sep = "")
hist(vulnerability_scores$social_vulnerability, breaks="FD", col="grey", labels=FALSE, main=title, xlab=x_label, ylab=y_label)
box("figure", lwd = 4)

../../_images/6d13650b2b35a628dabdf12745fd8d4318e01a2eb183cc299151475dddc323fe.png

# Merge all the indicators, domains, dimensions, and total vulnerability into one dataset
output_dataset <- merge(indicator_data_weighted, domain_scores, by=GUID)
output_dataset <- merge(output_dataset, dimension_scores, by=GUID)
output_dataset <- merge(output_dataset, vulnerability_scores, by=GUID)

head(output_dataset)

A data.frame: 6 × 26
	SEZ2011	early_childhood_boy	early_childhood_girl	age_middle_to_oldest_old_male	age_middle_to_oldest_old_female	dependants	unemployment	no_higher_education	foreign_nationals	primary_school_age	⋯	local_knowledge	social_network	physical_environment	sensitivity	prepare	respond	recover	adaptive_capacity	enhanced_exposure	social_vulnerability
	<chr>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	⋯	<dbl>	<dbl>	<dbl>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>
1	151460000001	-1.230411	-1.064144	2.1196292	-1.3062152	-0.7801407	-0.5060886	-0.3037669	0.142430939	1.458348	⋯	0.142430939	1.1958366	1.0118090	-0.7647853635	-0.696485479	0.320951976	0.271253971	0.320951976	1.0934219	0.6558794
2	151460000002	-1.230411	-1.064144	0.2302043	-0.3189938	0.1197864	1.3419462	0.4424940	0.384372102	1.458348	⋯	0.384372102	0.3778636	1.0418299	-1.2304165745	1.355476641	1.575888423	1.676990485	1.575888423	1.1258642	1.5094801
3	151460000003	-1.230411	-1.064144	3.8043177	-1.3062152	-2.2200240	-0.2425543	-0.8229049	-0.540697051	1.458348	⋯	-0.540697051	2.3409988	0.8359458	0.1046897905	-2.251790899	-0.203447695	0.312110916	-0.203447695	0.9033735	0.4027326
4	151460000004	-1.230411	-1.064144	2.6982091	-1.3062152	-0.5183437	-1.2391934	-0.8229049	-0.002474999	-1.865648	⋯	-0.002474999	-0.7933508	0.9203024	-0.4661777348	-1.478027752	-2.026764566	-2.690739562	-2.026764566	0.9945343	-1.1389091
5	151460000005	-1.230411	-1.064144	19.6216703	-1.3062152	-2.2200240	-2.2981224	-0.8229049	-0.540697051	1.458348	⋯	-0.540697051	2.3409988	0.9671620	8.2680954025	-3.144598085	-1.038699169	-0.797332495	-1.038699169	1.0451736	2.3380431
6	151460000006	0.000000	0.000000	0.0000000	0.0000000	0.0000000	0.0000000	0.0000000	0.000000000	0.000000	⋯	0.000000000	0.0000000	1.0492594	-0.0003619911	0.002318221	0.002883523	0.002519028	0.002883523	1.1338930	0.6662274

Correlations#

# check the correlations
correlation <- cor(output_dataset %>% select(-c(all_of(GUID))), use="pairwise.complete.obs")
correlation

A matrix: 25 × 25 of type dbl
	early_childhood_boy	early_childhood_girl	age_middle_to_oldest_old_male	age_middle_to_oldest_old_female	dependants	unemployment	no_higher_education	foreign_nationals	primary_school_age	one_person_households	⋯	local_knowledge	social_network	physical_environment	sensitivity	prepare	respond	recover	adaptive_capacity	enhanced_exposure	social_vulnerability
early_childhood_boy	1.00000000	0.229097528	-0.14133786	-0.152371506	0.479381856	-0.06813950	-0.05906216	0.06968821	-0.211541089	-0.053140400	⋯	0.06968821	-0.17126794	0.041952673	0.468965905	0.177996543	0.06209890	0.046053168	0.06209890	0.041952673	0.21671079
early_childhood_girl	0.22909753	1.000000000	-0.12233710	-0.115415283	0.447880059	-0.09983243	-0.07541606	0.02251899	-0.131044555	-0.087782855	⋯	0.02251899	-0.14149308	0.012169251	0.497075108	0.124612566	0.03031025	0.028487985	0.03031025	0.012169251	0.18312793
age_middle_to_oldest_old_male	-0.14133786	-0.122337104	1.00000000	0.291926773	-0.219142202	-0.20364703	0.01344422	-0.22114688	0.156731495	-0.058133618	⋯	-0.22114688	0.06398469	-0.130727845	0.515454373	-0.265588094	-0.20945491	-0.162603657	-0.20945491	-0.130727845	-0.08165958
age_middle_to_oldest_old_female	-0.15237151	-0.115415283	0.29192677	1.000000000	-0.235062655	-0.23129506	0.23646828	-0.25730892	0.166348557	-0.001316863	⋯	-0.25730892	0.10686905	-0.133976721	0.513279034	-0.205041719	-0.12666491	-0.033731192	-0.12666491	-0.133976721	-0.01975176
dependants	0.47938186	0.447880059	-0.21914220	-0.235062655	1.000000000	-0.08266693	0.11096832	0.08006488	-0.735608824	-0.291803934	⋯	0.08006488	-0.66460705	-0.024206633	0.237217276	0.467697674	0.03233285	0.001091004	0.03233285	-0.024206633	0.08373068
unemployment	-0.06813950	-0.099832433	-0.20364703	-0.231295057	-0.082666926	1.00000000	0.10782418	0.33788259	0.083462147	0.010301782	⋯	0.33788259	0.06069221	-0.046306921	-0.302233026	0.573835450	0.57384691	0.585589861	0.57384691	-0.046306921	0.32713626
no_higher_education	-0.05906216	-0.075416063	0.01344422	0.236468283	0.110968315	0.10782418	1.00000000	0.26173870	-0.045445576	-0.029993040	⋯	0.26173870	-0.04877900	-0.128676167	0.057830642	0.624357416	0.55436679	0.599521006	0.55436679	-0.128676167	0.37411283
foreign_nationals	0.06968821	0.022518991	-0.22114688	-0.257308923	0.080064879	0.33788259	0.26173870	1.00000000	-0.074132287	0.291800349	⋯	1.00000000	0.14025860	0.058567612	-0.193601159	0.707212143	0.74713737	0.469628941	0.74713737	0.058567612	0.55682335
primary_school_age	-0.21154109	-0.131044555	0.15673150	0.166348557	-0.735608824	0.08346215	-0.04544558	-0.07413229	1.000000000	0.196787249	⋯	-0.07413229	0.77451044	0.003812838	-0.009809013	-0.325644138	0.16757171	0.261335750	0.16757171	0.003812838	0.12973201
one_person_households	-0.05314040	-0.087782855	-0.05813362	-0.001316863	-0.291803934	0.01030178	-0.02999304	0.29180035	0.196787249	1.000000000	⋯	0.29180035	0.77260594	0.284224811	-0.100459534	-0.008700115	0.46292243	0.462342309	0.46292243	0.284224811	0.49619186
tree_cover_density	0.04948625	0.013555773	-0.11879223	-0.119645043	-0.001507900	-0.03736943	-0.08206047	0.05235133	-0.012114734	0.218214737	⋯	0.05235133	0.13294221	0.925360125	-0.087913902	-0.028978401	0.05394525	0.044286154	0.05394525	0.925360125	0.55702025
impervious	0.02815641	0.008966105	-0.12314844	-0.128308388	-0.043291805	-0.04833173	-0.15608312	0.05604093	0.019171231	0.307805877	⋯	0.05604093	0.21100349	0.925360125	-0.107434095	-0.080913361	0.05295268	0.041038921	0.05295268	0.925360125	0.55026267
age	0.46896590	0.497075108	0.51545437	0.513279034	0.237217276	-0.30223303	0.05783064	-0.19360116	-0.009809013	-0.100459534	⋯	-0.19360116	-0.07116596	-0.105552418	1.000000000	-0.084199177	-0.12216143	-0.061054149	-0.12216143	-0.105552418	0.14962341
income	0.30405399	0.257398729	-0.31214939	-0.344305665	0.678122645	0.67637489	0.16153269	0.30835420	-0.482128040	-0.208071286	⋯	0.30835420	-0.44644375	-0.052040916	-0.047564415	0.768857522	0.44709337	0.432663034	0.44709337	-0.052040916	0.30313843
info_access_use	-0.05906216	-0.075416063	0.01344422	0.236468283	0.110968315	0.10782418	1.00000000	0.26173870	-0.045445576	-0.029993040	⋯	0.26173870	-0.04877900	-0.128676167	0.057830642	0.624357416	0.55436679	0.599521006	0.55436679	-0.128676167	0.37411283
local_knowledge	0.06968821	0.022518991	-0.22114688	-0.257308923	0.080064879	0.33788259	0.26173870	1.00000000	-0.074132287	0.291800349	⋯	1.00000000	0.14025860	0.058567612	-0.193601159	0.707212143	0.74713737	0.469628941	0.74713737	0.058567612	0.55682335
social_network	-0.17126794	-0.141493083	0.06398469	0.106869046	-0.664607054	0.06069221	-0.04877900	0.14025860	0.774510442	0.772605938	⋯	0.14025860	1.00000000	0.185844241	-0.071165963	-0.216483284	0.40717750	0.467519929	0.40717750	0.185844241	0.40413915
physical_environment	0.04195267	0.012169251	-0.13072785	-0.133976721	-0.024206633	-0.04630692	-0.12867617	0.05856761	0.003812838	0.284224811	⋯	0.05856761	0.18584424	1.000000000	-0.105552418	-0.059377835	0.05776018	0.046103713	0.05776018	1.000000000	0.59829838
sensitivity	0.46896590	0.497075108	0.51545437	0.513279034	0.237217276	-0.30223303	0.05783064	-0.19360116	-0.009809013	-0.100459534	⋯	-0.19360116	-0.07116596	-0.105552418	1.000000000	-0.084199177	-0.12216143	-0.061054149	-0.12216143	-0.105552418	0.14962341
prepare	0.17799654	0.124612566	-0.26558809	-0.205041719	0.467697674	0.57383545	0.62435742	0.70721214	-0.325644138	-0.008700115	⋯	0.70721214	-0.21648328	-0.059377835	-0.084199177	1.000000000	0.80354306	0.697613287	0.80354306	-0.059377835	0.56521567
respond	0.06209890	0.030310255	-0.20945491	-0.126664909	0.032332845	0.57384691	0.55436679	0.74713737	0.167571709	0.462922431	⋯	0.74713737	0.40717750	0.057760176	-0.122161434	0.803543060	1.00000000	0.937690173	1.00000000	0.057760176	0.77518413
recover	0.04605317	0.028487985	-0.16260366	-0.033731192	0.001091004	0.58558986	0.59952101	0.46962894	0.261335750	0.462342309	⋯	0.46962894	0.46751993	0.046103713	-0.061054149	0.697613287	0.93769017	1.000000000	0.93769017	0.046103713	0.73856429
adaptive_capacity	0.06209890	0.030310255	-0.20945491	-0.126664909	0.032332845	0.57384691	0.55436679	0.74713737	0.167571709	0.462922431	⋯	0.74713737	0.40717750	0.057760176	-0.122161434	0.803543060	1.00000000	0.937690173	1.00000000	0.057760176	0.77518413
enhanced_exposure	0.04195267	0.012169251	-0.13072785	-0.133976721	-0.024206633	-0.04630692	-0.12867617	0.05856761	0.003812838	0.284224811	⋯	0.05856761	0.18584424	1.000000000	-0.105552418	-0.059377835	0.05776018	0.046103713	0.05776018	1.000000000	0.59829838
social_vulnerability	0.21671079	0.183127935	-0.08165958	-0.019751765	0.083730678	0.32713626	0.37411283	0.55682335	0.129732006	0.496191862	⋯	0.55682335	0.40413915	0.598298378	0.149623413	0.565215672	0.77518413	0.738564294	0.77518413	0.598298378	1.00000000

Add geometry#

# add st_drop_geometry
output_dataset_geom <- merge(output_dataset, oa, by.x=GUID, by.y=GUID, all.x = TRUE)
head(output_dataset_geom)

A data.frame: 6 × 27
	SEZ2011	early_childhood_boy	early_childhood_girl	age_middle_to_oldest_old_male	age_middle_to_oldest_old_female	dependants	unemployment	no_higher_education	foreign_nationals	primary_school_age	⋯	social_network	physical_environment	sensitivity	prepare	respond	recover	adaptive_capacity	enhanced_exposure	social_vulnerability	geometry
	<chr>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	<dbl>	⋯	<dbl>	<dbl>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<dbl[,1]>	<POLYGON [m]>
1	151460000001	-1.230411	-1.064144	2.1196292	-1.3062152	-0.7801407	-0.5060886	-0.3037669	0.142430939	1.458348	⋯	1.1958366	1.0118090	-0.7647853635	-0.696485479	0.320951976	0.271253971	0.320951976	1.0934219	0.6558794	POLYGON ((1515164 5034507, ...
2	151460000002	-1.230411	-1.064144	0.2302043	-0.3189938	0.1197864	1.3419462	0.4424940	0.384372102	1.458348	⋯	0.3778636	1.0418299	-1.2304165745	1.355476641	1.575888423	1.676990485	1.575888423	1.1258642	1.5094801	POLYGON ((1515138 5034525, ...
3	151460000003	-1.230411	-1.064144	3.8043177	-1.3062152	-2.2200240	-0.2425543	-0.8229049	-0.540697051	1.458348	⋯	2.3409988	0.8359458	0.1046897905	-2.251790899	-0.203447695	0.312110916	-0.203447695	0.9033735	0.4027326	POLYGON ((1515050 5034427, ...
4	151460000004	-1.230411	-1.064144	2.6982091	-1.3062152	-0.5183437	-1.2391934	-0.8229049	-0.002474999	-1.865648	⋯	-0.7933508	0.9203024	-0.4661777348	-1.478027752	-2.026764566	-2.690739562	-2.026764566	0.9945343	-1.1389091	POLYGON ((1515095 5034409, ...
5	151460000005	-1.230411	-1.064144	19.6216703	-1.3062152	-2.2200240	-2.2981224	-0.8229049	-0.540697051	1.458348	⋯	2.3409988	0.9671620	8.2680954025	-3.144598085	-1.038699169	-0.797332495	-1.038699169	1.0451736	2.3380431	POLYGON ((1514881 5034455, ...
6	151460000006	0.000000	0.000000	0.0000000	0.0000000	0.0000000	0.0000000	0.0000000	0.000000000	0.000000	⋯	0.0000000	1.0492594	-0.0003619911	0.002318221	0.002883523	0.002519028	0.002883523	1.1338930	0.6662274	POLYGON ((1514764 5034456, ...

Export#

# CSV
write.csv(output_dataset, file.path(output_dir, "social_vulnerability_index_milan_2021.csv"), row.names = FALSE)

# GeoJSON
st_write(output_dataset_geom, file.path(output_dir, "social_vulnerability_index_milan_2021.geojson"), delete_dsn=TRUE)

# Shapefile
# Need to manually rename these fields, otherwise we get a shapefile creation error
names(output_dataset_geom)[names(output_dataset_geom) == 'early_childhood_boy'] <- 'erly_cld_b'
names(output_dataset_geom)[names(output_dataset_geom) == 'early_childhood_girl'] <- 'erly_cld_g'
names(output_dataset_geom)[names(output_dataset_geom) == 'age_middle_to_oldest_old_male'] <- 'age_old_m'
names(output_dataset_geom)[names(output_dataset_geom) == 'age_middle_to_oldest_old_female'] <- 'age_old_f'
st_write(output_dataset_geom, file.path(output_dir, "social_vulnerability_index_milan_2021.shp"), append = FALSE)

Deleting source `../../3_outputs/Italy/Milan/2021/social_vulnerability_index_milan_2021.geojson' using driver `GeoJSON'
Writing layer `social_vulnerability_index_milan_2021' to data source 
  `../../3_outputs/Italy/Milan/2021/social_vulnerability_index_milan_2021.geojson' using driver `GeoJSON'
Writing 6079 features with 26 fields and geometry type Polygon.

Warning message in abbreviate_shapefile_names(obj):
“Field names abbreviated for ESRI Shapefile driver”

Deleting layer `social_vulnerability_index_milan_2021' using driver `ESRI Shapefile'
Writing layer `social_vulnerability_index_milan_2021' to data source 
  `../../3_outputs/Italy/Milan/2021/social_vulnerability_index_milan_2021.shp' using driver `ESRI Shapefile'
Writing 6079 features with 26 fields and geometry type Polygon.

END

Social Vulnerability Milan - Calculate Vulnerability

Contents

Social Vulnerability Milan - Calculate Vulnerability#

Environment#

R Libraries#

Output directory#

Set the GUID#

Load Data#

Import the data#

Prepare Data#

Combine data into a single indicator dataset#

Weight the indicator datas#

Process social vulnerability scores#

Calculate domain scores#

Calculate dimension scores#

Calculate vulnerability score#

Correlations#

Add geometry#

Export#