library(tidyverse)
library(readr)
library(ggplot2)
library(ggthemes)
library(gt)
library(gtExtras)
library(dplyr)
library(sf)
library(mapSpain)
library(rio)
library(plotly)
library(eurostat)
library(forcats)
library(scales)
# DATOS
# En primer lugar creamos la ruta relativa para posteriormente poder descargar los datos.
ruta_ccaa_inflacion <- "./datos/ccaa_inflacion.csv"
ccaa_inflacion <- rio::import(ruta_ccaa_inflacion)
ccaa_inflacion <- ccaa_inflacion %>% drop_na()
ccaa_inflacion_an <- ccaa_inflacion %>%
select(c(2, 3, 4, 5)) %>%
rename(periodo = Periodo, indice= c(1))
ccaa_inflacion_an <- ccaa_inflacion_an %>%
mutate(valor = gsub(",", ".", Total))
ccaa_inflacion_an <- ccaa_inflacion_an %>% mutate(periodo = gsub("M12", "", periodo),
periodo = gsub("M11", "", periodo),
periodo = gsub("M10", "", periodo),
periodo = gsub("M09", "", periodo),
periodo = gsub("M08", "", periodo),
periodo = gsub("M07", "", periodo),
periodo = gsub("M06", "", periodo),
periodo = gsub("M05", "", periodo),
periodo = gsub("M04", "", periodo),
periodo = gsub("M03", "", periodo),
periodo = gsub("M02", "", periodo),
periodo = gsub("M01", "", periodo),
indice = str_replace(indice, ".*Variaci.n anual.*", "Var_anual"))
ccaa_inflacion_an <- ccaa_inflacion_an %>% rename(ccaa = c(2)) %>%
filter(ccaa %in% "Nacional")
ccaa_inflacion_an <- ccaa_inflacion_an %>% filter(indice %in% "Var_anual")
# Cambiamos los nombres, seleccionamos aquellas columnas que deseamos mantener y cambiamos la notación decimal.
ccaa_inflacion <- ccaa_inflacion %>%
rename(indice = c(2), ccaa = c(3), periodo = c(4), valor = c(5)) %>%
select(c(2,3,4,5)) %>%
mutate(valor = gsub(",", ".", valor))
# Cambiamos los periodos mensuales por nada porque queremos pasar los datos a periodo anual.
# También, arreglamos los datos con símbolos extraños.
ccaa_inflacion <- ccaa_inflacion %>%
mutate(periodo = gsub("M12", "", periodo),
periodo = gsub("M11", "", periodo),
periodo = gsub("M10", "", periodo),
periodo = gsub("M09", "", periodo),
periodo = gsub("M08", "", periodo),
periodo = gsub("M07", "", periodo),
periodo = gsub("M06", "", periodo),
periodo = gsub("M05", "", periodo),
periodo = gsub("M04", "", periodo),
periodo = gsub("M03", "", periodo),
periodo = gsub("M02", "", periodo),
periodo = gsub("M01", "", periodo),
indice = str_replace(indice, ".*ndice.*", "indice"),
indice = str_replace(indice, ".*Variaci.n mensual.*", "Var_mens"),
indice = str_replace(indice, ".*Variaci.n anual.*", "Var_anual"),
ccaa = str_replace(ccaa, ".*16 Pa.s Vasco.*", "PV"),
ccaa = str_replace(ccaa, ".*14 Murcia, Regi.n de.*", "Murcia"),
ccaa = str_replace(ccaa, ".*01 Andaluc.a.*", "Andalucia"),
ccaa = str_replace(ccaa, ".*02 Arag.n.*", "Aragon"),
ccaa = str_replace(ccaa, ".*07 Castilla y Le.n.*", "CyL"),
ccaa = str_replace(ccaa, ".*09 Catalu.a.*", "CAT"),
ccaa = str_replace(ccaa, "03 Asturias, Principado de", "Asturias"),
ccaa = str_replace(ccaa, "04 Balears, Illes", "Islas Baleares"),
ccaa = str_replace(ccaa, "05 Canarias", "Canarias"),
ccaa = str_replace(ccaa, "06 Cantabria", "Cantabria"),
ccaa = str_replace(ccaa, "08 Castilla - La Mancha", "Castilla La Mancha"),
ccaa = str_replace(ccaa, "10 Comunitat Valenciana", "Comunidad Valenciana"),
ccaa = str_replace(ccaa, "11 Extremadura", "Extremadura"),
ccaa = str_replace(ccaa, "12 Galicia", "Galicia"),
ccaa = str_replace(ccaa, "13 Madrid, Comunidad de", "Madrid"),
ccaa = str_replace(ccaa, "15 Navarra, Comunidad Foral de", "Navarra"),
ccaa = str_replace(ccaa, "17 Rioja, La", "La Rioja"),
ccaa = str_replace(ccaa, "18 Ceuta", "Ceuta"),
ccaa = str_replace(ccaa, "19 Melilla", "Melilla"))
# Pasamos los años y el valor a variables numéricas.
ccaa_inflacion <- ccaa_inflacion %>% mutate(periodo = as.numeric(periodo),
valor = as.numeric(valor))
ccaa_inflacion_base2002 <- ccaa_inflacion %>%
filter(indice %in% c("indice"),
periodo %in% c("2002")) %>%
group_by(ccaa, periodo) %>%
arrange(desc(ccaa)) %>%
summarise(base = mean(valor, na.rm = TRUE)) %>%
select(ccaa, base)
#Calculamos los números índices para cada año, desde el 2002 hasta el 2025
ccaa_inflacion_25 <- ccaa_inflacion %>% group_by(periodo) %>%
filter(periodo %in% c("2025"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_24 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2024"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_23 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2023"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_22 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2022"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_21 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2021"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_20 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2020"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_19 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2019"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_18 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2018"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_17 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2017"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_16 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2016"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_15 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2015"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_14 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2014"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_13 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2013"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_12 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2012"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_11 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2011"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_10 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2010"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_09 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2009"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_08 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2008"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_07 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2007"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_06 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2006"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_05 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2005"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_04 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2004"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_03 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2003"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
ccaa_inflacion_02 <- ccaa_inflacion %>% group_by(ccaa, periodo) %>%
filter(periodo %in% c("2002"),
indice %in% c("indice")) %>%
mutate(media = mean(valor, na.rm = TRUE)) %>%
full_join(ccaa_inflacion_base2002, by = c("ccaa")) %>%
mutate(valor = (media/base) *100) %>%
distinct() %>%
select(indice, ccaa, valor)
#Una vez calculados los números índice para cada año, fusionamos todas las tablas para tener los datos en un solo data frame.
original <- full_join(ccaa_inflacion_02, ccaa_inflacion_03)
original <- full_join(original, ccaa_inflacion_04)
original <- full_join(original, ccaa_inflacion_05)
original <- full_join(original, ccaa_inflacion_06)
original <- full_join(original, ccaa_inflacion_07)
original <- full_join(original, ccaa_inflacion_08)
original <- full_join(original, ccaa_inflacion_09)
original <- full_join(original, ccaa_inflacion_10)
original <- full_join(original, ccaa_inflacion_11)
original <- full_join(original, ccaa_inflacion_12)
original <- full_join(original, ccaa_inflacion_13)
original <- full_join(original, ccaa_inflacion_14)
original <- full_join(original, ccaa_inflacion_15)
original <- full_join(original, ccaa_inflacion_16)
original <- full_join(original, ccaa_inflacion_17)
original <- full_join(original, ccaa_inflacion_18)
original <- full_join(original, ccaa_inflacion_19)
original <- full_join(original, ccaa_inflacion_20)
original <- full_join(original, ccaa_inflacion_21)
original <- full_join(original, ccaa_inflacion_22)
original <- full_join(original, ccaa_inflacion_23)
original <- full_join(original, ccaa_inflacion_24)
original <- full_join(original, ccaa_inflacion_25)