si.Rmd

title: "The energy and carbon inequality corridor for a 1.5°C compatible and just Europe: supplementary information"
author:
- Ingram S. Jaccard:
    email: jaccard@pik-potsdam.de
    institute: [PIK]
    correspondence: false
- Peter-Paul Pichler:
    email: pichler@pik-potsdam.de
    institute: [PIK]
    correspondence: false
- Johannes Többen:
    email: toebben@pik-potsdam.de
    institute: [PIK, GWS]
    correspondence: false
- Helga Weisz:
    email: weisz@pik-potsdam.de
    institute: [PIK, HU]
    correspondence: false
institute:
- PIK: Social Metabolism and Impacts, Potsdam Institute for Climate Impact Research, Member of the Leibniz Association, PO Box 60 12 03, Potsdam, 14412, Germany
- HU: Department of Cultural History & Theory and Department of Social Sciences, Humboldt University Berlin, Unter den Linden 6, Berlin, 10117, Germany
- GWS: Gesellschaft für Wirtschaftliche Strukturforschung (GWS) mbH, Heinrichstraße 30, 49080 Osnabrück, Germany
output:
  word_document:
    fig_caption: yes
    reference_docx: ../templates/template.docx
    pandoc_args:
    - --lua-filter=../templates/scholarly-metadata.lua
    - --lua-filter=../templates/author-info-blocks.lua
    - --lua-filter=../templates/pagebreak.lua
bibliography: references.bib
csl: ../templates/vancouver.csl
content: |
  35 pages, 13 tables, 7 figures
always_allow_html: yes

knitr::opts_chunk$set(echo = TRUE)
devtools::source_gist("c83e078bf8c81b035e32c3fc0cf04ee8",
                      filename = 'render_toc.R')


render_toc("si.Rmd")

knitr::opts_chunk$set(
  collapse = TRUE,
  warning = FALSE,
  message = FALSE,
  echo = FALSE,
  comment = "#>",
  fig.path = "../figures/",
  dpi = 300
)

if (!require("pacman")) install.packages("pacman")
pacman::p_load(tidyverse,
               janitor,
               here,
               wbstats,
               ISOcodes,
               viridis,
               hrbrthemes,
               wesanderson,
               glue,
               ggridges,
               patchwork,
               kableExtra,
               readxl,
               flextable)

pal <- wes_palette("Cavalcanti1", 5, type = "discrete")
extrafont::loadfonts()

options(scipen=999)


library(here)

#"HBS structure with calculations of quintile shares per sector."

quintile = c("q1","q2","q3","q4","q5")
pps_hh = c(10,13,20,33,40)

pm_sector1 = c(200,300,400,500,600)
pm_sector2 = c(800,700,600,500,400)

hbs = data.frame(quintile, pps_hh, pm_sector1, pm_sector2) %>%
  mutate(pps_hh_sector1 = pps_hh*(pm_sector1/1000),
         sector_1_shares = pps_hh_sector1/sum(pps_hh_sector1),
         pps_hh_sector2 = pps_hh*(pm_sector2/1000),
         sector_2_shares = pps_hh_sector2/sum(pps_hh_sector2)) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(hbs) %>%
  autofit() %>%
  set_header_labels(quintile = "quintile",
                    pps_hh = "pps hh",
                    pm_sector1 = "s1 (pm)",
                    pm_sector2 = "s2 (pm)",
                    pps_hh_sector1 = "s1 (pps hh)",
                    sector_1_shares = "s1 (q share)",
                    pps_hh_sector2 = "s2 (pps hh)",
                    sector_2_shares = "s2 (q share)") %>%
  fit_to_width(max_width = 6.8)

q_share_of_sector = hbs %>%
  select(quintile,pps_hh_sector1,pps_hh_sector2) %>%
  gather(sector,value,-quintile) %>%
  mutate(sector = dplyr::recode(sector,
                                "pps_hh_sector1" = 1,
                                "pps_hh_sector2" = 2)) %>%
  group_by(sector) %>%
  mutate(q_share_of_sector = value/sum(value)) %>%
  select(-value) %>%
  spread(quintile,q_share_of_sector)

eemrio_hh_fd = c(300,800)

eemrio = data.frame(q_share_of_sector, eemrio_hh_fd) %>%
  mutate(q1_eemrio = q1*eemrio_hh_fd,
         q2_eemrio = q2*eemrio_hh_fd,
         q3_eemrio = q3*eemrio_hh_fd,
         q4_eemrio = q4*eemrio_hh_fd,
         q5_eemrio = q5*eemrio_hh_fd) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(eemrio) %>%
  autofit(add_w=0.5) %>%
  set_header_labels(sector = "sector",
                    q1 = "q1 share",
                    q2 = "q2 share",
                    q3 = "q3 share",
                    q4 = "q4 share",
                    q5 = "q5 share",
                    eemrio_hh_fd = "eemrio hh fd",
                    q1_eemrio = "q1 fd",
                    q2_eemrio = "q2 fd",
                    q3_eemrio = "q3 fd",
                    q4_eemrio = "q4 fd",
                    q5_eemrio = "q5 fd") %>%
  fit_to_width(max_width = 6.8)

TIV = c(0.2,0.4)

footprint = data.frame(eemrio,TIV) %>%
  select(sector,
         eemrio_hh_fd,
         q1_eemrio,
         q2_eemrio,
         q3_eemrio,
         q4_eemrio,
         q5_eemrio,
         TIV) %>%
  mutate(q1_footprint = q1_eemrio*TIV,
         q2_footprint = q2_eemrio*TIV,
         q3_footprint = q3_eemrio*TIV,
         q4_footprint = q4_eemrio*TIV,
         q5_footprint = q5_eemrio*TIV,
         total_footprint = eemrio_hh_fd*TIV) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(footprint) %>%
  autofit() %>%
  set_header_labels(sector = "sector",
                    eemrio_hh_fd = "eemrio hh fd",
                    q1_eemrio = "q1 fd",
                    q2_eemrio = "q2 fd",
                    q3_eemrio = "q3 fd",
                    q4_eemrio = "q4 fd",
                    q5_eemrio = "q5 fd",
                    TIV = "TIV",
                    q1_footprint = "q1 fp",
                    q2_footprint = "q2 fp",
                    q3_footprint = "q3 fp",
                    q4_footprint = "q4 fp",
                    q5_footprint = "q5 fp",
                    total_footprint = "total fp") %>%
  fit_to_width(max_width = 6.8)

labels = read.csv(here("/analysis/preprocessing/income-stratified-footprints/Exiobase_T_labels_ixi_w_coicop_mapping.csv")) %>%
  select(V2,coicop,five_sectors) %>%
  unique()

flextable(labels) %>%
  autofit() %>%
  set_header_labels(V2 = "exiobase industry production sector",
                    coicop = "coicop consumption category",
                    five_sectors = "aggregate consumption category") %>%
  width(j=1, width = 4) %>%
  width(j=2, width = 1.5) %>%
  width(j=3, width = 1.5)


geo = c("Austria",
        "Belgium",
        "Bulgaria",
        "Cyprus",
        "Czech Rep.",
        "Germany",
        "Denmark",
        "Estonia",
        "Greece",
        "Spain",
        "Finland",
        "France",
        "Croatia",
        "Hungary",
        "Ireland",
        "Italy",
        "Lithuania",
        "Luxembourg",
        "Latvia",
        "Montenegro",
        "North Macedonia",
        "Malta",
        "Netherlands",
        "Norway",
        "Poland",
        "Portugal",
        "Romania",
        "Serbia",
        "Sweden",
        "Slovenia",
        "Slovakia",
        "Turkey",
        "UK",
        "Kosovo")

year_2015 = c("x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x")

year_2010 = c("x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "",
              "x",
              "",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "",
              "x",
              "x",
              "x",
              "x",
              "x",
              "")

year_2005 = c("x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "x",
              "",
              "x",
              "x",
              "x",
              "x",
              "x",
              "")

country_year_coverage = data.frame(geo,
                                   year_2015,
                                   year_2010,
                                   year_2005)

flextable(country_year_coverage) %>%
  autofit() %>%
  set_header_labels(geo = "Country",
                    year_2015 = "2015",
                    year_2010 = "2010",
                    year_2005 = "2005") %>%
  color(i=c(20,21,28,34),color='red') %>%
  fit_to_width(max_width = 7.5)


bp_share_in_pp_sector_1 = c(0.5,0.5,0.5,0.5,0.5)
bp_share_in_pp_sector_2 = c(1,1,1,1,1)

hbs_bp = data.frame(quintile,
                    pps_hh,
                    pm_sector1,
                    pm_sector2,
                    bp_share_in_pp_sector_1,
                    bp_share_in_pp_sector_2) %>%
  mutate(pps_hh_sector1 = pps_hh*(pm_sector1/1000),
         pps_hh_sector1_bp = pps_hh_sector1*bp_share_in_pp_sector_1,
         sector_1_shares = pps_hh_sector1/sum(pps_hh_sector1),
         sector_1_shares_bp = pps_hh_sector1_bp/sum(pps_hh_sector1_bp),
         pps_hh_sector2 = pps_hh*(pm_sector2/1000),
         pps_hh_sector2_bp = pps_hh_sector2*bp_share_in_pp_sector_2,
         sector_2_shares = pps_hh_sector2/sum(pps_hh_sector2),
         sector_2_shares_bp = pps_hh_sector2_bp/sum(pps_hh_sector2_bp),
         pps_hh_bp = pps_hh_sector1_bp + pps_hh_sector2_bp)

hbs_bp_pps = hbs_bp %>%
  select(quintile,
         pps_hh,
         pm_sector1,
         pm_sector2,
         pps_hh_sector1,
         bp_share_in_pp_sector_1,
         pps_hh_sector1_bp,
         pps_hh_sector2,
         bp_share_in_pp_sector_2,
         pps_hh_sector2_bp) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(hbs_bp_pps) %>%
  autofit() %>%
  set_header_labels(quintile = "quintile",
                    pps_hh = "pps hh",
                    pm_sector1 = "s1 (pm)",
                    pm_sector2 = "s2 (pm)",
                    pps_hh_sector1 = "s1 (pps hh)",
                    bp_share_in_pp_sector_1 = "s1 bp",
                    pps_hh_sector1_bp = "s1 (pps hh bp)",
                    pps_hh_sector2 = "s2 (pps hh)",
                    bp_share_in_pp_sector_2 = "s2 bp",
                    pps_hh_sector2_bp = "s2 (pps hh bp)") %>%
  fit_to_width(max_width = 6.8)


hbs_bp_shares = hbs_bp %>%
  select(quintile,
         pps_hh_bp,
         pps_hh_sector1_bp,
         sector_1_shares_bp,
         pps_hh_sector2_bp,
         sector_2_shares_bp) %>%
  mutate(pm_sector1_bp = (pps_hh_sector1_bp/(pps_hh_sector1_bp + pps_hh_sector2_bp))*1000,
         pm_sector2_bp = (pps_hh_sector2_bp/(pps_hh_sector1_bp + pps_hh_sector2_bp))*1000) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(hbs_bp_shares) %>%
  autofit() %>%
  set_header_labels(quintile = "quintile",
                    pps_hh_bp = "pps hh bp",
                    pps_hh_sector1_bp = "s1 (pps hh bp)",
                    sector_1_shares_bp = "s1 (q share bp)",
                    pps_hh_sector2_bp = "s2 (pps hh bp)",
                    sector_2_shares_bp = "s2 (q share bp)",
                    pm_sector1_bp = "s1 (pm bp)",
                    pm_sector2_bp = "s2 (pm bp)") %>%
  fit_to_width(max_width = 6.8)


q_share_of_sector_bp = hbs_bp_shares %>%
  select(quintile,pps_hh_sector1_bp,pps_hh_sector2_bp) %>%
  gather(sector,value,-quintile) %>%
  mutate(sector = dplyr::recode(sector,
                                "pps_hh_sector1_bp" = 1,
                                "pps_hh_sector2_bp" = 2)) %>%
  group_by(sector) %>%
  mutate(q_share_of_sector_bp = value/sum(value)) %>%
  select(-value) %>%
  spread(quintile,q_share_of_sector_bp)

eemrio_hh_fd = c(300,800)

eemrio_bp = data.frame(q_share_of_sector_bp, eemrio_hh_fd) %>%
  mutate(q1_eemrio = q1*eemrio_hh_fd,
         q2_eemrio = q2*eemrio_hh_fd,
         q3_eemrio = q3*eemrio_hh_fd,
         q4_eemrio = q4*eemrio_hh_fd,
         q5_eemrio = q5*eemrio_hh_fd) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(eemrio_bp) %>%
  autofit() %>%
  set_header_labels(sector = "sector",
                    q1 = "q1 share bp",
                    q2 = "q2 share bp",
                    q3 = "q3 share bp",
                    q4 = "q4 share bp",
                    q5 = "q5 share bp",
                    eemrio_hh_fd = "eemrio hh fd",
                    q1_eemrio = "q1 fd",
                    q2_eemrio = "q2 fd",
                    q3_eemrio = "q3 fd",
                    q4_eemrio = "q4 fd",
                    q5_eemrio = "q5 fd") %>%
  fit_to_width(max_width = 6.8)

# load data wrangling functions
source(here("analysis", "R", "wrangler_functions.R"))

## load result data for EU deciles
eu_q_count = 10

# summary countries aggregated by country quintiles and eu ntile
dat_country_summary_by_cquint_and_euntile = get_country_summary_by_cquint_and_euntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "quint", "eu_q_rank")
pdat_country_summary_by_cquint_and_euntile =
  pivot_results_longer_adorn(dat_country_summary_by_cquint_and_euntile, cols_ex)

# summary of countries by EU quantile without sectoral resolution
dat_country_summary_by_eu_ntile = get_country_summary_by_eu_ntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "eu_q_rank")
pdat_country_summary_by_eu_ntile =
  pivot_results_longer_adorn(dat_country_summary_by_eu_ntile, cols_ex)

# summary of countries by country quintile with aggregate sectoral resolution
dat_sector_summary_by_country_quintile = get_sector_summary_by_country_quintile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "quint", "eu_q_rank", "sector_agg_id")
pdat_sector_summary_by_country_quintile =
  pivot_results_longer_adorn(dat_sector_summary_by_country_quintile, cols_ex)

# summary of eu ntile with aggregate sectoral resolution
dat_sector_summary_by_eu_ntile = get_sector_summary_by_eu_ntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "eu_q_rank", "sector_agg_id")
pdat_sector_summary_by_eu_ntile =
  pivot_results_longer_adorn(dat_sector_summary_by_eu_ntile, cols_ex)


tmp3 = pdat_country_summary_by_cquint_and_euntile %>%
  filter(eu_q_rank < 5, year== 2015,  indicator=="pae_fd_ke") %>%
  group_by(iso3, quint) %>%
  summarise(value = sum(value)) %>%
  group_by(iso3) %>%
  summarise(pop = n()/5*100)

tmp4 = pdat_country_summary_by_cquint_and_euntile %>%
  ungroup() %>%
  filter(quint == 1, year== 2015,  indicator=="pae_fd_ke") %>%
  transmute(iso3, pop2 = 0) %>%
  left_join(tmp3, by="iso3") %>%
  transmute(iso3, popshare = if_else(is.na(pop), pop2, pop+pop2))

library(rworldmap)
library(ggthemes)

quantile_rank_map = joinCountryData2Map(tmp4, joinCode = "ISO_A3", nameJoinColumn = "iso3")
quantile_rank_map_poly = fortify(quantile_rank_map) #extract polygons

quantile_rank_map_poly = merge(quantile_rank_map_poly, quantile_rank_map@data, by.x="id", by.y="ADMIN", all.x=T)
quantile_rank_map_poly = quantile_rank_map_poly %>% arrange(id, order)


map1 = ggplot() +
  geom_polygon(data = quantile_rank_map_poly, aes(long, lat, group = group), color="black") +
  geom_polygon(data = quantile_rank_map_poly, aes(long, lat, group = group,
                                        fill=factor(popshare))) +
  #scale_fill_gradient(name="Mean decile \nrank", low="skyblue", high = "skyblue4", na.value = "#EEEEEE") +
  scale_fill_viridis(direction = -1, discrete = T, na.value = "white", name="Population\n share in\n bottom 4\n European\n deciles (%)") +
  theme_map() +
  coord_map("bonne", lat0 = 50,xlim = c(-9, 44), ylim = c(35, 70), clip="on") +
  theme(legend.position = c(0.75, 0.28))


map1

ggsave(here("analysis", "figures", "figureS1.pdf"), device=cairo_pdf)

bp_share_in_pp_sector_1 = c(0.5,0.5,0.5,0.5,0.5)
bp_share_in_pp_sector_2 = c(1,1,1,1,1)

hbs_bp = data.frame(quintile,
                    pps_hh,
                    pm_sector1,
                    pm_sector2,
                    bp_share_in_pp_sector_1,
                    bp_share_in_pp_sector_2) %>%
  mutate(pps_hh_sector1 = pps_hh*(pm_sector1/1000),
         pps_hh_sector1_bp = pps_hh_sector1*bp_share_in_pp_sector_1,
         sector_1_shares = pps_hh_sector1/sum(pps_hh_sector1),
         sector_1_shares_bp = pps_hh_sector1_bp/sum(pps_hh_sector1_bp),
         pps_hh_sector2 = pps_hh*(pm_sector2/1000),
         pps_hh_sector2_bp = pps_hh_sector2*bp_share_in_pp_sector_2,
         sector_2_shares = pps_hh_sector2/sum(pps_hh_sector2),
         sector_2_shares_bp = pps_hh_sector2_bp/sum(pps_hh_sector2_bp),
         pps_hh_bp = pps_hh_sector1_bp + pps_hh_sector2_bp)

hbs_bp_pps = hbs_bp %>%
  select(quintile,
         pps_hh,
         pm_sector1,
         pm_sector2,
         pps_hh_sector1,
         bp_share_in_pp_sector_1,
         pps_hh_sector1_bp,
         pps_hh_sector2,
         bp_share_in_pp_sector_2,
         pps_hh_sector2_bp) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(hbs_bp_pps) %>%
  autofit() %>%
  set_header_labels(quintile = "quintile",
                    pps_hh = "pps hh",
                    pm_sector1 = "s1 (pm)",
                    pm_sector2 = "s2 (pm)",
                    pps_hh_sector1 = "s1 (pps hh)",
                    bp_share_in_pp_sector_1 = "s1 bp",
                    pps_hh_sector1_bp = "s1 (pps hh bp)",
                    pps_hh_sector2 = "s2 (pps hh)",
                    bp_share_in_pp_sector_2 = "s2 bp",
                    pps_hh_sector2_bp = "s2 (pps hh bp)") %>%
  fit_to_width(max_width = 7)


hbs_bp_shares = hbs_bp %>%
  select(quintile,
         pps_hh_bp,
         pps_hh_sector1_bp,
         pps_hh_sector2_bp) %>%
  mutate(pm_sector1_bp = (pps_hh_sector1_bp/(pps_hh_sector1_bp + pps_hh_sector2_bp))*1000,
         pm_sector2_bp = (pps_hh_sector2_bp/(pps_hh_sector1_bp + pps_hh_sector2_bp))*1000) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(hbs_bp_shares) %>%
  autofit() %>%
  set_header_labels(quintile = "quintile",
                     pps_hh_bp = "pps hh bp",
                     pps_hh_sector1_bp = "s1 (pps hh bp)",
                     pps_hh_sector2_bp = "s2 (pps hh bp)",
                     pm_sector1_bp = "s1 (pm bp)",
                     pm_sector2_bp = "s2 (pm bp)") %>%
  fit_to_width(max_width = 7.5)


quintile = c("q1","q2","q3","q4","q5")
pps_hh = c(9,11,16,25,28)

pm_sector1 = c(111,176,250,333,429)
pm_sector2 = c(889,824,750,667,571)

hbs_alt_method = data.frame(quintile,
                            pps_hh,
                            pm_sector1,
                            pm_sector2,
                            bp_share_in_pp_sector_1,
                            bp_share_in_pp_sector_2) %>%
  mutate(mean_expenditure_share = pps_hh/sum(pps_hh),
         eemrio_hh_fd = 1100*mean_expenditure_share,
         hh_sector1 = eemrio_hh_fd*(pm_sector1/1000),
         hh_sector1_bp = hh_sector1*bp_share_in_pp_sector_1,
         hh_sector2 = eemrio_hh_fd*(pm_sector2/1000),
         hh_sector2_bp = hh_sector2*bp_share_in_pp_sector_2)

hbs_alt_method_fd = hbs_alt_method %>%
  select(quintile,
         pps_hh,
         pm_sector1,
         pm_sector2,
         mean_expenditure_share,
         eemrio_hh_fd,
         hh_sector1,
         hh_sector2) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(hbs_alt_method_fd) %>%
  autofit() %>%
  set_header_labels(quintile = "quintile",
                    pps_hh = "pps hh",
                    pm_sector1 = "s1 (pm)",
                    pm_sector2 = "s2 (pm)",
                    mean_expenditure_share = "mean exp",
                    eemrio_hh_fd = "eemrio hh fd",
                    hh_sector1 = "hh fd s1",
                    hh_sector2 = "hh fd s2") %>%
  fit_to_width(max_width = 7.5)


eemrio_alt_method = hbs_alt_method %>%
  select(quintile,hh_sector1,hh_sector2) %>%
  gather(sector,value,-quintile) %>%
  spread(quintile,value) %>%
  mutate(sector = dplyr::recode(sector,
                                "hh_sector1" = "1",
                                "hh_sector2" = "2")) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(eemrio_alt_method) %>%
  autofit() %>%
  set_header_labels(sector = "sector",
                    q1 = "q1 fd",
                    q2 = "q2 fd",
                    q3 = "q3 fd",
                    q4 = "q4 fd",
                    q5 = "q5 fd") %>%
  width(j=c(1:6), width = 0.8)


footprint_alt_method = data.frame(eemrio_alt_method, TIV) %>%
  mutate(q1_footprint = q1*TIV,
         q2_footprint = q2*TIV,
         q3_footprint = q3*TIV,
         q4_footprint = q4*TIV,
         q5_footprint = q5*TIV,
         total_footprint = q1_footprint +
           q2_footprint +
           q3_footprint +
           q4_footprint +
           q5_footprint) %>%
  mutate_if(is.numeric, round, digits = 2)

flextable(footprint_alt_method) %>%
  autofit() %>%
  set_header_labels(sector = "sector",
                    q1 = "q1 fd",
                    q2 = "q2 fd",
                    q3 = "q3 fd",
                    q4 = "q4 fd",
                    q5 = "q5 fd",
                    TIV = "TIV",
                    q1_footprint = "q1 fp",
                    q2_footprint = "q2 fp",
                    q3_footprint = "q3 fp",
                    q4_footprint = "q4 fp",
                    q5_footprint = "q5 fp",
                    total_footprint = "total fp") %>%
  fit_to_width(max_width = 7.5)

# load data wrangling functions
source(here("analysis", "R", "wrangler_functions.R"))

## load result data for EU deciles
eu_q_count = 10

# summary countries aggregated by country quintiles and eu ntile
dat_country_summary_by_cquint_and_euntile = get_country_summary_by_cquint_and_euntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "quint", "eu_q_rank")
pdat_country_summary_by_cquint_and_euntile =
  pivot_results_longer_adorn(dat_country_summary_by_cquint_and_euntile, cols_ex)

# summary of countries by EU quantile without sectoral resolution
dat_country_summary_by_eu_ntile = get_country_summary_by_eu_ntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "eu_q_rank")
pdat_country_summary_by_eu_ntile =
  pivot_results_longer_adorn(dat_country_summary_by_eu_ntile, cols_ex)

# summary of countries by country quintile with aggregate sectoral resolution
dat_sector_summary_by_country_quintile = get_sector_summary_by_country_quintile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "quint", "eu_q_rank", "sector_agg_id")
pdat_sector_summary_by_country_quintile =
  pivot_results_longer_adorn(dat_sector_summary_by_country_quintile, cols_ex)

# summary of eu ntile with aggregate sectoral resolution
dat_sector_summary_by_eu_ntile = get_sector_summary_by_eu_ntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "eu_q_rank", "sector_agg_id")
pdat_sector_summary_by_eu_ntile =
  pivot_results_longer_adorn(dat_sector_summary_by_eu_ntile, cols_ex)


p1 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2005,
         indicator == "total_fd_me") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Expenditure (trn€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p2 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2005,
         indicator == "total_energy_use_tj") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Energy footprint (EJ)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p3 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2005,
         indicator == "total_co2eq_kg") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon footprint (MtCO2eq)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p_top = p1 + p2 + p3


p1 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2005) %>%
  ggplot(aes(x=factor(eu_q_rank), y=pe_co2eq_kg)) +
  geom_violin(aes(weight=total_fd_me), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat_country_summary_by_eu_ntile %>%
                 filter(year == 2005) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_co2eq_kg = weighted.mean(pe_co2eq_kg,total_fd_me)),
               aes(y=pe_co2eq_kg, yend=pe_co2eq_kg, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon intensity per expenditure (kgCO2eq/€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p2 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2005) %>%
  ggplot(aes(x=factor(eu_q_rank), y=pe_energy_use_mj)) +
  geom_violin(aes(weight=total_fd_me), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat_country_summary_by_eu_ntile %>%
                 filter(year == 2005) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_energy_use_mj = weighted.mean(pe_energy_use_mj,total_fd_me)),
               aes(y=pe_energy_use_mj, yend=pe_energy_use_mj, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Energy intensity per expenditure (MJ/€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

dat3 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2005) %>%
  mutate(intensity_e_c = total_co2eq_kg*0.001/total_energy_use_tj)

p3 = dat3 %>%
  ggplot(aes(x=factor(eu_q_rank), y=intensity_e_c)) +
  geom_violin(aes(weight=total_energy_use_tj), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat3 %>%
                 filter(year == 2005) %>%
                 group_by(eu_q_rank) %>%
                 summarise(intensity_e_c = weighted.mean(intensity_e_c,total_energy_use_tj)),
               aes(y=intensity_e_c, yend=intensity_e_c, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon intensity per energy (gCO2eq/TJ)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p_bottom = p2 + p1 + p3


# values in text

## inequality
exp = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2005,
         indicator == "total_fd_me") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name))

exp_total = (exp %>% summarise(value = sum(value)))$value

exp_10_10 = round((exp %>% filter(eu_q_rank == 10))$value/(exp %>% filter(eu_q_rank == 1))$value,digits = 1)

energy = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2005,
         indicator == "total_energy_use_tj") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name))

energy_total = (energy %>% summarise(value = sum(value)))$value

energy_10_10 = round((energy %>% filter(eu_q_rank == 10))$value/(energy %>% filter(eu_q_rank == 1))$value,digits = 1)

co2eq = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2005,
         indicator == "total_co2eq_kg") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000000001,
            eu_ntile_name = first(eu_ntile_name))

co2eq_total = (co2eq %>% summarise(value = sum(value)))$value

co2eq_10_10 = round((co2eq %>% filter(eu_q_rank == 10))$value/(co2eq %>% filter(eu_q_rank == 1))$value,digits = 1)

## total per decile

exp_bottom_decile = round((exp %>% filter(eu_q_rank == 1))$value, digits = 1)

exp_top_decile = round((exp %>% filter(eu_q_rank == 10))$value, digits = 1)

energy_bottom_decile = round((energy %>% filter(eu_q_rank == 1))$value, digits = 1)

energy_top_decile = round((energy %>% filter(eu_q_rank == 10))$value, digits = 1)

co2eq_bottom_decile = round((co2eq %>% filter(eu_q_rank == 1))$value, digits = 1)

co2eq_top_decile = round((co2eq %>% filter(eu_q_rank == 10))$value, digits = 1)


## per adult equivalent per decile

aeu = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2005,
         indicator == "total_adult_eq") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value),
            eu_ntile_name = first(eu_ntile_name))

exp_pae = exp %>%
  rename(total_fd_me = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_fd_e = (total_fd_me/value)*1000000000000)

fd_pae_bottom_decile = round((exp_pae %>% filter(eu_q_rank == 1))$pae_fd_e, digits = 0)

fd_pae_top_decile = round((exp_pae %>% filter(eu_q_rank == 10))$pae_fd_e, digits = 0)

energy_pae = energy %>%
  rename(total_energy_use_tj = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_energy_use_gj = (total_energy_use_tj/value)*1000000000)

energy_pae_bottom_decile = round((energy_pae %>% filter(eu_q_rank == 1))$pae_energy_use_gj, digits = 1)

energy_pae_top_decile = round((energy_pae %>% filter(eu_q_rank == 10))$pae_energy_use_gj, digits = 1)

co2eq_pae = co2eq %>%
  rename(total_co2eq_kg = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_co2eq_t = (total_co2eq_kg/value)*1000000)

co2eq_pae_bottom_decile = round((co2eq_pae %>% filter(eu_q_rank == 1))$pae_co2eq_t, digits = 1)

co2eq_pae_top_decile = round((co2eq_pae %>% filter(eu_q_rank == 10))$pae_co2eq_t, digits = 1)


## intensities

mean_energy_intens = dat_country_summary_by_eu_ntile %>%
                 filter(year == 2005) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_energy_use_mj = weighted.mean(pe_energy_use_mj,total_fd_me))

mean_energy_intens_bottom_decile = round((mean_energy_intens %>% filter(eu_q_rank == 1))$pe_energy_use_mj, digits = 1)

mean_energy_intens_top_decile = round((mean_energy_intens %>% filter(eu_q_rank == 10))$pe_energy_use_mj, digits = 1)

mean_co2eq_of_energy_intens = dat_country_summary_by_eu_ntile %>%
  filter(year == 2005) %>%
  mutate(intensity_e_c = total_co2eq_kg*0.001/total_energy_use_tj) %>%
  group_by(eu_q_rank) %>%
  summarise(intensity_e_c = weighted.mean(intensity_e_c,total_energy_use_tj))

mean_co2eq_of_energy_intens_bottom_decile = round((mean_co2eq_of_energy_intens %>% filter(eu_q_rank == 1))$intensity_e_c, digits = 1)

mean_co2eq_of_energy_intens_top_decile = round((mean_co2eq_of_energy_intens %>% filter(eu_q_rank == 10))$intensity_e_c, digits = 1)


a = p_top / p_bottom + plot_annotation(tag_levels = 'a') +
  plot_layout(guides = 'collect')  &
  theme(plot.margin = unit(c(0.25,0.25,0.25,0.25), "cm"),
        legend.position = 'bottom',
        axis.title.y = element_text(size=13, hjust = 0.5),
        axis.text.x = element_text(size = 12),
        axis.text.y = element_text(size = 12),
        legend.text = element_text(size=12),
        legend.title = element_text(size=13))
a

ggsave(here("analysis", "figures", "figureS1.pdf"), device=cairo_pdf)


p1 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_fd_me") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Expenditure (trn€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p2 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_energy_use_tj") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Energy footprint (EJ)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p3 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_co2eq_kg") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon footprint (MtCO2eq)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p_top = p1 + p2 + p3


p1 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  ggplot(aes(x=factor(eu_q_rank), y=pe_co2eq_kg)) +
  geom_violin(aes(weight=total_fd_me), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat_country_summary_by_eu_ntile %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_co2eq_kg = weighted.mean(pe_co2eq_kg,total_fd_me)),
               aes(y=pe_co2eq_kg, yend=pe_co2eq_kg, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon intensity per expenditure (kgCO2eq/€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p2 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  ggplot(aes(x=factor(eu_q_rank), y=pe_energy_use_mj)) +
  geom_violin(aes(weight=total_fd_me), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat_country_summary_by_eu_ntile %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_energy_use_mj = weighted.mean(pe_energy_use_mj,total_fd_me)),
               aes(y=pe_energy_use_mj, yend=pe_energy_use_mj, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Energy intensity per expenditure (MJ/€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

dat3 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  mutate(intensity_e_c = total_co2eq_kg*0.001/total_energy_use_tj)

p3 = dat3 %>%
  ggplot(aes(x=factor(eu_q_rank), y=intensity_e_c)) +
  geom_violin(aes(weight=total_energy_use_tj), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat3 %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(intensity_e_c = weighted.mean(intensity_e_c,total_energy_use_tj)),
               aes(y=intensity_e_c, yend=intensity_e_c, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon intensity per energy (gCO2eq/TJ)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p_bottom = p2 + p1 + p3


# values in text

## inequality
exp = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_fd_me") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name))

exp_total = (exp %>% summarise(value = sum(value)))$value

exp_10_10 = round((exp %>% filter(eu_q_rank == 10))$value/(exp %>% filter(eu_q_rank == 1))$value,digits = 1)

energy = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_energy_use_tj") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name))

energy_total = (energy %>% summarise(value = sum(value)))$value

energy_10_10 = round((energy %>% filter(eu_q_rank == 10))$value/(energy %>% filter(eu_q_rank == 1))$value,digits = 1)

co2eq = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_co2eq_kg") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000000001,
            eu_ntile_name = first(eu_ntile_name))

co2eq_total = (co2eq %>% summarise(value = sum(value)))$value

co2eq_10_10 = round((co2eq %>% filter(eu_q_rank == 10))$value/(co2eq %>% filter(eu_q_rank == 1))$value,digits = 1)

## total per decile

exp_bottom_decile = round((exp %>% filter(eu_q_rank == 1))$value, digits = 1)

exp_top_decile = round((exp %>% filter(eu_q_rank == 10))$value, digits = 1)

energy_bottom_decile = round((energy %>% filter(eu_q_rank == 1))$value, digits = 1)

energy_top_decile = round((energy %>% filter(eu_q_rank == 10))$value, digits = 1)

co2eq_bottom_decile = round((co2eq %>% filter(eu_q_rank == 1))$value, digits = 1)

co2eq_top_decile = round((co2eq %>% filter(eu_q_rank == 10))$value, digits = 1)


## per adult equivalent per decile

aeu = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_adult_eq") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value),
            eu_ntile_name = first(eu_ntile_name))

exp_pae = exp %>%
  rename(total_fd_me = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_fd_e = (total_fd_me/value)*1000000000000)

fd_pae_bottom_decile = round((exp_pae %>% filter(eu_q_rank == 1))$pae_fd_e, digits = 0)

fd_pae_top_decile = round((exp_pae %>% filter(eu_q_rank == 10))$pae_fd_e, digits = 0)

energy_pae = energy %>%
  rename(total_energy_use_tj = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_energy_use_gj = (total_energy_use_tj/value)*1000000000)

energy_pae_bottom_decile = round((energy_pae %>% filter(eu_q_rank == 1))$pae_energy_use_gj, digits = 1)

energy_pae_top_decile = round((energy_pae %>% filter(eu_q_rank == 10))$pae_energy_use_gj, digits = 1)

co2eq_pae = co2eq %>%
  rename(total_co2eq_kg = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_co2eq_t = (total_co2eq_kg/value)*1000000)

co2eq_pae_bottom_decile = round((co2eq_pae %>% filter(eu_q_rank == 1))$pae_co2eq_t, digits = 1)

co2eq_pae_top_decile = round((co2eq_pae %>% filter(eu_q_rank == 10))$pae_co2eq_t, digits = 1)


## intensities

mean_energy_intens = dat_country_summary_by_eu_ntile %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_energy_use_mj = weighted.mean(pe_energy_use_mj,total_fd_me))

mean_energy_intens_bottom_decile = round((mean_energy_intens %>% filter(eu_q_rank == 1))$pe_energy_use_mj, digits = 1)

mean_energy_intens_top_decile = round((mean_energy_intens %>% filter(eu_q_rank == 10))$pe_energy_use_mj, digits = 1)

mean_co2eq_of_energy_intens = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  mutate(intensity_e_c = total_co2eq_kg*0.001/total_energy_use_tj) %>%
  group_by(eu_q_rank) %>%
  summarise(intensity_e_c = weighted.mean(intensity_e_c,total_energy_use_tj))

mean_co2eq_of_energy_intens_bottom_decile = round((mean_co2eq_of_energy_intens %>% filter(eu_q_rank == 1))$intensity_e_c, digits = 1)

mean_co2eq_of_energy_intens_top_decile = round((mean_co2eq_of_energy_intens %>% filter(eu_q_rank == 10))$intensity_e_c, digits = 1)


a = p_top / p_bottom + plot_annotation(tag_levels = 'a') +
  plot_layout(guides = 'collect')  &
  theme(plot.margin = unit(c(0.25,0.25,0.25,0.25), "cm"),
        legend.position = 'bottom',
        axis.title.y = element_text(size=13, hjust = 0.5),
        axis.text.x = element_text(size = 12),
        axis.text.y = element_text(size = 12),
        legend.text = element_text(size=12),
        legend.title = element_text(size=13))

a

ggsave(here("analysis", "figures", "figureS2.pdf"), device=cairo_pdf)

# load data wrangling functions
source(here("analysis", "R", "si", "wrangler_functions_pxp.R"))

## load result data for EU deciles
eu_q_count = 10

# summary countries aggregated by country quintiles and eu ntile
dat_country_summary_by_cquint_and_euntile = get_country_summary_by_cquint_and_euntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "quint", "eu_q_rank")
pdat_country_summary_by_cquint_and_euntile =
  pivot_results_longer_adorn(dat_country_summary_by_cquint_and_euntile, cols_ex)

# summary of countries by EU quantile without sectoral resolution
dat_country_summary_by_eu_ntile = get_country_summary_by_eu_ntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "eu_q_rank")
pdat_country_summary_by_eu_ntile =
  pivot_results_longer_adorn(dat_country_summary_by_eu_ntile, cols_ex)

# summary of countries by country quintile with aggregate sectoral resolution
dat_sector_summary_by_country_quintile = get_sector_summary_by_country_quintile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "iso2", "quint", "eu_q_rank", "sector_agg_id")
pdat_sector_summary_by_country_quintile =
  pivot_results_longer_adorn(dat_sector_summary_by_country_quintile, cols_ex)

# summary of eu ntile with aggregate sectoral resolution
dat_sector_summary_by_eu_ntile = get_sector_summary_by_eu_ntile(eu_q_count)
# pivot to long format for plotting and attach readable indicator names
cols_ex = c("year", "eu_q_rank", "sector_agg_id")
pdat_sector_summary_by_eu_ntile =
  pivot_results_longer_adorn(dat_sector_summary_by_eu_ntile, cols_ex)


p1 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_fd_me") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Expenditure (trn€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p2 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_energy_use_tj") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Energy footprint (EJ)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))


p3 = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_co2eq_kg") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000000001,
            eu_ntile_name = first(eu_ntile_name)) %>%
  ggplot(aes(x=eu_ntile_name, y=value)) +
    geom_col(position = position_dodge(), fill=pal[1]) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon footprint (MtCO2eq)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p_top = p1 + p2 + p3


p1 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  ggplot(aes(x=factor(eu_q_rank), y=pe_co2eq_kg)) +
  geom_violin(aes(weight=total_fd_me), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat_country_summary_by_eu_ntile %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_co2eq_kg = weighted.mean(pe_co2eq_kg,total_fd_me)),
               aes(y=pe_co2eq_kg, yend=pe_co2eq_kg, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon intensity per expenditure (kgCO2eq/€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p2 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  ggplot(aes(x=factor(eu_q_rank), y=pe_energy_use_mj)) +
  geom_violin(aes(weight=total_fd_me), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat_country_summary_by_eu_ntile %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_energy_use_mj = weighted.mean(pe_energy_use_mj,total_fd_me)),
               aes(y=pe_energy_use_mj, yend=pe_energy_use_mj, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Energy intensity per expenditure (MJ/€)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

dat3 = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  mutate(intensity_e_c = total_co2eq_kg*0.001/total_energy_use_tj)

p3 = dat3 %>%
  ggplot(aes(x=factor(eu_q_rank), y=intensity_e_c)) +
  geom_violin(aes(weight=total_energy_use_tj), fill=pal[1], color=pal[1], alpha=0.5) +
  geom_point( alpha=0.3) +
  geom_segment(data=dat3 %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(intensity_e_c = weighted.mean(intensity_e_c,total_energy_use_tj)),
               aes(y=intensity_e_c, yend=intensity_e_c, x=eu_q_rank-0.3, xend=eu_q_rank+0.3), size=1.5) +
    theme_minimal() +
    theme(text=element_text(family="Liberation Sans Narrow")) +
    labs(x="", y="Carbon intensity per energy (gCO2eq/TJ)") +
    theme(axis.text.x = element_text(angle = 90)) +
    scale_x_discrete(labels = c("D01","D02","D03","D04","D05","D06","D07","D08","D09","D10"))

p_bottom = p2 + p1 + p3


# values in text

## inequality
exp = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_fd_me") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name))

exp_total = (exp %>% summarise(value = sum(value)))$value

exp_10_10 = round((exp %>% filter(eu_q_rank == 10))$value/(exp %>% filter(eu_q_rank == 1))$value,digits = 1)

energy = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_energy_use_tj") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000001,
            eu_ntile_name = first(eu_ntile_name))

energy_total = (energy %>% summarise(value = sum(value)))$value

energy_10_10 = round((energy %>% filter(eu_q_rank == 10))$value/(energy %>% filter(eu_q_rank == 1))$value,digits = 1)

co2eq = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_co2eq_kg") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value)*0.000000001,
            eu_ntile_name = first(eu_ntile_name))

co2eq_total = (co2eq %>% summarise(value = sum(value)))$value

co2eq_10_10 = round((co2eq %>% filter(eu_q_rank == 10))$value/(co2eq %>% filter(eu_q_rank == 1))$value,digits = 1)

## total per decile

exp_bottom_decile = round((exp %>% filter(eu_q_rank == 1))$value, digits = 1)

exp_top_decile = round((exp %>% filter(eu_q_rank == 10))$value, digits = 1)

energy_bottom_decile = round((energy %>% filter(eu_q_rank == 1))$value, digits = 1)

energy_top_decile = round((energy %>% filter(eu_q_rank == 10))$value, digits = 1)

co2eq_bottom_decile = round((co2eq %>% filter(eu_q_rank == 1))$value, digits = 1)

co2eq_top_decile = round((co2eq %>% filter(eu_q_rank == 10))$value, digits = 1)


## per adult equivalent per decile

aeu = pdat_country_summary_by_eu_ntile %>%
  filter(year == 2010,
         indicator == "total_adult_eq") %>%
  group_by(eu_q_rank) %>%
  summarise(value = sum(value),
            eu_ntile_name = first(eu_ntile_name))

exp_pae = exp %>%
  rename(total_fd_me = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_fd_e = (total_fd_me/value)*1000000000000)

fd_pae_bottom_decile = round((exp_pae %>% filter(eu_q_rank == 1))$pae_fd_e, digits = 0)

fd_pae_top_decile = round((exp_pae %>% filter(eu_q_rank == 10))$pae_fd_e, digits = 0)

energy_pae = energy %>%
  rename(total_energy_use_tj = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_energy_use_gj = (total_energy_use_tj/value)*1000000000)

energy_pae_bottom_decile = round((energy_pae %>% filter(eu_q_rank == 1))$pae_energy_use_gj, digits = 1)

energy_pae_top_decile = round((energy_pae %>% filter(eu_q_rank == 10))$pae_energy_use_gj, digits = 1)

co2eq_pae = co2eq %>%
  rename(total_co2eq_kg = value) %>%
  left_join(aeu, by = c("eu_q_rank", "eu_ntile_name")) %>%
  mutate(pae_co2eq_t = (total_co2eq_kg/value)*1000000)

co2eq_pae_bottom_decile = round((co2eq_pae %>% filter(eu_q_rank == 1))$pae_co2eq_t, digits = 1)

co2eq_pae_top_decile = round((co2eq_pae %>% filter(eu_q_rank == 10))$pae_co2eq_t, digits = 1)


## intensities

mean_energy_intens = dat_country_summary_by_eu_ntile %>%
                 filter(year == 2010) %>%
                 group_by(eu_q_rank) %>%
                 summarise(pe_energy_use_mj = weighted.mean(pe_energy_use_mj,total_fd_me))

mean_energy_intens_bottom_decile = round((mean_energy_intens %>% filter(eu_q_rank == 1))$pe_energy_use_mj, digits = 1)

mean_energy_intens_top_decile = round((mean_energy_intens %>% filter(eu_q_rank == 10))$pe_energy_use_mj, digits = 1)

mean_co2eq_of_energy_intens = dat_country_summary_by_eu_ntile %>%
  filter(year == 2010) %>%
  mutate(intensity_e_c = total_co2eq_kg*0.001/total_energy_use_tj) %>%
  group_by(eu_q_rank) %>%
  summarise(intensity_e_c = weighted.mean(intensity_e_c,total_energy_use_tj))

mean_co2eq_of_energy_intens_bottom_decile = round((mean_co2eq_of_energy_intens %>% filter(eu_q_rank == 1))$intensity_e_c, digits = 1)

mean_co2eq_of_energy_intens_top_decile = round((mean_co2eq_of_energy_intens %>% filter(eu_q_rank == 10))$intensity_e_c, digits = 1)


a = p_top / p_bottom + plot_annotation(tag_levels = 'a') +
  plot_layout(guides = 'collect')  &
  theme(plot.margin = unit(c(0.25,0.25,0.25,0.25), "cm"),
        legend.position = 'bottom',
        axis.title.y = element_text(size=13, hjust = 0.5),
        axis.text.x = element_text(size = 12),
        axis.text.y = element_text(size = 12),
        legend.text = element_text(size=12),
        legend.title = element_text(size=13))

a

ggsave(here("analysis", "figures", "figureS3.pdf"), device=cairo_pdf)